diff --git "a/wandb/run-20220301_082052-1y1by2yf/files/wandb-summary.json" "b/wandb/run-20220301_082052-1y1by2yf/files/wandb-summary.json" --- "a/wandb/run-20220301_082052-1y1by2yf/files/wandb-summary.json" +++ "b/wandb/run-20220301_082052-1y1by2yf/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.3516, "train/learning_rate": 1.741654571843251e-07, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 6714, "_timestamp": 1646129566, "_step": 1191, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 28.0, 680.0, 301.0, 7.0, 1.0], "bins": [-571.5680541992188, -562.168701171875, -552.7693481445312, -543.3699951171875, -533.9706420898438, -524.5712890625, -515.171875, -505.7725524902344, -496.3731689453125, -486.97381591796875, -477.574462890625, -468.1750793457031, -458.7757263183594, -449.3763732910156, -439.9770202636719, -430.5776672363281, -421.1783142089844, -411.7789611816406, -402.3796081542969, -392.980224609375, -383.58087158203125, -374.1815185546875, -364.78216552734375, -355.3828125, -345.98345947265625, -336.5841064453125, -327.18475341796875, -317.7853698730469, -308.3860168457031, -298.9866638183594, -289.5873107910156, -280.1879577636719, -270.78857421875, -261.38922119140625, -251.98985290527344, -242.5904998779297, -233.19113159179688, -223.79177856445312, -214.39242553710938, -204.99307250976562, -195.59368896484375, -186.1943359375, -176.7949676513672, -167.39561462402344, -157.99624633789062, -148.59689331054688, -139.19754028320312, -129.79818725585938, -120.3988265991211, -110.99946594238281, -101.60011291503906, -92.20075225830078, -82.8013916015625, -73.40203094482422, -64.00267028808594, -54.60331726074219, -45.203956604003906, -35.804595947265625, -26.40523910522461, -17.00588035583496, -7.6065216064453125, 1.7928390502929688, 11.192195892333984, 20.591552734375, 29.990915298461914]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 5.0, 3.0, 8.0, 7.0, 9.0, 13.0, 12.0, 15.0, 26.0, 23.0, 30.0, 20.0, 28.0, 43.0, 47.0, 31.0, 42.0, 57.0, 39.0, 53.0, 49.0, 51.0, 40.0, 54.0, 45.0, 24.0, 26.0, 34.0, 19.0, 30.0, 12.0, 17.0, 17.0, 10.0, 11.0, 16.0, 11.0, 7.0, 5.0, 4.0, 0.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.36842346191406, -51.56277847290039, -49.75713348388672, -47.95148849487305, -46.145843505859375, -44.3401985168457, -42.53455352783203, -40.728904724121094, -38.92326354980469, -37.117618560791016, -35.311973571777344, -33.50632858276367, -31.70068359375, -29.895038604736328, -28.089391708374023, -26.28374671936035, -24.478099822998047, -22.672454833984375, -20.866809844970703, -19.06116485595703, -17.25551986694336, -15.449873924255371, -13.644227981567383, -11.838582992553711, -10.032938003540039, -8.227293014526367, -6.421647548675537, -4.616002082824707, -2.810357093811035, -1.0047121047973633, 0.800933837890625, 2.606578826904297, 4.412223815917969, 6.217868804931641, 8.023513793945312, 9.8291597366333, 11.634804725646973, 13.440449714660645, 15.246095657348633, 17.051740646362305, 18.857385635375977, 20.66303062438965, 22.46867561340332, 24.274322509765625, 26.079967498779297, 27.88561248779297, 29.69125747680664, 31.496902465820312, 33.302547454833984, 35.108192443847656, 36.91383743286133, 38.719482421875, 40.52512741088867, 42.330772399902344, 44.13642120361328, 45.94206237792969, 47.747711181640625, 49.5533561706543, 51.35900115966797, 53.16464614868164, 54.97029113769531, 56.775936126708984, 58.581581115722656, 60.387229919433594, 62.19287109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 10.0, 10.0, 15.0, 17.0, 27.0, 42.0, 51.0, 54.0, 68.0, 81.0, 76.0, 97.0, 91.0, 87.0, 69.0, 55.0, 35.0, 38.0, 23.0, 26.0, 15.0, 9.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.70703125, -7.525390625, -7.34375, -7.162109375, -6.98046875, -6.798828125, -6.6171875, -6.435546875, -6.25390625, -6.072265625, -5.890625, -5.708984375, -5.52734375, -5.345703125, -5.1640625, -4.982421875, -4.80078125, -4.619140625, -4.4375, -4.255859375, -4.07421875, -3.892578125, -3.7109375, -3.529296875, -3.34765625, -3.166015625, -2.984375, -2.802734375, -2.62109375, -2.439453125, -2.2578125, -2.076171875, -1.89453125, -1.712890625, -1.53125, -1.349609375, -1.16796875, -0.986328125, -0.8046875, -0.623046875, -0.44140625, -0.259765625, -0.078125, 0.103515625, 0.28515625, 0.466796875, 0.6484375, 0.830078125, 1.01171875, 1.193359375, 1.375, 1.556640625, 1.73828125, 1.919921875, 2.1015625, 2.283203125, 2.46484375, 2.646484375, 2.828125, 3.009765625, 3.19140625, 3.373046875, 3.5546875, 3.736328125, 3.91796875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 7.0, 11.0, 15.0, 14.0, 26.0, 39.0, 78.0, 114.0, 244.0, 480.0, 1043.0, 2971.0, 12037.0, 112525.0, 3599716.0, 434632.0, 22931.0, 4657.0, 1478.0, 619.0, 279.0, 145.0, 78.0, 56.0, 39.0, 21.0, 15.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.484375, -25.833251953125, -25.18212890625, -24.531005859375, -23.8798828125, -23.228759765625, -22.57763671875, -21.926513671875, -21.275390625, -20.624267578125, -19.97314453125, -19.322021484375, -18.6708984375, -18.019775390625, -17.36865234375, -16.717529296875, -16.06640625, -15.415283203125, -14.76416015625, -14.113037109375, -13.4619140625, -12.810791015625, -12.15966796875, -11.508544921875, -10.857421875, -10.206298828125, -9.55517578125, -8.904052734375, -8.2529296875, -7.601806640625, -6.95068359375, -6.299560546875, -5.6484375, -4.997314453125, -4.34619140625, -3.695068359375, -3.0439453125, -2.392822265625, -1.74169921875, -1.090576171875, -0.439453125, 0.211669921875, 0.86279296875, 1.513916015625, 2.1650390625, 2.816162109375, 3.46728515625, 4.118408203125, 4.76953125, 5.420654296875, 6.07177734375, 6.722900390625, 7.3740234375, 8.025146484375, 8.67626953125, 9.327392578125, 9.978515625, 10.629638671875, 11.28076171875, 11.931884765625, 12.5830078125, 13.234130859375, 13.88525390625, 14.536376953125, 15.1875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 11.0, 8.0, 15.0, 24.0, 39.0, 64.0, 102.0, 186.0, 303.0, 565.0, 924.0, 785.0, 450.0, 247.0, 140.0, 85.0, 46.0, 33.0, 16.0, 11.0, 6.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.0625, -25.4390869140625, -24.815673828125, -24.1922607421875, -23.56884765625, -22.9454345703125, -22.322021484375, -21.6986083984375, -21.0751953125, -20.4517822265625, -19.828369140625, -19.2049560546875, -18.58154296875, -17.9581298828125, -17.334716796875, -16.7113037109375, -16.087890625, -15.4644775390625, -14.841064453125, -14.2176513671875, -13.59423828125, -12.9708251953125, -12.347412109375, -11.7239990234375, -11.1005859375, -10.4771728515625, -9.853759765625, -9.2303466796875, -8.60693359375, -7.9835205078125, -7.360107421875, -6.7366943359375, -6.11328125, -5.4898681640625, -4.866455078125, -4.2430419921875, -3.61962890625, -2.9962158203125, -2.372802734375, -1.7493896484375, -1.1259765625, -0.5025634765625, 0.120849609375, 0.7442626953125, 1.36767578125, 1.9910888671875, 2.614501953125, 3.2379150390625, 3.861328125, 4.4847412109375, 5.108154296875, 5.7315673828125, 6.35498046875, 6.9783935546875, 7.601806640625, 8.2252197265625, 8.8486328125, 9.4720458984375, 10.095458984375, 10.7188720703125, 11.34228515625, 11.9656982421875, 12.589111328125, 13.2125244140625, 13.8359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 6.0, 14.0, 17.0, 51.0, 73.0, 166.0, 392.0, 1072.0, 4721.0, 3545464.0, 637411.0, 3411.0, 864.0, 309.0, 133.0, 72.0, 33.0, 34.0, 13.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.4375, -78.71484375, -75.9921875, -73.26953125, -70.546875, -67.82421875, -65.1015625, -62.37890625, -59.65625, -56.93359375, -54.2109375, -51.48828125, -48.765625, -46.04296875, -43.3203125, -40.59765625, -37.875, -35.15234375, -32.4296875, -29.70703125, -26.984375, -24.26171875, -21.5390625, -18.81640625, -16.09375, -13.37109375, -10.6484375, -7.92578125, -5.203125, -2.48046875, 0.2421875, 2.96484375, 5.6875, 8.41015625, 11.1328125, 13.85546875, 16.578125, 19.30078125, 22.0234375, 24.74609375, 27.46875, 30.19140625, 32.9140625, 35.63671875, 38.359375, 41.08203125, 43.8046875, 46.52734375, 49.25, 51.97265625, 54.6953125, 57.41796875, 60.140625, 62.86328125, 65.5859375, 68.30859375, 71.03125, 73.75390625, 76.4765625, 79.19921875, 81.921875, 84.64453125, 87.3671875, 90.08984375, 92.8125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 18.0, 74.0, 299.0, 391.0, 176.0, 42.0, 8.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.13645553588867, -28.68865203857422, -25.240848541259766, -21.793045043945312, -18.34524154663086, -14.897438049316406, -11.449634552001953, -8.0018310546875, -4.554027557373047, -1.1062240600585938, 2.3415794372558594, 5.7893829345703125, 9.237186431884766, 12.684989929199219, 16.132793426513672, 19.580596923828125, 23.028400421142578, 26.47620391845703, 29.924007415771484, 33.37181091308594, 36.81961441040039, 40.267417907714844, 43.7152214050293, 47.16302490234375, 50.6108283996582, 54.058631896972656, 57.50643539428711, 60.95423889160156, 64.40203857421875, 67.84984588623047, 71.29765319824219, 74.74545288085938, 78.19325256347656, 81.64105224609375, 85.08885955810547, 88.53666687011719, 91.98446655273438, 95.43226623535156, 98.88007354736328, 102.327880859375, 105.77568054199219, 109.22348022460938, 112.6712875366211, 116.11909484863281, 119.56689453125, 123.01469421386719, 126.4625015258789, 129.91030883789062, 133.3581085205078, 136.805908203125, 140.25372314453125, 143.70152282714844, 147.14932250976562, 150.5971221923828, 154.044921875, 157.49273681640625, 160.94053649902344, 164.38833618164062, 167.83615112304688, 171.28395080566406, 174.73175048828125, 178.17955017089844, 181.62734985351562, 185.07516479492188, 188.52296447753906]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 11.0, 10.0, 13.0, 17.0, 15.0, 22.0, 38.0, 32.0, 40.0, 48.0, 52.0, 58.0, 50.0, 61.0, 57.0, 54.0, 68.0, 48.0, 61.0, 39.0, 43.0, 29.0, 28.0, 23.0, 23.0, 15.0, 10.0, 12.0, 8.0, 4.0, 4.0, 7.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.120880126953125, -53.443641662597656, -51.76640319824219, -50.08916473388672, -48.41192626953125, -46.73468780517578, -45.05744552612305, -43.38020706176758, -41.70296859741211, -40.02573013305664, -38.34849166870117, -36.6712532043457, -34.99401092529297, -33.3167724609375, -31.63953399658203, -29.962295532226562, -28.285057067871094, -26.607818603515625, -24.930580139160156, -23.253339767456055, -21.576101303100586, -19.898862838745117, -18.221622467041016, -16.544384002685547, -14.867145538330078, -13.18990707397461, -11.512667655944824, -9.835428237915039, -8.15818977355957, -6.480951309204102, -4.803711891174316, -3.1264724731445312, -1.4492340087890625, 0.22800493240356445, 1.9052438735961914, 3.5824828147888184, 5.259721755981445, 6.936960220336914, 8.6141996383667, 10.291439056396484, 11.968677520751953, 13.645915985107422, 15.323155403137207, 17.000394821166992, 18.67763328552246, 20.35487174987793, 22.03211212158203, 23.7093505859375, 25.38658905029297, 27.063827514648438, 28.741065979003906, 30.418306350708008, 32.095542907714844, 33.77278137207031, 35.45002365112305, 37.127262115478516, 38.804500579833984, 40.48173904418945, 42.15897750854492, 43.83621597290039, 45.513458251953125, 47.190696716308594, 48.86793518066406, 50.54517364501953, 52.222412109375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 3.0, 13.0, 15.0, 12.0, 16.0, 17.0, 25.0, 26.0, 26.0, 26.0, 43.0, 40.0, 40.0, 49.0, 63.0, 64.0, 65.0, 65.0, 60.0, 67.0, 38.0, 34.0, 34.0, 28.0, 26.0, 19.0, 19.0, 15.0, 17.0, 9.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.9921875, -4.8699951171875, -4.747802734375, -4.6256103515625, -4.50341796875, -4.3812255859375, -4.259033203125, -4.1368408203125, -4.0146484375, -3.8924560546875, -3.770263671875, -3.6480712890625, -3.52587890625, -3.4036865234375, -3.281494140625, -3.1593017578125, -3.037109375, -2.9149169921875, -2.792724609375, -2.6705322265625, -2.54833984375, -2.4261474609375, -2.303955078125, -2.1817626953125, -2.0595703125, -1.9373779296875, -1.815185546875, -1.6929931640625, -1.57080078125, -1.4486083984375, -1.326416015625, -1.2042236328125, -1.08203125, -0.9598388671875, -0.837646484375, -0.7154541015625, -0.59326171875, -0.4710693359375, -0.348876953125, -0.2266845703125, -0.1044921875, 0.0177001953125, 0.139892578125, 0.2620849609375, 0.38427734375, 0.5064697265625, 0.628662109375, 0.7508544921875, 0.873046875, 0.9952392578125, 1.117431640625, 1.2396240234375, 1.36181640625, 1.4840087890625, 1.606201171875, 1.7283935546875, 1.8505859375, 1.9727783203125, 2.094970703125, 2.2171630859375, 2.33935546875, 2.4615478515625, 2.583740234375, 2.7059326171875, 2.828125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 8.0, 19.0, 22.0, 29.0, 48.0, 63.0, 113.0, 149.0, 236.0, 394.0, 601.0, 959.0, 1544.0, 2700.0, 4523.0, 7869.0, 14193.0, 26898.0, 51923.0, 105188.0, 234836.0, 304580.0, 145208.0, 68993.0, 34600.0, 18535.0, 10306.0, 5606.0, 3285.0, 1886.0, 1227.0, 704.0, 442.0, 263.0, 201.0, 138.0, 85.0, 40.0, 33.0, 31.0, 16.0, 16.0, 8.0, 10.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56298828125, -0.5443496704101562, -0.5257110595703125, -0.5070724487304688, -0.488433837890625, -0.46979522705078125, -0.4511566162109375, -0.43251800537109375, -0.41387939453125, -0.39524078369140625, -0.3766021728515625, -0.35796356201171875, -0.339324951171875, -0.32068634033203125, -0.3020477294921875, -0.28340911865234375, -0.2647705078125, -0.24613189697265625, -0.2274932861328125, -0.20885467529296875, -0.190216064453125, -0.17157745361328125, -0.1529388427734375, -0.13430023193359375, -0.11566162109375, -0.09702301025390625, -0.0783843994140625, -0.05974578857421875, -0.041107177734375, -0.02246856689453125, -0.0038299560546875, 0.01480865478515625, 0.033447265625, 0.05208587646484375, 0.0707244873046875, 0.08936309814453125, 0.108001708984375, 0.12664031982421875, 0.1452789306640625, 0.16391754150390625, 0.18255615234375, 0.20119476318359375, 0.2198333740234375, 0.23847198486328125, 0.257110595703125, 0.27574920654296875, 0.2943878173828125, 0.31302642822265625, 0.3316650390625, 0.35030364990234375, 0.3689422607421875, 0.38758087158203125, 0.406219482421875, 0.42485809326171875, 0.4434967041015625, 0.46213531494140625, 0.48077392578125, 0.49941253662109375, 0.5180511474609375, 0.5366897583007812, 0.555328369140625, 0.5739669799804688, 0.5926055908203125, 0.6112442016601562, 0.6298828125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 9.0, 10.0, 9.0, 9.0, 7.0, 10.0, 19.0, 19.0, 20.0, 21.0, 23.0, 34.0, 25.0, 37.0, 31.0, 39.0, 38.0, 45.0, 36.0, 37.0, 1069.0, 44.0, 24.0, 42.0, 32.0, 37.0, 37.0, 31.0, 25.0, 21.0, 29.0, 24.0, 19.0, 17.0, 19.0, 16.0, 10.0, 10.0, 7.0, 5.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7822265625, -1.7237091064453125, -1.665191650390625, -1.6066741943359375, -1.54815673828125, -1.4896392822265625, -1.431121826171875, -1.3726043701171875, -1.3140869140625, -1.2555694580078125, -1.197052001953125, -1.1385345458984375, -1.08001708984375, -1.0214996337890625, -0.962982177734375, -0.9044647216796875, -0.845947265625, -0.7874298095703125, -0.728912353515625, -0.6703948974609375, -0.61187744140625, -0.5533599853515625, -0.494842529296875, -0.4363250732421875, -0.3778076171875, -0.3192901611328125, -0.260772705078125, -0.2022552490234375, -0.14373779296875, -0.0852203369140625, -0.026702880859375, 0.0318145751953125, 0.09033203125, 0.1488494873046875, 0.207366943359375, 0.2658843994140625, 0.32440185546875, 0.3829193115234375, 0.441436767578125, 0.4999542236328125, 0.5584716796875, 0.6169891357421875, 0.675506591796875, 0.7340240478515625, 0.79254150390625, 0.8510589599609375, 0.909576416015625, 0.9680938720703125, 1.026611328125, 1.0851287841796875, 1.143646240234375, 1.2021636962890625, 1.26068115234375, 1.3191986083984375, 1.377716064453125, 1.4362335205078125, 1.4947509765625, 1.5532684326171875, 1.611785888671875, 1.6703033447265625, 1.72882080078125, 1.7873382568359375, 1.845855712890625, 1.9043731689453125, 1.962890625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 6.0, 6.0, 9.0, 21.0, 36.0, 37.0, 60.0, 110.0, 160.0, 235.0, 356.0, 604.0, 885.0, 1563.0, 2494.0, 3972.0, 6892.0, 11570.0, 20294.0, 36413.0, 68491.0, 131573.0, 265142.0, 1237728.0, 142367.0, 74084.0, 39603.0, 21445.0, 12427.0, 7248.0, 4395.0, 2585.0, 1608.0, 1009.0, 607.0, 377.0, 249.0, 179.0, 103.0, 66.0, 36.0, 28.0, 22.0, 18.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.361328125, -0.3503990173339844, -0.33946990966796875, -0.3285408020019531, -0.3176116943359375, -0.3066825866699219, -0.29575347900390625, -0.2848243713378906, -0.273895263671875, -0.2629661560058594, -0.25203704833984375, -0.24110794067382812, -0.2301788330078125, -0.21924972534179688, -0.20832061767578125, -0.19739151000976562, -0.18646240234375, -0.17553329467773438, -0.16460418701171875, -0.15367507934570312, -0.1427459716796875, -0.13181686401367188, -0.12088775634765625, -0.10995864868164062, -0.099029541015625, -0.08810043334960938, -0.07717132568359375, -0.06624221801757812, -0.0553131103515625, -0.044384002685546875, -0.03345489501953125, -0.022525787353515625, -0.0115966796875, -0.000667572021484375, 0.01026153564453125, 0.021190643310546875, 0.0321197509765625, 0.043048858642578125, 0.05397796630859375, 0.06490707397460938, 0.075836181640625, 0.08676528930664062, 0.09769439697265625, 0.10862350463867188, 0.1195526123046875, 0.13048171997070312, 0.14141082763671875, 0.15233993530273438, 0.16326904296875, 0.17419815063476562, 0.18512725830078125, 0.19605636596679688, 0.2069854736328125, 0.21791458129882812, 0.22884368896484375, 0.23977279663085938, 0.250701904296875, 0.2616310119628906, 0.27256011962890625, 0.2834892272949219, 0.2944183349609375, 0.3053474426269531, 0.31627655029296875, 0.3272056579589844, 0.338134765625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 5.0, 16.0, 11.0, 14.0, 10.0, 10.0, 24.0, 24.0, 29.0, 36.0, 39.0, 47.0, 55.0, 75.0, 72.0, 76.0, 80.0, 64.0, 59.0, 44.0, 42.0, 26.0, 27.0, 27.0, 11.0, 23.0, 10.0, 5.0, 7.0, 7.0, 1.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018644332885742188, -0.0018067359924316406, -0.0017490386962890625, -0.0016913414001464844, -0.0016336441040039062, -0.0015759468078613281, -0.00151824951171875, -0.0014605522155761719, -0.0014028549194335938, -0.0013451576232910156, -0.0012874603271484375, -0.0012297630310058594, -0.0011720657348632812, -0.0011143684387207031, -0.001056671142578125, -0.0009989738464355469, -0.0009412765502929688, -0.0008835792541503906, -0.0008258819580078125, -0.0007681846618652344, -0.0007104873657226562, -0.0006527900695800781, -0.0005950927734375, -0.0005373954772949219, -0.00047969818115234375, -0.0004220008850097656, -0.0003643035888671875, -0.0003066062927246094, -0.00024890899658203125, -0.00019121170043945312, -0.000133514404296875, -7.581710815429688e-05, -1.811981201171875e-05, 3.9577484130859375e-05, 9.72747802734375e-05, 0.00015497207641601562, 0.00021266937255859375, 0.0002703666687011719, 0.00032806396484375, 0.0003857612609863281, 0.00044345855712890625, 0.0005011558532714844, 0.0005588531494140625, 0.0006165504455566406, 0.0006742477416992188, 0.0007319450378417969, 0.000789642333984375, 0.0008473396301269531, 0.0009050369262695312, 0.0009627342224121094, 0.0010204315185546875, 0.0010781288146972656, 0.0011358261108398438, 0.0011935234069824219, 0.001251220703125, 0.0013089179992675781, 0.0013666152954101562, 0.0014243125915527344, 0.0014820098876953125, 0.0015397071838378906, 0.0015974044799804688, 0.0016551017761230469, 0.001712799072265625, 0.0017704963684082031, 0.0018281936645507812]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 5.0, 8.0, 6.0, 19.0, 23.0, 31.0, 34.0, 69.0, 99.0, 112.0, 163.0, 222.0, 325.0, 474.0, 1284.0, 1038664.0, 5160.0, 609.0, 354.0, 232.0, 151.0, 133.0, 103.0, 65.0, 69.0, 24.0, 26.0, 18.0, 28.0, 5.0, 8.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.044189453125, -0.04287576675415039, -0.04156208038330078, -0.04024839401245117, -0.03893470764160156, -0.03762102127075195, -0.036307334899902344, -0.034993648529052734, -0.033679962158203125, -0.032366275787353516, -0.031052589416503906, -0.029738903045654297, -0.028425216674804688, -0.027111530303955078, -0.02579784393310547, -0.02448415756225586, -0.02317047119140625, -0.02185678482055664, -0.02054309844970703, -0.019229412078857422, -0.017915725708007812, -0.016602039337158203, -0.015288352966308594, -0.013974666595458984, -0.012660980224609375, -0.011347293853759766, -0.010033607482910156, -0.008719921112060547, -0.0074062347412109375, -0.006092548370361328, -0.004778861999511719, -0.0034651756286621094, -0.0021514892578125, -0.0008378028869628906, 0.00047588348388671875, 0.0017895698547363281, 0.0031032562255859375, 0.004416942596435547, 0.005730628967285156, 0.007044315338134766, 0.008358001708984375, 0.009671688079833984, 0.010985374450683594, 0.012299060821533203, 0.013612747192382812, 0.014926433563232422, 0.01624011993408203, 0.01755380630493164, 0.01886749267578125, 0.02018117904663086, 0.02149486541748047, 0.022808551788330078, 0.024122238159179688, 0.025435924530029297, 0.026749610900878906, 0.028063297271728516, 0.029376983642578125, 0.030690670013427734, 0.032004356384277344, 0.03331804275512695, 0.03463172912597656, 0.03594541549682617, 0.03725910186767578, 0.03857278823852539, 0.039886474609375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1008.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006473960820585489, 0.00025259109679609537, 0.0011525782756507397, 0.002052565338090062, 0.0029525526333600283, 0.0038525399286299944, 0.004752526991069317, 0.005652514286339283, 0.006552501581609249, 0.007452488876879215, 0.008352476172149181, 0.009252462536096573, 0.010152449831366539, 0.011052437126636505, 0.011952424421906471, 0.012852411717176437, 0.013752399012446404, 0.01465238630771637, 0.015552373602986336, 0.016452360898256302, 0.017352348193526268, 0.018252335488796234, 0.01915232092142105, 0.020052310079336166, 0.020952295511960983, 0.02185228280723095, 0.022752270102500916, 0.02365225739777088, 0.024552244693040848, 0.025452231988310814, 0.02635221928358078, 0.027252204716205597, 0.028152193874120712, 0.02905218116939068, 0.029952168464660645, 0.03085215575993061, 0.03175214305520058, 0.032652128487825394, 0.03355211764574051, 0.034452103078365326, 0.03535209223628044, 0.03625207766890526, 0.037152066826820374, 0.03805205225944519, 0.038952041417360306, 0.03985202684998512, 0.04075201600790024, 0.041652001440525055, 0.04255198687314987, 0.04345197230577469, 0.044351961463689804, 0.04525194689631462, 0.046151936054229736, 0.04705192148685455, 0.04795191064476967, 0.048851896077394485, 0.0497518852353096, 0.05065187066793442, 0.05155185982584953, 0.05245184525847435, 0.053351834416389465, 0.05425181984901428, 0.0551518090069294, 0.056051794439554214, 0.05695178359746933]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 22.0, 11.0, 31.0, 39.0, 40.0, 62.0, 70.0, 77.0, 54.0, 83.0, 75.0, 79.0, 50.0, 72.0, 75.0, 43.0, 39.0, 24.0, 24.0, 18.0, 10.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020893216133117676, -0.0020346548408269882, -0.001979988068342209, -0.0019253212958574295, -0.0018706545233726501, -0.0018159877508878708, -0.0017613209784030914, -0.001706654205918312, -0.0016519874334335327, -0.0015973206609487534, -0.001542653888463974, -0.0014879871159791946, -0.0014333203434944153, -0.001378653571009636, -0.0013239867985248566, -0.0012693200260400772, -0.0012146532535552979, -0.0011599864810705185, -0.0011053197085857391, -0.0010506529361009598, -0.0009959861636161804, -0.0009413193911314011, -0.0008866526186466217, -0.0008319858461618423, -0.000777319073677063, -0.0007226523011922836, -0.0006679855287075043, -0.0006133187562227249, -0.0005586519837379456, -0.0005039852112531662, -0.00044931843876838684, -0.0003946516662836075, -0.0003399848937988281, -0.00028531812131404877, -0.0002306513488292694, -0.00017598457634449005, -0.0001213178038597107, -6.665103137493134e-05, -1.1984258890151978e-05, 4.268251359462738e-05, 9.734928607940674e-05, 0.0001520160585641861, 0.00020668283104896545, 0.0002613496035337448, 0.00031601637601852417, 0.00037068314850330353, 0.0004253499209880829, 0.00048001669347286224, 0.0005346834659576416, 0.000589350238442421, 0.0006440170109272003, 0.0006986837834119797, 0.000753350555896759, 0.0008080173283815384, 0.0008626841008663177, 0.0009173508733510971, 0.0009720176458358765, 0.0010266844183206558, 0.0010813511908054352, 0.0011360179632902145, 0.001190684735774994, 0.0012453515082597733, 0.0013000182807445526, 0.001354685053229332, 0.0014093518257141113]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 3.0, 14.0, 14.0, 12.0, 16.0, 17.0, 25.0, 26.0, 26.0, 26.0, 43.0, 40.0, 40.0, 49.0, 63.0, 64.0, 65.0, 65.0, 60.0, 67.0, 38.0, 34.0, 34.0, 28.0, 26.0, 19.0, 19.0, 15.0, 17.0, 9.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.9921875, -4.8699951171875, -4.747802734375, -4.6256103515625, -4.50341796875, -4.3812255859375, -4.259033203125, -4.1368408203125, -4.0146484375, -3.8924560546875, -3.770263671875, -3.6480712890625, -3.52587890625, -3.4036865234375, -3.281494140625, -3.1593017578125, -3.037109375, -2.9149169921875, -2.792724609375, -2.6705322265625, -2.54833984375, -2.4261474609375, -2.303955078125, -2.1817626953125, -2.0595703125, -1.9373779296875, -1.815185546875, -1.6929931640625, -1.57080078125, -1.4486083984375, -1.326416015625, -1.2042236328125, -1.08203125, -0.9598388671875, -0.837646484375, -0.7154541015625, -0.59326171875, -0.4710693359375, -0.348876953125, -0.2266845703125, -0.1044921875, 0.0177001953125, 0.139892578125, 0.2620849609375, 0.38427734375, 0.5064697265625, 0.628662109375, 0.7508544921875, 0.873046875, 0.9952392578125, 1.117431640625, 1.2396240234375, 1.36181640625, 1.4840087890625, 1.606201171875, 1.7283935546875, 1.8505859375, 1.9727783203125, 2.094970703125, 2.2171630859375, 2.33935546875, 2.4615478515625, 2.583740234375, 2.7059326171875, 2.828125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 10.0, 6.0, 22.0, 20.0, 26.0, 41.0, 70.0, 77.0, 91.0, 142.0, 198.0, 248.0, 374.0, 517.0, 776.0, 1126.0, 1690.0, 2672.0, 4374.0, 7768.0, 14682.0, 44616.0, 646530.0, 264752.0, 28594.0, 11713.0, 6518.0, 3687.0, 2340.0, 1446.0, 1032.0, 686.0, 487.0, 334.0, 239.0, 177.0, 138.0, 81.0, 77.0, 41.0, 39.0, 24.0, 28.0, 10.0, 7.0, 7.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-16.65625, -16.149169921875, -15.64208984375, -15.135009765625, -14.6279296875, -14.120849609375, -13.61376953125, -13.106689453125, -12.599609375, -12.092529296875, -11.58544921875, -11.078369140625, -10.5712890625, -10.064208984375, -9.55712890625, -9.050048828125, -8.54296875, -8.035888671875, -7.52880859375, -7.021728515625, -6.5146484375, -6.007568359375, -5.50048828125, -4.993408203125, -4.486328125, -3.979248046875, -3.47216796875, -2.965087890625, -2.4580078125, -1.950927734375, -1.44384765625, -0.936767578125, -0.4296875, 0.077392578125, 0.58447265625, 1.091552734375, 1.5986328125, 2.105712890625, 2.61279296875, 3.119873046875, 3.626953125, 4.134033203125, 4.64111328125, 5.148193359375, 5.6552734375, 6.162353515625, 6.66943359375, 7.176513671875, 7.68359375, 8.190673828125, 8.69775390625, 9.204833984375, 9.7119140625, 10.218994140625, 10.72607421875, 11.233154296875, 11.740234375, 12.247314453125, 12.75439453125, 13.261474609375, 13.7685546875, 14.275634765625, 14.78271484375, 15.289794921875, 15.796875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 6.0, 5.0, 4.0, 10.0, 8.0, 7.0, 19.0, 17.0, 19.0, 15.0, 29.0, 27.0, 26.0, 24.0, 31.0, 43.0, 46.0, 45.0, 67.0, 139.0, 304.0, 1485.0, 185.0, 72.0, 64.0, 45.0, 43.0, 40.0, 29.0, 31.0, 30.0, 24.0, 18.0, 19.0, 21.0, 15.0, 11.0, 9.0, 5.0, 6.0, 4.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.421875, -9.138916015625, -8.85595703125, -8.572998046875, -8.2900390625, -8.007080078125, -7.72412109375, -7.441162109375, -7.158203125, -6.875244140625, -6.59228515625, -6.309326171875, -6.0263671875, -5.743408203125, -5.46044921875, -5.177490234375, -4.89453125, -4.611572265625, -4.32861328125, -4.045654296875, -3.7626953125, -3.479736328125, -3.19677734375, -2.913818359375, -2.630859375, -2.347900390625, -2.06494140625, -1.781982421875, -1.4990234375, -1.216064453125, -0.93310546875, -0.650146484375, -0.3671875, -0.084228515625, 0.19873046875, 0.481689453125, 0.7646484375, 1.047607421875, 1.33056640625, 1.613525390625, 1.896484375, 2.179443359375, 2.46240234375, 2.745361328125, 3.0283203125, 3.311279296875, 3.59423828125, 3.877197265625, 4.16015625, 4.443115234375, 4.72607421875, 5.009033203125, 5.2919921875, 5.574951171875, 5.85791015625, 6.140869140625, 6.423828125, 6.706787109375, 6.98974609375, 7.272705078125, 7.5556640625, 7.838623046875, 8.12158203125, 8.404541015625, 8.6875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 3.0, 9.0, 5.0, 15.0, 16.0, 15.0, 16.0, 28.0, 26.0, 31.0, 32.0, 37.0, 49.0, 70.0, 126.0, 359.0, 1690.0, 609565.0, 2530616.0, 1980.0, 440.0, 171.0, 77.0, 63.0, 40.0, 25.0, 27.0, 27.0, 17.0, 20.0, 23.0, 16.0, 15.0, 9.0, 13.0, 7.0, 3.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.0625, -36.7958984375, -35.529296875, -34.2626953125, -32.99609375, -31.7294921875, -30.462890625, -29.1962890625, -27.9296875, -26.6630859375, -25.396484375, -24.1298828125, -22.86328125, -21.5966796875, -20.330078125, -19.0634765625, -17.796875, -16.5302734375, -15.263671875, -13.9970703125, -12.73046875, -11.4638671875, -10.197265625, -8.9306640625, -7.6640625, -6.3974609375, -5.130859375, -3.8642578125, -2.59765625, -1.3310546875, -0.064453125, 1.2021484375, 2.46875, 3.7353515625, 5.001953125, 6.2685546875, 7.53515625, 8.8017578125, 10.068359375, 11.3349609375, 12.6015625, 13.8681640625, 15.134765625, 16.4013671875, 17.66796875, 18.9345703125, 20.201171875, 21.4677734375, 22.734375, 24.0009765625, 25.267578125, 26.5341796875, 27.80078125, 29.0673828125, 30.333984375, 31.6005859375, 32.8671875, 34.1337890625, 35.400390625, 36.6669921875, 37.93359375, 39.2001953125, 40.466796875, 41.7333984375, 43.0]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 530.0, 481.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.5656433105469, -267.69378662109375, -262.8218994140625, -257.9500427246094, -253.0781707763672, -248.206298828125, -243.3344268798828, -238.46255493164062, -233.59068298339844, -228.71881103515625, -223.84693908691406, -218.97506713867188, -214.10321044921875, -209.23133850097656, -204.35946655273438, -199.4875946044922, -194.61572265625, -189.7438507080078, -184.87197875976562, -180.0001220703125, -175.1282501220703, -170.25637817382812, -165.38450622558594, -160.51263427734375, -155.64077758789062, -150.76890563964844, -145.89703369140625, -141.02517700195312, -136.15330505371094, -131.28143310546875, -126.40956115722656, -121.53768920898438, -116.66583251953125, -111.79396057128906, -106.9220962524414, -102.05022430419922, -97.17835235595703, -92.30648803710938, -87.43461608886719, -82.562744140625, -77.69087219238281, -72.81900024414062, -67.94713592529297, -63.07526397705078, -58.203392028808594, -53.33152389526367, -48.45965576171875, -43.58778381347656, -38.71591567993164, -33.84404754638672, -28.97217559814453, -24.10030746459961, -19.228437423706055, -14.3565673828125, -9.484699249267578, -4.612827301025391, 0.25904083251953125, 5.130910396575928, 10.002779960632324, 14.874649047851562, 19.746519088745117, 24.618389129638672, 29.490257263183594, 34.36212921142578, 39.2339973449707]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 4.0, 4.0, 9.0, 11.0, 11.0, 8.0, 11.0, 14.0, 11.0, 24.0, 26.0, 32.0, 17.0, 33.0, 27.0, 24.0, 43.0, 32.0, 34.0, 43.0, 37.0, 39.0, 35.0, 32.0, 48.0, 43.0, 38.0, 31.0, 23.0, 32.0, 23.0, 32.0, 22.0, 16.0, 30.0, 15.0, 6.0, 14.0, 15.0, 11.0, 5.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.228797912597656, -27.306621551513672, -26.384445190429688, -25.462268829345703, -24.540090560913086, -23.6179141998291, -22.695737838745117, -21.773561477661133, -20.851383209228516, -19.92920684814453, -19.007030487060547, -18.084854125976562, -17.162675857543945, -16.24049949645996, -15.318323135375977, -14.396146774291992, -13.473970413208008, -12.551794052124023, -11.629616737365723, -10.707440376281738, -9.785263061523438, -8.863086700439453, -7.940910339355469, -7.018733501434326, -6.096556663513184, -5.174379825592041, -4.252202987670898, -3.330026626586914, -2.4078497886657715, -1.485672950744629, -0.5634965896606445, 0.35868024826049805, 1.2808570861816406, 2.203033924102783, 3.1252105236053467, 4.04738712310791, 4.969563961029053, 5.891740798950195, 6.81391716003418, 7.736093997955322, 8.658270835876465, 9.58044719696045, 10.50262451171875, 11.424800872802734, 12.346977233886719, 13.26915454864502, 14.191330909729004, 15.113508224487305, 16.03568458557129, 16.957860946655273, 17.880037307739258, 18.802215576171875, 19.72439193725586, 20.646568298339844, 21.568744659423828, 22.490921020507812, 23.413097381591797, 24.33527374267578, 25.257450103759766, 26.17962646484375, 27.101804733276367, 28.02398109436035, 28.946157455444336, 29.86833381652832, 30.790512084960938]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 6.0, 5.0, 4.0, 10.0, 13.0, 9.0, 12.0, 14.0, 26.0, 24.0, 26.0, 34.0, 34.0, 31.0, 29.0, 49.0, 47.0, 61.0, 67.0, 57.0, 71.0, 54.0, 61.0, 48.0, 34.0, 25.0, 33.0, 18.0, 23.0, 22.0, 12.0, 15.0, 12.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.90625, -4.779541015625, -4.65283203125, -4.526123046875, -4.3994140625, -4.272705078125, -4.14599609375, -4.019287109375, -3.892578125, -3.765869140625, -3.63916015625, -3.512451171875, -3.3857421875, -3.259033203125, -3.13232421875, -3.005615234375, -2.87890625, -2.752197265625, -2.62548828125, -2.498779296875, -2.3720703125, -2.245361328125, -2.11865234375, -1.991943359375, -1.865234375, -1.738525390625, -1.61181640625, -1.485107421875, -1.3583984375, -1.231689453125, -1.10498046875, -0.978271484375, -0.8515625, -0.724853515625, -0.59814453125, -0.471435546875, -0.3447265625, -0.218017578125, -0.09130859375, 0.035400390625, 0.162109375, 0.288818359375, 0.41552734375, 0.542236328125, 0.6689453125, 0.795654296875, 0.92236328125, 1.049072265625, 1.17578125, 1.302490234375, 1.42919921875, 1.555908203125, 1.6826171875, 1.809326171875, 1.93603515625, 2.062744140625, 2.189453125, 2.316162109375, 2.44287109375, 2.569580078125, 2.6962890625, 2.822998046875, 2.94970703125, 3.076416015625, 3.203125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 6.0, 6.0, 14.0, 24.0, 24.0, 30.0, 58.0, 77.0, 102.0, 154.0, 281.0, 514.0, 930.0, 1923.0, 4757.0, 13803.0, 60827.0, 1049947.0, 2901525.0, 125747.0, 21171.0, 6680.0, 2701.0, 1324.0, 650.0, 363.0, 218.0, 133.0, 88.0, 60.0, 38.0, 31.0, 20.0, 21.0, 11.0, 9.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.25, -20.66259765625, -20.0751953125, -19.48779296875, -18.900390625, -18.31298828125, -17.7255859375, -17.13818359375, -16.55078125, -15.96337890625, -15.3759765625, -14.78857421875, -14.201171875, -13.61376953125, -13.0263671875, -12.43896484375, -11.8515625, -11.26416015625, -10.6767578125, -10.08935546875, -9.501953125, -8.91455078125, -8.3271484375, -7.73974609375, -7.15234375, -6.56494140625, -5.9775390625, -5.39013671875, -4.802734375, -4.21533203125, -3.6279296875, -3.04052734375, -2.453125, -1.86572265625, -1.2783203125, -0.69091796875, -0.103515625, 0.48388671875, 1.0712890625, 1.65869140625, 2.24609375, 2.83349609375, 3.4208984375, 4.00830078125, 4.595703125, 5.18310546875, 5.7705078125, 6.35791015625, 6.9453125, 7.53271484375, 8.1201171875, 8.70751953125, 9.294921875, 9.88232421875, 10.4697265625, 11.05712890625, 11.64453125, 12.23193359375, 12.8193359375, 13.40673828125, 13.994140625, 14.58154296875, 15.1689453125, 15.75634765625, 16.34375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 8.0, 16.0, 29.0, 31.0, 65.0, 61.0, 94.0, 152.0, 259.0, 369.0, 574.0, 680.0, 592.0, 363.0, 236.0, 161.0, 130.0, 77.0, 46.0, 35.0, 30.0, 20.0, 11.0, 10.0, 5.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.474853515625, -14.93408203125, -14.393310546875, -13.8525390625, -13.311767578125, -12.77099609375, -12.230224609375, -11.689453125, -11.148681640625, -10.60791015625, -10.067138671875, -9.5263671875, -8.985595703125, -8.44482421875, -7.904052734375, -7.36328125, -6.822509765625, -6.28173828125, -5.740966796875, -5.2001953125, -4.659423828125, -4.11865234375, -3.577880859375, -3.037109375, -2.496337890625, -1.95556640625, -1.414794921875, -0.8740234375, -0.333251953125, 0.20751953125, 0.748291015625, 1.2890625, 1.829833984375, 2.37060546875, 2.911376953125, 3.4521484375, 3.992919921875, 4.53369140625, 5.074462890625, 5.615234375, 6.156005859375, 6.69677734375, 7.237548828125, 7.7783203125, 8.319091796875, 8.85986328125, 9.400634765625, 9.94140625, 10.482177734375, 11.02294921875, 11.563720703125, 12.1044921875, 12.645263671875, 13.18603515625, 13.726806640625, 14.267578125, 14.808349609375, 15.34912109375, 15.889892578125, 16.4306640625, 16.971435546875, 17.51220703125, 18.052978515625, 18.59375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 6.0, 3.0, 8.0, 8.0, 16.0, 17.0, 16.0, 27.0, 43.0, 57.0, 75.0, 125.0, 230.0, 468.0, 1557.0, 26131.0, 4121096.0, 41456.0, 1770.0, 517.0, 242.0, 149.0, 88.0, 51.0, 43.0, 26.0, 16.0, 15.0, 13.0, 7.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.78125, -43.65576171875, -41.5302734375, -39.40478515625, -37.279296875, -35.15380859375, -33.0283203125, -30.90283203125, -28.77734375, -26.65185546875, -24.5263671875, -22.40087890625, -20.275390625, -18.14990234375, -16.0244140625, -13.89892578125, -11.7734375, -9.64794921875, -7.5224609375, -5.39697265625, -3.271484375, -1.14599609375, 0.9794921875, 3.10498046875, 5.23046875, 7.35595703125, 9.4814453125, 11.60693359375, 13.732421875, 15.85791015625, 17.9833984375, 20.10888671875, 22.234375, 24.35986328125, 26.4853515625, 28.61083984375, 30.736328125, 32.86181640625, 34.9873046875, 37.11279296875, 39.23828125, 41.36376953125, 43.4892578125, 45.61474609375, 47.740234375, 49.86572265625, 51.9912109375, 54.11669921875, 56.2421875, 58.36767578125, 60.4931640625, 62.61865234375, 64.744140625, 66.86962890625, 68.9951171875, 71.12060546875, 73.24609375, 75.37158203125, 77.4970703125, 79.62255859375, 81.748046875, 83.87353515625, 85.9990234375, 88.12451171875, 90.25]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [3.0, 6.0, 40.0, 255.0, 494.0, 200.0, 18.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.083255767822266, -16.30394744873047, -11.524641036987305, -6.745333671569824, -1.9660263061523438, 2.813282012939453, 7.592588424682617, 12.371894836425781, 17.151203155517578, 21.930511474609375, 26.70981788635254, 31.489124298095703, 36.2684326171875, 41.0477409362793, 45.827049255371094, 50.606353759765625, 55.38566207885742, 60.16497039794922, 64.94427490234375, 69.72358703613281, 74.50289154052734, 79.28219604492188, 84.06150817871094, 88.84081268310547, 93.6201171875, 98.39942169189453, 103.1787338256836, 107.95803833007812, 112.73735046386719, 117.51665496826172, 122.29595947265625, 127.07527160644531, 131.85458374023438, 136.63389587402344, 141.41319274902344, 146.1925048828125, 150.97181701660156, 155.75112915039062, 160.53042602539062, 165.3097381591797, 170.08905029296875, 174.8683624267578, 179.6476593017578, 184.42697143554688, 189.20628356933594, 193.985595703125, 198.764892578125, 203.54420471191406, 208.32350158691406, 213.10281372070312, 217.88211059570312, 222.6614227294922, 227.44073486328125, 232.22003173828125, 236.9993438720703, 241.77865600585938, 246.55795288085938, 251.33726501464844, 256.1165771484375, 260.8958740234375, 265.6751708984375, 270.4544982910156, 275.2337951660156, 280.0130920410156, 284.79241943359375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 5.0, 13.0, 8.0, 12.0, 29.0, 24.0, 19.0, 29.0, 32.0, 37.0, 27.0, 40.0, 28.0, 34.0, 42.0, 41.0, 45.0, 39.0, 49.0, 36.0, 42.0, 31.0, 31.0, 36.0, 26.0, 35.0, 29.0, 24.0, 25.0, 24.0, 21.0, 13.0, 10.0, 12.0, 8.0, 8.0, 1.0, 9.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-46.40675354003906, -45.116554260253906, -43.826358795166016, -42.53615951538086, -41.24596405029297, -39.95576477050781, -38.66556930541992, -37.375370025634766, -36.085174560546875, -34.79497528076172, -33.50477981567383, -32.21458053588867, -30.92438507080078, -29.634185791015625, -28.3439884185791, -27.053791046142578, -25.763591766357422, -24.4733943939209, -23.183197021484375, -21.89299964904785, -20.602802276611328, -19.312602996826172, -18.02240562438965, -16.732208251953125, -15.442010879516602, -14.151813507080078, -12.861616134643555, -11.571417808532715, -10.281220436096191, -8.991023063659668, -7.700825214385986, -6.410627365112305, -5.120429992675781, -3.8302323818206787, -2.540034770965576, -1.2498371601104736, 0.040360450744628906, 1.3305578231811523, 2.620755672454834, 3.9109535217285156, 5.201150894165039, 6.4913482666015625, 7.781546115875244, 9.071743965148926, 10.36194133758545, 11.652138710021973, 12.942337036132812, 14.232534408569336, 15.52273178100586, 16.812929153442383, 18.103126525878906, 19.39332389831543, 20.683521270751953, 21.97372055053711, 23.263917922973633, 24.554115295410156, 25.84431266784668, 27.134510040283203, 28.424707412719727, 29.71490478515625, 31.005104064941406, 32.2952995300293, 33.58549880981445, 34.875694274902344, 36.1658935546875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 1.0, 6.0, 3.0, 10.0, 11.0, 9.0, 14.0, 13.0, 14.0, 19.0, 28.0, 26.0, 30.0, 27.0, 32.0, 47.0, 42.0, 43.0, 51.0, 50.0, 67.0, 49.0, 50.0, 45.0, 53.0, 40.0, 35.0, 33.0, 28.0, 25.0, 22.0, 9.0, 22.0, 7.0, 6.0, 11.0, 8.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.49609375, -4.37762451171875, -4.2591552734375, -4.14068603515625, -4.022216796875, -3.90374755859375, -3.7852783203125, -3.66680908203125, -3.54833984375, -3.42987060546875, -3.3114013671875, -3.19293212890625, -3.074462890625, -2.95599365234375, -2.8375244140625, -2.71905517578125, -2.6005859375, -2.48211669921875, -2.3636474609375, -2.24517822265625, -2.126708984375, -2.00823974609375, -1.8897705078125, -1.77130126953125, -1.65283203125, -1.53436279296875, -1.4158935546875, -1.29742431640625, -1.178955078125, -1.06048583984375, -0.9420166015625, -0.82354736328125, -0.705078125, -0.58660888671875, -0.4681396484375, -0.34967041015625, -0.231201171875, -0.11273193359375, 0.0057373046875, 0.12420654296875, 0.24267578125, 0.36114501953125, 0.4796142578125, 0.59808349609375, 0.716552734375, 0.83502197265625, 0.9534912109375, 1.07196044921875, 1.1904296875, 1.30889892578125, 1.4273681640625, 1.54583740234375, 1.664306640625, 1.78277587890625, 1.9012451171875, 2.01971435546875, 2.13818359375, 2.25665283203125, 2.3751220703125, 2.49359130859375, 2.612060546875, 2.73052978515625, 2.8489990234375, 2.96746826171875, 3.0859375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 13.0, 6.0, 23.0, 19.0, 39.0, 53.0, 77.0, 116.0, 183.0, 284.0, 474.0, 747.0, 1227.0, 2047.0, 3547.0, 6184.0, 11355.0, 21021.0, 41068.0, 86923.0, 200200.0, 325293.0, 184761.0, 79960.0, 38326.0, 19745.0, 10609.0, 5810.0, 3377.0, 1961.0, 1163.0, 685.0, 451.0, 260.0, 190.0, 104.0, 77.0, 55.0, 29.0, 30.0, 15.0, 11.0, 13.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.669921875, -0.6492767333984375, -0.628631591796875, -0.6079864501953125, -0.58734130859375, -0.5666961669921875, -0.546051025390625, -0.5254058837890625, -0.5047607421875, -0.4841156005859375, -0.463470458984375, -0.4428253173828125, -0.42218017578125, -0.4015350341796875, -0.380889892578125, -0.3602447509765625, -0.339599609375, -0.3189544677734375, -0.298309326171875, -0.2776641845703125, -0.25701904296875, -0.2363739013671875, -0.215728759765625, -0.1950836181640625, -0.1744384765625, -0.1537933349609375, -0.133148193359375, -0.1125030517578125, -0.09185791015625, -0.0712127685546875, -0.050567626953125, -0.0299224853515625, -0.00927734375, 0.0113677978515625, 0.032012939453125, 0.0526580810546875, 0.07330322265625, 0.0939483642578125, 0.114593505859375, 0.1352386474609375, 0.1558837890625, 0.1765289306640625, 0.197174072265625, 0.2178192138671875, 0.23846435546875, 0.2591094970703125, 0.279754638671875, 0.3003997802734375, 0.321044921875, 0.3416900634765625, 0.362335205078125, 0.3829803466796875, 0.40362548828125, 0.4242706298828125, 0.444915771484375, 0.4655609130859375, 0.4862060546875, 0.5068511962890625, 0.527496337890625, 0.5481414794921875, 0.56878662109375, 0.5894317626953125, 0.610076904296875, 0.6307220458984375, 0.6513671875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 7.0, 7.0, 8.0, 12.0, 8.0, 14.0, 22.0, 20.0, 25.0, 29.0, 26.0, 37.0, 41.0, 37.0, 42.0, 43.0, 32.0, 41.0, 1070.0, 48.0, 40.0, 47.0, 43.0, 51.0, 32.0, 26.0, 38.0, 34.0, 14.0, 26.0, 20.0, 12.0, 17.0, 16.0, 7.0, 10.0, 7.0, 6.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.646484375, -2.5726318359375, -2.498779296875, -2.4249267578125, -2.35107421875, -2.2772216796875, -2.203369140625, -2.1295166015625, -2.0556640625, -1.9818115234375, -1.907958984375, -1.8341064453125, -1.76025390625, -1.6864013671875, -1.612548828125, -1.5386962890625, -1.46484375, -1.3909912109375, -1.317138671875, -1.2432861328125, -1.16943359375, -1.0955810546875, -1.021728515625, -0.9478759765625, -0.8740234375, -0.8001708984375, -0.726318359375, -0.6524658203125, -0.57861328125, -0.5047607421875, -0.430908203125, -0.3570556640625, -0.283203125, -0.2093505859375, -0.135498046875, -0.0616455078125, 0.01220703125, 0.0860595703125, 0.159912109375, 0.2337646484375, 0.3076171875, 0.3814697265625, 0.455322265625, 0.5291748046875, 0.60302734375, 0.6768798828125, 0.750732421875, 0.8245849609375, 0.8984375, 0.9722900390625, 1.046142578125, 1.1199951171875, 1.19384765625, 1.2677001953125, 1.341552734375, 1.4154052734375, 1.4892578125, 1.5631103515625, 1.636962890625, 1.7108154296875, 1.78466796875, 1.8585205078125, 1.932373046875, 2.0062255859375, 2.080078125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 7.0, 11.0, 26.0, 23.0, 39.0, 70.0, 110.0, 160.0, 255.0, 354.0, 612.0, 1009.0, 1554.0, 2522.0, 4265.0, 7103.0, 11614.0, 20325.0, 36282.0, 65720.0, 121570.0, 211293.0, 1277478.0, 149742.0, 80383.0, 44400.0, 24601.0, 14130.0, 8389.0, 4950.0, 3010.0, 1829.0, 1257.0, 746.0, 461.0, 305.0, 176.0, 126.0, 77.0, 48.0, 36.0, 23.0, 12.0, 10.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370361328125, -0.3584785461425781, -0.34659576416015625, -0.3347129821777344, -0.3228302001953125, -0.3109474182128906, -0.29906463623046875, -0.2871818542480469, -0.275299072265625, -0.2634162902832031, -0.25153350830078125, -0.23965072631835938, -0.2277679443359375, -0.21588516235351562, -0.20400238037109375, -0.19211959838867188, -0.18023681640625, -0.16835403442382812, -0.15647125244140625, -0.14458847045898438, -0.1327056884765625, -0.12082290649414062, -0.10894012451171875, -0.09705734252929688, -0.085174560546875, -0.07329177856445312, -0.06140899658203125, -0.049526214599609375, -0.0376434326171875, -0.025760650634765625, -0.01387786865234375, -0.001995086669921875, 0.0098876953125, 0.021770477294921875, 0.03365325927734375, 0.045536041259765625, 0.0574188232421875, 0.06930160522460938, 0.08118438720703125, 0.09306716918945312, 0.104949951171875, 0.11683273315429688, 0.12871551513671875, 0.14059829711914062, 0.1524810791015625, 0.16436386108398438, 0.17624664306640625, 0.18812942504882812, 0.20001220703125, 0.21189498901367188, 0.22377777099609375, 0.23566055297851562, 0.2475433349609375, 0.2594261169433594, 0.27130889892578125, 0.2831916809082031, 0.295074462890625, 0.3069572448730469, 0.31884002685546875, 0.3307228088378906, 0.3426055908203125, 0.3544883728027344, 0.36637115478515625, 0.3782539367675781, 0.39013671875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 8.0, 6.0, 8.0, 11.0, 8.0, 8.0, 14.0, 22.0, 31.0, 47.0, 64.0, 81.0, 91.0, 113.0, 88.0, 104.0, 78.0, 53.0, 48.0, 26.0, 15.0, 17.0, 13.0, 9.0, 5.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002483367919921875, -0.0024057626724243164, -0.002328157424926758, -0.0022505521774291992, -0.0021729469299316406, -0.002095341682434082, -0.0020177364349365234, -0.0019401311874389648, -0.0018625259399414062, -0.0017849206924438477, -0.001707315444946289, -0.0016297101974487305, -0.0015521049499511719, -0.0014744997024536133, -0.0013968944549560547, -0.001319289207458496, -0.0012416839599609375, -0.001164078712463379, -0.0010864734649658203, -0.0010088682174682617, -0.0009312629699707031, -0.0008536577224731445, -0.0007760524749755859, -0.0006984472274780273, -0.0006208419799804688, -0.0005432367324829102, -0.00046563148498535156, -0.00038802623748779297, -0.0003104209899902344, -0.00023281574249267578, -0.0001552104949951172, -7.76052474975586e-05, 0.0, 7.76052474975586e-05, 0.0001552104949951172, 0.00023281574249267578, 0.0003104209899902344, 0.00038802623748779297, 0.00046563148498535156, 0.0005432367324829102, 0.0006208419799804688, 0.0006984472274780273, 0.0007760524749755859, 0.0008536577224731445, 0.0009312629699707031, 0.0010088682174682617, 0.0010864734649658203, 0.001164078712463379, 0.0012416839599609375, 0.001319289207458496, 0.0013968944549560547, 0.0014744997024536133, 0.0015521049499511719, 0.0016297101974487305, 0.001707315444946289, 0.0017849206924438477, 0.0018625259399414062, 0.0019401311874389648, 0.0020177364349365234, 0.002095341682434082, 0.0021729469299316406, 0.0022505521774291992, 0.002328157424926758, 0.0024057626724243164, 0.002483367919921875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 2.0, 2.0, 6.0, 10.0, 11.0, 18.0, 17.0, 21.0, 34.0, 25.0, 58.0, 99.0, 184.0, 357.0, 876.0, 1039773.0, 5860.0, 549.0, 222.0, 103.0, 81.0, 58.0, 40.0, 30.0, 17.0, 13.0, 22.0, 12.0, 10.0, 6.0, 5.0, 4.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.057647705078125, -0.0557103157043457, -0.053772926330566406, -0.05183553695678711, -0.04989814758300781, -0.047960758209228516, -0.04602336883544922, -0.04408597946166992, -0.042148590087890625, -0.04021120071411133, -0.03827381134033203, -0.036336421966552734, -0.03439903259277344, -0.03246164321899414, -0.030524253845214844, -0.028586864471435547, -0.02664947509765625, -0.024712085723876953, -0.022774696350097656, -0.02083730697631836, -0.018899917602539062, -0.016962528228759766, -0.015025138854980469, -0.013087749481201172, -0.011150360107421875, -0.009212970733642578, -0.007275581359863281, -0.005338191986083984, -0.0034008026123046875, -0.0014634132385253906, 0.00047397613525390625, 0.002411365509033203, 0.0043487548828125, 0.006286144256591797, 0.008223533630371094, 0.01016092300415039, 0.012098312377929688, 0.014035701751708984, 0.01597309112548828, 0.017910480499267578, 0.019847869873046875, 0.021785259246826172, 0.02372264862060547, 0.025660037994384766, 0.027597427368164062, 0.02953481674194336, 0.031472206115722656, 0.03340959548950195, 0.03534698486328125, 0.03728437423706055, 0.039221763610839844, 0.04115915298461914, 0.04309654235839844, 0.045033931732177734, 0.04697132110595703, 0.04890871047973633, 0.050846099853515625, 0.05278348922729492, 0.05472087860107422, 0.056658267974853516, 0.05859565734863281, 0.06053304672241211, 0.062470436096191406, 0.0644078254699707, 0.06634521484375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1020.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004157747142016888, -0.0025714323855936527, -0.0009851173963397741, 0.0006011975929141045, 0.0021875123493373394, 0.0037738271057605743, 0.005360142327845097, 0.006946456618607044, 0.008532771840691566, 0.010119087062776089, 0.011705401353538036, 0.013291716575622559, 0.014878030866384506, 0.016464345157146454, 0.01805066131055355, 0.0196369756013155, 0.021223291754722595, 0.022809606045484543, 0.02439592219889164, 0.025982236489653587, 0.027568550780415535, 0.029154866933822632, 0.03074118122458458, 0.03232749551534653, 0.033913809806108475, 0.03550012409687042, 0.03708643838763237, 0.03867275267839432, 0.040259070694446564, 0.04184538498520851, 0.04343169927597046, 0.04501801356673241, 0.04660433158278465, 0.0481906458735466, 0.04977696016430855, 0.051363274455070496, 0.05294959247112274, 0.05453590676188469, 0.05612222105264664, 0.057708535343408585, 0.05929484963417053, 0.06088116392493248, 0.06246747821569443, 0.06405379623174667, 0.06564010679721832, 0.06722642481327057, 0.06881274282932281, 0.07039905339479446, 0.07198537141084671, 0.07357168942689896, 0.0751579999923706, 0.07674431800842285, 0.0783306285738945, 0.07991694658994675, 0.0815032571554184, 0.08308957517147064, 0.08467588573694229, 0.08626220375299454, 0.08784851431846619, 0.08943483233451843, 0.09102114289999008, 0.09260746091604233, 0.09419377148151398, 0.09578008949756622, 0.09736640751361847]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 13.0, 17.0, 17.0, 25.0, 32.0, 38.0, 59.0, 46.0, 69.0, 64.0, 81.0, 68.0, 65.0, 75.0, 67.0, 54.0, 42.0, 42.0, 28.0, 33.0, 18.0, 16.0, 12.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0023022890090942383, -0.0022492017596960068, -0.0021961145102977753, -0.0021430272608995438, -0.0020899400115013123, -0.0020368527621030807, -0.0019837655127048492, -0.0019306782633066177, -0.0018775910139083862, -0.0018245037645101547, -0.0017714165151119232, -0.0017183292657136917, -0.0016652420163154602, -0.0016121547669172287, -0.0015590675175189972, -0.0015059802681207657, -0.0014528930187225342, -0.0013998057693243027, -0.0013467185199260712, -0.0012936312705278397, -0.0012405440211296082, -0.0011874567717313766, -0.0011343695223331451, -0.0010812822729349136, -0.0010281950235366821, -0.0009751077741384506, -0.0009220205247402191, -0.0008689332753419876, -0.0008158460259437561, -0.0007627587765455246, -0.0007096715271472931, -0.0006565842777490616, -0.0006034970283508301, -0.0005504097789525986, -0.0004973225295543671, -0.00044423528015613556, -0.00039114803075790405, -0.00033806078135967255, -0.00028497353196144104, -0.00023188628256320953, -0.00017879903316497803, -0.00012571178376674652, -7.262453436851501e-05, -1.9537284970283508e-05, 3.3549964427948e-05, 8.66372138261795e-05, 0.000139724463224411, 0.00019281171262264252, 0.000245898962020874, 0.00029898621141910553, 0.00035207346081733704, 0.00040516071021556854, 0.00045824795961380005, 0.0005113352090120316, 0.0005644224584102631, 0.0006175097078084946, 0.0006705969572067261, 0.0007236842066049576, 0.0007767714560031891, 0.0008298587054014206, 0.0008829459547996521, 0.0009360332041978836, 0.0009891204535961151, 0.0010422077029943466, 0.0010952949523925781]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 1.0, 6.0, 3.0, 10.0, 11.0, 9.0, 14.0, 13.0, 14.0, 19.0, 28.0, 26.0, 30.0, 27.0, 32.0, 47.0, 42.0, 43.0, 51.0, 50.0, 67.0, 49.0, 50.0, 45.0, 53.0, 40.0, 35.0, 33.0, 28.0, 25.0, 22.0, 9.0, 22.0, 7.0, 6.0, 11.0, 8.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.49609375, -4.37762451171875, -4.2591552734375, -4.14068603515625, -4.022216796875, -3.90374755859375, -3.7852783203125, -3.66680908203125, -3.54833984375, -3.42987060546875, -3.3114013671875, -3.19293212890625, -3.074462890625, -2.95599365234375, -2.8375244140625, -2.71905517578125, -2.6005859375, -2.48211669921875, -2.3636474609375, -2.24517822265625, -2.126708984375, -2.00823974609375, -1.8897705078125, -1.77130126953125, -1.65283203125, -1.53436279296875, -1.4158935546875, -1.29742431640625, -1.178955078125, -1.06048583984375, -0.9420166015625, -0.82354736328125, -0.705078125, -0.58660888671875, -0.4681396484375, -0.34967041015625, -0.231201171875, -0.11273193359375, 0.0057373046875, 0.12420654296875, 0.24267578125, 0.36114501953125, 0.4796142578125, 0.59808349609375, 0.716552734375, 0.83502197265625, 0.9534912109375, 1.07196044921875, 1.1904296875, 1.30889892578125, 1.4273681640625, 1.54583740234375, 1.664306640625, 1.78277587890625, 1.9012451171875, 2.01971435546875, 2.13818359375, 2.25665283203125, 2.3751220703125, 2.49359130859375, 2.612060546875, 2.73052978515625, 2.8489990234375, 2.96746826171875, 3.0859375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 8.0, 8.0, 5.0, 16.0, 34.0, 34.0, 58.0, 69.0, 99.0, 139.0, 255.0, 349.0, 672.0, 1421.0, 3299.0, 9388.0, 31628.0, 124581.0, 467862.0, 304425.0, 73147.0, 19804.0, 6328.0, 2432.0, 1048.0, 542.0, 305.0, 187.0, 118.0, 79.0, 63.0, 52.0, 32.0, 21.0, 11.0, 14.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.59375, -4.4617919921875, -4.329833984375, -4.1978759765625, -4.06591796875, -3.9339599609375, -3.802001953125, -3.6700439453125, -3.5380859375, -3.4061279296875, -3.274169921875, -3.1422119140625, -3.01025390625, -2.8782958984375, -2.746337890625, -2.6143798828125, -2.482421875, -2.3504638671875, -2.218505859375, -2.0865478515625, -1.95458984375, -1.8226318359375, -1.690673828125, -1.5587158203125, -1.4267578125, -1.2947998046875, -1.162841796875, -1.0308837890625, -0.89892578125, -0.7669677734375, -0.635009765625, -0.5030517578125, -0.37109375, -0.2391357421875, -0.107177734375, 0.0247802734375, 0.15673828125, 0.2886962890625, 0.420654296875, 0.5526123046875, 0.6845703125, 0.8165283203125, 0.948486328125, 1.0804443359375, 1.21240234375, 1.3443603515625, 1.476318359375, 1.6082763671875, 1.740234375, 1.8721923828125, 2.004150390625, 2.1361083984375, 2.26806640625, 2.4000244140625, 2.531982421875, 2.6639404296875, 2.7958984375, 2.9278564453125, 3.059814453125, 3.1917724609375, 3.32373046875, 3.4556884765625, 3.587646484375, 3.7196044921875, 3.8515625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 4.0, 14.0, 6.0, 5.0, 8.0, 9.0, 20.0, 14.0, 14.0, 21.0, 27.0, 30.0, 24.0, 39.0, 33.0, 30.0, 48.0, 50.0, 76.0, 133.0, 1613.0, 322.0, 86.0, 37.0, 33.0, 41.0, 40.0, 30.0, 27.0, 24.0, 25.0, 23.0, 23.0, 19.0, 19.0, 19.0, 8.0, 13.0, 10.0, 5.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-11.375, -11.0380859375, -10.701171875, -10.3642578125, -10.02734375, -9.6904296875, -9.353515625, -9.0166015625, -8.6796875, -8.3427734375, -8.005859375, -7.6689453125, -7.33203125, -6.9951171875, -6.658203125, -6.3212890625, -5.984375, -5.6474609375, -5.310546875, -4.9736328125, -4.63671875, -4.2998046875, -3.962890625, -3.6259765625, -3.2890625, -2.9521484375, -2.615234375, -2.2783203125, -1.94140625, -1.6044921875, -1.267578125, -0.9306640625, -0.59375, -0.2568359375, 0.080078125, 0.4169921875, 0.75390625, 1.0908203125, 1.427734375, 1.7646484375, 2.1015625, 2.4384765625, 2.775390625, 3.1123046875, 3.44921875, 3.7861328125, 4.123046875, 4.4599609375, 4.796875, 5.1337890625, 5.470703125, 5.8076171875, 6.14453125, 6.4814453125, 6.818359375, 7.1552734375, 7.4921875, 7.8291015625, 8.166015625, 8.5029296875, 8.83984375, 9.1767578125, 9.513671875, 9.8505859375, 10.1875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 10.0, 7.0, 13.0, 8.0, 18.0, 20.0, 24.0, 12.0, 27.0, 23.0, 34.0, 42.0, 49.0, 79.0, 109.0, 149.0, 359.0, 1111.0, 17289.0, 3096045.0, 27944.0, 1233.0, 394.0, 194.0, 111.0, 77.0, 51.0, 49.0, 27.0, 32.0, 24.0, 28.0, 12.0, 20.0, 10.0, 10.0, 8.0, 5.0, 8.0, 8.0, 7.0, 4.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-21.890625, -21.149658203125, -20.40869140625, -19.667724609375, -18.9267578125, -18.185791015625, -17.44482421875, -16.703857421875, -15.962890625, -15.221923828125, -14.48095703125, -13.739990234375, -12.9990234375, -12.258056640625, -11.51708984375, -10.776123046875, -10.03515625, -9.294189453125, -8.55322265625, -7.812255859375, -7.0712890625, -6.330322265625, -5.58935546875, -4.848388671875, -4.107421875, -3.366455078125, -2.62548828125, -1.884521484375, -1.1435546875, -0.402587890625, 0.33837890625, 1.079345703125, 1.8203125, 2.561279296875, 3.30224609375, 4.043212890625, 4.7841796875, 5.525146484375, 6.26611328125, 7.007080078125, 7.748046875, 8.489013671875, 9.22998046875, 9.970947265625, 10.7119140625, 11.452880859375, 12.19384765625, 12.934814453125, 13.67578125, 14.416748046875, 15.15771484375, 15.898681640625, 16.6396484375, 17.380615234375, 18.12158203125, 18.862548828125, 19.603515625, 20.344482421875, 21.08544921875, 21.826416015625, 22.5673828125, 23.308349609375, 24.04931640625, 24.790283203125, 25.53125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 12.0, 286.0, 639.0, 77.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.906078338623047, -4.106780052185059, -2.307481288909912, -0.5081825256347656, 1.2911157608032227, 3.090414047241211, 4.889713287353516, 6.689011573791504, 8.488309860229492, 10.28760814666748, 12.086906433105469, 13.886205673217773, 15.685503959655762, 17.48480224609375, 19.284101486206055, 21.08340072631836, 22.88269805908203, 24.681997299194336, 26.481294631958008, 28.280593872070312, 30.079891204833984, 31.87919044494629, 33.678489685058594, 35.477787017822266, 37.27708435058594, 39.07638168334961, 40.87568283081055, 42.67498016357422, 44.47427749633789, 46.27357482910156, 48.0728759765625, 49.87217330932617, 51.671478271484375, 53.47077560424805, 55.270076751708984, 57.069374084472656, 58.86867141723633, 60.66796875, 62.46726989746094, 64.26657104492188, 66.06586456298828, 67.86516571044922, 69.66445922851562, 71.46376037597656, 73.2630615234375, 75.0623550415039, 76.86165618896484, 78.66095733642578, 80.46025085449219, 82.25955200195312, 84.05884552001953, 85.85814666748047, 87.6574478149414, 89.45674133300781, 91.25604248046875, 93.05534362792969, 94.85464477539062, 96.65394592285156, 98.45323944091797, 100.2525405883789, 102.05184173583984, 103.85113525390625, 105.65043640136719, 107.44973754882812, 109.24903106689453]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 9.0, 7.0, 10.0, 15.0, 14.0, 22.0, 24.0, 31.0, 33.0, 39.0, 34.0, 44.0, 25.0, 46.0, 41.0, 35.0, 50.0, 44.0, 45.0, 44.0, 45.0, 45.0, 33.0, 37.0, 31.0, 20.0, 25.0, 19.0, 23.0, 20.0, 23.0, 9.0, 10.0, 8.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.88740921020508, -36.67438507080078, -35.461360931396484, -34.24833679199219, -33.03531265258789, -31.822288513183594, -30.609264373779297, -29.396240234375, -28.183216094970703, -26.970191955566406, -25.75716781616211, -24.544143676757812, -23.331119537353516, -22.11809539794922, -20.905071258544922, -19.692047119140625, -18.479022979736328, -17.26599884033203, -16.052974700927734, -14.839950561523438, -13.62692642211914, -12.413902282714844, -11.200878143310547, -9.98785400390625, -8.774829864501953, -7.561805725097656, -6.348781585693359, -5.1357574462890625, -3.9227333068847656, -2.7097091674804688, -1.4966850280761719, -0.283660888671875, 0.9293594360351562, 2.142383575439453, 3.35540771484375, 4.568431854248047, 5.781455993652344, 6.994480133056641, 8.207504272460938, 9.420528411865234, 10.633552551269531, 11.846576690673828, 13.059600830078125, 14.272624969482422, 15.485649108886719, 16.698673248291016, 17.911697387695312, 19.12472152709961, 20.337745666503906, 21.550769805908203, 22.7637939453125, 23.976818084716797, 25.189842224121094, 26.40286636352539, 27.615890502929688, 28.828914642333984, 30.04193878173828, 31.254962921142578, 32.467987060546875, 33.68101119995117, 34.89403533935547, 36.107059478759766, 37.32008361816406, 38.53310775756836, 39.746131896972656]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 4.0, 8.0, 11.0, 7.0, 11.0, 17.0, 14.0, 16.0, 18.0, 32.0, 30.0, 33.0, 24.0, 45.0, 41.0, 48.0, 38.0, 53.0, 61.0, 53.0, 51.0, 50.0, 50.0, 37.0, 36.0, 37.0, 33.0, 31.0, 15.0, 17.0, 13.0, 16.0, 4.0, 11.0, 8.0, 9.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.5, -4.3792724609375, -4.258544921875, -4.1378173828125, -4.01708984375, -3.8963623046875, -3.775634765625, -3.6549072265625, -3.5341796875, -3.4134521484375, -3.292724609375, -3.1719970703125, -3.05126953125, -2.9305419921875, -2.809814453125, -2.6890869140625, -2.568359375, -2.4476318359375, -2.326904296875, -2.2061767578125, -2.08544921875, -1.9647216796875, -1.843994140625, -1.7232666015625, -1.6025390625, -1.4818115234375, -1.361083984375, -1.2403564453125, -1.11962890625, -0.9989013671875, -0.878173828125, -0.7574462890625, -0.63671875, -0.5159912109375, -0.395263671875, -0.2745361328125, -0.15380859375, -0.0330810546875, 0.087646484375, 0.2083740234375, 0.3291015625, 0.4498291015625, 0.570556640625, 0.6912841796875, 0.81201171875, 0.9327392578125, 1.053466796875, 1.1741943359375, 1.294921875, 1.4156494140625, 1.536376953125, 1.6571044921875, 1.77783203125, 1.8985595703125, 2.019287109375, 2.1400146484375, 2.2607421875, 2.3814697265625, 2.502197265625, 2.6229248046875, 2.74365234375, 2.8643798828125, 2.985107421875, 3.1058349609375, 3.2265625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 1.0, 5.0, 9.0, 11.0, 16.0, 10.0, 13.0, 17.0, 20.0, 35.0, 54.0, 70.0, 94.0, 135.0, 255.0, 438.0, 1143.0, 4768.0, 33193.0, 520498.0, 3229445.0, 371754.0, 26251.0, 3902.0, 1009.0, 466.0, 229.0, 133.0, 87.0, 61.0, 41.0, 29.0, 15.0, 20.0, 18.0, 14.0, 7.0, 5.0, 6.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-15.2734375, -14.8543701171875, -14.435302734375, -14.0162353515625, -13.59716796875, -13.1781005859375, -12.759033203125, -12.3399658203125, -11.9208984375, -11.5018310546875, -11.082763671875, -10.6636962890625, -10.24462890625, -9.8255615234375, -9.406494140625, -8.9874267578125, -8.568359375, -8.1492919921875, -7.730224609375, -7.3111572265625, -6.89208984375, -6.4730224609375, -6.053955078125, -5.6348876953125, -5.2158203125, -4.7967529296875, -4.377685546875, -3.9586181640625, -3.53955078125, -3.1204833984375, -2.701416015625, -2.2823486328125, -1.86328125, -1.4442138671875, -1.025146484375, -0.6060791015625, -0.18701171875, 0.2320556640625, 0.651123046875, 1.0701904296875, 1.4892578125, 1.9083251953125, 2.327392578125, 2.7464599609375, 3.16552734375, 3.5845947265625, 4.003662109375, 4.4227294921875, 4.841796875, 5.2608642578125, 5.679931640625, 6.0989990234375, 6.51806640625, 6.9371337890625, 7.356201171875, 7.7752685546875, 8.1943359375, 8.6134033203125, 9.032470703125, 9.4515380859375, 9.87060546875, 10.2896728515625, 10.708740234375, 11.1278076171875, 11.546875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 4.0, 7.0, 19.0, 20.0, 35.0, 39.0, 83.0, 124.0, 179.0, 270.0, 474.0, 672.0, 685.0, 511.0, 330.0, 219.0, 139.0, 88.0, 76.0, 39.0, 20.0, 20.0, 12.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.78125, -18.231201171875, -17.68115234375, -17.131103515625, -16.5810546875, -16.031005859375, -15.48095703125, -14.930908203125, -14.380859375, -13.830810546875, -13.28076171875, -12.730712890625, -12.1806640625, -11.630615234375, -11.08056640625, -10.530517578125, -9.98046875, -9.430419921875, -8.88037109375, -8.330322265625, -7.7802734375, -7.230224609375, -6.68017578125, -6.130126953125, -5.580078125, -5.030029296875, -4.47998046875, -3.929931640625, -3.3798828125, -2.829833984375, -2.27978515625, -1.729736328125, -1.1796875, -0.629638671875, -0.07958984375, 0.470458984375, 1.0205078125, 1.570556640625, 2.12060546875, 2.670654296875, 3.220703125, 3.770751953125, 4.32080078125, 4.870849609375, 5.4208984375, 5.970947265625, 6.52099609375, 7.071044921875, 7.62109375, 8.171142578125, 8.72119140625, 9.271240234375, 9.8212890625, 10.371337890625, 10.92138671875, 11.471435546875, 12.021484375, 12.571533203125, 13.12158203125, 13.671630859375, 14.2216796875, 14.771728515625, 15.32177734375, 15.871826171875, 16.421875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 11.0, 15.0, 18.0, 31.0, 38.0, 63.0, 100.0, 157.0, 279.0, 422.0, 982.0, 4997.0, 154571.0, 3914460.0, 111998.0, 4081.0, 984.0, 412.0, 219.0, 138.0, 98.0, 64.0, 43.0, 24.0, 24.0, 12.0, 10.0, 5.0, 11.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.53125, -27.26123046875, -25.9912109375, -24.72119140625, -23.451171875, -22.18115234375, -20.9111328125, -19.64111328125, -18.37109375, -17.10107421875, -15.8310546875, -14.56103515625, -13.291015625, -12.02099609375, -10.7509765625, -9.48095703125, -8.2109375, -6.94091796875, -5.6708984375, -4.40087890625, -3.130859375, -1.86083984375, -0.5908203125, 0.67919921875, 1.94921875, 3.21923828125, 4.4892578125, 5.75927734375, 7.029296875, 8.29931640625, 9.5693359375, 10.83935546875, 12.109375, 13.37939453125, 14.6494140625, 15.91943359375, 17.189453125, 18.45947265625, 19.7294921875, 20.99951171875, 22.26953125, 23.53955078125, 24.8095703125, 26.07958984375, 27.349609375, 28.61962890625, 29.8896484375, 31.15966796875, 32.4296875, 33.69970703125, 34.9697265625, 36.23974609375, 37.509765625, 38.77978515625, 40.0498046875, 41.31982421875, 42.58984375, 43.85986328125, 45.1298828125, 46.39990234375, 47.669921875, 48.93994140625, 50.2099609375, 51.47998046875, 52.75]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 78.0, 507.0, 393.0, 35.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-412.53875732421875, -405.15386962890625, -397.7689514160156, -390.3840637207031, -382.9991760253906, -375.6142578125, -368.2293701171875, -360.844482421875, -353.4595947265625, -346.07470703125, -338.6897888183594, -331.3049011230469, -323.9200134277344, -316.53509521484375, -309.15020751953125, -301.76531982421875, -294.3804016113281, -286.9955139160156, -279.610595703125, -272.2257080078125, -264.8408203125, -257.4559326171875, -250.07101440429688, -242.68612670898438, -235.30123901367188, -227.9163360595703, -220.5314483642578, -213.14654541015625, -205.76165771484375, -198.3767547607422, -190.99185180664062, -183.60696411132812, -176.22206115722656, -168.837158203125, -161.4522705078125, -154.06736755371094, -146.68247985839844, -139.29757690429688, -131.91268920898438, -124.52778625488281, -117.14288330078125, -109.75798797607422, -102.37309265136719, -94.98818969726562, -87.6032943725586, -80.21839904785156, -72.83350372314453, -65.4486083984375, -58.0637092590332, -50.67881393432617, -43.293914794921875, -35.909019470214844, -28.52412223815918, -21.139225006103516, -13.754329681396484, -6.3694305419921875, 1.0154647827148438, 8.400362014770508, 15.785258293151855, 23.170154571533203, 30.555051803588867, 37.93994903564453, 45.32484436035156, 52.70974349975586, 60.09463882446289]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 7.0, 9.0, 9.0, 8.0, 12.0, 10.0, 21.0, 19.0, 21.0, 21.0, 25.0, 29.0, 21.0, 32.0, 23.0, 30.0, 26.0, 32.0, 34.0, 30.0, 38.0, 40.0, 45.0, 22.0, 43.0, 25.0, 26.0, 39.0, 34.0, 36.0, 27.0, 23.0, 19.0, 20.0, 18.0, 25.0, 20.0, 10.0, 11.0, 12.0, 15.0, 9.0, 5.0, 10.0, 6.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-36.43756103515625, -35.34339904785156, -34.249237060546875, -33.15507507324219, -32.0609130859375, -30.96674919128418, -29.87258529663086, -28.778423309326172, -27.684261322021484, -26.590099334716797, -25.49593734741211, -24.40177345275879, -23.3076114654541, -22.213449478149414, -21.119285583496094, -20.025123596191406, -18.93096160888672, -17.83679962158203, -16.742637634277344, -15.648473739624023, -14.554311752319336, -13.460149765014648, -12.365986824035645, -11.27182388305664, -10.177661895751953, -9.083499908447266, -7.989336967468262, -6.895174503326416, -5.80101203918457, -4.706849575042725, -3.612687110900879, -2.518524646759033, -1.4243621826171875, -0.3301997184753418, 0.7639627456665039, 1.8581252098083496, 2.9522876739501953, 4.046450138092041, 5.140612602233887, 6.234775066375732, 7.328937530517578, 8.423099517822266, 9.51726245880127, 10.611425399780273, 11.705587387084961, 12.799749374389648, 13.893912315368652, 14.988075256347656, 16.082237243652344, 17.17639923095703, 18.27056121826172, 19.36472511291504, 20.458887100219727, 21.553049087524414, 22.647212982177734, 23.741374969482422, 24.83553695678711, 25.929698944091797, 27.023860931396484, 28.118024826049805, 29.212186813354492, 30.30634880065918, 31.4005126953125, 32.49467468261719, 33.588836669921875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 7.0, 6.0, 6.0, 15.0, 15.0, 10.0, 22.0, 25.0, 17.0, 36.0, 39.0, 36.0, 26.0, 42.0, 44.0, 50.0, 46.0, 54.0, 47.0, 55.0, 52.0, 44.0, 60.0, 34.0, 35.0, 22.0, 29.0, 21.0, 23.0, 13.0, 14.0, 12.0, 5.0, 7.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1640625, -4.0396728515625, -3.915283203125, -3.7908935546875, -3.66650390625, -3.5421142578125, -3.417724609375, -3.2933349609375, -3.1689453125, -3.0445556640625, -2.920166015625, -2.7957763671875, -2.67138671875, -2.5469970703125, -2.422607421875, -2.2982177734375, -2.173828125, -2.0494384765625, -1.925048828125, -1.8006591796875, -1.67626953125, -1.5518798828125, -1.427490234375, -1.3031005859375, -1.1787109375, -1.0543212890625, -0.929931640625, -0.8055419921875, -0.68115234375, -0.5567626953125, -0.432373046875, -0.3079833984375, -0.18359375, -0.0592041015625, 0.065185546875, 0.1895751953125, 0.31396484375, 0.4383544921875, 0.562744140625, 0.6871337890625, 0.8115234375, 0.9359130859375, 1.060302734375, 1.1846923828125, 1.30908203125, 1.4334716796875, 1.557861328125, 1.6822509765625, 1.806640625, 1.9310302734375, 2.055419921875, 2.1798095703125, 2.30419921875, 2.4285888671875, 2.552978515625, 2.6773681640625, 2.8017578125, 2.9261474609375, 3.050537109375, 3.1749267578125, 3.29931640625, 3.4237060546875, 3.548095703125, 3.6724853515625, 3.796875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 11.0, 14.0, 30.0, 34.0, 63.0, 97.0, 141.0, 241.0, 382.0, 612.0, 990.0, 1695.0, 3017.0, 5315.0, 9535.0, 17028.0, 30665.0, 56246.0, 111574.0, 234081.0, 281938.0, 141184.0, 69616.0, 36973.0, 20440.0, 11320.0, 6560.0, 3609.0, 2145.0, 1162.0, 664.0, 464.0, 251.0, 163.0, 94.0, 56.0, 45.0, 36.0, 22.0, 14.0, 10.0, 6.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.68408203125, -0.6634521484375, -0.642822265625, -0.6221923828125, -0.6015625, -0.5809326171875, -0.560302734375, -0.5396728515625, -0.51904296875, -0.4984130859375, -0.477783203125, -0.4571533203125, -0.4365234375, -0.4158935546875, -0.395263671875, -0.3746337890625, -0.35400390625, -0.3333740234375, -0.312744140625, -0.2921142578125, -0.271484375, -0.2508544921875, -0.230224609375, -0.2095947265625, -0.18896484375, -0.1683349609375, -0.147705078125, -0.1270751953125, -0.1064453125, -0.0858154296875, -0.065185546875, -0.0445556640625, -0.02392578125, -0.0032958984375, 0.017333984375, 0.0379638671875, 0.05859375, 0.0792236328125, 0.099853515625, 0.1204833984375, 0.14111328125, 0.1617431640625, 0.182373046875, 0.2030029296875, 0.2236328125, 0.2442626953125, 0.264892578125, 0.2855224609375, 0.30615234375, 0.3267822265625, 0.347412109375, 0.3680419921875, 0.388671875, 0.4093017578125, 0.429931640625, 0.4505615234375, 0.47119140625, 0.4918212890625, 0.512451171875, 0.5330810546875, 0.5537109375, 0.5743408203125, 0.594970703125, 0.6156005859375, 0.63623046875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 9.0, 11.0, 9.0, 14.0, 18.0, 15.0, 17.0, 22.0, 19.0, 25.0, 39.0, 42.0, 35.0, 41.0, 31.0, 41.0, 33.0, 31.0, 1063.0, 39.0, 41.0, 45.0, 35.0, 40.0, 41.0, 27.0, 32.0, 24.0, 30.0, 17.0, 19.0, 15.0, 17.0, 18.0, 12.0, 10.0, 13.0, 10.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.140625, -2.070465087890625, -2.00030517578125, -1.930145263671875, -1.8599853515625, -1.789825439453125, -1.71966552734375, -1.649505615234375, -1.579345703125, -1.509185791015625, -1.43902587890625, -1.368865966796875, -1.2987060546875, -1.228546142578125, -1.15838623046875, -1.088226318359375, -1.01806640625, -0.947906494140625, -0.87774658203125, -0.807586669921875, -0.7374267578125, -0.667266845703125, -0.59710693359375, -0.526947021484375, -0.456787109375, -0.386627197265625, -0.31646728515625, -0.246307373046875, -0.1761474609375, -0.105987548828125, -0.03582763671875, 0.034332275390625, 0.1044921875, 0.174652099609375, 0.24481201171875, 0.314971923828125, 0.3851318359375, 0.455291748046875, 0.52545166015625, 0.595611572265625, 0.665771484375, 0.735931396484375, 0.80609130859375, 0.876251220703125, 0.9464111328125, 1.016571044921875, 1.08673095703125, 1.156890869140625, 1.22705078125, 1.297210693359375, 1.36737060546875, 1.437530517578125, 1.5076904296875, 1.577850341796875, 1.64801025390625, 1.718170166015625, 1.788330078125, 1.858489990234375, 1.92864990234375, 1.998809814453125, 2.0689697265625, 2.139129638671875, 2.20928955078125, 2.279449462890625, 2.349609375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 5.0, 5.0, 10.0, 22.0, 18.0, 41.0, 60.0, 101.0, 125.0, 209.0, 337.0, 533.0, 921.0, 1533.0, 2631.0, 4345.0, 7707.0, 13837.0, 24416.0, 45091.0, 85555.0, 166151.0, 1307196.0, 203635.0, 107578.0, 55908.0, 29741.0, 16629.0, 9448.0, 5511.0, 3094.0, 1856.0, 1139.0, 646.0, 405.0, 255.0, 151.0, 95.0, 68.0, 43.0, 21.0, 22.0, 16.0, 9.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.462890625, -0.4491424560546875, -0.435394287109375, -0.4216461181640625, -0.40789794921875, -0.3941497802734375, -0.380401611328125, -0.3666534423828125, -0.3529052734375, -0.3391571044921875, -0.325408935546875, -0.3116607666015625, -0.29791259765625, -0.2841644287109375, -0.270416259765625, -0.2566680908203125, -0.242919921875, -0.2291717529296875, -0.215423583984375, -0.2016754150390625, -0.18792724609375, -0.1741790771484375, -0.160430908203125, -0.1466827392578125, -0.1329345703125, -0.1191864013671875, -0.105438232421875, -0.0916900634765625, -0.07794189453125, -0.0641937255859375, -0.050445556640625, -0.0366973876953125, -0.02294921875, -0.0092010498046875, 0.004547119140625, 0.0182952880859375, 0.03204345703125, 0.0457916259765625, 0.059539794921875, 0.0732879638671875, 0.0870361328125, 0.1007843017578125, 0.114532470703125, 0.1282806396484375, 0.14202880859375, 0.1557769775390625, 0.169525146484375, 0.1832733154296875, 0.197021484375, 0.2107696533203125, 0.224517822265625, 0.2382659912109375, 0.25201416015625, 0.2657623291015625, 0.279510498046875, 0.2932586669921875, 0.3070068359375, 0.3207550048828125, 0.334503173828125, 0.3482513427734375, 0.36199951171875, 0.3757476806640625, 0.389495849609375, 0.4032440185546875, 0.4169921875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 14.0, 10.0, 17.0, 13.0, 24.0, 20.0, 42.0, 35.0, 49.0, 58.0, 101.0, 94.0, 98.0, 93.0, 76.0, 62.0, 41.0, 21.0, 22.0, 19.0, 18.0, 11.0, 8.0, 12.0, 3.0, 5.0, 4.0, 8.0, 0.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0033397674560546875, -0.0032536983489990234, -0.0031676292419433594, -0.0030815601348876953, -0.0029954910278320312, -0.002909421920776367, -0.002823352813720703, -0.002737283706665039, -0.002651214599609375, -0.002565145492553711, -0.002479076385498047, -0.002393007278442383, -0.0023069381713867188, -0.0022208690643310547, -0.0021347999572753906, -0.0020487308502197266, -0.0019626617431640625, -0.0018765926361083984, -0.0017905235290527344, -0.0017044544219970703, -0.0016183853149414062, -0.0015323162078857422, -0.0014462471008300781, -0.001360177993774414, -0.00127410888671875, -0.001188039779663086, -0.0011019706726074219, -0.0010159015655517578, -0.0009298324584960938, -0.0008437633514404297, -0.0007576942443847656, -0.0006716251373291016, -0.0005855560302734375, -0.0004994869232177734, -0.0004134178161621094, -0.0003273487091064453, -0.00024127960205078125, -0.0001552104949951172, -6.914138793945312e-05, 1.6927719116210938e-05, 0.000102996826171875, 0.00018906593322753906, 0.0002751350402832031, 0.0003612041473388672, 0.00044727325439453125, 0.0005333423614501953, 0.0006194114685058594, 0.0007054805755615234, 0.0007915496826171875, 0.0008776187896728516, 0.0009636878967285156, 0.0010497570037841797, 0.0011358261108398438, 0.0012218952178955078, 0.0013079643249511719, 0.001394033432006836, 0.0014801025390625, 0.001566171646118164, 0.0016522407531738281, 0.0017383098602294922, 0.0018243789672851562, 0.0019104480743408203, 0.0019965171813964844, 0.0020825862884521484, 0.0021686553955078125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 9.0, 11.0, 9.0, 20.0, 15.0, 21.0, 27.0, 35.0, 67.0, 104.0, 215.0, 367.0, 1204.0, 1042886.0, 2535.0, 474.0, 175.0, 102.0, 67.0, 46.0, 30.0, 28.0, 13.0, 15.0, 18.0, 10.0, 8.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05743408203125, -0.05527687072753906, -0.053119659423828125, -0.05096244812011719, -0.04880523681640625, -0.04664802551269531, -0.044490814208984375, -0.04233360290527344, -0.0401763916015625, -0.03801918029785156, -0.035861968994140625, -0.03370475769042969, -0.03154754638671875, -0.029390335083007812, -0.027233123779296875, -0.025075912475585938, -0.022918701171875, -0.020761489868164062, -0.018604278564453125, -0.016447067260742188, -0.01428985595703125, -0.012132644653320312, -0.009975433349609375, -0.007818222045898438, -0.0056610107421875, -0.0035037994384765625, -0.001346588134765625, 0.0008106231689453125, 0.00296783447265625, 0.0051250457763671875, 0.007282257080078125, 0.009439468383789062, 0.0115966796875, 0.013753890991210938, 0.015911102294921875, 0.018068313598632812, 0.02022552490234375, 0.022382736206054688, 0.024539947509765625, 0.026697158813476562, 0.0288543701171875, 0.031011581420898438, 0.033168792724609375, 0.03532600402832031, 0.03748321533203125, 0.03964042663574219, 0.041797637939453125, 0.04395484924316406, 0.046112060546875, 0.04826927185058594, 0.050426483154296875, 0.05258369445800781, 0.05474090576171875, 0.05689811706542969, 0.059055328369140625, 0.06121253967285156, 0.0633697509765625, 0.06552696228027344, 0.06768417358398438, 0.06984138488769531, 0.07199859619140625, 0.07415580749511719, 0.07631301879882812, 0.07847023010253906, 0.08062744140625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1018.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006074903532862663, -0.0038381684571504593, -0.0016014333814382553, 0.0006353016942739487, 0.0028720367699861526, 0.005108771845698357, 0.007345506921410561, 0.009582241997122765, 0.011818977072834969, 0.014055712148547173, 0.016292447224259377, 0.01852918229997158, 0.020765917375683784, 0.02300265245139599, 0.025239387527108192, 0.027476122602820396, 0.0297128576785326, 0.031949594616889954, 0.03418632596731186, 0.03642306476831436, 0.03865979611873627, 0.04089653491973877, 0.043133266270160675, 0.04537000507116318, 0.04760673642158508, 0.04984347149729729, 0.05208020657300949, 0.054316941648721695, 0.0565536767244339, 0.0587904118001461, 0.06102714687585831, 0.06326387822628021, 0.06550061702728271, 0.06773735582828522, 0.06997408717870712, 0.07221081852912903, 0.07444755733013153, 0.07668429613113403, 0.07892102748155594, 0.08115775883197784, 0.08339449763298035, 0.08563123643398285, 0.08786796778440475, 0.09010469913482666, 0.09234143793582916, 0.09457817673683167, 0.09681490808725357, 0.09905163943767548, 0.10128837823867798, 0.10352511703968048, 0.10576184839010239, 0.10799857974052429, 0.1102353185415268, 0.1124720573425293, 0.1147087886929512, 0.11694552004337311, 0.11918225884437561, 0.12141899764537811, 0.12365572899580002, 0.12589246034622192, 0.12812919914722443, 0.13036593794822693, 0.13260266184806824, 0.13483940064907074, 0.13707613945007324]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 18.0, 24.0, 39.0, 46.0, 55.0, 53.0, 75.0, 91.0, 92.0, 85.0, 77.0, 86.0, 82.0, 57.0, 41.0, 39.0, 18.0, 13.0, 7.0, 6.0, 2.0, 2.0], "bins": [-0.0042359232902526855, -0.0041525838896632195, -0.004069244489073753, -0.003985905088484287, -0.003902565687894821, -0.003819226287305355, -0.003735886886715889, -0.003652547486126423, -0.003569208085536957, -0.0034858686849474907, -0.0034025292843580246, -0.0033191898837685585, -0.0032358504831790924, -0.0031525110825896263, -0.0030691716820001602, -0.002985832281410694, -0.002902492880821228, -0.002819153480231762, -0.002735814079642296, -0.0026524746790528297, -0.0025691352784633636, -0.0024857958778738976, -0.0024024564772844315, -0.0023191170766949654, -0.0022357776761054993, -0.002152438275516033, -0.002069098874926567, -0.001985759474337101, -0.0019024200737476349, -0.0018190806731581688, -0.0017357412725687027, -0.0016524018719792366, -0.0015690624713897705, -0.0014857230708003044, -0.0014023836702108383, -0.0013190442696213722, -0.0012357048690319061, -0.00115236546844244, -0.001069026067852974, -0.0009856866672635078, -0.0009023472666740417, -0.0008190078660845757, -0.0007356684654951096, -0.0006523290649056435, -0.0005689896643161774, -0.0004856502637267113, -0.0004023108631372452, -0.0003189714625477791, -0.000235632061958313, -0.0001522926613688469, -6.89532607793808e-05, 1.4386139810085297e-05, 9.772554039955139e-05, 0.0001810649409890175, 0.0002644043415784836, 0.0003477437421679497, 0.00043108314275741577, 0.0005144225433468819, 0.000597761943936348, 0.0006811013445258141, 0.0007644407451152802, 0.0008477801457047462, 0.0009311195462942123, 0.0010144589468836784, 0.0010977983474731445]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 7.0, 6.0, 6.0, 15.0, 15.0, 10.0, 22.0, 25.0, 17.0, 36.0, 39.0, 36.0, 26.0, 42.0, 44.0, 50.0, 46.0, 54.0, 47.0, 55.0, 52.0, 44.0, 60.0, 34.0, 35.0, 22.0, 29.0, 21.0, 23.0, 13.0, 14.0, 12.0, 5.0, 7.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1640625, -4.0396728515625, -3.915283203125, -3.7908935546875, -3.66650390625, -3.5421142578125, -3.417724609375, -3.2933349609375, -3.1689453125, -3.0445556640625, -2.920166015625, -2.7957763671875, -2.67138671875, -2.5469970703125, -2.422607421875, -2.2982177734375, -2.173828125, -2.0494384765625, -1.925048828125, -1.8006591796875, -1.67626953125, -1.5518798828125, -1.427490234375, -1.3031005859375, -1.1787109375, -1.0543212890625, -0.929931640625, -0.8055419921875, -0.68115234375, -0.5567626953125, -0.432373046875, -0.3079833984375, -0.18359375, -0.0592041015625, 0.065185546875, 0.1895751953125, 0.31396484375, 0.4383544921875, 0.562744140625, 0.6871337890625, 0.8115234375, 0.9359130859375, 1.060302734375, 1.1846923828125, 1.30908203125, 1.4334716796875, 1.557861328125, 1.6822509765625, 1.806640625, 1.9310302734375, 2.055419921875, 2.1798095703125, 2.30419921875, 2.4285888671875, 2.552978515625, 2.6773681640625, 2.8017578125, 2.9261474609375, 3.050537109375, 3.1749267578125, 3.29931640625, 3.4237060546875, 3.548095703125, 3.6724853515625, 3.796875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 12.0, 11.0, 11.0, 28.0, 33.0, 42.0, 60.0, 86.0, 133.0, 215.0, 288.0, 488.0, 705.0, 1101.0, 1927.0, 3386.0, 6268.0, 12189.0, 25005.0, 59744.0, 172050.0, 439991.0, 199976.0, 67673.0, 27935.0, 13191.0, 6851.0, 3643.0, 2068.0, 1201.0, 792.0, 476.0, 313.0, 194.0, 147.0, 78.0, 76.0, 58.0, 32.0, 25.0, 16.0, 12.0, 1.0, 3.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.830078125, -2.74041748046875, -2.6507568359375, -2.56109619140625, -2.471435546875, -2.38177490234375, -2.2921142578125, -2.20245361328125, -2.11279296875, -2.02313232421875, -1.9334716796875, -1.84381103515625, -1.754150390625, -1.66448974609375, -1.5748291015625, -1.48516845703125, -1.3955078125, -1.30584716796875, -1.2161865234375, -1.12652587890625, -1.036865234375, -0.94720458984375, -0.8575439453125, -0.76788330078125, -0.67822265625, -0.58856201171875, -0.4989013671875, -0.40924072265625, -0.319580078125, -0.22991943359375, -0.1402587890625, -0.05059814453125, 0.0390625, 0.12872314453125, 0.2183837890625, 0.30804443359375, 0.397705078125, 0.48736572265625, 0.5770263671875, 0.66668701171875, 0.75634765625, 0.84600830078125, 0.9356689453125, 1.02532958984375, 1.114990234375, 1.20465087890625, 1.2943115234375, 1.38397216796875, 1.4736328125, 1.56329345703125, 1.6529541015625, 1.74261474609375, 1.832275390625, 1.92193603515625, 2.0115966796875, 2.10125732421875, 2.19091796875, 2.28057861328125, 2.3702392578125, 2.45989990234375, 2.549560546875, 2.63922119140625, 2.7288818359375, 2.81854248046875, 2.908203125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 5.0, 2.0, 10.0, 6.0, 17.0, 6.0, 7.0, 13.0, 24.0, 24.0, 22.0, 25.0, 36.0, 33.0, 34.0, 43.0, 47.0, 61.0, 64.0, 137.0, 1769.0, 167.0, 68.0, 59.0, 44.0, 43.0, 46.0, 40.0, 31.0, 25.0, 25.0, 25.0, 20.0, 23.0, 12.0, 6.0, 9.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.9193115234375, -11.502685546875, -11.0860595703125, -10.66943359375, -10.2528076171875, -9.836181640625, -9.4195556640625, -9.0029296875, -8.5863037109375, -8.169677734375, -7.7530517578125, -7.33642578125, -6.9197998046875, -6.503173828125, -6.0865478515625, -5.669921875, -5.2532958984375, -4.836669921875, -4.4200439453125, -4.00341796875, -3.5867919921875, -3.170166015625, -2.7535400390625, -2.3369140625, -1.9202880859375, -1.503662109375, -1.0870361328125, -0.67041015625, -0.2537841796875, 0.162841796875, 0.5794677734375, 0.99609375, 1.4127197265625, 1.829345703125, 2.2459716796875, 2.66259765625, 3.0792236328125, 3.495849609375, 3.9124755859375, 4.3291015625, 4.7457275390625, 5.162353515625, 5.5789794921875, 5.99560546875, 6.4122314453125, 6.828857421875, 7.2454833984375, 7.662109375, 8.0787353515625, 8.495361328125, 8.9119873046875, 9.32861328125, 9.7452392578125, 10.161865234375, 10.5784912109375, 10.9951171875, 11.4117431640625, 11.828369140625, 12.2449951171875, 12.66162109375, 13.0782470703125, 13.494873046875, 13.9114990234375, 14.328125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 7.0, 8.0, 5.0, 7.0, 9.0, 14.0, 24.0, 29.0, 40.0, 32.0, 41.0, 60.0, 78.0, 94.0, 199.0, 380.0, 1075.0, 7280.0, 840275.0, 2284413.0, 9270.0, 1228.0, 424.0, 197.0, 118.0, 91.0, 62.0, 47.0, 41.0, 33.0, 21.0, 22.0, 13.0, 13.0, 12.0, 13.0, 7.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-24.28125, -23.58837890625, -22.8955078125, -22.20263671875, -21.509765625, -20.81689453125, -20.1240234375, -19.43115234375, -18.73828125, -18.04541015625, -17.3525390625, -16.65966796875, -15.966796875, -15.27392578125, -14.5810546875, -13.88818359375, -13.1953125, -12.50244140625, -11.8095703125, -11.11669921875, -10.423828125, -9.73095703125, -9.0380859375, -8.34521484375, -7.65234375, -6.95947265625, -6.2666015625, -5.57373046875, -4.880859375, -4.18798828125, -3.4951171875, -2.80224609375, -2.109375, -1.41650390625, -0.7236328125, -0.03076171875, 0.662109375, 1.35498046875, 2.0478515625, 2.74072265625, 3.43359375, 4.12646484375, 4.8193359375, 5.51220703125, 6.205078125, 6.89794921875, 7.5908203125, 8.28369140625, 8.9765625, 9.66943359375, 10.3623046875, 11.05517578125, 11.748046875, 12.44091796875, 13.1337890625, 13.82666015625, 14.51953125, 15.21240234375, 15.9052734375, 16.59814453125, 17.291015625, 17.98388671875, 18.6767578125, 19.36962890625, 20.0625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 12.0, 37.0, 132.0, 280.0, 288.0, 177.0, 58.0, 23.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.660255432128906, -35.67465591430664, -34.68905258178711, -33.703453063964844, -32.71785354614258, -31.73225212097168, -30.74665069580078, -29.761051177978516, -28.775449752807617, -27.78984832763672, -26.804248809814453, -25.818647384643555, -24.833045959472656, -23.84744644165039, -22.861845016479492, -21.876243591308594, -20.890644073486328, -19.90504264831543, -18.919443130493164, -17.933841705322266, -16.948240280151367, -15.962640762329102, -14.977039337158203, -13.991438865661621, -13.005836486816406, -12.020236015319824, -11.034634590148926, -10.049034118652344, -9.063433647155762, -8.07783317565918, -7.092231750488281, -6.106631278991699, -5.121030807495117, -4.135429859161377, -3.149829387664795, -2.1642284393310547, -1.1786277294158936, -0.19302701950073242, 0.7925739288330078, 1.7781744003295898, 2.76377534866333, 3.749376058578491, 4.734976768493652, 5.720577716827393, 6.706178665161133, 7.691779136657715, 8.677379608154297, 9.662981033325195, 10.648581504821777, 11.63418197631836, 12.619783401489258, 13.60538387298584, 14.590984344482422, 15.57658576965332, 16.56218719482422, 17.547786712646484, 18.533388137817383, 19.51898956298828, 20.504589080810547, 21.490190505981445, 22.475791931152344, 23.46139144897461, 24.446992874145508, 25.432594299316406, 26.418193817138672]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 3.0, 4.0, 7.0, 11.0, 17.0, 14.0, 18.0, 28.0, 38.0, 42.0, 36.0, 39.0, 46.0, 52.0, 47.0, 51.0, 49.0, 40.0, 44.0, 41.0, 39.0, 36.0, 41.0, 32.0, 33.0, 22.0, 24.0, 30.0, 17.0, 24.0, 8.0, 12.0, 9.0, 10.0, 11.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.41718673706055, -43.99454879760742, -42.5719108581543, -41.14927291870117, -39.72663116455078, -38.303993225097656, -36.88135528564453, -35.458717346191406, -34.03607940673828, -32.613441467285156, -31.19080352783203, -29.768163681030273, -28.34552574157715, -26.922887802124023, -25.500247955322266, -24.07761001586914, -22.654972076416016, -21.23233413696289, -19.809696197509766, -18.387056350708008, -16.964418411254883, -15.541780471801758, -14.119141578674316, -12.696502685546875, -11.27386474609375, -9.851226806640625, -8.428587913513184, -7.0059494972229, -5.583311080932617, -4.160672664642334, -2.738034248352051, -1.3153953552246094, 0.10724639892578125, 1.5298848152160645, 2.9525232315063477, 4.375161647796631, 5.797800064086914, 7.220438480377197, 8.64307689666748, 10.065715789794922, 11.488353729248047, 12.910991668701172, 14.333630561828613, 15.756269454956055, 17.17890739440918, 18.601545333862305, 20.024185180664062, 21.446823120117188, 22.869461059570312, 24.292098999023438, 25.714736938476562, 27.13737678527832, 28.560014724731445, 29.98265266418457, 31.405292510986328, 32.82793045043945, 34.25056838989258, 35.6732063293457, 37.09584426879883, 38.51848220825195, 39.941123962402344, 41.36376190185547, 42.786399841308594, 44.20903778076172, 45.631675720214844]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 2.0, 8.0, 4.0, 6.0, 6.0, 10.0, 10.0, 11.0, 20.0, 20.0, 20.0, 19.0, 32.0, 35.0, 35.0, 31.0, 41.0, 45.0, 52.0, 44.0, 58.0, 45.0, 55.0, 61.0, 40.0, 42.0, 49.0, 37.0, 22.0, 26.0, 20.0, 20.0, 14.0, 24.0, 7.0, 7.0, 5.0, 7.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.0550537109375, -3.926513671875, -3.7979736328125, -3.66943359375, -3.5408935546875, -3.412353515625, -3.2838134765625, -3.1552734375, -3.0267333984375, -2.898193359375, -2.7696533203125, -2.64111328125, -2.5125732421875, -2.384033203125, -2.2554931640625, -2.126953125, -1.9984130859375, -1.869873046875, -1.7413330078125, -1.61279296875, -1.4842529296875, -1.355712890625, -1.2271728515625, -1.0986328125, -0.9700927734375, -0.841552734375, -0.7130126953125, -0.58447265625, -0.4559326171875, -0.327392578125, -0.1988525390625, -0.0703125, 0.0582275390625, 0.186767578125, 0.3153076171875, 0.44384765625, 0.5723876953125, 0.700927734375, 0.8294677734375, 0.9580078125, 1.0865478515625, 1.215087890625, 1.3436279296875, 1.47216796875, 1.6007080078125, 1.729248046875, 1.8577880859375, 1.986328125, 2.1148681640625, 2.243408203125, 2.3719482421875, 2.50048828125, 2.6290283203125, 2.757568359375, 2.8861083984375, 3.0146484375, 3.1431884765625, 3.271728515625, 3.4002685546875, 3.52880859375, 3.6573486328125, 3.785888671875, 3.9144287109375, 4.04296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 5.0, 6.0, 6.0, 9.0, 14.0, 16.0, 19.0, 20.0, 14.0, 31.0, 27.0, 23.0, 28.0, 43.0, 54.0, 162.0, 665.0, 4494.0, 87891.0, 3497458.0, 587731.0, 13508.0, 1348.0, 298.0, 102.0, 46.0, 46.0, 22.0, 21.0, 27.0, 27.0, 20.0, 21.0, 13.0, 11.0, 11.0, 10.0, 7.0, 9.0, 1.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.359375, -17.719970703125, -17.08056640625, -16.441162109375, -15.8017578125, -15.162353515625, -14.52294921875, -13.883544921875, -13.244140625, -12.604736328125, -11.96533203125, -11.325927734375, -10.6865234375, -10.047119140625, -9.40771484375, -8.768310546875, -8.12890625, -7.489501953125, -6.85009765625, -6.210693359375, -5.5712890625, -4.931884765625, -4.29248046875, -3.653076171875, -3.013671875, -2.374267578125, -1.73486328125, -1.095458984375, -0.4560546875, 0.183349609375, 0.82275390625, 1.462158203125, 2.1015625, 2.740966796875, 3.38037109375, 4.019775390625, 4.6591796875, 5.298583984375, 5.93798828125, 6.577392578125, 7.216796875, 7.856201171875, 8.49560546875, 9.135009765625, 9.7744140625, 10.413818359375, 11.05322265625, 11.692626953125, 12.33203125, 12.971435546875, 13.61083984375, 14.250244140625, 14.8896484375, 15.529052734375, 16.16845703125, 16.807861328125, 17.447265625, 18.086669921875, 18.72607421875, 19.365478515625, 20.0048828125, 20.644287109375, 21.28369140625, 21.923095703125, 22.5625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 7.0, 11.0, 15.0, 15.0, 25.0, 39.0, 37.0, 70.0, 99.0, 163.0, 211.0, 302.0, 452.0, 590.0, 595.0, 467.0, 306.0, 216.0, 138.0, 103.0, 75.0, 46.0, 28.0, 23.0, 13.0, 9.0, 9.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-18.890625, -18.4508056640625, -18.010986328125, -17.5711669921875, -17.13134765625, -16.6915283203125, -16.251708984375, -15.8118896484375, -15.3720703125, -14.9322509765625, -14.492431640625, -14.0526123046875, -13.61279296875, -13.1729736328125, -12.733154296875, -12.2933349609375, -11.853515625, -11.4136962890625, -10.973876953125, -10.5340576171875, -10.09423828125, -9.6544189453125, -9.214599609375, -8.7747802734375, -8.3349609375, -7.8951416015625, -7.455322265625, -7.0155029296875, -6.57568359375, -6.1358642578125, -5.696044921875, -5.2562255859375, -4.81640625, -4.3765869140625, -3.936767578125, -3.4969482421875, -3.05712890625, -2.6173095703125, -2.177490234375, -1.7376708984375, -1.2978515625, -0.8580322265625, -0.418212890625, 0.0216064453125, 0.46142578125, 0.9012451171875, 1.341064453125, 1.7808837890625, 2.220703125, 2.6605224609375, 3.100341796875, 3.5401611328125, 3.97998046875, 4.4197998046875, 4.859619140625, 5.2994384765625, 5.7392578125, 6.1790771484375, 6.618896484375, 7.0587158203125, 7.49853515625, 7.9383544921875, 8.378173828125, 8.8179931640625, 9.2578125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 18.0, 26.0, 44.0, 59.0, 105.0, 175.0, 312.0, 570.0, 2230.0, 105036.0, 4047379.0, 35649.0, 1552.0, 472.0, 259.0, 134.0, 105.0, 58.0, 34.0, 12.0, 13.0, 12.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.71875, -37.94580078125, -36.1728515625, -34.39990234375, -32.626953125, -30.85400390625, -29.0810546875, -27.30810546875, -25.53515625, -23.76220703125, -21.9892578125, -20.21630859375, -18.443359375, -16.67041015625, -14.8974609375, -13.12451171875, -11.3515625, -9.57861328125, -7.8056640625, -6.03271484375, -4.259765625, -2.48681640625, -0.7138671875, 1.05908203125, 2.83203125, 4.60498046875, 6.3779296875, 8.15087890625, 9.923828125, 11.69677734375, 13.4697265625, 15.24267578125, 17.015625, 18.78857421875, 20.5615234375, 22.33447265625, 24.107421875, 25.88037109375, 27.6533203125, 29.42626953125, 31.19921875, 32.97216796875, 34.7451171875, 36.51806640625, 38.291015625, 40.06396484375, 41.8369140625, 43.60986328125, 45.3828125, 47.15576171875, 48.9287109375, 50.70166015625, 52.474609375, 54.24755859375, 56.0205078125, 57.79345703125, 59.56640625, 61.33935546875, 63.1123046875, 64.88525390625, 66.658203125, 68.43115234375, 70.2041015625, 71.97705078125, 73.75]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 38.0, 120.0, 311.0, 316.0, 167.0, 49.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-227.37490844726562, -223.09507751464844, -218.81524658203125, -214.53543090820312, -210.25559997558594, -205.97576904296875, -201.69595336914062, -197.41612243652344, -193.13629150390625, -188.85646057128906, -184.57662963867188, -180.29681396484375, -176.01698303222656, -171.73715209960938, -167.45733642578125, -163.17750549316406, -158.89767456054688, -154.6178436279297, -150.3380126953125, -146.05819702148438, -141.7783660888672, -137.49853515625, -133.21871948242188, -128.9388885498047, -124.6590576171875, -120.37922668457031, -116.09940338134766, -111.819580078125, -107.53974914550781, -103.25991821289062, -98.98009490966797, -94.70027160644531, -90.42044067382812, -86.14060974121094, -81.86078643798828, -77.58096313476562, -73.30113220214844, -69.02130126953125, -64.7414779663086, -60.46165084838867, -56.18182373046875, -51.90199661254883, -47.622169494628906, -43.342342376708984, -39.06251525878906, -34.78268814086914, -30.50286102294922, -26.223033905029297, -21.943206787109375, -17.663379669189453, -13.383552551269531, -9.10372543334961, -4.8238983154296875, -0.5440711975097656, 3.7357559204101562, 8.015583038330078, 12.29541015625, 16.575237274169922, 20.855064392089844, 25.134891510009766, 29.414718627929688, 33.69454574584961, 37.97437286376953, 42.25419998168945, 46.534027099609375]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 3.0, 7.0, 6.0, 6.0, 8.0, 10.0, 10.0, 14.0, 19.0, 12.0, 23.0, 30.0, 26.0, 27.0, 42.0, 25.0, 39.0, 41.0, 42.0, 43.0, 47.0, 49.0, 36.0, 46.0, 41.0, 37.0, 42.0, 26.0, 31.0, 28.0, 35.0, 33.0, 10.0, 18.0, 19.0, 15.0, 14.0, 7.0, 9.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.37052917480469, -35.0737419128418, -33.77695083618164, -32.48016357421875, -31.183374404907227, -29.886585235595703, -28.589797973632812, -27.29300880432129, -25.996219635009766, -24.699430465698242, -23.40264129638672, -22.105854034423828, -20.809064865112305, -19.51227569580078, -18.21548843383789, -16.918699264526367, -15.621910095214844, -14.32512092590332, -13.028332710266113, -11.731544494628906, -10.434755325317383, -9.13796615600586, -7.841177940368652, -6.544389724731445, -5.247600555419922, -3.9508118629455566, -2.6540231704711914, -1.3572344779968262, -0.06044578552246094, 1.2363429069519043, 2.5331315994262695, 3.8299198150634766, 5.126708984375, 6.423497676849365, 7.7202863693237305, 9.017074584960938, 10.313863754272461, 11.610652923583984, 12.907441139221191, 14.204229354858398, 15.501018524169922, 16.797807693481445, 18.09459686279297, 19.39138412475586, 20.688173294067383, 21.984962463378906, 23.281749725341797, 24.57853889465332, 25.875328063964844, 27.172117233276367, 28.46890640258789, 29.76569366455078, 31.062482833862305, 32.35927200317383, 33.65605926513672, 34.952850341796875, 36.249637603759766, 37.546424865722656, 38.84321594238281, 40.1400032043457, 41.436790466308594, 42.73358154296875, 44.03036880493164, 45.32715606689453, 46.62394714355469]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 6.0, 8.0, 11.0, 16.0, 18.0, 19.0, 15.0, 22.0, 23.0, 29.0, 34.0, 28.0, 28.0, 33.0, 54.0, 56.0, 47.0, 55.0, 50.0, 47.0, 44.0, 46.0, 51.0, 35.0, 32.0, 29.0, 27.0, 23.0, 25.0, 11.0, 13.0, 12.0, 14.0, 7.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.0997314453125, -3.968994140625, -3.8382568359375, -3.70751953125, -3.5767822265625, -3.446044921875, -3.3153076171875, -3.1845703125, -3.0538330078125, -2.923095703125, -2.7923583984375, -2.66162109375, -2.5308837890625, -2.400146484375, -2.2694091796875, -2.138671875, -2.0079345703125, -1.877197265625, -1.7464599609375, -1.61572265625, -1.4849853515625, -1.354248046875, -1.2235107421875, -1.0927734375, -0.9620361328125, -0.831298828125, -0.7005615234375, -0.56982421875, -0.4390869140625, -0.308349609375, -0.1776123046875, -0.046875, 0.0838623046875, 0.214599609375, 0.3453369140625, 0.47607421875, 0.6068115234375, 0.737548828125, 0.8682861328125, 0.9990234375, 1.1297607421875, 1.260498046875, 1.3912353515625, 1.52197265625, 1.6527099609375, 1.783447265625, 1.9141845703125, 2.044921875, 2.1756591796875, 2.306396484375, 2.4371337890625, 2.56787109375, 2.6986083984375, 2.829345703125, 2.9600830078125, 3.0908203125, 3.2215576171875, 3.352294921875, 3.4830322265625, 3.61376953125, 3.7445068359375, 3.875244140625, 4.0059814453125, 4.13671875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 10.0, 20.0, 16.0, 24.0, 42.0, 58.0, 80.0, 117.0, 157.0, 241.0, 380.0, 570.0, 886.0, 1497.0, 2306.0, 3804.0, 6510.0, 11031.0, 18570.0, 32690.0, 59946.0, 117934.0, 232594.0, 260700.0, 139127.0, 69405.0, 37405.0, 21189.0, 12323.0, 7416.0, 4449.0, 2522.0, 1635.0, 1036.0, 680.0, 384.0, 258.0, 170.0, 117.0, 70.0, 54.0, 36.0, 28.0, 16.0, 9.0, 9.0, 5.0, 7.0, 6.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.626953125, -0.6068038940429688, -0.5866546630859375, -0.5665054321289062, -0.546356201171875, -0.5262069702148438, -0.5060577392578125, -0.48590850830078125, -0.46575927734375, -0.44561004638671875, -0.4254608154296875, -0.40531158447265625, -0.385162353515625, -0.36501312255859375, -0.3448638916015625, -0.32471466064453125, -0.3045654296875, -0.28441619873046875, -0.2642669677734375, -0.24411773681640625, -0.223968505859375, -0.20381927490234375, -0.1836700439453125, -0.16352081298828125, -0.14337158203125, -0.12322235107421875, -0.1030731201171875, -0.08292388916015625, -0.062774658203125, -0.04262542724609375, -0.0224761962890625, -0.00232696533203125, 0.017822265625, 0.03797149658203125, 0.0581207275390625, 0.07826995849609375, 0.098419189453125, 0.11856842041015625, 0.1387176513671875, 0.15886688232421875, 0.17901611328125, 0.19916534423828125, 0.2193145751953125, 0.23946380615234375, 0.259613037109375, 0.27976226806640625, 0.2999114990234375, 0.32006072998046875, 0.3402099609375, 0.36035919189453125, 0.3805084228515625, 0.40065765380859375, 0.420806884765625, 0.44095611572265625, 0.4611053466796875, 0.48125457763671875, 0.50140380859375, 0.5215530395507812, 0.5417022705078125, 0.5618515014648438, 0.582000732421875, 0.6021499633789062, 0.6222991943359375, 0.6424484252929688, 0.66259765625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 1.0, 3.0, 6.0, 7.0, 11.0, 7.0, 10.0, 11.0, 16.0, 21.0, 17.0, 30.0, 31.0, 29.0, 36.0, 38.0, 30.0, 32.0, 44.0, 49.0, 32.0, 40.0, 1054.0, 45.0, 39.0, 37.0, 32.0, 36.0, 26.0, 34.0, 22.0, 24.0, 27.0, 23.0, 20.0, 13.0, 13.0, 20.0, 15.0, 8.0, 6.0, 5.0, 2.0, 6.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.205078125, -2.135955810546875, -2.06683349609375, -1.997711181640625, -1.9285888671875, -1.859466552734375, -1.79034423828125, -1.721221923828125, -1.652099609375, -1.582977294921875, -1.51385498046875, -1.444732666015625, -1.3756103515625, -1.306488037109375, -1.23736572265625, -1.168243408203125, -1.09912109375, -1.029998779296875, -0.96087646484375, -0.891754150390625, -0.8226318359375, -0.753509521484375, -0.68438720703125, -0.615264892578125, -0.546142578125, -0.477020263671875, -0.40789794921875, -0.338775634765625, -0.2696533203125, -0.200531005859375, -0.13140869140625, -0.062286376953125, 0.0068359375, 0.075958251953125, 0.14508056640625, 0.214202880859375, 0.2833251953125, 0.352447509765625, 0.42156982421875, 0.490692138671875, 0.559814453125, 0.628936767578125, 0.69805908203125, 0.767181396484375, 0.8363037109375, 0.905426025390625, 0.97454833984375, 1.043670654296875, 1.11279296875, 1.181915283203125, 1.25103759765625, 1.320159912109375, 1.3892822265625, 1.458404541015625, 1.52752685546875, 1.596649169921875, 1.665771484375, 1.734893798828125, 1.80401611328125, 1.873138427734375, 1.9422607421875, 2.011383056640625, 2.08050537109375, 2.149627685546875, 2.21875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 10.0, 7.0, 14.0, 20.0, 41.0, 42.0, 63.0, 117.0, 156.0, 262.0, 413.0, 754.0, 1091.0, 1867.0, 2972.0, 4949.0, 8411.0, 14433.0, 25282.0, 44767.0, 83069.0, 152201.0, 1284045.0, 206615.0, 118675.0, 63547.0, 34871.0, 19980.0, 11375.0, 6682.0, 3941.0, 2445.0, 1468.0, 913.0, 627.0, 349.0, 224.0, 138.0, 106.0, 62.0, 53.0, 19.0, 20.0, 16.0, 12.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.4443359375, -0.4307861328125, -0.417236328125, -0.4036865234375, -0.39013671875, -0.3765869140625, -0.363037109375, -0.3494873046875, -0.3359375, -0.3223876953125, -0.308837890625, -0.2952880859375, -0.28173828125, -0.2681884765625, -0.254638671875, -0.2410888671875, -0.2275390625, -0.2139892578125, -0.200439453125, -0.1868896484375, -0.17333984375, -0.1597900390625, -0.146240234375, -0.1326904296875, -0.119140625, -0.1055908203125, -0.092041015625, -0.0784912109375, -0.06494140625, -0.0513916015625, -0.037841796875, -0.0242919921875, -0.0107421875, 0.0028076171875, 0.016357421875, 0.0299072265625, 0.04345703125, 0.0570068359375, 0.070556640625, 0.0841064453125, 0.09765625, 0.1112060546875, 0.124755859375, 0.1383056640625, 0.15185546875, 0.1654052734375, 0.178955078125, 0.1925048828125, 0.2060546875, 0.2196044921875, 0.233154296875, 0.2467041015625, 0.26025390625, 0.2738037109375, 0.287353515625, 0.3009033203125, 0.314453125, 0.3280029296875, 0.341552734375, 0.3551025390625, 0.36865234375, 0.3822021484375, 0.395751953125, 0.4093017578125, 0.4228515625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 4.0, 5.0, 7.0, 13.0, 14.0, 7.0, 26.0, 29.0, 25.0, 43.0, 41.0, 51.0, 74.0, 64.0, 71.0, 62.0, 61.0, 69.0, 52.0, 51.0, 46.0, 34.0, 35.0, 19.0, 17.0, 11.0, 17.0, 8.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0017118453979492188, -0.0016632080078125, -0.0016145706176757812, -0.0015659332275390625, -0.0015172958374023438, -0.001468658447265625, -0.0014200210571289062, -0.0013713836669921875, -0.0013227462768554688, -0.00127410888671875, -0.0012254714965820312, -0.0011768341064453125, -0.0011281967163085938, -0.001079559326171875, -0.0010309219360351562, -0.0009822845458984375, -0.0009336471557617188, -0.000885009765625, -0.0008363723754882812, -0.0007877349853515625, -0.0007390975952148438, -0.000690460205078125, -0.0006418228149414062, -0.0005931854248046875, -0.0005445480346679688, -0.00049591064453125, -0.00044727325439453125, -0.0003986358642578125, -0.00034999847412109375, -0.000301361083984375, -0.00025272369384765625, -0.0002040863037109375, -0.00015544891357421875, -0.0001068115234375, -5.817413330078125e-05, -9.5367431640625e-06, 3.910064697265625e-05, 8.7738037109375e-05, 0.00013637542724609375, 0.0001850128173828125, 0.00023365020751953125, 0.00028228759765625, 0.00033092498779296875, 0.0003795623779296875, 0.00042819976806640625, 0.000476837158203125, 0.0005254745483398438, 0.0005741119384765625, 0.0006227493286132812, 0.00067138671875, 0.0007200241088867188, 0.0007686614990234375, 0.0008172988891601562, 0.000865936279296875, 0.0009145736694335938, 0.0009632110595703125, 0.0010118484497070312, 0.00106048583984375, 0.0011091232299804688, 0.0011577606201171875, 0.0012063980102539062, 0.001255035400390625, 0.0013036727905273438, 0.0013523101806640625, 0.0014009475708007812]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 4.0, 6.0, 11.0, 13.0, 12.0, 17.0, 27.0, 24.0, 37.0, 64.0, 67.0, 114.0, 161.0, 369.0, 909.0, 533945.0, 510902.0, 898.0, 395.0, 163.0, 97.0, 74.0, 43.0, 41.0, 36.0, 21.0, 8.0, 10.0, 12.0, 18.0, 9.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.04388427734375, -0.04246854782104492, -0.041052818298339844, -0.039637088775634766, -0.03822135925292969, -0.03680562973022461, -0.03538990020751953, -0.03397417068481445, -0.032558441162109375, -0.031142711639404297, -0.02972698211669922, -0.02831125259399414, -0.026895523071289062, -0.025479793548583984, -0.024064064025878906, -0.022648334503173828, -0.02123260498046875, -0.019816875457763672, -0.018401145935058594, -0.016985416412353516, -0.015569686889648438, -0.01415395736694336, -0.012738227844238281, -0.011322498321533203, -0.009906768798828125, -0.008491039276123047, -0.007075309753417969, -0.005659580230712891, -0.0042438507080078125, -0.0028281211853027344, -0.0014123916625976562, 3.337860107421875e-06, 0.0014190673828125, 0.002834796905517578, 0.004250526428222656, 0.005666255950927734, 0.0070819854736328125, 0.00849771499633789, 0.009913444519042969, 0.011329174041748047, 0.012744903564453125, 0.014160633087158203, 0.015576362609863281, 0.01699209213256836, 0.018407821655273438, 0.019823551177978516, 0.021239280700683594, 0.022655010223388672, 0.02407073974609375, 0.025486469268798828, 0.026902198791503906, 0.028317928314208984, 0.029733657836914062, 0.03114938735961914, 0.03256511688232422, 0.0339808464050293, 0.035396575927734375, 0.03681230545043945, 0.03822803497314453, 0.03964376449584961, 0.04105949401855469, 0.042475223541259766, 0.043890953063964844, 0.04530668258666992, 0.046722412109375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1018.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007014077622443438, -0.00571267819032073, -0.0044112782925367355, -0.003109878860414028, -0.0018084794282913208, -0.0005070799961686134, 0.0007943199016153812, 0.0020957193337380886, 0.003397118765860796, 0.004698518197983503, 0.005999918095767498, 0.007301317527890205, 0.008602716960012913, 0.00990411639213562, 0.011205516755580902, 0.012506915256381035, 0.013808315619826317, 0.015109715051949024, 0.01641111448407173, 0.017712514847517014, 0.019013913348317146, 0.02031531371176243, 0.02161671221256256, 0.022918112576007843, 0.024219511076807976, 0.025520911440253258, 0.02682230994105339, 0.028123710304498672, 0.029425108805298805, 0.030726509168744087, 0.03202790766954422, 0.0333293080329895, 0.034630704671144485, 0.03593210503458977, 0.03723350539803505, 0.03853490203619003, 0.039836302399635315, 0.0411377027630806, 0.04243910312652588, 0.04374050348997116, 0.045041900128126144, 0.046343300491571426, 0.04764470085501671, 0.04894609749317169, 0.050247497856616974, 0.051548898220062256, 0.05285029858350754, 0.05415169894695282, 0.0554530993103981, 0.056754499673843384, 0.058055900037288666, 0.05935729667544365, 0.06065869703888893, 0.06196009740233421, 0.0632614940404892, 0.06456289440393448, 0.06586429476737976, 0.06716569513082504, 0.06846709549427032, 0.0697684958577156, 0.07106989622116089, 0.07237128913402557, 0.07367268949747086, 0.07497408986091614, 0.07627549022436142]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 9.0, 7.0, 9.0, 15.0, 15.0, 22.0, 24.0, 19.0, 29.0, 45.0, 45.0, 47.0, 67.0, 62.0, 70.0, 53.0, 61.0, 47.0, 60.0, 52.0, 42.0, 45.0, 29.0, 27.0, 34.0, 19.0, 16.0, 13.0, 13.0, 12.0, 5.0, 2.0, 3.0], "bins": [-0.0016615986824035645, -0.0016258619725704193, -0.0015901252627372742, -0.001554388552904129, -0.0015186518430709839, -0.0014829151332378387, -0.0014471784234046936, -0.0014114417135715485, -0.0013757050037384033, -0.0013399682939052582, -0.001304231584072113, -0.001268494874238968, -0.0012327581644058228, -0.0011970214545726776, -0.0011612847447395325, -0.0011255480349063873, -0.0010898113250732422, -0.001054074615240097, -0.001018337905406952, -0.0009826011955738068, -0.0009468644857406616, -0.0009111277759075165, -0.0008753910660743713, -0.0008396543562412262, -0.0008039176464080811, -0.0007681809365749359, -0.0007324442267417908, -0.0006967075169086456, -0.0006609708070755005, -0.0006252340972423553, -0.0005894973874092102, -0.0005537606775760651, -0.0005180239677429199, -0.0004822872579097748, -0.00044655054807662964, -0.0004108138382434845, -0.00037507712841033936, -0.0003393404185771942, -0.00030360370874404907, -0.00026786699891090393, -0.0002321302890777588, -0.00019639357924461365, -0.0001606568694114685, -0.00012492015957832336, -8.918344974517822e-05, -5.344673991203308e-05, -1.771003007888794e-05, 1.8026679754257202e-05, 5.3763389587402344e-05, 8.950009942054749e-05, 0.00012523680925369263, 0.00016097351908683777, 0.0001967102289199829, 0.00023244693875312805, 0.0002681836485862732, 0.00030392035841941833, 0.0003396570682525635, 0.0003753937780857086, 0.00041113048791885376, 0.0004468671977519989, 0.00048260390758514404, 0.0005183406174182892, 0.0005540773272514343, 0.0005898140370845795, 0.0006255507469177246]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 6.0, 8.0, 11.0, 16.0, 18.0, 19.0, 15.0, 22.0, 23.0, 29.0, 34.0, 28.0, 28.0, 33.0, 54.0, 56.0, 47.0, 55.0, 50.0, 47.0, 44.0, 46.0, 51.0, 35.0, 32.0, 29.0, 27.0, 23.0, 25.0, 11.0, 13.0, 12.0, 14.0, 7.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.0997314453125, -3.968994140625, -3.8382568359375, -3.70751953125, -3.5767822265625, -3.446044921875, -3.3153076171875, -3.1845703125, -3.0538330078125, -2.923095703125, -2.7923583984375, -2.66162109375, -2.5308837890625, -2.400146484375, -2.2694091796875, -2.138671875, -2.0079345703125, -1.877197265625, -1.7464599609375, -1.61572265625, -1.4849853515625, -1.354248046875, -1.2235107421875, -1.0927734375, -0.9620361328125, -0.831298828125, -0.7005615234375, -0.56982421875, -0.4390869140625, -0.308349609375, -0.1776123046875, -0.046875, 0.0838623046875, 0.214599609375, 0.3453369140625, 0.47607421875, 0.6068115234375, 0.737548828125, 0.8682861328125, 0.9990234375, 1.1297607421875, 1.260498046875, 1.3912353515625, 1.52197265625, 1.6527099609375, 1.783447265625, 1.9141845703125, 2.044921875, 2.1756591796875, 2.306396484375, 2.4371337890625, 2.56787109375, 2.6986083984375, 2.829345703125, 2.9600830078125, 3.0908203125, 3.2215576171875, 3.352294921875, 3.4830322265625, 3.61376953125, 3.7445068359375, 3.875244140625, 4.0059814453125, 4.13671875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 14.0, 10.0, 13.0, 19.0, 24.0, 35.0, 57.0, 65.0, 110.0, 160.0, 246.0, 429.0, 722.0, 1277.0, 2468.0, 5173.0, 12257.0, 35204.0, 122409.0, 521154.0, 251345.0, 60355.0, 19652.0, 7634.0, 3519.0, 1754.0, 950.0, 529.0, 338.0, 213.0, 109.0, 93.0, 53.0, 39.0, 33.0, 27.0, 17.0, 14.0, 5.0, 3.0, 3.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.59375, -3.487213134765625, -3.38067626953125, -3.274139404296875, -3.1676025390625, -3.061065673828125, -2.95452880859375, -2.847991943359375, -2.741455078125, -2.634918212890625, -2.52838134765625, -2.421844482421875, -2.3153076171875, -2.208770751953125, -2.10223388671875, -1.995697021484375, -1.88916015625, -1.782623291015625, -1.67608642578125, -1.569549560546875, -1.4630126953125, -1.356475830078125, -1.24993896484375, -1.143402099609375, -1.036865234375, -0.930328369140625, -0.82379150390625, -0.717254638671875, -0.6107177734375, -0.504180908203125, -0.39764404296875, -0.291107177734375, -0.1845703125, -0.078033447265625, 0.02850341796875, 0.135040283203125, 0.2415771484375, 0.348114013671875, 0.45465087890625, 0.561187744140625, 0.667724609375, 0.774261474609375, 0.88079833984375, 0.987335205078125, 1.0938720703125, 1.200408935546875, 1.30694580078125, 1.413482666015625, 1.52001953125, 1.626556396484375, 1.73309326171875, 1.839630126953125, 1.9461669921875, 2.052703857421875, 2.15924072265625, 2.265777587890625, 2.372314453125, 2.478851318359375, 2.58538818359375, 2.691925048828125, 2.7984619140625, 2.904998779296875, 3.01153564453125, 3.118072509765625, 3.224609375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 8.0, 6.0, 11.0, 7.0, 17.0, 17.0, 24.0, 27.0, 35.0, 43.0, 39.0, 41.0, 44.0, 73.0, 95.0, 1734.0, 322.0, 84.0, 66.0, 43.0, 51.0, 40.0, 44.0, 30.0, 30.0, 17.0, 23.0, 15.0, 8.0, 13.0, 8.0, 3.0, 10.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-18.53125, -18.028076171875, -17.52490234375, -17.021728515625, -16.5185546875, -16.015380859375, -15.51220703125, -15.009033203125, -14.505859375, -14.002685546875, -13.49951171875, -12.996337890625, -12.4931640625, -11.989990234375, -11.48681640625, -10.983642578125, -10.48046875, -9.977294921875, -9.47412109375, -8.970947265625, -8.4677734375, -7.964599609375, -7.46142578125, -6.958251953125, -6.455078125, -5.951904296875, -5.44873046875, -4.945556640625, -4.4423828125, -3.939208984375, -3.43603515625, -2.932861328125, -2.4296875, -1.926513671875, -1.42333984375, -0.920166015625, -0.4169921875, 0.086181640625, 0.58935546875, 1.092529296875, 1.595703125, 2.098876953125, 2.60205078125, 3.105224609375, 3.6083984375, 4.111572265625, 4.61474609375, 5.117919921875, 5.62109375, 6.124267578125, 6.62744140625, 7.130615234375, 7.6337890625, 8.136962890625, 8.64013671875, 9.143310546875, 9.646484375, 10.149658203125, 10.65283203125, 11.156005859375, 11.6591796875, 12.162353515625, 12.66552734375, 13.168701171875, 13.671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 3.0, 6.0, 7.0, 3.0, 13.0, 13.0, 19.0, 24.0, 15.0, 33.0, 45.0, 55.0, 81.0, 108.0, 180.0, 342.0, 883.0, 8215.0, 3018011.0, 114333.0, 2089.0, 519.0, 228.0, 124.0, 95.0, 66.0, 48.0, 23.0, 21.0, 28.0, 16.0, 10.0, 12.0, 6.0, 7.0, 6.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.3125, -20.544921875, -19.77734375, -19.009765625, -18.2421875, -17.474609375, -16.70703125, -15.939453125, -15.171875, -14.404296875, -13.63671875, -12.869140625, -12.1015625, -11.333984375, -10.56640625, -9.798828125, -9.03125, -8.263671875, -7.49609375, -6.728515625, -5.9609375, -5.193359375, -4.42578125, -3.658203125, -2.890625, -2.123046875, -1.35546875, -0.587890625, 0.1796875, 0.947265625, 1.71484375, 2.482421875, 3.25, 4.017578125, 4.78515625, 5.552734375, 6.3203125, 7.087890625, 7.85546875, 8.623046875, 9.390625, 10.158203125, 10.92578125, 11.693359375, 12.4609375, 13.228515625, 13.99609375, 14.763671875, 15.53125, 16.298828125, 17.06640625, 17.833984375, 18.6015625, 19.369140625, 20.13671875, 20.904296875, 21.671875, 22.439453125, 23.20703125, 23.974609375, 24.7421875, 25.509765625, 26.27734375, 27.044921875, 27.8125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 47.0, 233.0, 381.0, 273.0, 60.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.573726654052734, -48.43610382080078, -47.29848098754883, -46.16085433959961, -45.023231506347656, -43.8856086730957, -42.74798583984375, -41.61035919189453, -40.47273635864258, -39.335113525390625, -38.19749069213867, -37.05986404418945, -35.9222412109375, -34.78461837768555, -33.646995544433594, -32.509368896484375, -31.371747970581055, -30.2341251373291, -29.096500396728516, -27.958877563476562, -26.821252822875977, -25.683629989624023, -24.546005249023438, -23.408382415771484, -22.27075958251953, -21.133136749267578, -19.995512008666992, -18.85788917541504, -17.720264434814453, -16.5826416015625, -15.44501781463623, -14.307394027709961, -13.169767379760742, -12.032143592834473, -10.894519805908203, -9.75689697265625, -8.619272232055664, -7.481648921966553, -6.344025611877441, -5.206401824951172, -4.068778038024902, -2.931154251098633, -1.7935307025909424, -0.655907154083252, 0.4817166328430176, 1.619340419769287, 2.7569637298583984, 3.894587516784668, 5.0322113037109375, 6.169835090637207, 7.307458877563477, 8.44508171081543, 9.582706451416016, 10.720329284667969, 11.857953071594238, 12.995576858520508, 14.133200645446777, 15.270824432373047, 16.408447265625, 17.546072006225586, 18.68369483947754, 19.821319580078125, 20.958942413330078, 22.09656524658203, 23.234189987182617]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 9.0, 6.0, 15.0, 11.0, 15.0, 14.0, 24.0, 27.0, 34.0, 29.0, 37.0, 31.0, 32.0, 34.0, 33.0, 44.0, 41.0, 27.0, 33.0, 46.0, 26.0, 43.0, 36.0, 31.0, 44.0, 38.0, 22.0, 22.0, 18.0, 19.0, 12.0, 21.0, 21.0, 19.0, 13.0, 8.0, 6.0, 13.0, 9.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.89753723144531, -34.700870513916016, -33.50420379638672, -32.30754089355469, -31.11087417602539, -29.914207458496094, -28.717540740966797, -27.520875930786133, -26.32421112060547, -25.127544403076172, -23.930879592895508, -22.73421287536621, -21.537548065185547, -20.34088134765625, -19.144214630126953, -17.94754981994629, -16.750883102416992, -15.554217338562012, -14.357551574707031, -13.160884857177734, -11.96422004699707, -10.767553329467773, -9.570887565612793, -8.374221801757812, -7.177556037902832, -5.980890274047852, -4.784224510192871, -3.5875582695007324, -2.390892505645752, -1.1942267417907715, 0.0024394989013671875, 1.1991052627563477, 2.395771026611328, 3.5924367904663086, 4.789102554321289, 5.985768795013428, 7.182434558868408, 8.379100799560547, 9.575766563415527, 10.772432327270508, 11.969098091125488, 13.165763854980469, 14.36242961883545, 15.55909538269043, 16.755762100219727, 17.95242691040039, 19.149093627929688, 20.345760345458984, 21.54242515563965, 22.739091873168945, 23.93575668334961, 25.132423400878906, 26.32908821105957, 27.525754928588867, 28.72241973876953, 29.919086456298828, 31.115753173828125, 32.31241989135742, 33.50908660888672, 34.70574951171875, 35.90241622924805, 37.099082946777344, 38.29574966430664, 39.49241638183594, 40.68907928466797]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 5.0, 7.0, 7.0, 8.0, 11.0, 12.0, 19.0, 14.0, 19.0, 22.0, 25.0, 23.0, 30.0, 31.0, 33.0, 37.0, 49.0, 52.0, 40.0, 66.0, 51.0, 42.0, 37.0, 50.0, 52.0, 45.0, 28.0, 27.0, 33.0, 30.0, 21.0, 10.0, 15.0, 10.0, 13.0, 8.0, 8.0, 5.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.38671875, -4.25201416015625, -4.1173095703125, -3.98260498046875, -3.847900390625, -3.71319580078125, -3.5784912109375, -3.44378662109375, -3.30908203125, -3.17437744140625, -3.0396728515625, -2.90496826171875, -2.770263671875, -2.63555908203125, -2.5008544921875, -2.36614990234375, -2.2314453125, -2.09674072265625, -1.9620361328125, -1.82733154296875, -1.692626953125, -1.55792236328125, -1.4232177734375, -1.28851318359375, -1.15380859375, -1.01910400390625, -0.8843994140625, -0.74969482421875, -0.614990234375, -0.48028564453125, -0.3455810546875, -0.21087646484375, -0.076171875, 0.05853271484375, 0.1932373046875, 0.32794189453125, 0.462646484375, 0.59735107421875, 0.7320556640625, 0.86676025390625, 1.00146484375, 1.13616943359375, 1.2708740234375, 1.40557861328125, 1.540283203125, 1.67498779296875, 1.8096923828125, 1.94439697265625, 2.0791015625, 2.21380615234375, 2.3485107421875, 2.48321533203125, 2.617919921875, 2.75262451171875, 2.8873291015625, 3.02203369140625, 3.15673828125, 3.29144287109375, 3.4261474609375, 3.56085205078125, 3.695556640625, 3.83026123046875, 3.9649658203125, 4.09967041015625, 4.234375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 7.0, 12.0, 11.0, 13.0, 11.0, 19.0, 32.0, 27.0, 70.0, 87.0, 168.0, 344.0, 946.0, 2709.0, 9599.0, 39473.0, 248779.0, 1945804.0, 1687099.0, 211583.0, 34633.0, 8597.0, 2537.0, 862.0, 372.0, 170.0, 89.0, 62.0, 44.0, 25.0, 11.0, 16.0, 15.0, 5.0, 10.0, 9.0, 8.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-9.9765625, -9.691162109375, -9.40576171875, -9.120361328125, -8.8349609375, -8.549560546875, -8.26416015625, -7.978759765625, -7.693359375, -7.407958984375, -7.12255859375, -6.837158203125, -6.5517578125, -6.266357421875, -5.98095703125, -5.695556640625, -5.41015625, -5.124755859375, -4.83935546875, -4.553955078125, -4.2685546875, -3.983154296875, -3.69775390625, -3.412353515625, -3.126953125, -2.841552734375, -2.55615234375, -2.270751953125, -1.9853515625, -1.699951171875, -1.41455078125, -1.129150390625, -0.84375, -0.558349609375, -0.27294921875, 0.012451171875, 0.2978515625, 0.583251953125, 0.86865234375, 1.154052734375, 1.439453125, 1.724853515625, 2.01025390625, 2.295654296875, 2.5810546875, 2.866455078125, 3.15185546875, 3.437255859375, 3.72265625, 4.008056640625, 4.29345703125, 4.578857421875, 4.8642578125, 5.149658203125, 5.43505859375, 5.720458984375, 6.005859375, 6.291259765625, 6.57666015625, 6.862060546875, 7.1474609375, 7.432861328125, 7.71826171875, 8.003662109375, 8.2890625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 8.0, 5.0, 6.0, 23.0, 30.0, 32.0, 81.0, 96.0, 130.0, 257.0, 360.0, 543.0, 687.0, 599.0, 424.0, 291.0, 194.0, 100.0, 72.0, 50.0, 34.0, 19.0, 15.0, 3.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.796875, -18.2841796875, -17.771484375, -17.2587890625, -16.74609375, -16.2333984375, -15.720703125, -15.2080078125, -14.6953125, -14.1826171875, -13.669921875, -13.1572265625, -12.64453125, -12.1318359375, -11.619140625, -11.1064453125, -10.59375, -10.0810546875, -9.568359375, -9.0556640625, -8.54296875, -8.0302734375, -7.517578125, -7.0048828125, -6.4921875, -5.9794921875, -5.466796875, -4.9541015625, -4.44140625, -3.9287109375, -3.416015625, -2.9033203125, -2.390625, -1.8779296875, -1.365234375, -0.8525390625, -0.33984375, 0.1728515625, 0.685546875, 1.1982421875, 1.7109375, 2.2236328125, 2.736328125, 3.2490234375, 3.76171875, 4.2744140625, 4.787109375, 5.2998046875, 5.8125, 6.3251953125, 6.837890625, 7.3505859375, 7.86328125, 8.3759765625, 8.888671875, 9.4013671875, 9.9140625, 10.4267578125, 10.939453125, 11.4521484375, 11.96484375, 12.4775390625, 12.990234375, 13.5029296875, 14.015625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 12.0, 12.0, 18.0, 28.0, 42.0, 65.0, 99.0, 177.0, 398.0, 1761.0, 64863.0, 4070773.0, 53575.0, 1639.0, 336.0, 189.0, 103.0, 57.0, 41.0, 29.0, 24.0, 15.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.375, -51.6240234375, -49.873046875, -48.1220703125, -46.37109375, -44.6201171875, -42.869140625, -41.1181640625, -39.3671875, -37.6162109375, -35.865234375, -34.1142578125, -32.36328125, -30.6123046875, -28.861328125, -27.1103515625, -25.359375, -23.6083984375, -21.857421875, -20.1064453125, -18.35546875, -16.6044921875, -14.853515625, -13.1025390625, -11.3515625, -9.6005859375, -7.849609375, -6.0986328125, -4.34765625, -2.5966796875, -0.845703125, 0.9052734375, 2.65625, 4.4072265625, 6.158203125, 7.9091796875, 9.66015625, 11.4111328125, 13.162109375, 14.9130859375, 16.6640625, 18.4150390625, 20.166015625, 21.9169921875, 23.66796875, 25.4189453125, 27.169921875, 28.9208984375, 30.671875, 32.4228515625, 34.173828125, 35.9248046875, 37.67578125, 39.4267578125, 41.177734375, 42.9287109375, 44.6796875, 46.4306640625, 48.181640625, 49.9326171875, 51.68359375, 53.4345703125, 55.185546875, 56.9365234375, 58.6875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 9.0, 27.0, 66.0, 154.0, 232.0, 251.0, 140.0, 102.0, 24.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.12625122070312, -67.08890533447266, -64.05156707763672, -61.01422119140625, -57.97688293457031, -54.939537048339844, -51.90219497680664, -48.86485290527344, -45.827510833740234, -42.79016876220703, -39.75282669067383, -36.715484619140625, -33.678138732910156, -30.640798568725586, -27.60345458984375, -24.566112518310547, -21.528770446777344, -18.49142837524414, -15.454085350036621, -12.416742324829102, -9.379400253295898, -6.342058181762695, -3.3047142028808594, -0.26737213134765625, 2.769969940185547, 5.807312488555908, 8.84465503692627, 11.881998062133789, 14.919340133666992, 17.956682205200195, 20.99402618408203, 24.031368255615234, 27.068702697753906, 30.10604476928711, 33.14338684082031, 36.18073272705078, 39.21807098388672, 42.25541687011719, 45.29275894165039, 48.330101013183594, 51.3674430847168, 54.40478515625, 57.4421272277832, 60.479469299316406, 63.516815185546875, 66.55415344238281, 69.59149932861328, 72.62884521484375, 75.66618347167969, 78.70352935791016, 81.7408676147461, 84.77821350097656, 87.8155517578125, 90.85289764404297, 93.89024353027344, 96.92758178710938, 99.96492004394531, 103.00226593017578, 106.03960418701172, 109.07695007324219, 112.11428833007812, 115.1516342163086, 118.18898010253906, 121.226318359375, 124.26366424560547]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 6.0, 5.0, 5.0, 7.0, 9.0, 5.0, 14.0, 13.0, 18.0, 25.0, 33.0, 24.0, 24.0, 41.0, 28.0, 39.0, 32.0, 40.0, 42.0, 38.0, 34.0, 37.0, 43.0, 42.0, 35.0, 32.0, 32.0, 35.0, 34.0, 26.0, 28.0, 27.0, 24.0, 17.0, 13.0, 9.0, 15.0, 18.0, 16.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-40.74736022949219, -39.589813232421875, -38.4322624206543, -37.27471160888672, -36.117164611816406, -34.959617614746094, -33.802066802978516, -32.64451599121094, -31.486968994140625, -30.32942008972168, -29.171871185302734, -28.01432228088379, -26.856773376464844, -25.6992244720459, -24.541675567626953, -23.384126663208008, -22.226577758789062, -21.069028854370117, -19.911479949951172, -18.753931045532227, -17.59638214111328, -16.438833236694336, -15.28128433227539, -14.123735427856445, -12.9661865234375, -11.808637619018555, -10.65108871459961, -9.493539810180664, -8.335990905761719, -7.178442001342773, -6.020893096923828, -4.863344192504883, -3.705791473388672, -2.5482425689697266, -1.3906936645507812, -0.23314476013183594, 0.9244041442871094, 2.0819530487060547, 3.239501953125, 4.397050857543945, 5.554599761962891, 6.712148666381836, 7.869697570800781, 9.027246475219727, 10.184795379638672, 11.342344284057617, 12.499893188476562, 13.657442092895508, 14.814990997314453, 15.972539901733398, 17.130088806152344, 18.28763771057129, 19.445186614990234, 20.60273551940918, 21.760284423828125, 22.91783332824707, 24.075382232666016, 25.23293113708496, 26.390480041503906, 27.54802894592285, 28.705577850341797, 29.863126754760742, 31.020675659179688, 32.17822265625, 33.33577346801758]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 2.0, 6.0, 5.0, 5.0, 6.0, 8.0, 13.0, 14.0, 18.0, 19.0, 13.0, 17.0, 27.0, 23.0, 40.0, 31.0, 29.0, 32.0, 52.0, 44.0, 49.0, 49.0, 38.0, 49.0, 50.0, 41.0, 38.0, 40.0, 31.0, 34.0, 29.0, 33.0, 17.0, 22.0, 6.0, 18.0, 8.0, 14.0, 13.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.0625, -3.93463134765625, -3.8067626953125, -3.67889404296875, -3.551025390625, -3.42315673828125, -3.2952880859375, -3.16741943359375, -3.03955078125, -2.91168212890625, -2.7838134765625, -2.65594482421875, -2.528076171875, -2.40020751953125, -2.2723388671875, -2.14447021484375, -2.0166015625, -1.88873291015625, -1.7608642578125, -1.63299560546875, -1.505126953125, -1.37725830078125, -1.2493896484375, -1.12152099609375, -0.99365234375, -0.86578369140625, -0.7379150390625, -0.61004638671875, -0.482177734375, -0.35430908203125, -0.2264404296875, -0.09857177734375, 0.029296875, 0.15716552734375, 0.2850341796875, 0.41290283203125, 0.540771484375, 0.66864013671875, 0.7965087890625, 0.92437744140625, 1.05224609375, 1.18011474609375, 1.3079833984375, 1.43585205078125, 1.563720703125, 1.69158935546875, 1.8194580078125, 1.94732666015625, 2.0751953125, 2.20306396484375, 2.3309326171875, 2.45880126953125, 2.586669921875, 2.71453857421875, 2.8424072265625, 2.97027587890625, 3.09814453125, 3.22601318359375, 3.3538818359375, 3.48175048828125, 3.609619140625, 3.73748779296875, 3.8653564453125, 3.99322509765625, 4.12109375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 9.0, 11.0, 24.0, 19.0, 43.0, 54.0, 95.0, 123.0, 180.0, 267.0, 423.0, 668.0, 1121.0, 1766.0, 3096.0, 5136.0, 8884.0, 15481.0, 27102.0, 50508.0, 98507.0, 201509.0, 283850.0, 168604.0, 82436.0, 43016.0, 23261.0, 13201.0, 7738.0, 4427.0, 2608.0, 1640.0, 1004.0, 643.0, 386.0, 234.0, 170.0, 95.0, 69.0, 43.0, 32.0, 26.0, 9.0, 9.0, 9.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.68115234375, -0.6594390869140625, -0.637725830078125, -0.6160125732421875, -0.59429931640625, -0.5725860595703125, -0.550872802734375, -0.5291595458984375, -0.5074462890625, -0.4857330322265625, -0.464019775390625, -0.4423065185546875, -0.42059326171875, -0.3988800048828125, -0.377166748046875, -0.3554534912109375, -0.333740234375, -0.3120269775390625, -0.290313720703125, -0.2686004638671875, -0.24688720703125, -0.2251739501953125, -0.203460693359375, -0.1817474365234375, -0.1600341796875, -0.1383209228515625, -0.116607666015625, -0.0948944091796875, -0.07318115234375, -0.0514678955078125, -0.029754638671875, -0.0080413818359375, 0.013671875, 0.0353851318359375, 0.057098388671875, 0.0788116455078125, 0.10052490234375, 0.1222381591796875, 0.143951416015625, 0.1656646728515625, 0.1873779296875, 0.2090911865234375, 0.230804443359375, 0.2525177001953125, 0.27423095703125, 0.2959442138671875, 0.317657470703125, 0.3393707275390625, 0.361083984375, 0.3827972412109375, 0.404510498046875, 0.4262237548828125, 0.44793701171875, 0.4696502685546875, 0.491363525390625, 0.5130767822265625, 0.5347900390625, 0.5565032958984375, 0.578216552734375, 0.5999298095703125, 0.62164306640625, 0.6433563232421875, 0.665069580078125, 0.6867828369140625, 0.70849609375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 5.0, 6.0, 8.0, 7.0, 20.0, 15.0, 15.0, 16.0, 20.0, 26.0, 28.0, 28.0, 38.0, 25.0, 30.0, 37.0, 50.0, 42.0, 40.0, 34.0, 1046.0, 31.0, 33.0, 35.0, 37.0, 43.0, 31.0, 45.0, 33.0, 26.0, 25.0, 15.0, 17.0, 17.0, 17.0, 15.0, 12.0, 10.0, 10.0, 6.0, 8.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0], "bins": [-2.57421875, -2.503326416015625, -2.43243408203125, -2.361541748046875, -2.2906494140625, -2.219757080078125, -2.14886474609375, -2.077972412109375, -2.007080078125, -1.936187744140625, -1.86529541015625, -1.794403076171875, -1.7235107421875, -1.652618408203125, -1.58172607421875, -1.510833740234375, -1.43994140625, -1.369049072265625, -1.29815673828125, -1.227264404296875, -1.1563720703125, -1.085479736328125, -1.01458740234375, -0.943695068359375, -0.872802734375, -0.801910400390625, -0.73101806640625, -0.660125732421875, -0.5892333984375, -0.518341064453125, -0.44744873046875, -0.376556396484375, -0.3056640625, -0.234771728515625, -0.16387939453125, -0.092987060546875, -0.0220947265625, 0.048797607421875, 0.11968994140625, 0.190582275390625, 0.261474609375, 0.332366943359375, 0.40325927734375, 0.474151611328125, 0.5450439453125, 0.615936279296875, 0.68682861328125, 0.757720947265625, 0.82861328125, 0.899505615234375, 0.97039794921875, 1.041290283203125, 1.1121826171875, 1.183074951171875, 1.25396728515625, 1.324859619140625, 1.395751953125, 1.466644287109375, 1.53753662109375, 1.608428955078125, 1.6793212890625, 1.750213623046875, 1.82110595703125, 1.891998291015625, 1.962890625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 5.0, 5.0, 8.0, 12.0, 21.0, 35.0, 55.0, 77.0, 107.0, 175.0, 326.0, 504.0, 779.0, 1194.0, 2080.0, 3282.0, 5545.0, 9419.0, 16180.0, 28295.0, 50109.0, 91348.0, 169611.0, 1292761.0, 188776.0, 103721.0, 56629.0, 31849.0, 17954.0, 10456.0, 6228.0, 3785.0, 2150.0, 1350.0, 824.0, 509.0, 350.0, 216.0, 138.0, 81.0, 69.0, 41.0, 28.0, 14.0, 12.0, 7.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.471923828125, -0.45787811279296875, -0.4438323974609375, -0.42978668212890625, -0.415740966796875, -0.40169525146484375, -0.3876495361328125, -0.37360382080078125, -0.35955810546875, -0.34551239013671875, -0.3314666748046875, -0.31742095947265625, -0.303375244140625, -0.28932952880859375, -0.2752838134765625, -0.26123809814453125, -0.2471923828125, -0.23314666748046875, -0.2191009521484375, -0.20505523681640625, -0.191009521484375, -0.17696380615234375, -0.1629180908203125, -0.14887237548828125, -0.13482666015625, -0.12078094482421875, -0.1067352294921875, -0.09268951416015625, -0.078643798828125, -0.06459808349609375, -0.0505523681640625, -0.03650665283203125, -0.0224609375, -0.00841522216796875, 0.0056304931640625, 0.01967620849609375, 0.033721923828125, 0.04776763916015625, 0.0618133544921875, 0.07585906982421875, 0.08990478515625, 0.10395050048828125, 0.1179962158203125, 0.13204193115234375, 0.146087646484375, 0.16013336181640625, 0.1741790771484375, 0.18822479248046875, 0.2022705078125, 0.21631622314453125, 0.2303619384765625, 0.24440765380859375, 0.258453369140625, 0.27249908447265625, 0.2865447998046875, 0.30059051513671875, 0.31463623046875, 0.32868194580078125, 0.3427276611328125, 0.35677337646484375, 0.370819091796875, 0.38486480712890625, 0.3989105224609375, 0.41295623779296875, 0.427001953125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 7.0, 4.0, 6.0, 9.0, 14.0, 9.0, 12.0, 18.0, 12.0, 25.0, 31.0, 37.0, 45.0, 55.0, 70.0, 69.0, 78.0, 79.0, 77.0, 64.0, 57.0, 39.0, 38.0, 35.0, 20.0, 18.0, 17.0, 10.0, 4.0, 5.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021152496337890625, -0.002048969268798828, -0.0019826889038085938, -0.0019164085388183594, -0.001850128173828125, -0.0017838478088378906, -0.0017175674438476562, -0.0016512870788574219, -0.0015850067138671875, -0.0015187263488769531, -0.0014524459838867188, -0.0013861656188964844, -0.00131988525390625, -0.0012536048889160156, -0.0011873245239257812, -0.0011210441589355469, -0.0010547637939453125, -0.0009884834289550781, -0.0009222030639648438, -0.0008559226989746094, -0.000789642333984375, -0.0007233619689941406, -0.0006570816040039062, -0.0005908012390136719, -0.0005245208740234375, -0.0004582405090332031, -0.00039196014404296875, -0.0003256797790527344, -0.0002593994140625, -0.00019311904907226562, -0.00012683868408203125, -6.0558319091796875e-05, 5.7220458984375e-06, 7.200241088867188e-05, 0.00013828277587890625, 0.00020456314086914062, 0.000270843505859375, 0.0003371238708496094, 0.00040340423583984375, 0.0004696846008300781, 0.0005359649658203125, 0.0006022453308105469, 0.0006685256958007812, 0.0007348060607910156, 0.00080108642578125, 0.0008673667907714844, 0.0009336471557617188, 0.0009999275207519531, 0.0010662078857421875, 0.0011324882507324219, 0.0011987686157226562, 0.0012650489807128906, 0.001331329345703125, 0.0013976097106933594, 0.0014638900756835938, 0.0015301704406738281, 0.0015964508056640625, 0.0016627311706542969, 0.0017290115356445312, 0.0017952919006347656, 0.001861572265625, 0.0019278526306152344, 0.0019941329956054688, 0.002060413360595703, 0.0021266937255859375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 10.0, 10.0, 13.0, 17.0, 16.0, 27.0, 49.0, 84.0, 125.0, 227.0, 542.0, 3579.0, 1039957.0, 2735.0, 486.0, 257.0, 133.0, 73.0, 41.0, 28.0, 27.0, 16.0, 8.0, 13.0, 11.0, 14.0, 3.0, 12.0, 5.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059326171875, -0.05749940872192383, -0.055672645568847656, -0.053845882415771484, -0.05201911926269531, -0.05019235610961914, -0.04836559295654297, -0.0465388298034668, -0.044712066650390625, -0.04288530349731445, -0.04105854034423828, -0.03923177719116211, -0.03740501403808594, -0.035578250885009766, -0.033751487731933594, -0.03192472457885742, -0.03009796142578125, -0.028271198272705078, -0.026444435119628906, -0.024617671966552734, -0.022790908813476562, -0.02096414566040039, -0.01913738250732422, -0.017310619354248047, -0.015483856201171875, -0.013657093048095703, -0.011830329895019531, -0.01000356674194336, -0.008176803588867188, -0.006350040435791016, -0.004523277282714844, -0.002696514129638672, -0.0008697509765625, 0.0009570121765136719, 0.0027837753295898438, 0.004610538482666016, 0.0064373016357421875, 0.00826406478881836, 0.010090827941894531, 0.011917591094970703, 0.013744354248046875, 0.015571117401123047, 0.01739788055419922, 0.01922464370727539, 0.021051406860351562, 0.022878170013427734, 0.024704933166503906, 0.026531696319580078, 0.02835845947265625, 0.030185222625732422, 0.032011985778808594, 0.033838748931884766, 0.03566551208496094, 0.03749227523803711, 0.03931903839111328, 0.04114580154418945, 0.042972564697265625, 0.0447993278503418, 0.04662609100341797, 0.04845285415649414, 0.05027961730957031, 0.052106380462646484, 0.053933143615722656, 0.05575990676879883, 0.057586669921875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 80.0, 939.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005784960929304361, -0.004382389597594738, -0.002979818033054471, -0.001577246468514204, -0.0001746751368045807, 0.0012278961949050426, 0.0026304679922759533, 0.004033038858324289, 0.0054356106556952, 0.006838181987404823, 0.008240753784775734, 0.009643325582146645, 0.01104589644819498, 0.012448467314243317, 0.013851039111614227, 0.015253610908985138, 0.01665618270635605, 0.01805875450372696, 0.01946132630109787, 0.02086389809846878, 0.022266468033194542, 0.023669039830565453, 0.025071611627936363, 0.026474181562662125, 0.027876753360033035, 0.029279325157403946, 0.030681896954774857, 0.03208446875214577, 0.03348704054951668, 0.03488960862159729, 0.0362921804189682, 0.03769475221633911, 0.03909732773900032, 0.04049989953637123, 0.04190247133374214, 0.04330504313111305, 0.04470761492848396, 0.046110183000564575, 0.047512754797935486, 0.048915326595306396, 0.05031789839267731, 0.05172047019004822, 0.05312304198741913, 0.05452561378479004, 0.05592818558216095, 0.05733075737953186, 0.05873332917690277, 0.06013589724898338, 0.06153847277164459, 0.0629410445690155, 0.06434361636638641, 0.06574618816375732, 0.06714875996112823, 0.06855133175849915, 0.06995390355587006, 0.07135647535324097, 0.07275903970003128, 0.07416161149740219, 0.0755641832947731, 0.07696675509214401, 0.07836932688951492, 0.07977189868688583, 0.08117447048425674, 0.08257704228162766, 0.08397961407899857]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 11.0, 9.0, 11.0, 13.0, 26.0, 32.0, 42.0, 39.0, 47.0, 48.0, 55.0, 65.0, 66.0, 67.0, 72.0, 77.0, 62.0, 63.0, 42.0, 26.0, 27.0, 31.0, 19.0, 17.0, 9.0, 14.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0022071003913879395, -0.0021561840549111366, -0.002105267718434334, -0.002054351381957531, -0.002003435045480728, -0.0019525187090039253, -0.0019016023725271225, -0.0018506860360503197, -0.0017997696995735168, -0.001748853363096714, -0.0016979370266199112, -0.0016470206901431084, -0.0015961043536663055, -0.0015451880171895027, -0.0014942716807126999, -0.001443355344235897, -0.0013924390077590942, -0.0013415226712822914, -0.0012906063348054886, -0.0012396899983286858, -0.001188773661851883, -0.0011378573253750801, -0.0010869409888982773, -0.0010360246524214745, -0.0009851083159446716, -0.0009341919794678688, -0.000883275642991066, -0.0008323593065142632, -0.0007814429700374603, -0.0007305266335606575, -0.0006796102970838547, -0.0006286939606070518, -0.000577777624130249, -0.0005268612876534462, -0.00047594495117664337, -0.00042502861469984055, -0.0003741122782230377, -0.0003231959417462349, -0.00027227960526943207, -0.00022136326879262924, -0.00017044693231582642, -0.00011953059583902359, -6.861425936222076e-05, -1.7697922885417938e-05, 3.321841359138489e-05, 8.413475006818771e-05, 0.00013505108654499054, 0.00018596742302179337, 0.0002368837594985962, 0.000287800095975399, 0.00033871643245220184, 0.00038963276892900467, 0.0004405491054058075, 0.0004914654418826103, 0.0005423817783594131, 0.000593298114836216, 0.0006442144513130188, 0.0006951307877898216, 0.0007460471242666245, 0.0007969634607434273, 0.0008478797972202301, 0.0008987961336970329, 0.0009497124701738358, 0.0010006288066506386, 0.0010515451431274414]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 2.0, 6.0, 5.0, 5.0, 6.0, 8.0, 13.0, 14.0, 18.0, 19.0, 13.0, 17.0, 27.0, 23.0, 40.0, 31.0, 29.0, 32.0, 52.0, 44.0, 49.0, 49.0, 38.0, 49.0, 50.0, 41.0, 38.0, 40.0, 31.0, 34.0, 29.0, 33.0, 17.0, 22.0, 6.0, 18.0, 8.0, 14.0, 13.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.0625, -3.93463134765625, -3.8067626953125, -3.67889404296875, -3.551025390625, -3.42315673828125, -3.2952880859375, -3.16741943359375, -3.03955078125, -2.91168212890625, -2.7838134765625, -2.65594482421875, -2.528076171875, -2.40020751953125, -2.2723388671875, -2.14447021484375, -2.0166015625, -1.88873291015625, -1.7608642578125, -1.63299560546875, -1.505126953125, -1.37725830078125, -1.2493896484375, -1.12152099609375, -0.99365234375, -0.86578369140625, -0.7379150390625, -0.61004638671875, -0.482177734375, -0.35430908203125, -0.2264404296875, -0.09857177734375, 0.029296875, 0.15716552734375, 0.2850341796875, 0.41290283203125, 0.540771484375, 0.66864013671875, 0.7965087890625, 0.92437744140625, 1.05224609375, 1.18011474609375, 1.3079833984375, 1.43585205078125, 1.563720703125, 1.69158935546875, 1.8194580078125, 1.94732666015625, 2.0751953125, 2.20306396484375, 2.3309326171875, 2.45880126953125, 2.586669921875, 2.71453857421875, 2.8424072265625, 2.97027587890625, 3.09814453125, 3.22601318359375, 3.3538818359375, 3.48175048828125, 3.609619140625, 3.73748779296875, 3.8653564453125, 3.99322509765625, 4.12109375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 9.0, 2.0, 12.0, 7.0, 15.0, 18.0, 35.0, 24.0, 54.0, 78.0, 135.0, 183.0, 356.0, 539.0, 909.0, 1592.0, 2904.0, 5377.0, 9890.0, 21155.0, 47447.0, 122927.0, 320665.0, 309943.0, 116403.0, 45790.0, 20528.0, 9983.0, 4999.0, 2728.0, 1513.0, 920.0, 508.0, 303.0, 198.0, 140.0, 76.0, 61.0, 37.0, 34.0, 15.0, 14.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5546875, -2.47479248046875, -2.3948974609375, -2.31500244140625, -2.235107421875, -2.15521240234375, -2.0753173828125, -1.99542236328125, -1.91552734375, -1.83563232421875, -1.7557373046875, -1.67584228515625, -1.595947265625, -1.51605224609375, -1.4361572265625, -1.35626220703125, -1.2763671875, -1.19647216796875, -1.1165771484375, -1.03668212890625, -0.956787109375, -0.87689208984375, -0.7969970703125, -0.71710205078125, -0.63720703125, -0.55731201171875, -0.4774169921875, -0.39752197265625, -0.317626953125, -0.23773193359375, -0.1578369140625, -0.07794189453125, 0.001953125, 0.08184814453125, 0.1617431640625, 0.24163818359375, 0.321533203125, 0.40142822265625, 0.4813232421875, 0.56121826171875, 0.64111328125, 0.72100830078125, 0.8009033203125, 0.88079833984375, 0.960693359375, 1.04058837890625, 1.1204833984375, 1.20037841796875, 1.2802734375, 1.36016845703125, 1.4400634765625, 1.51995849609375, 1.599853515625, 1.67974853515625, 1.7596435546875, 1.83953857421875, 1.91943359375, 1.99932861328125, 2.0792236328125, 2.15911865234375, 2.239013671875, 2.31890869140625, 2.3988037109375, 2.47869873046875, 2.55859375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 1.0, 5.0, 5.0, 9.0, 19.0, 12.0, 18.0, 22.0, 30.0, 27.0, 28.0, 37.0, 39.0, 44.0, 37.0, 44.0, 53.0, 73.0, 236.0, 1699.0, 140.0, 63.0, 60.0, 54.0, 41.0, 36.0, 32.0, 22.0, 24.0, 21.0, 20.0, 25.0, 16.0, 14.0, 6.0, 6.0, 10.0, 10.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.421875, -13.9615478515625, -13.501220703125, -13.0408935546875, -12.58056640625, -12.1202392578125, -11.659912109375, -11.1995849609375, -10.7392578125, -10.2789306640625, -9.818603515625, -9.3582763671875, -8.89794921875, -8.4376220703125, -7.977294921875, -7.5169677734375, -7.056640625, -6.5963134765625, -6.135986328125, -5.6756591796875, -5.21533203125, -4.7550048828125, -4.294677734375, -3.8343505859375, -3.3740234375, -2.9136962890625, -2.453369140625, -1.9930419921875, -1.53271484375, -1.0723876953125, -0.612060546875, -0.1517333984375, 0.30859375, 0.7689208984375, 1.229248046875, 1.6895751953125, 2.14990234375, 2.6102294921875, 3.070556640625, 3.5308837890625, 3.9912109375, 4.4515380859375, 4.911865234375, 5.3721923828125, 5.83251953125, 6.2928466796875, 6.753173828125, 7.2135009765625, 7.673828125, 8.1341552734375, 8.594482421875, 9.0548095703125, 9.51513671875, 9.9754638671875, 10.435791015625, 10.8961181640625, 11.3564453125, 11.8167724609375, 12.277099609375, 12.7374267578125, 13.19775390625, 13.6580810546875, 14.118408203125, 14.5787353515625, 15.0390625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 11.0, 5.0, 12.0, 13.0, 24.0, 25.0, 21.0, 34.0, 31.0, 50.0, 83.0, 132.0, 185.0, 299.0, 672.0, 3459.0, 207884.0, 2920189.0, 10299.0, 1104.0, 402.0, 210.0, 151.0, 87.0, 62.0, 53.0, 27.0, 47.0, 23.0, 25.0, 17.0, 17.0, 12.0, 11.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.65625, -23.890380859375, -23.12451171875, -22.358642578125, -21.5927734375, -20.826904296875, -20.06103515625, -19.295166015625, -18.529296875, -17.763427734375, -16.99755859375, -16.231689453125, -15.4658203125, -14.699951171875, -13.93408203125, -13.168212890625, -12.40234375, -11.636474609375, -10.87060546875, -10.104736328125, -9.3388671875, -8.572998046875, -7.80712890625, -7.041259765625, -6.275390625, -5.509521484375, -4.74365234375, -3.977783203125, -3.2119140625, -2.446044921875, -1.68017578125, -0.914306640625, -0.1484375, 0.617431640625, 1.38330078125, 2.149169921875, 2.9150390625, 3.680908203125, 4.44677734375, 5.212646484375, 5.978515625, 6.744384765625, 7.51025390625, 8.276123046875, 9.0419921875, 9.807861328125, 10.57373046875, 11.339599609375, 12.10546875, 12.871337890625, 13.63720703125, 14.403076171875, 15.1689453125, 15.934814453125, 16.70068359375, 17.466552734375, 18.232421875, 18.998291015625, 19.76416015625, 20.530029296875, 21.2958984375, 22.061767578125, 22.82763671875, 23.593505859375, 24.359375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 330.0, 642.0, 35.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.857102394104004, -7.4332780838012695, -4.009453773498535, -0.5856294631958008, 2.8381948471069336, 6.262019157409668, 9.685843467712402, 13.109667778015137, 16.533493041992188, 19.957317352294922, 23.381141662597656, 26.80496597290039, 30.228790283203125, 33.65261459350586, 37.076438903808594, 40.50026321411133, 43.92408752441406, 47.3479118347168, 50.77173614501953, 54.195560455322266, 57.619384765625, 61.043209075927734, 64.46703338623047, 67.89085388183594, 71.31468200683594, 74.73851013183594, 78.1623306274414, 81.58615112304688, 85.00997924804688, 88.43380737304688, 91.85762786865234, 95.28144836425781, 98.70527648925781, 102.12910461425781, 105.55292510986328, 108.97674560546875, 112.40057373046875, 115.82440185546875, 119.24822235107422, 122.67204284667969, 126.09587097167969, 129.5196990966797, 132.94351196289062, 136.36734008789062, 139.79116821289062, 143.21499633789062, 146.63882446289062, 150.06263732910156, 153.48646545410156, 156.91029357910156, 160.3341064453125, 163.7579345703125, 167.1817626953125, 170.6055908203125, 174.0294189453125, 177.45323181152344, 180.87705993652344, 184.30088806152344, 187.72470092773438, 191.14852905273438, 194.57235717773438, 197.99618530273438, 201.42001342773438, 204.8438262939453, 208.2676544189453]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 10.0, 7.0, 11.0, 13.0, 11.0, 12.0, 17.0, 23.0, 14.0, 27.0, 22.0, 21.0, 41.0, 27.0, 36.0, 39.0, 43.0, 42.0, 41.0, 45.0, 35.0, 48.0, 33.0, 42.0, 31.0, 36.0, 26.0, 34.0, 26.0, 29.0, 29.0, 15.0, 14.0, 12.0, 14.0, 15.0, 12.0, 7.0, 10.0, 6.0, 9.0, 5.0, 3.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.402992248535156, -45.00642395019531, -43.6098518371582, -42.21328353881836, -40.816715240478516, -39.420143127441406, -38.02357482910156, -36.62700653076172, -35.230438232421875, -33.83386993408203, -32.43729782104492, -31.040729522705078, -29.644161224365234, -28.247591018676758, -26.85102081298828, -25.454452514648438, -24.057880401611328, -22.66131019592285, -21.264741897583008, -19.86817169189453, -18.471603393554688, -17.07503318786621, -15.678462982177734, -14.281893730163574, -12.885324478149414, -11.488755226135254, -10.092185974121094, -8.695615768432617, -7.299046516418457, -5.902477264404297, -4.50590705871582, -3.10933780670166, -1.7127685546875, -0.31619906425476074, 1.0803704261779785, 2.476940155029297, 3.873509407043457, 5.270078659057617, 6.666648864746094, 8.063218116760254, 9.459787368774414, 10.856356620788574, 12.252925872802734, 13.649496078491211, 15.046065330505371, 16.44263458251953, 17.839204788208008, 19.235774993896484, 20.632343292236328, 22.028913497924805, 23.42548179626465, 24.822052001953125, 26.21862030029297, 27.615190505981445, 29.011760711669922, 30.408329010009766, 31.804899215698242, 33.20146942138672, 34.59803771972656, 35.994606018066406, 37.391178131103516, 38.78774642944336, 40.18431854248047, 41.58088684082031, 42.977455139160156]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 6.0, 5.0, 7.0, 6.0, 10.0, 7.0, 12.0, 21.0, 14.0, 23.0, 22.0, 21.0, 24.0, 26.0, 31.0, 43.0, 40.0, 34.0, 38.0, 47.0, 42.0, 49.0, 42.0, 48.0, 35.0, 39.0, 44.0, 29.0, 40.0, 36.0, 29.0, 18.0, 19.0, 15.0, 17.0, 11.0, 9.0, 15.0, 5.0, 6.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.984375, -3.8560791015625, -3.727783203125, -3.5994873046875, -3.47119140625, -3.3428955078125, -3.214599609375, -3.0863037109375, -2.9580078125, -2.8297119140625, -2.701416015625, -2.5731201171875, -2.44482421875, -2.3165283203125, -2.188232421875, -2.0599365234375, -1.931640625, -1.8033447265625, -1.675048828125, -1.5467529296875, -1.41845703125, -1.2901611328125, -1.161865234375, -1.0335693359375, -0.9052734375, -0.7769775390625, -0.648681640625, -0.5203857421875, -0.39208984375, -0.2637939453125, -0.135498046875, -0.0072021484375, 0.12109375, 0.2493896484375, 0.377685546875, 0.5059814453125, 0.63427734375, 0.7625732421875, 0.890869140625, 1.0191650390625, 1.1474609375, 1.2757568359375, 1.404052734375, 1.5323486328125, 1.66064453125, 1.7889404296875, 1.917236328125, 2.0455322265625, 2.173828125, 2.3021240234375, 2.430419921875, 2.5587158203125, 2.68701171875, 2.8153076171875, 2.943603515625, 3.0718994140625, 3.2001953125, 3.3284912109375, 3.456787109375, 3.5850830078125, 3.71337890625, 3.8416748046875, 3.969970703125, 4.0982666015625, 4.2265625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 9.0, 7.0, 8.0, 6.0, 11.0, 12.0, 20.0, 18.0, 28.0, 36.0, 42.0, 48.0, 96.0, 196.0, 458.0, 1461.0, 6701.0, 40312.0, 499362.0, 3050256.0, 543206.0, 42409.0, 6941.0, 1546.0, 508.0, 205.0, 96.0, 74.0, 38.0, 35.0, 34.0, 28.0, 17.0, 13.0, 7.0, 8.0, 8.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.890625, -12.494140625, -12.09765625, -11.701171875, -11.3046875, -10.908203125, -10.51171875, -10.115234375, -9.71875, -9.322265625, -8.92578125, -8.529296875, -8.1328125, -7.736328125, -7.33984375, -6.943359375, -6.546875, -6.150390625, -5.75390625, -5.357421875, -4.9609375, -4.564453125, -4.16796875, -3.771484375, -3.375, -2.978515625, -2.58203125, -2.185546875, -1.7890625, -1.392578125, -0.99609375, -0.599609375, -0.203125, 0.193359375, 0.58984375, 0.986328125, 1.3828125, 1.779296875, 2.17578125, 2.572265625, 2.96875, 3.365234375, 3.76171875, 4.158203125, 4.5546875, 4.951171875, 5.34765625, 5.744140625, 6.140625, 6.537109375, 6.93359375, 7.330078125, 7.7265625, 8.123046875, 8.51953125, 8.916015625, 9.3125, 9.708984375, 10.10546875, 10.501953125, 10.8984375, 11.294921875, 11.69140625, 12.087890625, 12.484375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 3.0, 10.0, 16.0, 15.0, 41.0, 54.0, 85.0, 121.0, 185.0, 301.0, 388.0, 592.0, 662.0, 529.0, 366.0, 248.0, 166.0, 110.0, 55.0, 47.0, 28.0, 15.0, 14.0, 9.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.46875, -13.974365234375, -13.47998046875, -12.985595703125, -12.4912109375, -11.996826171875, -11.50244140625, -11.008056640625, -10.513671875, -10.019287109375, -9.52490234375, -9.030517578125, -8.5361328125, -8.041748046875, -7.54736328125, -7.052978515625, -6.55859375, -6.064208984375, -5.56982421875, -5.075439453125, -4.5810546875, -4.086669921875, -3.59228515625, -3.097900390625, -2.603515625, -2.109130859375, -1.61474609375, -1.120361328125, -0.6259765625, -0.131591796875, 0.36279296875, 0.857177734375, 1.3515625, 1.845947265625, 2.34033203125, 2.834716796875, 3.3291015625, 3.823486328125, 4.31787109375, 4.812255859375, 5.306640625, 5.801025390625, 6.29541015625, 6.789794921875, 7.2841796875, 7.778564453125, 8.27294921875, 8.767333984375, 9.26171875, 9.756103515625, 10.25048828125, 10.744873046875, 11.2392578125, 11.733642578125, 12.22802734375, 12.722412109375, 13.216796875, 13.711181640625, 14.20556640625, 14.699951171875, 15.1943359375, 15.688720703125, 16.18310546875, 16.677490234375, 17.171875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 4.0, 14.0, 11.0, 18.0, 25.0, 31.0, 40.0, 65.0, 81.0, 109.0, 152.0, 281.0, 484.0, 1401.0, 9460.0, 355110.0, 3735260.0, 85421.0, 4204.0, 959.0, 402.0, 204.0, 145.0, 100.0, 86.0, 49.0, 40.0, 30.0, 20.0, 15.0, 10.0, 10.0, 10.0, 10.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.03125, -31.9052734375, -30.779296875, -29.6533203125, -28.52734375, -27.4013671875, -26.275390625, -25.1494140625, -24.0234375, -22.8974609375, -21.771484375, -20.6455078125, -19.51953125, -18.3935546875, -17.267578125, -16.1416015625, -15.015625, -13.8896484375, -12.763671875, -11.6376953125, -10.51171875, -9.3857421875, -8.259765625, -7.1337890625, -6.0078125, -4.8818359375, -3.755859375, -2.6298828125, -1.50390625, -0.3779296875, 0.748046875, 1.8740234375, 3.0, 4.1259765625, 5.251953125, 6.3779296875, 7.50390625, 8.6298828125, 9.755859375, 10.8818359375, 12.0078125, 13.1337890625, 14.259765625, 15.3857421875, 16.51171875, 17.6376953125, 18.763671875, 19.8896484375, 21.015625, 22.1416015625, 23.267578125, 24.3935546875, 25.51953125, 26.6455078125, 27.771484375, 28.8974609375, 30.0234375, 31.1494140625, 32.275390625, 33.4013671875, 34.52734375, 35.6533203125, 36.779296875, 37.9052734375, 39.03125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 15.0, 21.0, 48.0, 80.0, 110.0, 127.0, 148.0, 139.0, 104.0, 91.0, 49.0, 32.0, 22.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.87782287597656, -66.0169448852539, -64.15605926513672, -62.29518127441406, -60.43429946899414, -58.57341766357422, -56.71253967285156, -54.85165786743164, -52.99077606201172, -51.1298942565918, -49.269012451171875, -47.40813446044922, -45.5472526550293, -43.686370849609375, -41.82549285888672, -39.9646110534668, -38.103729248046875, -36.24284744262695, -34.38196563720703, -32.521087646484375, -30.660205841064453, -28.79932403564453, -26.938444137573242, -25.077564239501953, -23.21668243408203, -21.35580062866211, -19.49492073059082, -17.63404083251953, -15.77315902709961, -13.912278175354004, -12.051397323608398, -10.190516471862793, -8.329639434814453, -6.468758583068848, -4.607877731323242, -2.7469968795776367, -0.8861160278320312, 0.9747648239135742, 2.8356456756591797, 4.696526527404785, 6.557407379150391, 8.418288230895996, 10.279169082641602, 12.140049934387207, 14.000930786132812, 15.861811637878418, 17.722692489624023, 19.583572387695312, 21.444454193115234, 23.305335998535156, 25.166215896606445, 27.027095794677734, 28.887977600097656, 30.748859405517578, 32.6097412109375, 34.470619201660156, 36.33150100708008, 38.1923828125, 40.053260803222656, 41.91414260864258, 43.7750244140625, 45.63590621948242, 47.496788024902344, 49.357666015625, 51.21854782104492]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 11.0, 2.0, 9.0, 5.0, 7.0, 7.0, 10.0, 13.0, 13.0, 25.0, 20.0, 24.0, 18.0, 26.0, 34.0, 35.0, 34.0, 32.0, 34.0, 45.0, 45.0, 42.0, 36.0, 32.0, 37.0, 37.0, 40.0, 45.0, 38.0, 34.0, 26.0, 28.0, 25.0, 24.0, 19.0, 10.0, 14.0, 12.0, 6.0, 12.0, 6.0, 9.0, 4.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-37.75487518310547, -36.618038177490234, -35.481201171875, -34.344364166259766, -33.20752716064453, -32.07068634033203, -30.933849334716797, -29.797012329101562, -28.660175323486328, -27.523338317871094, -26.38650131225586, -25.249662399291992, -24.112825393676758, -22.975988388061523, -21.839149475097656, -20.702312469482422, -19.565475463867188, -18.428638458251953, -17.29180145263672, -16.15496253967285, -15.018125534057617, -13.881288528442383, -12.744450569152832, -11.607612609863281, -10.470775604248047, -9.333938598632812, -8.197100639343262, -7.060263156890869, -5.923425674438477, -4.786588191986084, -3.6497507095336914, -2.512913227081299, -1.3760719299316406, -0.23923444747924805, 0.8976030349731445, 2.034440517425537, 3.1712779998779297, 4.308115482330322, 5.444952964782715, 6.581790447235107, 7.7186279296875, 8.855464935302734, 9.992302894592285, 11.129140853881836, 12.26597785949707, 13.402814865112305, 14.539652824401855, 15.676490783691406, 16.81332778930664, 17.950164794921875, 19.08700180053711, 20.223840713500977, 21.36067771911621, 22.497514724731445, 23.634353637695312, 24.771190643310547, 25.90802764892578, 27.044864654541016, 28.18170166015625, 29.318540573120117, 30.45537757873535, 31.592214584350586, 32.72905349731445, 33.86589050292969, 35.00272750854492]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 2.0, 3.0, 9.0, 7.0, 3.0, 14.0, 12.0, 13.0, 15.0, 16.0, 27.0, 30.0, 37.0, 18.0, 31.0, 31.0, 38.0, 36.0, 49.0, 32.0, 24.0, 44.0, 39.0, 41.0, 44.0, 39.0, 42.0, 35.0, 35.0, 25.0, 27.0, 32.0, 14.0, 18.0, 21.0, 15.0, 17.0, 14.0, 9.0, 7.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-3.7734375, -3.6500244140625, -3.526611328125, -3.4031982421875, -3.27978515625, -3.1563720703125, -3.032958984375, -2.9095458984375, -2.7861328125, -2.6627197265625, -2.539306640625, -2.4158935546875, -2.29248046875, -2.1690673828125, -2.045654296875, -1.9222412109375, -1.798828125, -1.6754150390625, -1.552001953125, -1.4285888671875, -1.30517578125, -1.1817626953125, -1.058349609375, -0.9349365234375, -0.8115234375, -0.6881103515625, -0.564697265625, -0.4412841796875, -0.31787109375, -0.1944580078125, -0.071044921875, 0.0523681640625, 0.17578125, 0.2991943359375, 0.422607421875, 0.5460205078125, 0.66943359375, 0.7928466796875, 0.916259765625, 1.0396728515625, 1.1630859375, 1.2864990234375, 1.409912109375, 1.5333251953125, 1.65673828125, 1.7801513671875, 1.903564453125, 2.0269775390625, 2.150390625, 2.2738037109375, 2.397216796875, 2.5206298828125, 2.64404296875, 2.7674560546875, 2.890869140625, 3.0142822265625, 3.1376953125, 3.2611083984375, 3.384521484375, 3.5079345703125, 3.63134765625, 3.7547607421875, 3.878173828125, 4.0015869140625, 4.125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 9.0, 7.0, 17.0, 18.0, 32.0, 50.0, 61.0, 95.0, 157.0, 211.0, 340.0, 504.0, 783.0, 1251.0, 2034.0, 3090.0, 4983.0, 8004.0, 12731.0, 20690.0, 34590.0, 60725.0, 116437.0, 220953.0, 247929.0, 138780.0, 71922.0, 39796.0, 23511.0, 14461.0, 9010.0, 5564.0, 3608.0, 2277.0, 1375.0, 909.0, 558.0, 351.0, 243.0, 155.0, 102.0, 66.0, 62.0, 35.0, 17.0, 16.0, 11.0, 9.0, 9.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0], "bins": [-0.6591796875, -0.6386642456054688, -0.6181488037109375, -0.5976333618164062, -0.577117919921875, -0.5566024780273438, -0.5360870361328125, -0.5155715942382812, -0.49505615234375, -0.47454071044921875, -0.4540252685546875, -0.43350982666015625, -0.412994384765625, -0.39247894287109375, -0.3719635009765625, -0.35144805908203125, -0.3309326171875, -0.31041717529296875, -0.2899017333984375, -0.26938629150390625, -0.248870849609375, -0.22835540771484375, -0.2078399658203125, -0.18732452392578125, -0.16680908203125, -0.14629364013671875, -0.1257781982421875, -0.10526275634765625, -0.084747314453125, -0.06423187255859375, -0.0437164306640625, -0.02320098876953125, -0.002685546875, 0.01782989501953125, 0.0383453369140625, 0.05886077880859375, 0.079376220703125, 0.09989166259765625, 0.1204071044921875, 0.14092254638671875, 0.16143798828125, 0.18195343017578125, 0.2024688720703125, 0.22298431396484375, 0.243499755859375, 0.26401519775390625, 0.2845306396484375, 0.30504608154296875, 0.3255615234375, 0.34607696533203125, 0.3665924072265625, 0.38710784912109375, 0.407623291015625, 0.42813873291015625, 0.4486541748046875, 0.46916961669921875, 0.48968505859375, 0.5102005004882812, 0.5307159423828125, 0.5512313842773438, 0.571746826171875, 0.5922622680664062, 0.6127777099609375, 0.6332931518554688, 0.65380859375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 12.0, 10.0, 14.0, 15.0, 22.0, 20.0, 27.0, 35.0, 29.0, 25.0, 36.0, 35.0, 32.0, 47.0, 38.0, 46.0, 44.0, 1074.0, 51.0, 40.0, 38.0, 30.0, 32.0, 39.0, 24.0, 24.0, 24.0, 23.0, 22.0, 17.0, 21.0, 18.0, 12.0, 7.0, 14.0, 10.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.703125, -2.61761474609375, -2.5321044921875, -2.44659423828125, -2.361083984375, -2.27557373046875, -2.1900634765625, -2.10455322265625, -2.01904296875, -1.93353271484375, -1.8480224609375, -1.76251220703125, -1.677001953125, -1.59149169921875, -1.5059814453125, -1.42047119140625, -1.3349609375, -1.24945068359375, -1.1639404296875, -1.07843017578125, -0.992919921875, -0.90740966796875, -0.8218994140625, -0.73638916015625, -0.65087890625, -0.56536865234375, -0.4798583984375, -0.39434814453125, -0.308837890625, -0.22332763671875, -0.1378173828125, -0.05230712890625, 0.033203125, 0.11871337890625, 0.2042236328125, 0.28973388671875, 0.375244140625, 0.46075439453125, 0.5462646484375, 0.63177490234375, 0.71728515625, 0.80279541015625, 0.8883056640625, 0.97381591796875, 1.059326171875, 1.14483642578125, 1.2303466796875, 1.31585693359375, 1.4013671875, 1.48687744140625, 1.5723876953125, 1.65789794921875, 1.743408203125, 1.82891845703125, 1.9144287109375, 1.99993896484375, 2.08544921875, 2.17095947265625, 2.2564697265625, 2.34197998046875, 2.427490234375, 2.51300048828125, 2.5985107421875, 2.68402099609375, 2.76953125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 14.0, 17.0, 15.0, 23.0, 50.0, 88.0, 123.0, 186.0, 260.0, 460.0, 639.0, 1136.0, 1865.0, 2957.0, 4740.0, 8229.0, 14020.0, 24567.0, 44494.0, 82109.0, 150275.0, 1280807.0, 208124.0, 120739.0, 66204.0, 36189.0, 20022.0, 11507.0, 6784.0, 3896.0, 2558.0, 1496.0, 970.0, 566.0, 355.0, 241.0, 150.0, 86.0, 49.0, 47.0, 31.0, 18.0, 6.0, 7.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.47607421875, -0.46111297607421875, -0.4461517333984375, -0.43119049072265625, -0.416229248046875, -0.40126800537109375, -0.3863067626953125, -0.37134552001953125, -0.35638427734375, -0.34142303466796875, -0.3264617919921875, -0.31150054931640625, -0.296539306640625, -0.28157806396484375, -0.2666168212890625, -0.25165557861328125, -0.2366943359375, -0.22173309326171875, -0.2067718505859375, -0.19181060791015625, -0.176849365234375, -0.16188812255859375, -0.1469268798828125, -0.13196563720703125, -0.11700439453125, -0.10204315185546875, -0.0870819091796875, -0.07212066650390625, -0.057159423828125, -0.04219818115234375, -0.0272369384765625, -0.01227569580078125, 0.002685546875, 0.01764678955078125, 0.0326080322265625, 0.04756927490234375, 0.062530517578125, 0.07749176025390625, 0.0924530029296875, 0.10741424560546875, 0.12237548828125, 0.13733673095703125, 0.1522979736328125, 0.16725921630859375, 0.182220458984375, 0.19718170166015625, 0.2121429443359375, 0.22710418701171875, 0.2420654296875, 0.25702667236328125, 0.2719879150390625, 0.28694915771484375, 0.301910400390625, 0.31687164306640625, 0.3318328857421875, 0.34679412841796875, 0.36175537109375, 0.37671661376953125, 0.3916778564453125, 0.40663909912109375, 0.421600341796875, 0.43656158447265625, 0.4515228271484375, 0.46648406982421875, 0.4814453125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 6.0, 11.0, 13.0, 10.0, 10.0, 19.0, 19.0, 19.0, 26.0, 27.0, 27.0, 35.0, 26.0, 52.0, 49.0, 46.0, 57.0, 48.0, 59.0, 50.0, 57.0, 37.0, 48.0, 47.0, 29.0, 32.0, 23.0, 23.0, 22.0, 14.0, 12.0, 9.0, 7.0, 5.0, 11.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001453399658203125, -0.0014071613550186157, -0.0013609230518341064, -0.0013146847486495972, -0.0012684464454650879, -0.0012222081422805786, -0.0011759698390960693, -0.00112973153591156, -0.0010834932327270508, -0.0010372549295425415, -0.0009910166263580322, -0.000944778323173523, -0.0008985400199890137, -0.0008523017168045044, -0.0008060634136199951, -0.0007598251104354858, -0.0007135868072509766, -0.0006673485040664673, -0.000621110200881958, -0.0005748718976974487, -0.0005286335945129395, -0.0004823952913284302, -0.0004361569881439209, -0.0003899186849594116, -0.00034368038177490234, -0.00029744207859039307, -0.0002512037754058838, -0.0002049654722213745, -0.00015872716903686523, -0.00011248886585235596, -6.625056266784668e-05, -2.0012259483337402e-05, 2.6226043701171875e-05, 7.246434688568115e-05, 0.00011870265007019043, 0.0001649409532546997, 0.00021117925643920898, 0.00025741755962371826, 0.00030365586280822754, 0.0003498941659927368, 0.0003961324691772461, 0.00044237077236175537, 0.0004886090755462646, 0.0005348473787307739, 0.0005810856819152832, 0.0006273239850997925, 0.0006735622882843018, 0.000719800591468811, 0.0007660388946533203, 0.0008122771978378296, 0.0008585155010223389, 0.0009047538042068481, 0.0009509921073913574, 0.0009972304105758667, 0.001043468713760376, 0.0010897070169448853, 0.0011359453201293945, 0.0011821836233139038, 0.001228421926498413, 0.0012746602296829224, 0.0013208985328674316, 0.001367136836051941, 0.0014133751392364502, 0.0014596134424209595, 0.0015058517456054688]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 1.0, 7.0, 9.0, 14.0, 18.0, 17.0, 21.0, 40.0, 53.0, 75.0, 121.0, 251.0, 613.0, 7625.0, 1035418.0, 3174.0, 521.0, 217.0, 105.0, 62.0, 50.0, 36.0, 18.0, 15.0, 20.0, 11.0, 10.0, 12.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05255126953125, -0.05087900161743164, -0.04920673370361328, -0.04753446578979492, -0.04586219787597656, -0.0441899299621582, -0.042517662048339844, -0.040845394134521484, -0.039173126220703125, -0.037500858306884766, -0.035828590393066406, -0.03415632247924805, -0.03248405456542969, -0.030811786651611328, -0.02913951873779297, -0.02746725082397461, -0.02579498291015625, -0.02412271499633789, -0.02245044708251953, -0.020778179168701172, -0.019105911254882812, -0.017433643341064453, -0.015761375427246094, -0.014089107513427734, -0.012416839599609375, -0.010744571685791016, -0.009072303771972656, -0.007400035858154297, -0.0057277679443359375, -0.004055500030517578, -0.0023832321166992188, -0.0007109642028808594, 0.0009613037109375, 0.0026335716247558594, 0.004305839538574219, 0.005978107452392578, 0.0076503753662109375, 0.009322643280029297, 0.010994911193847656, 0.012667179107666016, 0.014339447021484375, 0.016011714935302734, 0.017683982849121094, 0.019356250762939453, 0.021028518676757812, 0.022700786590576172, 0.02437305450439453, 0.02604532241821289, 0.02771759033203125, 0.02938985824584961, 0.03106212615966797, 0.03273439407348633, 0.03440666198730469, 0.03607892990112305, 0.037751197814941406, 0.039423465728759766, 0.041095733642578125, 0.042768001556396484, 0.044440269470214844, 0.0461125373840332, 0.04778480529785156, 0.04945707321166992, 0.05112934112548828, 0.05280160903930664, 0.054473876953125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1017.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0044039469212293625, -0.003146381815895438, -0.001888816710561514, -0.0006312516052275896, 0.0006263135001063347, 0.0018838783726096153, 0.0031414437107741833, 0.004399009048938751, 0.005656573921442032, 0.0069141387939453125, 0.008171703666448593, 0.009429269470274448, 0.010686834342777729, 0.01194439921528101, 0.013201965019106865, 0.014459529891610146, 0.015717094764113426, 0.016974659636616707, 0.018232224509119987, 0.019489789381623268, 0.020747356116771698, 0.02200492098927498, 0.02326248586177826, 0.02452005073428154, 0.02577761560678482, 0.0270351804792881, 0.028292745351791382, 0.029550310224294662, 0.030807875096797943, 0.032065439969301224, 0.033323004841804504, 0.034580573439598083, 0.035838134586811066, 0.037095699459314346, 0.03835326433181763, 0.03961082920432091, 0.04086839407682419, 0.04212595894932747, 0.04338352382183075, 0.04464109241962433, 0.04589865356683731, 0.04715621843934059, 0.04841378331184387, 0.04967134818434715, 0.05092891305685043, 0.052186477929353714, 0.053444042801856995, 0.054701611399650574, 0.055959176272153854, 0.057216741144657135, 0.058474306017160416, 0.059731870889663696, 0.06098943576216698, 0.06224700063467026, 0.06350456923246384, 0.06476213037967682, 0.0660196989774704, 0.06727726757526398, 0.06853482872247696, 0.06979239732027054, 0.07104995846748352, 0.0723075270652771, 0.07356508821249008, 0.07482265681028366, 0.07608021795749664]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 20.0, 24.0, 28.0, 35.0, 44.0, 62.0, 61.0, 63.0, 74.0, 73.0, 73.0, 78.0, 61.0, 64.0, 58.0, 43.0, 40.0, 22.0, 25.0, 21.0, 9.0, 3.0, 11.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019169449806213379, -0.0018700174987316132, -0.0018230900168418884, -0.0017761625349521637, -0.001729235053062439, -0.0016823075711727142, -0.0016353800892829895, -0.0015884526073932648, -0.00154152512550354, -0.0014945976436138153, -0.0014476701617240906, -0.0014007426798343658, -0.0013538151979446411, -0.0013068877160549164, -0.0012599602341651917, -0.001213032752275467, -0.0011661052703857422, -0.0011191777884960175, -0.0010722503066062927, -0.001025322824716568, -0.0009783953428268433, -0.0009314678609371185, -0.0008845403790473938, -0.0008376128971576691, -0.0007906854152679443, -0.0007437579333782196, -0.0006968304514884949, -0.0006499029695987701, -0.0006029754877090454, -0.0005560480058193207, -0.000509120523929596, -0.0004621930420398712, -0.0004152655601501465, -0.00036833807826042175, -0.000321410596370697, -0.0002744831144809723, -0.00022755563259124756, -0.00018062815070152283, -0.0001337006688117981, -8.677318692207336e-05, -3.984570503234863e-05, 7.081776857376099e-06, 5.400925874710083e-05, 0.00010093674063682556, 0.0001478642225265503, 0.00019479170441627502, 0.00024171918630599976, 0.0002886466681957245, 0.0003355741500854492, 0.00038250163197517395, 0.0004294291138648987, 0.0004763565957546234, 0.0005232840776443481, 0.0005702115595340729, 0.0006171390414237976, 0.0006640665233135223, 0.0007109940052032471, 0.0007579214870929718, 0.0008048489689826965, 0.0008517764508724213, 0.000898703932762146, 0.0009456314146518707, 0.0009925588965415955, 0.0010394863784313202, 0.001086413860321045]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 2.0, 3.0, 9.0, 7.0, 3.0, 14.0, 12.0, 13.0, 15.0, 16.0, 27.0, 30.0, 37.0, 18.0, 31.0, 31.0, 38.0, 36.0, 49.0, 32.0, 24.0, 44.0, 39.0, 41.0, 44.0, 39.0, 42.0, 35.0, 35.0, 25.0, 27.0, 32.0, 14.0, 17.0, 22.0, 15.0, 17.0, 14.0, 9.0, 7.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-3.7734375, -3.6500244140625, -3.526611328125, -3.4031982421875, -3.27978515625, -3.1563720703125, -3.032958984375, -2.9095458984375, -2.7861328125, -2.6627197265625, -2.539306640625, -2.4158935546875, -2.29248046875, -2.1690673828125, -2.045654296875, -1.9222412109375, -1.798828125, -1.6754150390625, -1.552001953125, -1.4285888671875, -1.30517578125, -1.1817626953125, -1.058349609375, -0.9349365234375, -0.8115234375, -0.6881103515625, -0.564697265625, -0.4412841796875, -0.31787109375, -0.1944580078125, -0.071044921875, 0.0523681640625, 0.17578125, 0.2991943359375, 0.422607421875, 0.5460205078125, 0.66943359375, 0.7928466796875, 0.916259765625, 1.0396728515625, 1.1630859375, 1.2864990234375, 1.409912109375, 1.5333251953125, 1.65673828125, 1.7801513671875, 1.903564453125, 2.0269775390625, 2.150390625, 2.2738037109375, 2.397216796875, 2.5206298828125, 2.64404296875, 2.7674560546875, 2.890869140625, 3.0142822265625, 3.1376953125, 3.2611083984375, 3.384521484375, 3.5079345703125, 3.63134765625, 3.7547607421875, 3.878173828125, 4.0015869140625, 4.125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 6.0, 16.0, 21.0, 23.0, 43.0, 55.0, 91.0, 141.0, 214.0, 255.0, 449.0, 705.0, 1098.0, 1946.0, 3126.0, 5928.0, 11776.0, 26368.0, 71488.0, 283443.0, 472455.0, 102319.0, 34697.0, 14904.0, 7298.0, 3746.0, 2153.0, 1305.0, 834.0, 558.0, 362.0, 214.0, 167.0, 94.0, 75.0, 58.0, 27.0, 22.0, 24.0, 9.0, 13.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.6015625, -4.4627685546875, -4.323974609375, -4.1851806640625, -4.04638671875, -3.9075927734375, -3.768798828125, -3.6300048828125, -3.4912109375, -3.3524169921875, -3.213623046875, -3.0748291015625, -2.93603515625, -2.7972412109375, -2.658447265625, -2.5196533203125, -2.380859375, -2.2420654296875, -2.103271484375, -1.9644775390625, -1.82568359375, -1.6868896484375, -1.548095703125, -1.4093017578125, -1.2705078125, -1.1317138671875, -0.992919921875, -0.8541259765625, -0.71533203125, -0.5765380859375, -0.437744140625, -0.2989501953125, -0.16015625, -0.0213623046875, 0.117431640625, 0.2562255859375, 0.39501953125, 0.5338134765625, 0.672607421875, 0.8114013671875, 0.9501953125, 1.0889892578125, 1.227783203125, 1.3665771484375, 1.50537109375, 1.6441650390625, 1.782958984375, 1.9217529296875, 2.060546875, 2.1993408203125, 2.338134765625, 2.4769287109375, 2.61572265625, 2.7545166015625, 2.893310546875, 3.0321044921875, 3.1708984375, 3.3096923828125, 3.448486328125, 3.5872802734375, 3.72607421875, 3.8648681640625, 4.003662109375, 4.1424560546875, 4.28125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 3.0, 7.0, 9.0, 10.0, 8.0, 14.0, 10.0, 18.0, 21.0, 24.0, 30.0, 36.0, 38.0, 43.0, 42.0, 43.0, 66.0, 106.0, 426.0, 1516.0, 112.0, 65.0, 51.0, 41.0, 40.0, 38.0, 38.0, 28.0, 22.0, 20.0, 15.0, 21.0, 16.0, 17.0, 8.0, 11.0, 8.0, 7.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4375, -14.9842529296875, -14.531005859375, -14.0777587890625, -13.62451171875, -13.1712646484375, -12.718017578125, -12.2647705078125, -11.8115234375, -11.3582763671875, -10.905029296875, -10.4517822265625, -9.99853515625, -9.5452880859375, -9.092041015625, -8.6387939453125, -8.185546875, -7.7322998046875, -7.279052734375, -6.8258056640625, -6.37255859375, -5.9193115234375, -5.466064453125, -5.0128173828125, -4.5595703125, -4.1063232421875, -3.653076171875, -3.1998291015625, -2.74658203125, -2.2933349609375, -1.840087890625, -1.3868408203125, -0.93359375, -0.4803466796875, -0.027099609375, 0.4261474609375, 0.87939453125, 1.3326416015625, 1.785888671875, 2.2391357421875, 2.6923828125, 3.1456298828125, 3.598876953125, 4.0521240234375, 4.50537109375, 4.9586181640625, 5.411865234375, 5.8651123046875, 6.318359375, 6.7716064453125, 7.224853515625, 7.6781005859375, 8.13134765625, 8.5845947265625, 9.037841796875, 9.4910888671875, 9.9443359375, 10.3975830078125, 10.850830078125, 11.3040771484375, 11.75732421875, 12.2105712890625, 12.663818359375, 13.1170654296875, 13.5703125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 6.0, 13.0, 15.0, 18.0, 18.0, 34.0, 35.0, 34.0, 60.0, 106.0, 183.0, 296.0, 663.0, 5228.0, 2771982.0, 362797.0, 2875.0, 590.0, 282.0, 140.0, 112.0, 62.0, 42.0, 22.0, 28.0, 17.0, 13.0, 10.0, 9.0, 3.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.1875, -31.998046875, -30.80859375, -29.619140625, -28.4296875, -27.240234375, -26.05078125, -24.861328125, -23.671875, -22.482421875, -21.29296875, -20.103515625, -18.9140625, -17.724609375, -16.53515625, -15.345703125, -14.15625, -12.966796875, -11.77734375, -10.587890625, -9.3984375, -8.208984375, -7.01953125, -5.830078125, -4.640625, -3.451171875, -2.26171875, -1.072265625, 0.1171875, 1.306640625, 2.49609375, 3.685546875, 4.875, 6.064453125, 7.25390625, 8.443359375, 9.6328125, 10.822265625, 12.01171875, 13.201171875, 14.390625, 15.580078125, 16.76953125, 17.958984375, 19.1484375, 20.337890625, 21.52734375, 22.716796875, 23.90625, 25.095703125, 26.28515625, 27.474609375, 28.6640625, 29.853515625, 31.04296875, 32.232421875, 33.421875, 34.611328125, 35.80078125, 36.990234375, 38.1796875, 39.369140625, 40.55859375, 41.748046875, 42.9375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 11.0, 108.0, 326.0, 384.0, 154.0, 25.0, 6.0], "bins": [-116.4489974975586, -114.5123062133789, -112.57561492919922, -110.63893127441406, -108.70223999023438, -106.76554870605469, -104.828857421875, -102.89217376708984, -100.95548248291016, -99.01879119873047, -97.08209991455078, -95.14541625976562, -93.20872497558594, -91.27203369140625, -89.33534240722656, -87.3986587524414, -85.46196746826172, -83.52527618408203, -81.58858489990234, -79.65190124511719, -77.7152099609375, -75.77851867675781, -73.84182739257812, -71.90514373779297, -69.96845245361328, -68.0317611694336, -66.0950698852539, -64.15838623046875, -62.22169494628906, -60.285003662109375, -58.34831619262695, -56.411624908447266, -54.474937438964844, -52.538246154785156, -50.601558685302734, -48.66486740112305, -46.728179931640625, -44.79148864746094, -42.854801177978516, -40.91810989379883, -38.98141860961914, -37.04472732543945, -35.10803985595703, -33.171348571777344, -31.234661102294922, -29.297969818115234, -27.361282348632812, -25.424591064453125, -23.487903594970703, -21.55121421813965, -19.614524841308594, -17.67783546447754, -15.741146087646484, -13.804455757141113, -11.867766380310059, -9.931077003479004, -7.994387626647949, -6.0576982498168945, -4.12100887298584, -2.184319019317627, -0.24762964248657227, 1.6890602111816406, 3.6257495880126953, 5.56243896484375, 7.499128341674805]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 3.0, 10.0, 8.0, 12.0, 14.0, 13.0, 14.0, 21.0, 23.0, 18.0, 24.0, 19.0, 28.0, 34.0, 38.0, 39.0, 31.0, 27.0, 44.0, 30.0, 42.0, 47.0, 37.0, 41.0, 26.0, 36.0, 42.0, 27.0, 25.0, 27.0, 26.0, 19.0, 17.0, 18.0, 21.0, 13.0, 14.0, 13.0, 10.0, 10.0, 11.0, 7.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-38.564788818359375, -37.33913040161133, -36.113468170166016, -34.88780975341797, -33.66215133666992, -32.436492919921875, -31.210830688476562, -29.985172271728516, -28.759511947631836, -27.533851623535156, -26.30819320678711, -25.08253288269043, -23.85687255859375, -22.631214141845703, -21.405553817749023, -20.179893493652344, -18.954235076904297, -17.728574752807617, -16.50291633605957, -15.27725601196289, -14.051596641540527, -12.825937271118164, -11.600276947021484, -10.374617576599121, -9.148958206176758, -7.9232988357543945, -6.697638988494873, -5.471979141235352, -4.246319770812988, -3.020660400390625, -1.7950005531311035, -0.569340705871582, 0.6563224792480469, 1.8819820880889893, 3.1076416969299316, 4.333301544189453, 5.558960914611816, 6.78462028503418, 8.01028060913086, 9.235939979553223, 10.461599349975586, 11.68725872039795, 12.912918090820312, 14.138578414916992, 15.364237785339355, 16.58989715576172, 17.8155574798584, 19.041217803955078, 20.266876220703125, 21.492536544799805, 22.71819496154785, 23.94385528564453, 25.169513702392578, 26.395174026489258, 27.620834350585938, 28.846492767333984, 30.072153091430664, 31.297813415527344, 32.52347183227539, 33.74913024902344, 34.97479248046875, 36.2004508972168, 37.426109313964844, 38.651771545410156, 39.8774299621582]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 9.0, 5.0, 10.0, 16.0, 19.0, 15.0, 26.0, 23.0, 29.0, 31.0, 30.0, 30.0, 26.0, 44.0, 40.0, 47.0, 32.0, 31.0, 39.0, 34.0, 48.0, 45.0, 41.0, 34.0, 30.0, 32.0, 27.0, 30.0, 27.0, 16.0, 15.0, 18.0, 18.0, 9.0, 11.0, 9.0, 8.0, 5.0, 8.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.828125, -3.7001953125, -3.572265625, -3.4443359375, -3.31640625, -3.1884765625, -3.060546875, -2.9326171875, -2.8046875, -2.6767578125, -2.548828125, -2.4208984375, -2.29296875, -2.1650390625, -2.037109375, -1.9091796875, -1.78125, -1.6533203125, -1.525390625, -1.3974609375, -1.26953125, -1.1416015625, -1.013671875, -0.8857421875, -0.7578125, -0.6298828125, -0.501953125, -0.3740234375, -0.24609375, -0.1181640625, 0.009765625, 0.1376953125, 0.265625, 0.3935546875, 0.521484375, 0.6494140625, 0.77734375, 0.9052734375, 1.033203125, 1.1611328125, 1.2890625, 1.4169921875, 1.544921875, 1.6728515625, 1.80078125, 1.9287109375, 2.056640625, 2.1845703125, 2.3125, 2.4404296875, 2.568359375, 2.6962890625, 2.82421875, 2.9521484375, 3.080078125, 3.2080078125, 3.3359375, 3.4638671875, 3.591796875, 3.7197265625, 3.84765625, 3.9755859375, 4.103515625, 4.2314453125, 4.359375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 5.0, 14.0, 12.0, 22.0, 33.0, 36.0, 60.0, 94.0, 122.0, 233.0, 357.0, 623.0, 1166.0, 2037.0, 3913.0, 7713.0, 16157.0, 38373.0, 105833.0, 350384.0, 1036272.0, 1471909.0, 778856.0, 246066.0, 77810.0, 29637.0, 13104.0, 6232.0, 3157.0, 1617.0, 977.0, 513.0, 364.0, 188.0, 119.0, 82.0, 54.0, 45.0, 29.0, 21.0, 8.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4921875, -4.333740234375, -4.17529296875, -4.016845703125, -3.8583984375, -3.699951171875, -3.54150390625, -3.383056640625, -3.224609375, -3.066162109375, -2.90771484375, -2.749267578125, -2.5908203125, -2.432373046875, -2.27392578125, -2.115478515625, -1.95703125, -1.798583984375, -1.64013671875, -1.481689453125, -1.3232421875, -1.164794921875, -1.00634765625, -0.847900390625, -0.689453125, -0.531005859375, -0.37255859375, -0.214111328125, -0.0556640625, 0.102783203125, 0.26123046875, 0.419677734375, 0.578125, 0.736572265625, 0.89501953125, 1.053466796875, 1.2119140625, 1.370361328125, 1.52880859375, 1.687255859375, 1.845703125, 2.004150390625, 2.16259765625, 2.321044921875, 2.4794921875, 2.637939453125, 2.79638671875, 2.954833984375, 3.11328125, 3.271728515625, 3.43017578125, 3.588623046875, 3.7470703125, 3.905517578125, 4.06396484375, 4.222412109375, 4.380859375, 4.539306640625, 4.69775390625, 4.856201171875, 5.0146484375, 5.173095703125, 5.33154296875, 5.489990234375, 5.6484375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 6.0, 4.0, 11.0, 19.0, 7.0, 22.0, 32.0, 32.0, 49.0, 82.0, 86.0, 111.0, 180.0, 217.0, 270.0, 346.0, 433.0, 439.0, 428.0, 327.0, 231.0, 196.0, 133.0, 104.0, 102.0, 64.0, 29.0, 38.0, 19.0, 19.0, 11.0, 10.0, 7.0, 7.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-14.53125, -14.1788330078125, -13.826416015625, -13.4739990234375, -13.12158203125, -12.7691650390625, -12.416748046875, -12.0643310546875, -11.7119140625, -11.3594970703125, -11.007080078125, -10.6546630859375, -10.30224609375, -9.9498291015625, -9.597412109375, -9.2449951171875, -8.892578125, -8.5401611328125, -8.187744140625, -7.8353271484375, -7.48291015625, -7.1304931640625, -6.778076171875, -6.4256591796875, -6.0732421875, -5.7208251953125, -5.368408203125, -5.0159912109375, -4.66357421875, -4.3111572265625, -3.958740234375, -3.6063232421875, -3.25390625, -2.9014892578125, -2.549072265625, -2.1966552734375, -1.84423828125, -1.4918212890625, -1.139404296875, -0.7869873046875, -0.4345703125, -0.0821533203125, 0.270263671875, 0.6226806640625, 0.97509765625, 1.3275146484375, 1.679931640625, 2.0323486328125, 2.384765625, 2.7371826171875, 3.089599609375, 3.4420166015625, 3.79443359375, 4.1468505859375, 4.499267578125, 4.8516845703125, 5.2041015625, 5.5565185546875, 5.908935546875, 6.2613525390625, 6.61376953125, 6.9661865234375, 7.318603515625, 7.6710205078125, 8.0234375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 15.0, 8.0, 15.0, 30.0, 36.0, 56.0, 53.0, 92.0, 132.0, 179.0, 394.0, 1002.0, 7275.0, 362465.0, 3756325.0, 61857.0, 2802.0, 673.0, 287.0, 157.0, 95.0, 88.0, 50.0, 42.0, 31.0, 26.0, 16.0, 18.0, 15.0, 10.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.5, -29.294921875, -28.08984375, -26.884765625, -25.6796875, -24.474609375, -23.26953125, -22.064453125, -20.859375, -19.654296875, -18.44921875, -17.244140625, -16.0390625, -14.833984375, -13.62890625, -12.423828125, -11.21875, -10.013671875, -8.80859375, -7.603515625, -6.3984375, -5.193359375, -3.98828125, -2.783203125, -1.578125, -0.373046875, 0.83203125, 2.037109375, 3.2421875, 4.447265625, 5.65234375, 6.857421875, 8.0625, 9.267578125, 10.47265625, 11.677734375, 12.8828125, 14.087890625, 15.29296875, 16.498046875, 17.703125, 18.908203125, 20.11328125, 21.318359375, 22.5234375, 23.728515625, 24.93359375, 26.138671875, 27.34375, 28.548828125, 29.75390625, 30.958984375, 32.1640625, 33.369140625, 34.57421875, 35.779296875, 36.984375, 38.189453125, 39.39453125, 40.599609375, 41.8046875, 43.009765625, 44.21484375, 45.419921875, 46.625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 14.0, 43.0, 101.0, 140.0, 186.0, 222.0, 157.0, 86.0, 32.0, 18.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.33330535888672, -121.43858337402344, -118.54386901855469, -115.6491470336914, -112.75443267822266, -109.85971069335938, -106.96499633789062, -104.07027435302734, -101.17555236816406, -98.28083038330078, -95.38611602783203, -92.49139404296875, -89.5966796875, -86.70195770263672, -83.80723571777344, -80.91252136230469, -78.01780700683594, -75.12308502197266, -72.2283706665039, -69.33364868164062, -66.43893432617188, -63.544212341308594, -60.64949417114258, -57.75477600097656, -54.86005783081055, -51.96533966064453, -49.070621490478516, -46.1759033203125, -43.28118133544922, -40.38646697998047, -37.49174499511719, -34.59702682495117, -31.702301025390625, -28.80758285522461, -25.912864685058594, -23.018144607543945, -20.12342643737793, -17.228708267211914, -14.333988189697266, -11.43927001953125, -8.544551849365234, -5.6498332023620605, -2.7551145553588867, 0.1396045684814453, 3.034322738647461, 5.929040908813477, 8.823760986328125, 11.71847915649414, 14.613197326660156, 17.507915496826172, 20.402633666992188, 23.297353744506836, 26.19207191467285, 29.086790084838867, 31.981510162353516, 34.87622833251953, 37.77094650268555, 40.66566467285156, 43.56038284301758, 46.455101013183594, 49.349822998046875, 52.244537353515625, 55.139259338378906, 58.03397750854492, 60.92869567871094]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 3.0, 7.0, 9.0, 21.0, 13.0, 25.0, 21.0, 19.0, 28.0, 27.0, 27.0, 34.0, 28.0, 52.0, 51.0, 43.0, 34.0, 45.0, 36.0, 39.0, 52.0, 43.0, 29.0, 31.0, 23.0, 28.0, 27.0, 23.0, 23.0, 21.0, 20.0, 19.0, 13.0, 12.0, 10.0, 9.0, 14.0, 9.0, 2.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-40.26957702636719, -39.09467315673828, -37.91977310180664, -36.744869232177734, -35.56996536254883, -34.39506530761719, -33.22016143798828, -32.045257568359375, -30.870357513427734, -29.69545555114746, -28.520551681518555, -27.34564971923828, -26.170747756958008, -24.995845794677734, -23.820941925048828, -22.646039962768555, -21.47113609313965, -20.296234130859375, -19.12133026123047, -17.946428298950195, -16.771526336669922, -15.596623420715332, -14.421720504760742, -13.246818542480469, -12.071915626525879, -10.897012710571289, -9.722110748291016, -8.547207832336426, -7.372305393218994, -6.1974029541015625, -5.022500038146973, -3.847598075866699, -2.6726951599121094, -1.4977926015853882, -0.322890043258667, 0.8520126342773438, 2.0269150733947754, 3.201817512512207, 4.376720428466797, 5.55162239074707, 6.72652530670166, 7.901427745819092, 9.076330184936523, 10.251233100891113, 11.426136016845703, 12.601037979125977, 13.775940895080566, 14.95084285736084, 16.12574577331543, 17.300647735595703, 18.47555160522461, 19.650453567504883, 20.825355529785156, 22.000259399414062, 23.175161361694336, 24.35006332397461, 25.524967193603516, 26.69986915588379, 27.874773025512695, 29.04967498779297, 30.224576950073242, 31.399478912353516, 32.57438278198242, 33.74928283691406, 34.92418670654297]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 13.0, 13.0, 23.0, 21.0, 16.0, 32.0, 31.0, 39.0, 37.0, 32.0, 41.0, 41.0, 36.0, 41.0, 36.0, 40.0, 53.0, 48.0, 46.0, 35.0, 39.0, 26.0, 29.0, 28.0, 25.0, 27.0, 23.0, 12.0, 18.0, 13.0, 13.0, 9.0, 7.0, 3.0, 1.0, 5.0, 4.0, 8.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.6328125, -4.49237060546875, -4.3519287109375, -4.21148681640625, -4.071044921875, -3.93060302734375, -3.7901611328125, -3.64971923828125, -3.50927734375, -3.36883544921875, -3.2283935546875, -3.08795166015625, -2.947509765625, -2.80706787109375, -2.6666259765625, -2.52618408203125, -2.3857421875, -2.24530029296875, -2.1048583984375, -1.96441650390625, -1.823974609375, -1.68353271484375, -1.5430908203125, -1.40264892578125, -1.26220703125, -1.12176513671875, -0.9813232421875, -0.84088134765625, -0.700439453125, -0.55999755859375, -0.4195556640625, -0.27911376953125, -0.138671875, 0.00177001953125, 0.1422119140625, 0.28265380859375, 0.423095703125, 0.56353759765625, 0.7039794921875, 0.84442138671875, 0.98486328125, 1.12530517578125, 1.2657470703125, 1.40618896484375, 1.546630859375, 1.68707275390625, 1.8275146484375, 1.96795654296875, 2.1083984375, 2.24884033203125, 2.3892822265625, 2.52972412109375, 2.670166015625, 2.81060791015625, 2.9510498046875, 3.09149169921875, 3.23193359375, 3.37237548828125, 3.5128173828125, 3.65325927734375, 3.793701171875, 3.93414306640625, 4.0745849609375, 4.21502685546875, 4.35546875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 9.0, 19.0, 18.0, 26.0, 55.0, 57.0, 90.0, 145.0, 196.0, 284.0, 420.0, 642.0, 963.0, 1486.0, 2241.0, 3466.0, 5306.0, 8558.0, 13740.0, 22919.0, 39726.0, 73817.0, 147739.0, 262486.0, 217486.0, 109624.0, 56075.0, 31518.0, 18610.0, 10879.0, 7126.0, 4385.0, 2860.0, 1918.0, 1204.0, 795.0, 536.0, 344.0, 246.0, 174.0, 126.0, 62.0, 62.0, 35.0, 25.0, 19.0, 9.0, 9.0, 5.0, 5.0, 5.0, 3.0, 0.0, 3.0], "bins": [-0.77490234375, -0.7519683837890625, -0.729034423828125, -0.7061004638671875, -0.68316650390625, -0.6602325439453125, -0.637298583984375, -0.6143646240234375, -0.5914306640625, -0.5684967041015625, -0.545562744140625, -0.5226287841796875, -0.49969482421875, -0.4767608642578125, -0.453826904296875, -0.4308929443359375, -0.407958984375, -0.3850250244140625, -0.362091064453125, -0.3391571044921875, -0.31622314453125, -0.2932891845703125, -0.270355224609375, -0.2474212646484375, -0.2244873046875, -0.2015533447265625, -0.178619384765625, -0.1556854248046875, -0.13275146484375, -0.1098175048828125, -0.086883544921875, -0.0639495849609375, -0.041015625, -0.0180816650390625, 0.004852294921875, 0.0277862548828125, 0.05072021484375, 0.0736541748046875, 0.096588134765625, 0.1195220947265625, 0.1424560546875, 0.1653900146484375, 0.188323974609375, 0.2112579345703125, 0.23419189453125, 0.2571258544921875, 0.280059814453125, 0.3029937744140625, 0.325927734375, 0.3488616943359375, 0.371795654296875, 0.3947296142578125, 0.41766357421875, 0.4405975341796875, 0.463531494140625, 0.4864654541015625, 0.5093994140625, 0.5323333740234375, 0.555267333984375, 0.5782012939453125, 0.60113525390625, 0.6240692138671875, 0.647003173828125, 0.6699371337890625, 0.69287109375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 11.0, 11.0, 7.0, 10.0, 13.0, 16.0, 15.0, 18.0, 22.0, 30.0, 35.0, 29.0, 36.0, 34.0, 36.0, 49.0, 41.0, 45.0, 1080.0, 40.0, 38.0, 47.0, 27.0, 30.0, 46.0, 33.0, 25.0, 37.0, 34.0, 17.0, 15.0, 21.0, 8.0, 19.0, 10.0, 8.0, 7.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.982421875, -2.89306640625, -2.8037109375, -2.71435546875, -2.625, -2.53564453125, -2.4462890625, -2.35693359375, -2.267578125, -2.17822265625, -2.0888671875, -1.99951171875, -1.91015625, -1.82080078125, -1.7314453125, -1.64208984375, -1.552734375, -1.46337890625, -1.3740234375, -1.28466796875, -1.1953125, -1.10595703125, -1.0166015625, -0.92724609375, -0.837890625, -0.74853515625, -0.6591796875, -0.56982421875, -0.48046875, -0.39111328125, -0.3017578125, -0.21240234375, -0.123046875, -0.03369140625, 0.0556640625, 0.14501953125, 0.234375, 0.32373046875, 0.4130859375, 0.50244140625, 0.591796875, 0.68115234375, 0.7705078125, 0.85986328125, 0.94921875, 1.03857421875, 1.1279296875, 1.21728515625, 1.306640625, 1.39599609375, 1.4853515625, 1.57470703125, 1.6640625, 1.75341796875, 1.8427734375, 1.93212890625, 2.021484375, 2.11083984375, 2.2001953125, 2.28955078125, 2.37890625, 2.46826171875, 2.5576171875, 2.64697265625, 2.736328125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 6.0, 5.0, 8.0, 13.0, 19.0, 52.0, 65.0, 92.0, 154.0, 238.0, 422.0, 658.0, 1061.0, 1618.0, 2671.0, 4369.0, 7124.0, 11835.0, 20940.0, 36303.0, 65758.0, 124433.0, 218374.0, 1279643.0, 144616.0, 76684.0, 41656.0, 23772.0, 13642.0, 8091.0, 4941.0, 2977.0, 1839.0, 1120.0, 732.0, 443.0, 272.0, 172.0, 117.0, 70.0, 60.0, 19.0, 20.0, 10.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5224609375, -0.506195068359375, -0.48992919921875, -0.473663330078125, -0.4573974609375, -0.441131591796875, -0.42486572265625, -0.408599853515625, -0.392333984375, -0.376068115234375, -0.35980224609375, -0.343536376953125, -0.3272705078125, -0.311004638671875, -0.29473876953125, -0.278472900390625, -0.26220703125, -0.245941162109375, -0.22967529296875, -0.213409423828125, -0.1971435546875, -0.180877685546875, -0.16461181640625, -0.148345947265625, -0.132080078125, -0.115814208984375, -0.09954833984375, -0.083282470703125, -0.0670166015625, -0.050750732421875, -0.03448486328125, -0.018218994140625, -0.001953125, 0.014312744140625, 0.03057861328125, 0.046844482421875, 0.0631103515625, 0.079376220703125, 0.09564208984375, 0.111907958984375, 0.128173828125, 0.144439697265625, 0.16070556640625, 0.176971435546875, 0.1932373046875, 0.209503173828125, 0.22576904296875, 0.242034912109375, 0.25830078125, 0.274566650390625, 0.29083251953125, 0.307098388671875, 0.3233642578125, 0.339630126953125, 0.35589599609375, 0.372161865234375, 0.388427734375, 0.404693603515625, 0.42095947265625, 0.437225341796875, 0.4534912109375, 0.469757080078125, 0.48602294921875, 0.502288818359375, 0.5185546875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 8.0, 2.0, 7.0, 10.0, 15.0, 15.0, 23.0, 27.0, 38.0, 46.0, 50.0, 77.0, 76.0, 73.0, 71.0, 82.0, 65.0, 71.0, 52.0, 32.0, 38.0, 24.0, 30.0, 15.0, 14.0, 10.0, 2.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00278472900390625, -0.002713307738304138, -0.0026418864727020264, -0.0025704652070999146, -0.0024990439414978027, -0.002427622675895691, -0.002356201410293579, -0.0022847801446914673, -0.0022133588790893555, -0.0021419376134872437, -0.002070516347885132, -0.00199909508228302, -0.0019276738166809082, -0.0018562525510787964, -0.0017848312854766846, -0.0017134100198745728, -0.001641988754272461, -0.0015705674886703491, -0.0014991462230682373, -0.0014277249574661255, -0.0013563036918640137, -0.0012848824262619019, -0.00121346116065979, -0.0011420398950576782, -0.0010706186294555664, -0.0009991973638534546, -0.0009277760982513428, -0.000856354832649231, -0.0007849335670471191, -0.0007135123014450073, -0.0006420910358428955, -0.0005706697702407837, -0.0004992485046386719, -0.00042782723903656006, -0.00035640597343444824, -0.0002849847078323364, -0.0002135634422302246, -0.0001421421766281128, -7.072091102600098e-05, 7.003545761108398e-07, 7.212162017822266e-05, 0.00014354288578033447, 0.0002149641513824463, 0.0002863854169845581, 0.0003578066825866699, 0.00042922794818878174, 0.0005006492137908936, 0.0005720704793930054, 0.0006434917449951172, 0.000714913010597229, 0.0007863342761993408, 0.0008577555418014526, 0.0009291768074035645, 0.0010005980730056763, 0.001072019338607788, 0.0011434406042099, 0.0012148618698120117, 0.0012862831354141235, 0.0013577044010162354, 0.0014291256666183472, 0.001500546932220459, 0.0015719681978225708, 0.0016433894634246826, 0.0017148107290267944, 0.0017862319946289062]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 8.0, 6.0, 1.0, 16.0, 16.0, 27.0, 39.0, 56.0, 65.0, 135.0, 298.0, 935.0, 413221.0, 632027.0, 1023.0, 316.0, 133.0, 79.0, 46.0, 28.0, 22.0, 18.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055633544921875, -0.05341005325317383, -0.051186561584472656, -0.048963069915771484, -0.04673957824707031, -0.04451608657836914, -0.04229259490966797, -0.0400691032409668, -0.037845611572265625, -0.03562211990356445, -0.03339862823486328, -0.03117513656616211, -0.028951644897460938, -0.026728153228759766, -0.024504661560058594, -0.022281169891357422, -0.02005767822265625, -0.017834186553955078, -0.015610694885253906, -0.013387203216552734, -0.011163711547851562, -0.00894021987915039, -0.006716728210449219, -0.004493236541748047, -0.002269744873046875, -4.6253204345703125e-05, 0.0021772384643554688, 0.004400730133056641, 0.0066242218017578125, 0.008847713470458984, 0.011071205139160156, 0.013294696807861328, 0.0155181884765625, 0.017741680145263672, 0.019965171813964844, 0.022188663482666016, 0.024412155151367188, 0.02663564682006836, 0.02885913848876953, 0.031082630157470703, 0.033306121826171875, 0.03552961349487305, 0.03775310516357422, 0.03997659683227539, 0.04220008850097656, 0.044423580169677734, 0.046647071838378906, 0.04887056350708008, 0.05109405517578125, 0.05331754684448242, 0.055541038513183594, 0.057764530181884766, 0.05998802185058594, 0.06221151351928711, 0.06443500518798828, 0.06665849685668945, 0.06888198852539062, 0.0711054801940918, 0.07332897186279297, 0.07555246353149414, 0.07777595520019531, 0.07999944686889648, 0.08222293853759766, 0.08444643020629883, 0.086669921875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 12.0, 1007.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009045690298080444, -0.007335582748055458, -0.005625475198030472, -0.0039153676480054855, -0.0022052600979804993, -0.000495152547955513, 0.0012149550020694733, 0.0029250625520944595, 0.004635170102119446, 0.006345277652144432, 0.008055385202169418, 0.009765492752194405, 0.011475600302219391, 0.013185707852244377, 0.014895815402269363, 0.01660592295229435, 0.018316030502319336, 0.020026138052344322, 0.02173624560236931, 0.023446353152394295, 0.02515646070241928, 0.026866568252444267, 0.028576675802469254, 0.03028678335249424, 0.031996890902519226, 0.03370700031518936, 0.0354171060025692, 0.037127211689949036, 0.03883732110261917, 0.04054743051528931, 0.042257536202669144, 0.04396764189004898, 0.045677751302719116, 0.04738786071538925, 0.04909796640276909, 0.050808072090148926, 0.05251818150281906, 0.0542282909154892, 0.055938396602869034, 0.05764850229024887, 0.059358611702919006, 0.06106872111558914, 0.06277883052825928, 0.06448893249034882, 0.06619904190301895, 0.06790915131568909, 0.06961925327777863, 0.07132936269044876, 0.0730394721031189, 0.07474958151578903, 0.07645969092845917, 0.0781697928905487, 0.07987990230321884, 0.08159001171588898, 0.08330011367797852, 0.08501022309064865, 0.08672033250331879, 0.08843044191598892, 0.09014055132865906, 0.0918506532907486, 0.09356076270341873, 0.09527087211608887, 0.0969809740781784, 0.09869108349084854, 0.10040119290351868]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 8.0, 4.0, 9.0, 14.0, 21.0, 39.0, 34.0, 55.0, 72.0, 63.0, 80.0, 76.0, 71.0, 87.0, 80.0, 68.0, 58.0, 43.0, 45.0, 19.0, 19.0, 23.0, 8.0, 8.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0025292038917541504, -0.0024705110117793083, -0.0024118181318044662, -0.002353125251829624, -0.002294432371854782, -0.00223573949187994, -0.002177046611905098, -0.002118353731930256, -0.002059660851955414, -0.0020009679719805717, -0.0019422750920057297, -0.0018835822120308876, -0.0018248893320560455, -0.0017661964520812035, -0.0017075035721063614, -0.0016488106921315193, -0.0015901178121566772, -0.0015314249321818352, -0.001472732052206993, -0.001414039172232151, -0.001355346292257309, -0.0012966534122824669, -0.0012379605323076248, -0.0011792676523327827, -0.0011205747723579407, -0.0010618818923830986, -0.0010031890124082565, -0.0009444961324334145, -0.0008858032524585724, -0.0008271103724837303, -0.0007684174925088882, -0.0007097246125340462, -0.0006510317325592041, -0.000592338852584362, -0.00053364597260952, -0.0004749530926346779, -0.0004162602126598358, -0.00035756733268499374, -0.00029887445271015167, -0.0002401815727353096, -0.00018148869276046753, -0.00012279581278562546, -6.410293281078339e-05, -5.410052835941315e-06, 5.328282713890076e-05, 0.00011197570711374283, 0.0001706685870885849, 0.00022936146706342697, 0.00028805434703826904, 0.0003467472270131111, 0.0004054401069879532, 0.00046413298696279526, 0.0005228258669376373, 0.0005815187469124794, 0.0006402116268873215, 0.0006989045068621635, 0.0007575973868370056, 0.0008162902668118477, 0.0008749831467866898, 0.0009336760267615318, 0.000992368906736374, 0.001051061786711216, 0.001109754666686058, 0.0011684475466609001, 0.0012271404266357422]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 13.0, 13.0, 23.0, 21.0, 16.0, 32.0, 31.0, 39.0, 37.0, 32.0, 41.0, 41.0, 36.0, 41.0, 36.0, 40.0, 53.0, 48.0, 46.0, 35.0, 39.0, 26.0, 29.0, 28.0, 25.0, 27.0, 23.0, 12.0, 18.0, 13.0, 13.0, 9.0, 7.0, 3.0, 1.0, 5.0, 4.0, 8.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.6328125, -4.49237060546875, -4.3519287109375, -4.21148681640625, -4.071044921875, -3.93060302734375, -3.7901611328125, -3.64971923828125, -3.50927734375, -3.36883544921875, -3.2283935546875, -3.08795166015625, -2.947509765625, -2.80706787109375, -2.6666259765625, -2.52618408203125, -2.3857421875, -2.24530029296875, -2.1048583984375, -1.96441650390625, -1.823974609375, -1.68353271484375, -1.5430908203125, -1.40264892578125, -1.26220703125, -1.12176513671875, -0.9813232421875, -0.84088134765625, -0.700439453125, -0.55999755859375, -0.4195556640625, -0.27911376953125, -0.138671875, 0.00177001953125, 0.1422119140625, 0.28265380859375, 0.423095703125, 0.56353759765625, 0.7039794921875, 0.84442138671875, 0.98486328125, 1.12530517578125, 1.2657470703125, 1.40618896484375, 1.546630859375, 1.68707275390625, 1.8275146484375, 1.96795654296875, 2.1083984375, 2.24884033203125, 2.3892822265625, 2.52972412109375, 2.670166015625, 2.81060791015625, 2.9510498046875, 3.09149169921875, 3.23193359375, 3.37237548828125, 3.5128173828125, 3.65325927734375, 3.793701171875, 3.93414306640625, 4.0745849609375, 4.21502685546875, 4.35546875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 8.0, 6.0, 17.0, 22.0, 34.0, 39.0, 77.0, 92.0, 137.0, 245.0, 358.0, 546.0, 913.0, 1488.0, 2511.0, 4113.0, 7532.0, 15574.0, 37017.0, 110044.0, 404714.0, 317147.0, 86416.0, 30234.0, 13097.0, 6696.0, 3677.0, 2143.0, 1346.0, 807.0, 522.0, 310.0, 210.0, 172.0, 92.0, 79.0, 30.0, 18.0, 22.0, 7.0, 12.0, 10.0, 10.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.884765625, -3.762969970703125, -3.64117431640625, -3.519378662109375, -3.3975830078125, -3.275787353515625, -3.15399169921875, -3.032196044921875, -2.910400390625, -2.788604736328125, -2.66680908203125, -2.545013427734375, -2.4232177734375, -2.301422119140625, -2.17962646484375, -2.057830810546875, -1.93603515625, -1.814239501953125, -1.69244384765625, -1.570648193359375, -1.4488525390625, -1.327056884765625, -1.20526123046875, -1.083465576171875, -0.961669921875, -0.839874267578125, -0.71807861328125, -0.596282958984375, -0.4744873046875, -0.352691650390625, -0.23089599609375, -0.109100341796875, 0.0126953125, 0.134490966796875, 0.25628662109375, 0.378082275390625, 0.4998779296875, 0.621673583984375, 0.74346923828125, 0.865264892578125, 0.987060546875, 1.108856201171875, 1.23065185546875, 1.352447509765625, 1.4742431640625, 1.596038818359375, 1.71783447265625, 1.839630126953125, 1.96142578125, 2.083221435546875, 2.20501708984375, 2.326812744140625, 2.4486083984375, 2.570404052734375, 2.69219970703125, 2.813995361328125, 2.935791015625, 3.057586669921875, 3.17938232421875, 3.301177978515625, 3.4229736328125, 3.544769287109375, 3.66656494140625, 3.788360595703125, 3.91015625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 9.0, 13.0, 15.0, 11.0, 22.0, 23.0, 23.0, 31.0, 40.0, 34.0, 33.0, 47.0, 43.0, 66.0, 83.0, 275.0, 1651.0, 167.0, 60.0, 68.0, 41.0, 37.0, 28.0, 28.0, 32.0, 27.0, 22.0, 23.0, 16.0, 15.0, 12.0, 12.0, 3.0, 0.0, 7.0, 5.0, 6.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.40625, -17.88525390625, -17.3642578125, -16.84326171875, -16.322265625, -15.80126953125, -15.2802734375, -14.75927734375, -14.23828125, -13.71728515625, -13.1962890625, -12.67529296875, -12.154296875, -11.63330078125, -11.1123046875, -10.59130859375, -10.0703125, -9.54931640625, -9.0283203125, -8.50732421875, -7.986328125, -7.46533203125, -6.9443359375, -6.42333984375, -5.90234375, -5.38134765625, -4.8603515625, -4.33935546875, -3.818359375, -3.29736328125, -2.7763671875, -2.25537109375, -1.734375, -1.21337890625, -0.6923828125, -0.17138671875, 0.349609375, 0.87060546875, 1.3916015625, 1.91259765625, 2.43359375, 2.95458984375, 3.4755859375, 3.99658203125, 4.517578125, 5.03857421875, 5.5595703125, 6.08056640625, 6.6015625, 7.12255859375, 7.6435546875, 8.16455078125, 8.685546875, 9.20654296875, 9.7275390625, 10.24853515625, 10.76953125, 11.29052734375, 11.8115234375, 12.33251953125, 12.853515625, 13.37451171875, 13.8955078125, 14.41650390625, 14.9375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 4.0, 12.0, 14.0, 15.0, 25.0, 30.0, 25.0, 30.0, 64.0, 49.0, 103.0, 123.0, 175.0, 291.0, 501.0, 2820.0, 341875.0, 2792083.0, 5631.0, 688.0, 333.0, 185.0, 149.0, 115.0, 81.0, 52.0, 46.0, 33.0, 32.0, 18.0, 21.0, 21.0, 9.0, 11.0, 9.0, 4.0, 4.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.5, -28.45068359375, -27.4013671875, -26.35205078125, -25.302734375, -24.25341796875, -23.2041015625, -22.15478515625, -21.10546875, -20.05615234375, -19.0068359375, -17.95751953125, -16.908203125, -15.85888671875, -14.8095703125, -13.76025390625, -12.7109375, -11.66162109375, -10.6123046875, -9.56298828125, -8.513671875, -7.46435546875, -6.4150390625, -5.36572265625, -4.31640625, -3.26708984375, -2.2177734375, -1.16845703125, -0.119140625, 0.93017578125, 1.9794921875, 3.02880859375, 4.078125, 5.12744140625, 6.1767578125, 7.22607421875, 8.275390625, 9.32470703125, 10.3740234375, 11.42333984375, 12.47265625, 13.52197265625, 14.5712890625, 15.62060546875, 16.669921875, 17.71923828125, 18.7685546875, 19.81787109375, 20.8671875, 21.91650390625, 22.9658203125, 24.01513671875, 25.064453125, 26.11376953125, 27.1630859375, 28.21240234375, 29.26171875, 30.31103515625, 31.3603515625, 32.40966796875, 33.458984375, 34.50830078125, 35.5576171875, 36.60693359375, 37.65625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 13.0, 26.0, 100.0, 220.0, 286.0, 234.0, 99.0, 20.0, 7.0, 3.0, 2.0, 1.0], "bins": [-62.753448486328125, -61.642967224121094, -60.5324821472168, -59.422000885009766, -58.31151580810547, -57.20103454589844, -56.090553283691406, -54.98006820678711, -53.86958694458008, -52.75910568237305, -51.64862060546875, -50.53813934326172, -49.42765808105469, -48.31717300415039, -47.20669174194336, -46.09620666503906, -44.98572540283203, -43.875244140625, -42.7647590637207, -41.65427780151367, -40.543792724609375, -39.433311462402344, -38.32283020019531, -37.212345123291016, -36.101863861083984, -34.99138259887695, -33.880897521972656, -32.770416259765625, -31.65993309020996, -30.549449920654297, -29.438968658447266, -28.3284854888916, -27.218006134033203, -26.10752296447754, -24.997039794921875, -23.886558532714844, -22.77607536315918, -21.665592193603516, -20.555110931396484, -19.44462776184082, -18.334144592285156, -17.223661422729492, -16.113178253173828, -15.002696990966797, -13.892213821411133, -12.781730651855469, -11.671248435974121, -10.560766220092773, -9.450282096862793, -8.339799880981445, -7.229316711425781, -6.118834018707275, -5.0083513259887695, -3.8978686332702637, -2.787385940551758, -1.676903247833252, -0.5664205551147461, 0.5440621376037598, 1.6545448303222656, 2.7650275230407715, 3.8755102157592773, 4.985992908477783, 6.096475601196289, 7.206958293914795, 8.3174409866333]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 2.0, 9.0, 14.0, 5.0, 14.0, 20.0, 20.0, 24.0, 18.0, 26.0, 25.0, 29.0, 42.0, 50.0, 53.0, 60.0, 47.0, 46.0, 48.0, 55.0, 48.0, 50.0, 40.0, 33.0, 40.0, 37.0, 24.0, 23.0, 19.0, 21.0, 20.0, 10.0, 7.0, 10.0, 3.0, 2.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.25403594970703, -49.77967834472656, -48.305320739746094, -46.830963134765625, -45.356605529785156, -43.88224792480469, -42.40789031982422, -40.93353271484375, -39.45917510986328, -37.98481750488281, -36.510459899902344, -35.036102294921875, -33.561744689941406, -32.08738708496094, -30.6130313873291, -29.138673782348633, -27.664318084716797, -26.189960479736328, -24.71560287475586, -23.24124526977539, -21.766887664794922, -20.292530059814453, -18.818174362182617, -17.34381675720215, -15.86945915222168, -14.395101547241211, -12.920743942260742, -11.44638729095459, -9.972029685974121, -8.497672080993652, -7.0233154296875, -5.548957824707031, -4.074604034423828, -2.6002466678619385, -1.1258893013000488, 0.3484678268432617, 1.8228254318237305, 3.297183036804199, 4.771539688110352, 6.24589729309082, 7.720254898071289, 9.194612503051758, 10.668970108032227, 12.143326759338379, 13.617684364318848, 15.092041969299316, 16.56639862060547, 18.040756225585938, 19.515113830566406, 20.989471435546875, 22.463829040527344, 23.938186645507812, 25.41254425048828, 26.88690185546875, 28.361257553100586, 29.835615158081055, 31.309972763061523, 32.78432846069336, 34.25868606567383, 35.7330436706543, 37.207401275634766, 38.681758880615234, 40.1561164855957, 41.63047409057617, 43.10483169555664]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 5.0, 5.0, 7.0, 8.0, 11.0, 12.0, 19.0, 13.0, 18.0, 21.0, 30.0, 40.0, 29.0, 44.0, 35.0, 27.0, 38.0, 28.0, 44.0, 46.0, 40.0, 37.0, 49.0, 48.0, 43.0, 30.0, 25.0, 36.0, 28.0, 24.0, 20.0, 22.0, 24.0, 13.0, 14.0, 15.0, 13.0, 12.0, 4.0, 2.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.6484375, -4.50909423828125, -4.3697509765625, -4.23040771484375, -4.091064453125, -3.95172119140625, -3.8123779296875, -3.67303466796875, -3.53369140625, -3.39434814453125, -3.2550048828125, -3.11566162109375, -2.976318359375, -2.83697509765625, -2.6976318359375, -2.55828857421875, -2.4189453125, -2.27960205078125, -2.1402587890625, -2.00091552734375, -1.861572265625, -1.72222900390625, -1.5828857421875, -1.44354248046875, -1.30419921875, -1.16485595703125, -1.0255126953125, -0.88616943359375, -0.746826171875, -0.60748291015625, -0.4681396484375, -0.32879638671875, -0.189453125, -0.05010986328125, 0.0892333984375, 0.22857666015625, 0.367919921875, 0.50726318359375, 0.6466064453125, 0.78594970703125, 0.92529296875, 1.06463623046875, 1.2039794921875, 1.34332275390625, 1.482666015625, 1.62200927734375, 1.7613525390625, 1.90069580078125, 2.0400390625, 2.17938232421875, 2.3187255859375, 2.45806884765625, 2.597412109375, 2.73675537109375, 2.8760986328125, 3.01544189453125, 3.15478515625, 3.29412841796875, 3.4334716796875, 3.57281494140625, 3.712158203125, 3.85150146484375, 3.9908447265625, 4.13018798828125, 4.26953125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 4.0, 7.0, 14.0, 14.0, 16.0, 21.0, 21.0, 27.0, 31.0, 52.0, 54.0, 75.0, 84.0, 116.0, 278.0, 1116.0, 12152.0, 774895.0, 3346999.0, 54178.0, 2957.0, 511.0, 177.0, 97.0, 69.0, 56.0, 39.0, 36.0, 38.0, 27.0, 23.0, 18.0, 11.0, 15.0, 11.0, 6.0, 8.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.875, -25.118896484375, -24.36279296875, -23.606689453125, -22.8505859375, -22.094482421875, -21.33837890625, -20.582275390625, -19.826171875, -19.070068359375, -18.31396484375, -17.557861328125, -16.8017578125, -16.045654296875, -15.28955078125, -14.533447265625, -13.77734375, -13.021240234375, -12.26513671875, -11.509033203125, -10.7529296875, -9.996826171875, -9.24072265625, -8.484619140625, -7.728515625, -6.972412109375, -6.21630859375, -5.460205078125, -4.7041015625, -3.947998046875, -3.19189453125, -2.435791015625, -1.6796875, -0.923583984375, -0.16748046875, 0.588623046875, 1.3447265625, 2.100830078125, 2.85693359375, 3.613037109375, 4.369140625, 5.125244140625, 5.88134765625, 6.637451171875, 7.3935546875, 8.149658203125, 8.90576171875, 9.661865234375, 10.41796875, 11.174072265625, 11.93017578125, 12.686279296875, 13.4423828125, 14.198486328125, 14.95458984375, 15.710693359375, 16.466796875, 17.222900390625, 17.97900390625, 18.735107421875, 19.4912109375, 20.247314453125, 21.00341796875, 21.759521484375, 22.515625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 5.0, 15.0, 19.0, 7.0, 24.0, 33.0, 43.0, 40.0, 57.0, 76.0, 121.0, 140.0, 156.0, 217.0, 297.0, 347.0, 423.0, 375.0, 365.0, 303.0, 204.0, 193.0, 141.0, 99.0, 80.0, 73.0, 49.0, 39.0, 29.0, 24.0, 17.0, 17.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.9442138671875, -8.646240234375, -8.3482666015625, -8.05029296875, -7.7523193359375, -7.454345703125, -7.1563720703125, -6.8583984375, -6.5604248046875, -6.262451171875, -5.9644775390625, -5.66650390625, -5.3685302734375, -5.070556640625, -4.7725830078125, -4.474609375, -4.1766357421875, -3.878662109375, -3.5806884765625, -3.28271484375, -2.9847412109375, -2.686767578125, -2.3887939453125, -2.0908203125, -1.7928466796875, -1.494873046875, -1.1968994140625, -0.89892578125, -0.6009521484375, -0.302978515625, -0.0050048828125, 0.29296875, 0.5909423828125, 0.888916015625, 1.1868896484375, 1.48486328125, 1.7828369140625, 2.080810546875, 2.3787841796875, 2.6767578125, 2.9747314453125, 3.272705078125, 3.5706787109375, 3.86865234375, 4.1666259765625, 4.464599609375, 4.7625732421875, 5.060546875, 5.3585205078125, 5.656494140625, 5.9544677734375, 6.25244140625, 6.5504150390625, 6.848388671875, 7.1463623046875, 7.4443359375, 7.7423095703125, 8.040283203125, 8.3382568359375, 8.63623046875, 8.9342041015625, 9.232177734375, 9.5301513671875, 9.828125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 10.0, 9.0, 4.0, 13.0, 15.0, 29.0, 25.0, 48.0, 52.0, 64.0, 71.0, 95.0, 116.0, 143.0, 194.0, 283.0, 493.0, 1464.0, 13647.0, 749132.0, 3371453.0, 52091.0, 2865.0, 674.0, 340.0, 239.0, 157.0, 111.0, 101.0, 76.0, 59.0, 52.0, 45.0, 14.0, 24.0, 20.0, 13.0, 18.0, 7.0, 6.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.90625, -27.84326171875, -26.7802734375, -25.71728515625, -24.654296875, -23.59130859375, -22.5283203125, -21.46533203125, -20.40234375, -19.33935546875, -18.2763671875, -17.21337890625, -16.150390625, -15.08740234375, -14.0244140625, -12.96142578125, -11.8984375, -10.83544921875, -9.7724609375, -8.70947265625, -7.646484375, -6.58349609375, -5.5205078125, -4.45751953125, -3.39453125, -2.33154296875, -1.2685546875, -0.20556640625, 0.857421875, 1.92041015625, 2.9833984375, 4.04638671875, 5.109375, 6.17236328125, 7.2353515625, 8.29833984375, 9.361328125, 10.42431640625, 11.4873046875, 12.55029296875, 13.61328125, 14.67626953125, 15.7392578125, 16.80224609375, 17.865234375, 18.92822265625, 19.9912109375, 21.05419921875, 22.1171875, 23.18017578125, 24.2431640625, 25.30615234375, 26.369140625, 27.43212890625, 28.4951171875, 29.55810546875, 30.62109375, 31.68408203125, 32.7470703125, 33.81005859375, 34.873046875, 35.93603515625, 36.9990234375, 38.06201171875, 39.125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 6.0, 13.0, 40.0, 76.0, 140.0, 218.0, 217.0, 154.0, 83.0, 44.0, 12.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.778566360473633, -25.900775909423828, -23.022987365722656, -20.145198822021484, -17.26740837097168, -14.389618873596191, -11.511829376220703, -8.634038925170898, -5.756250381469727, -2.8784608840942383, -0.00067138671875, 2.8771181106567383, 5.754907608032227, 8.632697105407715, 11.510486602783203, 14.388277053833008, 17.26606559753418, 20.143856048583984, 23.021644592285156, 25.899433135986328, 28.777223587036133, 31.655014038085938, 34.53280258178711, 37.41059112548828, 40.28838348388672, 43.16617202758789, 46.04396057128906, 48.9217529296875, 51.79954147338867, 54.677330017089844, 57.55512237548828, 60.43291091918945, 63.310699462890625, 66.18849182128906, 69.06627655029297, 71.9440689086914, 74.82185363769531, 77.69964599609375, 80.57743835449219, 83.45523071289062, 86.33301544189453, 89.21080780029297, 92.08859252929688, 94.96638488769531, 97.84417724609375, 100.72196197509766, 103.5997543334961, 106.4775390625, 109.35533142089844, 112.23312377929688, 115.11090850830078, 117.98870086669922, 120.86648559570312, 123.74427795410156, 126.6220703125, 129.49986267089844, 132.37765502929688, 135.2554473876953, 138.13323974609375, 141.01101684570312, 143.88880920410156, 146.7666015625, 149.64439392089844, 152.52218627929688, 155.39996337890625]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 11.0, 6.0, 9.0, 12.0, 14.0, 16.0, 15.0, 14.0, 14.0, 17.0, 16.0, 30.0, 23.0, 29.0, 27.0, 33.0, 43.0, 40.0, 42.0, 34.0, 39.0, 48.0, 35.0, 28.0, 45.0, 35.0, 30.0, 33.0, 26.0, 25.0, 20.0, 25.0, 21.0, 17.0, 22.0, 13.0, 14.0, 13.0, 11.0, 6.0, 10.0, 8.0, 6.0, 5.0, 2.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.614334106445312, -28.640439987182617, -27.666547775268555, -26.69265365600586, -25.718761444091797, -24.7448673248291, -23.770973205566406, -22.797080993652344, -21.82318687438965, -20.849292755126953, -19.87540054321289, -18.901506423950195, -17.9276123046875, -16.953720092773438, -15.979825973510742, -15.005932807922363, -14.032039642333984, -13.058146476745605, -12.084253311157227, -11.110359191894531, -10.136466026306152, -9.162572860717773, -8.188678741455078, -7.214785575866699, -6.24089241027832, -5.266999244689941, -4.293105602264404, -3.3192121982574463, -2.3453187942504883, -1.3714256286621094, -0.39753198623657227, 0.5763616561889648, 1.5502548217773438, 2.5241482257843018, 3.4980416297912598, 4.471935272216797, 5.445828437805176, 6.419721603393555, 7.393615245819092, 8.367508888244629, 9.341402053833008, 10.315295219421387, 11.289188385009766, 12.263082504272461, 13.23697566986084, 14.210868835449219, 15.184762954711914, 16.15865707397461, 17.132549285888672, 18.106443405151367, 19.08033561706543, 20.054229736328125, 21.028121948242188, 22.002016067504883, 22.975910186767578, 23.94980239868164, 24.923696517944336, 25.89759063720703, 26.871482849121094, 27.84537696838379, 28.819271087646484, 29.793163299560547, 30.767057418823242, 31.740951538085938, 32.71484375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 5.0, 6.0, 14.0, 18.0, 13.0, 19.0, 30.0, 20.0, 26.0, 36.0, 31.0, 34.0, 44.0, 34.0, 42.0, 36.0, 28.0, 32.0, 37.0, 44.0, 36.0, 40.0, 34.0, 35.0, 33.0, 29.0, 29.0, 27.0, 26.0, 14.0, 23.0, 17.0, 26.0, 10.0, 12.0, 6.0, 5.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-4.5234375, -4.3868408203125, -4.250244140625, -4.1136474609375, -3.97705078125, -3.8404541015625, -3.703857421875, -3.5672607421875, -3.4306640625, -3.2940673828125, -3.157470703125, -3.0208740234375, -2.88427734375, -2.7476806640625, -2.611083984375, -2.4744873046875, -2.337890625, -2.2012939453125, -2.064697265625, -1.9281005859375, -1.79150390625, -1.6549072265625, -1.518310546875, -1.3817138671875, -1.2451171875, -1.1085205078125, -0.971923828125, -0.8353271484375, -0.69873046875, -0.5621337890625, -0.425537109375, -0.2889404296875, -0.15234375, -0.0157470703125, 0.120849609375, 0.2574462890625, 0.39404296875, 0.5306396484375, 0.667236328125, 0.8038330078125, 0.9404296875, 1.0770263671875, 1.213623046875, 1.3502197265625, 1.48681640625, 1.6234130859375, 1.760009765625, 1.8966064453125, 2.033203125, 2.1697998046875, 2.306396484375, 2.4429931640625, 2.57958984375, 2.7161865234375, 2.852783203125, 2.9893798828125, 3.1259765625, 3.2625732421875, 3.399169921875, 3.5357666015625, 3.67236328125, 3.8089599609375, 3.945556640625, 4.0821533203125, 4.21875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 9.0, 10.0, 16.0, 25.0, 20.0, 49.0, 77.0, 112.0, 158.0, 262.0, 393.0, 610.0, 898.0, 1466.0, 2260.0, 3491.0, 5534.0, 8680.0, 13908.0, 23463.0, 40485.0, 75046.0, 147212.0, 256414.0, 215325.0, 111782.0, 57901.0, 32297.0, 18997.0, 11660.0, 7238.0, 4590.0, 2811.0, 1815.0, 1235.0, 781.0, 517.0, 342.0, 224.0, 148.0, 112.0, 60.0, 43.0, 34.0, 20.0, 7.0, 8.0, 3.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7509765625, -0.726593017578125, -0.70220947265625, -0.677825927734375, -0.6534423828125, -0.629058837890625, -0.60467529296875, -0.580291748046875, -0.555908203125, -0.531524658203125, -0.50714111328125, -0.482757568359375, -0.4583740234375, -0.433990478515625, -0.40960693359375, -0.385223388671875, -0.36083984375, -0.336456298828125, -0.31207275390625, -0.287689208984375, -0.2633056640625, -0.238922119140625, -0.21453857421875, -0.190155029296875, -0.165771484375, -0.141387939453125, -0.11700439453125, -0.092620849609375, -0.0682373046875, -0.043853759765625, -0.01947021484375, 0.004913330078125, 0.029296875, 0.053680419921875, 0.07806396484375, 0.102447509765625, 0.1268310546875, 0.151214599609375, 0.17559814453125, 0.199981689453125, 0.224365234375, 0.248748779296875, 0.27313232421875, 0.297515869140625, 0.3218994140625, 0.346282958984375, 0.37066650390625, 0.395050048828125, 0.41943359375, 0.443817138671875, 0.46820068359375, 0.492584228515625, 0.5169677734375, 0.541351318359375, 0.56573486328125, 0.590118408203125, 0.614501953125, 0.638885498046875, 0.66326904296875, 0.687652587890625, 0.7120361328125, 0.736419677734375, 0.76080322265625, 0.785186767578125, 0.8095703125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 5.0, 3.0, 7.0, 9.0, 11.0, 16.0, 14.0, 17.0, 14.0, 17.0, 32.0, 20.0, 28.0, 33.0, 35.0, 40.0, 38.0, 38.0, 47.0, 50.0, 1069.0, 52.0, 34.0, 31.0, 37.0, 36.0, 37.0, 35.0, 27.0, 26.0, 29.0, 18.0, 11.0, 16.0, 11.0, 13.0, 7.0, 17.0, 9.0, 5.0, 4.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-3.076171875, -2.988128662109375, -2.90008544921875, -2.812042236328125, -2.7239990234375, -2.635955810546875, -2.54791259765625, -2.459869384765625, -2.371826171875, -2.283782958984375, -2.19573974609375, -2.107696533203125, -2.0196533203125, -1.931610107421875, -1.84356689453125, -1.755523681640625, -1.66748046875, -1.579437255859375, -1.49139404296875, -1.403350830078125, -1.3153076171875, -1.227264404296875, -1.13922119140625, -1.051177978515625, -0.963134765625, -0.875091552734375, -0.78704833984375, -0.699005126953125, -0.6109619140625, -0.522918701171875, -0.43487548828125, -0.346832275390625, -0.2587890625, -0.170745849609375, -0.08270263671875, 0.005340576171875, 0.0933837890625, 0.181427001953125, 0.26947021484375, 0.357513427734375, 0.445556640625, 0.533599853515625, 0.62164306640625, 0.709686279296875, 0.7977294921875, 0.885772705078125, 0.97381591796875, 1.061859130859375, 1.14990234375, 1.237945556640625, 1.32598876953125, 1.414031982421875, 1.5020751953125, 1.590118408203125, 1.67816162109375, 1.766204833984375, 1.854248046875, 1.942291259765625, 2.03033447265625, 2.118377685546875, 2.2064208984375, 2.294464111328125, 2.38250732421875, 2.470550537109375, 2.55859375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 9.0, 18.0, 23.0, 45.0, 52.0, 77.0, 130.0, 165.0, 260.0, 439.0, 595.0, 1008.0, 1606.0, 2525.0, 4139.0, 6757.0, 11422.0, 19449.0, 34005.0, 61358.0, 112590.0, 195856.0, 1282080.0, 159925.0, 87398.0, 48065.0, 27553.0, 15593.0, 9251.0, 5595.0, 3432.0, 2061.0, 1257.0, 836.0, 539.0, 358.0, 214.0, 140.0, 97.0, 64.0, 39.0, 32.0, 13.0, 23.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.53076171875, -0.5143280029296875, -0.497894287109375, -0.4814605712890625, -0.46502685546875, -0.4485931396484375, -0.432159423828125, -0.4157257080078125, -0.3992919921875, -0.3828582763671875, -0.366424560546875, -0.3499908447265625, -0.33355712890625, -0.3171234130859375, -0.300689697265625, -0.2842559814453125, -0.267822265625, -0.2513885498046875, -0.234954833984375, -0.2185211181640625, -0.20208740234375, -0.1856536865234375, -0.169219970703125, -0.1527862548828125, -0.1363525390625, -0.1199188232421875, -0.103485107421875, -0.0870513916015625, -0.07061767578125, -0.0541839599609375, -0.037750244140625, -0.0213165283203125, -0.0048828125, 0.0115509033203125, 0.027984619140625, 0.0444183349609375, 0.06085205078125, 0.0772857666015625, 0.093719482421875, 0.1101531982421875, 0.1265869140625, 0.1430206298828125, 0.159454345703125, 0.1758880615234375, 0.19232177734375, 0.2087554931640625, 0.225189208984375, 0.2416229248046875, 0.258056640625, 0.2744903564453125, 0.290924072265625, 0.3073577880859375, 0.32379150390625, 0.3402252197265625, 0.356658935546875, 0.3730926513671875, 0.3895263671875, 0.4059600830078125, 0.422393798828125, 0.4388275146484375, 0.45526123046875, 0.4716949462890625, 0.488128662109375, 0.5045623779296875, 0.52099609375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 5.0, 6.0, 7.0, 12.0, 20.0, 14.0, 18.0, 19.0, 18.0, 18.0, 25.0, 25.0, 32.0, 50.0, 34.0, 45.0, 47.0, 43.0, 57.0, 51.0, 41.0, 46.0, 33.0, 36.0, 39.0, 36.0, 34.0, 22.0, 30.0, 21.0, 19.0, 18.0, 16.0, 11.0, 4.0, 7.0, 8.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.00141143798828125, -0.0013677775859832764, -0.0013241171836853027, -0.001280456781387329, -0.0012367963790893555, -0.0011931359767913818, -0.0011494755744934082, -0.0011058151721954346, -0.001062154769897461, -0.0010184943675994873, -0.0009748339653015137, -0.00093117356300354, -0.0008875131607055664, -0.0008438527584075928, -0.0008001923561096191, -0.0007565319538116455, -0.0007128715515136719, -0.0006692111492156982, -0.0006255507469177246, -0.000581890344619751, -0.0005382299423217773, -0.0004945695400238037, -0.0004509091377258301, -0.00040724873542785645, -0.0003635883331298828, -0.0003199279308319092, -0.00027626752853393555, -0.00023260712623596191, -0.00018894672393798828, -0.00014528632164001465, -0.00010162591934204102, -5.796551704406738e-05, -1.430511474609375e-05, 2.9355287551879883e-05, 7.301568984985352e-05, 0.00011667609214782715, 0.00016033649444580078, 0.00020399689674377441, 0.00024765729904174805, 0.0002913177013397217, 0.0003349781036376953, 0.00037863850593566895, 0.0004222989082336426, 0.0004659593105316162, 0.0005096197128295898, 0.0005532801151275635, 0.0005969405174255371, 0.0006406009197235107, 0.0006842613220214844, 0.000727921724319458, 0.0007715821266174316, 0.0008152425289154053, 0.0008589029312133789, 0.0009025633335113525, 0.0009462237358093262, 0.0009898841381072998, 0.0010335445404052734, 0.001077204942703247, 0.0011208653450012207, 0.0011645257472991943, 0.001208186149597168, 0.0012518465518951416, 0.0012955069541931152, 0.0013391673564910889, 0.0013828277587890625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 6.0, 5.0, 8.0, 8.0, 11.0, 27.0, 23.0, 24.0, 37.0, 52.0, 72.0, 104.0, 134.0, 231.0, 401.0, 772.0, 7304.0, 932237.0, 103894.0, 1785.0, 534.0, 283.0, 176.0, 129.0, 66.0, 53.0, 33.0, 36.0, 25.0, 14.0, 18.0, 9.0, 10.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0401611328125, -0.03889656066894531, -0.037631988525390625, -0.03636741638183594, -0.03510284423828125, -0.03383827209472656, -0.032573699951171875, -0.03130912780761719, -0.0300445556640625, -0.028779983520507812, -0.027515411376953125, -0.026250839233398438, -0.02498626708984375, -0.023721694946289062, -0.022457122802734375, -0.021192550659179688, -0.019927978515625, -0.018663406372070312, -0.017398834228515625, -0.016134262084960938, -0.01486968994140625, -0.013605117797851562, -0.012340545654296875, -0.011075973510742188, -0.0098114013671875, -0.008546829223632812, -0.007282257080078125, -0.0060176849365234375, -0.00475311279296875, -0.0034885406494140625, -0.002223968505859375, -0.0009593963623046875, 0.00030517578125, 0.0015697479248046875, 0.002834320068359375, 0.0040988922119140625, 0.00536346435546875, 0.0066280364990234375, 0.007892608642578125, 0.009157180786132812, 0.0104217529296875, 0.011686325073242188, 0.012950897216796875, 0.014215469360351562, 0.01548004150390625, 0.016744613647460938, 0.018009185791015625, 0.019273757934570312, 0.020538330078125, 0.021802902221679688, 0.023067474365234375, 0.024332046508789062, 0.02559661865234375, 0.026861190795898438, 0.028125762939453125, 0.029390335083007812, 0.0306549072265625, 0.03191947937011719, 0.033184051513671875, 0.03444862365722656, 0.03571319580078125, 0.03697776794433594, 0.038242340087890625, 0.03950691223144531, 0.040771484375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 364.0, 642.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007213766220957041, -0.006619041319936514, -0.006024316884577274, -0.0054295919835567474, -0.0048348670825362206, -0.004240142181515694, -0.0036454175133258104, -0.003050692845135927, -0.0024559679441154003, -0.0018612431595101953, -0.0012665183749049902, -0.0006717935902997851, -7.706880569458008e-05, 0.0005176560953259468, 0.00111238076351583, 0.0017071054317057133, 0.00230183033272624, 0.002896555233746767, 0.0034912799019366503, 0.0040860045701265335, 0.00468072947114706, 0.005275454372167587, 0.005870179273188114, 0.006464903708547354, 0.007059628609567881, 0.0076543535105884075, 0.008249077945947647, 0.008843802846968174, 0.0094385277479887, 0.010033252649009228, 0.010627977550029755, 0.011222701519727707, 0.011817427352070808, 0.012412152253091335, 0.013006877154111862, 0.013601602055132389, 0.014196326956152916, 0.014791050925850868, 0.015385775826871395, 0.015980500727891922, 0.016575224697589874, 0.017169948667287827, 0.017764674499630928, 0.01835939846932888, 0.018954124301671982, 0.019548848271369934, 0.020143574103713036, 0.020738298073410988, 0.02133302390575409, 0.02192774787545204, 0.022522473707795143, 0.023117197677493095, 0.023711923509836197, 0.02430664747953415, 0.02490137331187725, 0.025496097281575203, 0.026090823113918304, 0.026685547083616257, 0.027280272915959358, 0.02787499688565731, 0.028469722718000412, 0.029064446687698364, 0.029659172520041466, 0.030253896489739418, 0.03084862045943737]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 8.0, 6.0, 3.0, 8.0, 7.0, 14.0, 12.0, 17.0, 15.0, 25.0, 29.0, 20.0, 32.0, 28.0, 38.0, 41.0, 40.0, 46.0, 48.0, 52.0, 56.0, 48.0, 48.0, 47.0, 49.0, 37.0, 40.0, 35.0, 18.0, 21.0, 19.0, 16.0, 15.0, 15.0, 16.0, 3.0, 3.0, 11.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0009328126907348633, -0.0009030187502503395, -0.0008732248097658157, -0.000843430869281292, -0.0008136369287967682, -0.0007838429883122444, -0.0007540490478277206, -0.0007242551073431969, -0.0006944611668586731, -0.0006646672263741493, -0.0006348732858896255, -0.0006050793454051018, -0.000575285404920578, -0.0005454914644360542, -0.0005156975239515305, -0.0004859035834670067, -0.0004561096429824829, -0.00042631570249795914, -0.00039652176201343536, -0.0003667278215289116, -0.0003369338810443878, -0.00030713994055986404, -0.00027734600007534027, -0.0002475520595908165, -0.00021775811910629272, -0.00018796417862176895, -0.00015817023813724518, -0.0001283762976527214, -9.858235716819763e-05, -6.878841668367386e-05, -3.8994476199150085e-05, -9.200535714626312e-06, 2.059340476989746e-05, 5.0387345254421234e-05, 8.018128573894501e-05, 0.00010997522622346878, 0.00013976916670799255, 0.00016956310719251633, 0.0001993570476770401, 0.00022915098816156387, 0.00025894492864608765, 0.0002887388691306114, 0.0003185328096151352, 0.00034832675009965897, 0.00037812069058418274, 0.0004079146310687065, 0.0004377085715532303, 0.00046750251203775406, 0.0004972964525222778, 0.0005270903930068016, 0.0005568843334913254, 0.0005866782739758492, 0.0006164722144603729, 0.0006462661549448967, 0.0006760600954294205, 0.0007058540359139442, 0.000735647976398468, 0.0007654419168829918, 0.0007952358573675156, 0.0008250297978520393, 0.0008548237383365631, 0.0008846176788210869, 0.0009144116193056107, 0.0009442055597901344, 0.0009739995002746582]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 5.0, 6.0, 14.0, 18.0, 13.0, 19.0, 30.0, 20.0, 26.0, 36.0, 31.0, 34.0, 44.0, 34.0, 42.0, 36.0, 28.0, 32.0, 37.0, 44.0, 36.0, 40.0, 34.0, 35.0, 33.0, 29.0, 29.0, 27.0, 26.0, 14.0, 23.0, 17.0, 26.0, 10.0, 12.0, 6.0, 5.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-4.5234375, -4.3868408203125, -4.250244140625, -4.1136474609375, -3.97705078125, -3.8404541015625, -3.703857421875, -3.5672607421875, -3.4306640625, -3.2940673828125, -3.157470703125, -3.0208740234375, -2.88427734375, -2.7476806640625, -2.611083984375, -2.4744873046875, -2.337890625, -2.2012939453125, -2.064697265625, -1.9281005859375, -1.79150390625, -1.6549072265625, -1.518310546875, -1.3817138671875, -1.2451171875, -1.1085205078125, -0.971923828125, -0.8353271484375, -0.69873046875, -0.5621337890625, -0.425537109375, -0.2889404296875, -0.15234375, -0.0157470703125, 0.120849609375, 0.2574462890625, 0.39404296875, 0.5306396484375, 0.667236328125, 0.8038330078125, 0.9404296875, 1.0770263671875, 1.213623046875, 1.3502197265625, 1.48681640625, 1.6234130859375, 1.760009765625, 1.8966064453125, 2.033203125, 2.1697998046875, 2.306396484375, 2.4429931640625, 2.57958984375, 2.7161865234375, 2.852783203125, 2.9893798828125, 3.1259765625, 3.2625732421875, 3.399169921875, 3.5357666015625, 3.67236328125, 3.8089599609375, 3.945556640625, 4.0821533203125, 4.21875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 10.0, 13.0, 9.0, 26.0, 27.0, 34.0, 52.0, 64.0, 125.0, 164.0, 269.0, 419.0, 715.0, 1185.0, 2142.0, 3516.0, 6099.0, 10663.0, 19423.0, 38587.0, 86865.0, 270870.0, 384790.0, 119545.0, 48566.0, 23858.0, 12763.0, 7380.0, 4211.0, 2430.0, 1497.0, 858.0, 493.0, 284.0, 190.0, 139.0, 76.0, 58.0, 43.0, 31.0, 19.0, 11.0, 13.0, 14.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1875, -3.09136962890625, -2.9952392578125, -2.89910888671875, -2.802978515625, -2.70684814453125, -2.6107177734375, -2.51458740234375, -2.41845703125, -2.32232666015625, -2.2261962890625, -2.13006591796875, -2.033935546875, -1.93780517578125, -1.8416748046875, -1.74554443359375, -1.6494140625, -1.55328369140625, -1.4571533203125, -1.36102294921875, -1.264892578125, -1.16876220703125, -1.0726318359375, -0.97650146484375, -0.88037109375, -0.78424072265625, -0.6881103515625, -0.59197998046875, -0.495849609375, -0.39971923828125, -0.3035888671875, -0.20745849609375, -0.111328125, -0.01519775390625, 0.0809326171875, 0.17706298828125, 0.273193359375, 0.36932373046875, 0.4654541015625, 0.56158447265625, 0.65771484375, 0.75384521484375, 0.8499755859375, 0.94610595703125, 1.042236328125, 1.13836669921875, 1.2344970703125, 1.33062744140625, 1.4267578125, 1.52288818359375, 1.6190185546875, 1.71514892578125, 1.811279296875, 1.90740966796875, 2.0035400390625, 2.09967041015625, 2.19580078125, 2.29193115234375, 2.3880615234375, 2.48419189453125, 2.580322265625, 2.67645263671875, 2.7725830078125, 2.86871337890625, 2.96484375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 5.0, 10.0, 11.0, 7.0, 11.0, 23.0, 18.0, 20.0, 22.0, 22.0, 29.0, 35.0, 43.0, 38.0, 37.0, 72.0, 179.0, 1693.0, 225.0, 81.0, 65.0, 44.0, 45.0, 40.0, 32.0, 33.0, 28.0, 24.0, 20.0, 31.0, 22.0, 13.0, 12.0, 10.0, 7.0, 9.0, 3.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.2845458984375, -12.764404296875, -12.2442626953125, -11.72412109375, -11.2039794921875, -10.683837890625, -10.1636962890625, -9.6435546875, -9.1234130859375, -8.603271484375, -8.0831298828125, -7.56298828125, -7.0428466796875, -6.522705078125, -6.0025634765625, -5.482421875, -4.9622802734375, -4.442138671875, -3.9219970703125, -3.40185546875, -2.8817138671875, -2.361572265625, -1.8414306640625, -1.3212890625, -0.8011474609375, -0.281005859375, 0.2391357421875, 0.75927734375, 1.2794189453125, 1.799560546875, 2.3197021484375, 2.83984375, 3.3599853515625, 3.880126953125, 4.4002685546875, 4.92041015625, 5.4405517578125, 5.960693359375, 6.4808349609375, 7.0009765625, 7.5211181640625, 8.041259765625, 8.5614013671875, 9.08154296875, 9.6016845703125, 10.121826171875, 10.6419677734375, 11.162109375, 11.6822509765625, 12.202392578125, 12.7225341796875, 13.24267578125, 13.7628173828125, 14.282958984375, 14.8031005859375, 15.3232421875, 15.8433837890625, 16.363525390625, 16.8836669921875, 17.40380859375, 17.9239501953125, 18.444091796875, 18.9642333984375, 19.484375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 13.0, 13.0, 10.0, 21.0, 32.0, 40.0, 56.0, 72.0, 97.0, 179.0, 279.0, 556.0, 2920.0, 2910897.0, 227915.0, 1542.0, 423.0, 230.0, 128.0, 76.0, 61.0, 38.0, 19.0, 26.0, 14.0, 12.0, 5.0, 7.0, 9.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.09375, -46.53662109375, -44.9794921875, -43.42236328125, -41.865234375, -40.30810546875, -38.7509765625, -37.19384765625, -35.63671875, -34.07958984375, -32.5224609375, -30.96533203125, -29.408203125, -27.85107421875, -26.2939453125, -24.73681640625, -23.1796875, -21.62255859375, -20.0654296875, -18.50830078125, -16.951171875, -15.39404296875, -13.8369140625, -12.27978515625, -10.72265625, -9.16552734375, -7.6083984375, -6.05126953125, -4.494140625, -2.93701171875, -1.3798828125, 0.17724609375, 1.734375, 3.29150390625, 4.8486328125, 6.40576171875, 7.962890625, 9.52001953125, 11.0771484375, 12.63427734375, 14.19140625, 15.74853515625, 17.3056640625, 18.86279296875, 20.419921875, 21.97705078125, 23.5341796875, 25.09130859375, 26.6484375, 28.20556640625, 29.7626953125, 31.31982421875, 32.876953125, 34.43408203125, 35.9912109375, 37.54833984375, 39.10546875, 40.66259765625, 42.2197265625, 43.77685546875, 45.333984375, 46.89111328125, 48.4482421875, 50.00537109375, 51.5625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 187.0, 759.0, 69.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.774166107177734, -20.15549087524414, -15.53681468963623, -10.91813850402832, -6.299463272094727, -1.6807880401611328, 2.9378890991210938, 7.5565643310546875, 12.175239562988281, 16.793914794921875, 21.41259002685547, 26.031267166137695, 30.64994239807129, 35.26861572265625, 39.88729476928711, 44.5059700012207, 49.1246452331543, 53.74332046508789, 58.361995697021484, 62.980674743652344, 67.59934997558594, 72.21802520751953, 76.83670043945312, 81.45537567138672, 86.07405090332031, 90.6927261352539, 95.3114013671875, 99.9300765991211, 104.54875183105469, 109.16742706298828, 113.78610229492188, 118.40478515625, 123.02345275878906, 127.64212799072266, 132.26080322265625, 136.87948608398438, 141.49815368652344, 146.11683654785156, 150.73550415039062, 155.35418701171875, 159.9728546142578, 164.59153747558594, 169.210205078125, 173.82888793945312, 178.4475555419922, 183.0662384033203, 187.68490600585938, 192.3035888671875, 196.92227172851562, 201.54095458984375, 206.1596221923828, 210.77830505371094, 215.39697265625, 220.01565551757812, 224.6343231201172, 229.2530059814453, 233.87167358398438, 238.4903564453125, 243.10902404785156, 247.7277069091797, 252.34637451171875, 256.9650573730469, 261.583740234375, 266.202392578125, 270.8210754394531]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 8.0, 5.0, 14.0, 5.0, 5.0, 19.0, 18.0, 16.0, 18.0, 19.0, 26.0, 24.0, 27.0, 31.0, 37.0, 37.0, 40.0, 46.0, 35.0, 36.0, 40.0, 42.0, 44.0, 34.0, 37.0, 39.0, 30.0, 31.0, 33.0, 33.0, 37.0, 22.0, 19.0, 18.0, 18.0, 15.0, 6.0, 1.0, 13.0, 6.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.74343490600586, -43.338130950927734, -41.932823181152344, -40.52751922607422, -39.12221145629883, -37.7169075012207, -36.31159973144531, -34.90629577636719, -33.5009880065918, -32.09568405151367, -30.69037628173828, -29.285070419311523, -27.879764556884766, -26.474458694458008, -25.06915283203125, -23.663848876953125, -22.258543014526367, -20.85323715209961, -19.44793128967285, -18.042625427246094, -16.637319564819336, -15.232013702392578, -13.826708793640137, -12.421402931213379, -11.016097068786621, -9.610791206359863, -8.205485343933105, -6.800179958343506, -5.394874095916748, -3.9895682334899902, -2.5842628479003906, -1.1789569854736328, 0.226348876953125, 1.6316546201705933, 3.0369603633880615, 4.44226598739624, 5.847571849822998, 7.252877712249756, 8.658183097839355, 10.063488960266113, 11.468794822692871, 12.874100685119629, 14.279406547546387, 15.684711456298828, 17.090017318725586, 18.495323181152344, 19.9006290435791, 21.30593490600586, 22.711240768432617, 24.116546630859375, 25.521852493286133, 26.92715835571289, 28.33246421813965, 29.737770080566406, 31.14307403564453, 32.54838180541992, 33.95368576049805, 35.35898971557617, 36.76429748535156, 38.16960144042969, 39.57490921020508, 40.9802131652832, 42.385520935058594, 43.79082489013672, 45.19613265991211]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 2.0, 4.0, 1.0, 5.0, 10.0, 10.0, 11.0, 9.0, 17.0, 18.0, 14.0, 30.0, 30.0, 32.0, 30.0, 34.0, 38.0, 38.0, 29.0, 43.0, 39.0, 39.0, 32.0, 34.0, 48.0, 50.0, 35.0, 27.0, 30.0, 23.0, 30.0, 30.0, 26.0, 25.0, 21.0, 22.0, 16.0, 14.0, 13.0, 5.0, 10.0, 5.0, 6.0, 6.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.69921875, -4.55474853515625, -4.4102783203125, -4.26580810546875, -4.121337890625, -3.97686767578125, -3.8323974609375, -3.68792724609375, -3.54345703125, -3.39898681640625, -3.2545166015625, -3.11004638671875, -2.965576171875, -2.82110595703125, -2.6766357421875, -2.53216552734375, -2.3876953125, -2.24322509765625, -2.0987548828125, -1.95428466796875, -1.809814453125, -1.66534423828125, -1.5208740234375, -1.37640380859375, -1.23193359375, -1.08746337890625, -0.9429931640625, -0.79852294921875, -0.654052734375, -0.50958251953125, -0.3651123046875, -0.22064208984375, -0.076171875, 0.06829833984375, 0.2127685546875, 0.35723876953125, 0.501708984375, 0.64617919921875, 0.7906494140625, 0.93511962890625, 1.07958984375, 1.22406005859375, 1.3685302734375, 1.51300048828125, 1.657470703125, 1.80194091796875, 1.9464111328125, 2.09088134765625, 2.2353515625, 2.37982177734375, 2.5242919921875, 2.66876220703125, 2.813232421875, 2.95770263671875, 3.1021728515625, 3.24664306640625, 3.39111328125, 3.53558349609375, 3.6800537109375, 3.82452392578125, 3.968994140625, 4.11346435546875, 4.2579345703125, 4.40240478515625, 4.546875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 14.0, 22.0, 20.0, 26.0, 45.0, 59.0, 72.0, 102.0, 149.0, 222.0, 322.0, 541.0, 1027.0, 1993.0, 4663.0, 13065.0, 48782.0, 262994.0, 1251775.0, 1857373.0, 607925.0, 104905.0, 23947.0, 7720.0, 2978.0, 1409.0, 725.0, 432.0, 266.0, 192.0, 146.0, 94.0, 64.0, 37.0, 49.0, 21.0, 18.0, 12.0, 14.0, 12.0, 5.0, 10.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.56640625, -6.32537841796875, -6.0843505859375, -5.84332275390625, -5.602294921875, -5.36126708984375, -5.1202392578125, -4.87921142578125, -4.63818359375, -4.39715576171875, -4.1561279296875, -3.91510009765625, -3.674072265625, -3.43304443359375, -3.1920166015625, -2.95098876953125, -2.7099609375, -2.46893310546875, -2.2279052734375, -1.98687744140625, -1.745849609375, -1.50482177734375, -1.2637939453125, -1.02276611328125, -0.78173828125, -0.54071044921875, -0.2996826171875, -0.05865478515625, 0.182373046875, 0.42340087890625, 0.6644287109375, 0.90545654296875, 1.146484375, 1.38751220703125, 1.6285400390625, 1.86956787109375, 2.110595703125, 2.35162353515625, 2.5926513671875, 2.83367919921875, 3.07470703125, 3.31573486328125, 3.5567626953125, 3.79779052734375, 4.038818359375, 4.27984619140625, 4.5208740234375, 4.76190185546875, 5.0029296875, 5.24395751953125, 5.4849853515625, 5.72601318359375, 5.967041015625, 6.20806884765625, 6.4490966796875, 6.69012451171875, 6.93115234375, 7.17218017578125, 7.4132080078125, 7.65423583984375, 7.895263671875, 8.13629150390625, 8.3773193359375, 8.61834716796875, 8.859375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 5.0, 8.0, 9.0, 7.0, 15.0, 25.0, 36.0, 52.0, 84.0, 98.0, 145.0, 191.0, 235.0, 361.0, 412.0, 448.0, 507.0, 375.0, 301.0, 218.0, 154.0, 112.0, 74.0, 58.0, 40.0, 33.0, 24.0, 18.0, 10.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3359375, -10.96728515625, -10.5986328125, -10.22998046875, -9.861328125, -9.49267578125, -9.1240234375, -8.75537109375, -8.38671875, -8.01806640625, -7.6494140625, -7.28076171875, -6.912109375, -6.54345703125, -6.1748046875, -5.80615234375, -5.4375, -5.06884765625, -4.7001953125, -4.33154296875, -3.962890625, -3.59423828125, -3.2255859375, -2.85693359375, -2.48828125, -2.11962890625, -1.7509765625, -1.38232421875, -1.013671875, -0.64501953125, -0.2763671875, 0.09228515625, 0.4609375, 0.82958984375, 1.1982421875, 1.56689453125, 1.935546875, 2.30419921875, 2.6728515625, 3.04150390625, 3.41015625, 3.77880859375, 4.1474609375, 4.51611328125, 4.884765625, 5.25341796875, 5.6220703125, 5.99072265625, 6.359375, 6.72802734375, 7.0966796875, 7.46533203125, 7.833984375, 8.20263671875, 8.5712890625, 8.93994140625, 9.30859375, 9.67724609375, 10.0458984375, 10.41455078125, 10.783203125, 11.15185546875, 11.5205078125, 11.88916015625, 12.2578125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 12.0, 9.0, 21.0, 24.0, 41.0, 42.0, 52.0, 97.0, 112.0, 169.0, 223.0, 550.0, 1685.0, 37444.0, 3770563.0, 376571.0, 4780.0, 796.0, 347.0, 216.0, 150.0, 95.0, 68.0, 47.0, 39.0, 33.0, 25.0, 11.0, 11.0, 16.0, 3.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.875, -32.607421875, -31.33984375, -30.072265625, -28.8046875, -27.537109375, -26.26953125, -25.001953125, -23.734375, -22.466796875, -21.19921875, -19.931640625, -18.6640625, -17.396484375, -16.12890625, -14.861328125, -13.59375, -12.326171875, -11.05859375, -9.791015625, -8.5234375, -7.255859375, -5.98828125, -4.720703125, -3.453125, -2.185546875, -0.91796875, 0.349609375, 1.6171875, 2.884765625, 4.15234375, 5.419921875, 6.6875, 7.955078125, 9.22265625, 10.490234375, 11.7578125, 13.025390625, 14.29296875, 15.560546875, 16.828125, 18.095703125, 19.36328125, 20.630859375, 21.8984375, 23.166015625, 24.43359375, 25.701171875, 26.96875, 28.236328125, 29.50390625, 30.771484375, 32.0390625, 33.306640625, 34.57421875, 35.841796875, 37.109375, 38.376953125, 39.64453125, 40.912109375, 42.1796875, 43.447265625, 44.71484375, 45.982421875, 47.25]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 8.0, 74.0, 270.0, 376.0, 226.0, 44.0, 11.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.75665283203125, -65.4729232788086, -60.18919372558594, -54.905460357666016, -49.62173080444336, -44.3380012512207, -39.05426788330078, -33.770538330078125, -28.48680877685547, -23.203079223632812, -17.919347763061523, -12.63561725616455, -7.351886749267578, -2.068157196044922, 3.215574264526367, 8.499305725097656, 13.783035278320312, 19.06676483154297, 24.350496292114258, 29.634227752685547, 34.9179573059082, 40.20168685913086, 45.48542022705078, 50.76914978027344, 56.052879333496094, 61.33660888671875, 66.6203384399414, 71.90406799316406, 77.18780517578125, 82.47152709960938, 87.75526428222656, 93.03899383544922, 98.32272338867188, 103.60645294189453, 108.89018249511719, 114.17391204833984, 119.4576416015625, 124.74137878417969, 130.0251007080078, 135.308837890625, 140.59255981445312, 145.8762969970703, 151.16001892089844, 156.44375610351562, 161.72747802734375, 167.01121520996094, 172.29493713378906, 177.57867431640625, 182.86241149902344, 188.14614868164062, 193.42987060546875, 198.71360778808594, 203.99732971191406, 209.28106689453125, 214.56478881835938, 219.84852600097656, 225.13226318359375, 230.41600036621094, 235.69972229003906, 240.98345947265625, 246.26718139648438, 251.55091857910156, 256.83465576171875, 262.1183776855469, 267.402099609375]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 6.0, 5.0, 11.0, 9.0, 18.0, 9.0, 20.0, 15.0, 19.0, 19.0, 22.0, 24.0, 28.0, 26.0, 46.0, 31.0, 45.0, 38.0, 41.0, 32.0, 43.0, 48.0, 37.0, 34.0, 38.0, 36.0, 26.0, 29.0, 34.0, 17.0, 24.0, 22.0, 23.0, 23.0, 18.0, 14.0, 20.0, 6.0, 12.0, 6.0, 5.0, 6.0, 0.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.296630859375, -32.26353454589844, -31.23044204711914, -30.19734764099121, -29.16425323486328, -28.13115882873535, -27.098064422607422, -26.064970016479492, -25.031875610351562, -23.998781204223633, -22.965686798095703, -21.932592391967773, -20.899497985839844, -19.866403579711914, -18.833309173583984, -17.800214767456055, -16.767120361328125, -15.734025955200195, -14.700931549072266, -13.667837142944336, -12.634742736816406, -11.601648330688477, -10.568553924560547, -9.535459518432617, -8.502365112304688, -7.469270706176758, -6.436176300048828, -5.403081893920898, -4.369987487792969, -3.336893081665039, -2.3037986755371094, -1.2707042694091797, -0.23760986328125, 0.7954845428466797, 1.8285789489746094, 2.861673355102539, 3.8947677612304688, 4.927862167358398, 5.960956573486328, 6.994050979614258, 8.027145385742188, 9.060239791870117, 10.093334197998047, 11.126428604125977, 12.159523010253906, 13.192617416381836, 14.225711822509766, 15.258806228637695, 16.291900634765625, 17.324995040893555, 18.358089447021484, 19.391183853149414, 20.424278259277344, 21.457372665405273, 22.490467071533203, 23.523561477661133, 24.556655883789062, 25.589750289916992, 26.622844696044922, 27.65593910217285, 28.68903350830078, 29.72212791442871, 30.75522232055664, 31.78831672668457, 32.8214111328125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 7.0, 10.0, 15.0, 17.0, 17.0, 21.0, 29.0, 33.0, 32.0, 32.0, 40.0, 38.0, 46.0, 44.0, 42.0, 42.0, 51.0, 42.0, 46.0, 40.0, 44.0, 40.0, 35.0, 38.0, 38.0, 26.0, 26.0, 19.0, 15.0, 17.0, 15.0, 13.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.99505615234375, -4.8260498046875, -4.65704345703125, -4.488037109375, -4.31903076171875, -4.1500244140625, -3.98101806640625, -3.81201171875, -3.64300537109375, -3.4739990234375, -3.30499267578125, -3.135986328125, -2.96697998046875, -2.7979736328125, -2.62896728515625, -2.4599609375, -2.29095458984375, -2.1219482421875, -1.95294189453125, -1.783935546875, -1.61492919921875, -1.4459228515625, -1.27691650390625, -1.10791015625, -0.93890380859375, -0.7698974609375, -0.60089111328125, -0.431884765625, -0.26287841796875, -0.0938720703125, 0.07513427734375, 0.244140625, 0.41314697265625, 0.5821533203125, 0.75115966796875, 0.920166015625, 1.08917236328125, 1.2581787109375, 1.42718505859375, 1.59619140625, 1.76519775390625, 1.9342041015625, 2.10321044921875, 2.272216796875, 2.44122314453125, 2.6102294921875, 2.77923583984375, 2.9482421875, 3.11724853515625, 3.2862548828125, 3.45526123046875, 3.624267578125, 3.79327392578125, 3.9622802734375, 4.13128662109375, 4.30029296875, 4.46929931640625, 4.6383056640625, 4.80731201171875, 4.976318359375, 5.14532470703125, 5.3143310546875, 5.48333740234375, 5.65234375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 11.0, 13.0, 21.0, 34.0, 49.0, 56.0, 79.0, 107.0, 136.0, 200.0, 303.0, 424.0, 646.0, 907.0, 1370.0, 2016.0, 2831.0, 4187.0, 6236.0, 9394.0, 14321.0, 22065.0, 34259.0, 55022.0, 89569.0, 148893.0, 207474.0, 168601.0, 103533.0, 63244.0, 39051.0, 24920.0, 15895.0, 10536.0, 7142.0, 4708.0, 3257.0, 2242.0, 1520.0, 1053.0, 676.0, 495.0, 341.0, 210.0, 149.0, 115.0, 71.0, 53.0, 38.0, 32.0, 23.0, 8.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0], "bins": [-0.572265625, -0.5535888671875, -0.534912109375, -0.5162353515625, -0.49755859375, -0.4788818359375, -0.460205078125, -0.4415283203125, -0.4228515625, -0.4041748046875, -0.385498046875, -0.3668212890625, -0.34814453125, -0.3294677734375, -0.310791015625, -0.2921142578125, -0.2734375, -0.2547607421875, -0.236083984375, -0.2174072265625, -0.19873046875, -0.1800537109375, -0.161376953125, -0.1427001953125, -0.1240234375, -0.1053466796875, -0.086669921875, -0.0679931640625, -0.04931640625, -0.0306396484375, -0.011962890625, 0.0067138671875, 0.025390625, 0.0440673828125, 0.062744140625, 0.0814208984375, 0.10009765625, 0.1187744140625, 0.137451171875, 0.1561279296875, 0.1748046875, 0.1934814453125, 0.212158203125, 0.2308349609375, 0.24951171875, 0.2681884765625, 0.286865234375, 0.3055419921875, 0.32421875, 0.3428955078125, 0.361572265625, 0.3802490234375, 0.39892578125, 0.4176025390625, 0.436279296875, 0.4549560546875, 0.4736328125, 0.4923095703125, 0.510986328125, 0.5296630859375, 0.54833984375, 0.5670166015625, 0.585693359375, 0.6043701171875, 0.623046875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 12.0, 7.0, 11.0, 11.0, 12.0, 17.0, 31.0, 36.0, 40.0, 31.0, 39.0, 51.0, 43.0, 37.0, 58.0, 1092.0, 59.0, 54.0, 48.0, 43.0, 44.0, 28.0, 42.0, 21.0, 34.0, 16.0, 28.0, 21.0, 14.0, 12.0, 8.0, 1.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.16015625, -3.04095458984375, -2.9217529296875, -2.80255126953125, -2.683349609375, -2.56414794921875, -2.4449462890625, -2.32574462890625, -2.20654296875, -2.08734130859375, -1.9681396484375, -1.84893798828125, -1.729736328125, -1.61053466796875, -1.4913330078125, -1.37213134765625, -1.2529296875, -1.13372802734375, -1.0145263671875, -0.89532470703125, -0.776123046875, -0.65692138671875, -0.5377197265625, -0.41851806640625, -0.29931640625, -0.18011474609375, -0.0609130859375, 0.05828857421875, 0.177490234375, 0.29669189453125, 0.4158935546875, 0.53509521484375, 0.654296875, 0.77349853515625, 0.8927001953125, 1.01190185546875, 1.131103515625, 1.25030517578125, 1.3695068359375, 1.48870849609375, 1.60791015625, 1.72711181640625, 1.8463134765625, 1.96551513671875, 2.084716796875, 2.20391845703125, 2.3231201171875, 2.44232177734375, 2.5615234375, 2.68072509765625, 2.7999267578125, 2.91912841796875, 3.038330078125, 3.15753173828125, 3.2767333984375, 3.39593505859375, 3.51513671875, 3.63433837890625, 3.7535400390625, 3.87274169921875, 3.991943359375, 4.11114501953125, 4.2303466796875, 4.34954833984375, 4.46875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 14.0, 9.0, 33.0, 47.0, 59.0, 116.0, 184.0, 317.0, 507.0, 972.0, 1786.0, 3371.0, 6347.0, 12190.0, 24481.0, 51877.0, 113925.0, 243317.0, 1343093.0, 156745.0, 70913.0, 33023.0, 16154.0, 8192.0, 4359.0, 2259.0, 1234.0, 682.0, 374.0, 222.0, 108.0, 78.0, 52.0, 36.0, 16.0, 17.0, 10.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79248046875, -0.7693099975585938, -0.7461395263671875, -0.7229690551757812, -0.699798583984375, -0.6766281127929688, -0.6534576416015625, -0.6302871704101562, -0.60711669921875, -0.5839462280273438, -0.5607757568359375, -0.5376052856445312, -0.514434814453125, -0.49126434326171875, -0.4680938720703125, -0.44492340087890625, -0.4217529296875, -0.39858245849609375, -0.3754119873046875, -0.35224151611328125, -0.329071044921875, -0.30590057373046875, -0.2827301025390625, -0.25955963134765625, -0.23638916015625, -0.21321868896484375, -0.1900482177734375, -0.16687774658203125, -0.143707275390625, -0.12053680419921875, -0.0973663330078125, -0.07419586181640625, -0.051025390625, -0.02785491943359375, -0.0046844482421875, 0.01848602294921875, 0.041656494140625, 0.06482696533203125, 0.0879974365234375, 0.11116790771484375, 0.13433837890625, 0.15750885009765625, 0.1806793212890625, 0.20384979248046875, 0.227020263671875, 0.25019073486328125, 0.2733612060546875, 0.29653167724609375, 0.3197021484375, 0.34287261962890625, 0.3660430908203125, 0.38921356201171875, 0.412384033203125, 0.43555450439453125, 0.4587249755859375, 0.48189544677734375, 0.50506591796875, 0.5282363891601562, 0.5514068603515625, 0.5745773315429688, 0.597747802734375, 0.6209182739257812, 0.6440887451171875, 0.6672592163085938, 0.6904296875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 8.0, 3.0, 6.0, 11.0, 15.0, 19.0, 19.0, 22.0, 30.0, 33.0, 34.0, 37.0, 56.0, 63.0, 49.0, 68.0, 62.0, 66.0, 60.0, 67.0, 39.0, 49.0, 38.0, 39.0, 26.0, 24.0, 15.0, 9.0, 9.0, 6.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0017576217651367188, -0.0016979724168777466, -0.0016383230686187744, -0.0015786737203598022, -0.00151902437210083, -0.001459375023841858, -0.0013997256755828857, -0.0013400763273239136, -0.0012804269790649414, -0.0012207776308059692, -0.001161128282546997, -0.001101478934288025, -0.0010418295860290527, -0.0009821802377700806, -0.0009225308895111084, -0.0008628815412521362, -0.0008032321929931641, -0.0007435828447341919, -0.0006839334964752197, -0.0006242841482162476, -0.0005646347999572754, -0.0005049854516983032, -0.00044533610343933105, -0.0003856867551803589, -0.0003260374069213867, -0.00026638805866241455, -0.00020673871040344238, -0.00014708936214447021, -8.744001388549805e-05, -2.779066562652588e-05, 3.185868263244629e-05, 9.150803089141846e-05, 0.00015115737915039062, 0.0002108067274093628, 0.00027045607566833496, 0.00033010542392730713, 0.0003897547721862793, 0.00044940412044525146, 0.0005090534687042236, 0.0005687028169631958, 0.000628352165222168, 0.0006880015134811401, 0.0007476508617401123, 0.0008073002099990845, 0.0008669495582580566, 0.0009265989065170288, 0.000986248254776001, 0.0010458976030349731, 0.0011055469512939453, 0.0011651962995529175, 0.0012248456478118896, 0.0012844949960708618, 0.001344144344329834, 0.0014037936925888062, 0.0014634430408477783, 0.0015230923891067505, 0.0015827417373657227, 0.0016423910856246948, 0.001702040433883667, 0.0017616897821426392, 0.0018213391304016113, 0.0018809884786605835, 0.0019406378269195557, 0.002000287175178528, 0.0020599365234375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 13.0, 18.0, 18.0, 19.0, 31.0, 41.0, 60.0, 71.0, 116.0, 191.0, 360.0, 677.0, 3511.0, 663000.0, 376312.0, 2525.0, 646.0, 280.0, 192.0, 117.0, 73.0, 59.0, 34.0, 38.0, 29.0, 21.0, 17.0, 16.0, 13.0, 5.0, 8.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0394287109375, -0.03826713562011719, -0.037105560302734375, -0.03594398498535156, -0.03478240966796875, -0.03362083435058594, -0.032459259033203125, -0.03129768371582031, -0.0301361083984375, -0.028974533081054688, -0.027812957763671875, -0.026651382446289062, -0.02548980712890625, -0.024328231811523438, -0.023166656494140625, -0.022005081176757812, -0.020843505859375, -0.019681930541992188, -0.018520355224609375, -0.017358779907226562, -0.01619720458984375, -0.015035629272460938, -0.013874053955078125, -0.012712478637695312, -0.0115509033203125, -0.010389328002929688, -0.009227752685546875, -0.008066177368164062, -0.00690460205078125, -0.0057430267333984375, -0.004581451416015625, -0.0034198760986328125, -0.00225830078125, -0.0010967254638671875, 6.4849853515625e-05, 0.0012264251708984375, 0.00238800048828125, 0.0035495758056640625, 0.004711151123046875, 0.0058727264404296875, 0.0070343017578125, 0.008195877075195312, 0.009357452392578125, 0.010519027709960938, 0.01168060302734375, 0.012842178344726562, 0.014003753662109375, 0.015165328979492188, 0.016326904296875, 0.017488479614257812, 0.018650054931640625, 0.019811630249023438, 0.02097320556640625, 0.022134780883789062, 0.023296356201171875, 0.024457931518554688, 0.0256195068359375, 0.026781082153320312, 0.027942657470703125, 0.029104232788085938, 0.03026580810546875, 0.03142738342285156, 0.032588958740234375, 0.03375053405761719, 0.034912109375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 22.0, 93.0, 270.0, 350.0, 191.0, 66.0, 13.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006533139385282993, -0.006395274773240089, -0.0062574101611971855, -0.006119545549154282, -0.00598168047145009, -0.0058438158594071865, -0.005705951247364283, -0.005568086635321379, -0.005430222023278475, -0.005292357411235571, -0.005154492799192667, -0.005016627721488476, -0.004878763109445572, -0.004740898497402668, -0.004603033885359764, -0.00446516927331686, -0.004327304661273956, -0.004189440049231052, -0.0040515754371881485, -0.003913710825145245, -0.003775845980271697, -0.0036379811353981495, -0.0035001165233552456, -0.0033622519113123417, -0.0032243868336081505, -0.0030865222215652466, -0.002948657376691699, -0.002810792764648795, -0.0026729281526058912, -0.0025350633077323437, -0.0023971986956894398, -0.002259334083646536, -0.0021214692387729883, -0.0019836046267300844, -0.0018457398982718587, -0.001707875169813633, -0.001570010557770729, -0.0014321458293125033, -0.0012942811008542776, -0.0011564164888113737, -0.001018551760353148, -0.0008806870901025832, -0.0007428224198520184, -0.0006049576913937926, -0.0004670930211432278, -0.000329228350892663, -0.00019136362243443727, -5.349895218387246e-05, 8.436571806669235e-05, 0.0002222304028691724, 0.00036009508767165244, 0.0004979597870260477, 0.0006358244572766125, 0.0007736891275271773, 0.0009115538559854031, 0.001049418468028307, 0.0011872831964865327, 0.0013251479249447584, 0.0014630125369876623, 0.001600877265445888, 0.0017387419939041138, 0.0018766066059470177, 0.0020144712179899216, 0.002152336062863469, 0.002290200674906373]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 9.0, 6.0, 13.0, 15.0, 19.0, 18.0, 25.0, 27.0, 33.0, 37.0, 38.0, 36.0, 50.0, 37.0, 46.0, 44.0, 60.0, 48.0, 60.0, 48.0, 36.0, 37.0, 31.0, 36.0, 42.0, 27.0, 29.0, 23.0, 14.0, 12.0, 14.0, 3.0, 4.0, 6.0, 4.0, 3.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0012736916542053223, -0.0012402180582284927, -0.0012067444622516632, -0.0011732708662748337, -0.0011397972702980042, -0.0011063236743211746, -0.001072850078344345, -0.0010393764823675156, -0.001005902886390686, -0.0009724292904138565, -0.000938955694437027, -0.0009054820984601974, -0.0008720085024833679, -0.0008385349065065384, -0.0008050613105297089, -0.0007715877145528793, -0.0007381141185760498, -0.0007046405225992203, -0.0006711669266223907, -0.0006376933306455612, -0.0006042197346687317, -0.0005707461386919022, -0.0005372725427150726, -0.0005037989467382431, -0.0004703253507614136, -0.00043685175478458405, -0.0004033781588077545, -0.000369904562830925, -0.00033643096685409546, -0.00030295737087726593, -0.0002694837749004364, -0.00023601017892360687, -0.00020253658294677734, -0.00016906298696994781, -0.00013558939099311829, -0.00010211579501628876, -6.864219903945923e-05, -3.51686030626297e-05, -1.695007085800171e-06, 3.177858889102936e-05, 6.525218486785889e-05, 9.872578084468842e-05, 0.00013219937682151794, 0.00016567297279834747, 0.000199146568775177, 0.00023262016475200653, 0.00026609376072883606, 0.0002995673567056656, 0.0003330409526824951, 0.00036651454865932465, 0.0003999881446361542, 0.0004334617406129837, 0.00046693533658981323, 0.0005004089325666428, 0.0005338825285434723, 0.0005673561245203018, 0.0006008297204971313, 0.0006343033164739609, 0.0006677769124507904, 0.0007012505084276199, 0.0007347241044044495, 0.000768197700381279, 0.0008016712963581085, 0.000835144892334938, 0.0008686184883117676]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 7.0, 10.0, 15.0, 17.0, 17.0, 21.0, 29.0, 33.0, 32.0, 32.0, 40.0, 38.0, 46.0, 44.0, 42.0, 42.0, 51.0, 42.0, 46.0, 40.0, 44.0, 40.0, 35.0, 38.0, 38.0, 26.0, 26.0, 19.0, 15.0, 17.0, 15.0, 13.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.99505615234375, -4.8260498046875, -4.65704345703125, -4.488037109375, -4.31903076171875, -4.1500244140625, -3.98101806640625, -3.81201171875, -3.64300537109375, -3.4739990234375, -3.30499267578125, -3.135986328125, -2.96697998046875, -2.7979736328125, -2.62896728515625, -2.4599609375, -2.29095458984375, -2.1219482421875, -1.95294189453125, -1.783935546875, -1.61492919921875, -1.4459228515625, -1.27691650390625, -1.10791015625, -0.93890380859375, -0.7698974609375, -0.60089111328125, -0.431884765625, -0.26287841796875, -0.0938720703125, 0.07513427734375, 0.244140625, 0.41314697265625, 0.5821533203125, 0.75115966796875, 0.920166015625, 1.08917236328125, 1.2581787109375, 1.42718505859375, 1.59619140625, 1.76519775390625, 1.9342041015625, 2.10321044921875, 2.272216796875, 2.44122314453125, 2.6102294921875, 2.77923583984375, 2.9482421875, 3.11724853515625, 3.2862548828125, 3.45526123046875, 3.624267578125, 3.79327392578125, 3.9622802734375, 4.13128662109375, 4.30029296875, 4.46929931640625, 4.6383056640625, 4.80731201171875, 4.976318359375, 5.14532470703125, 5.3143310546875, 5.48333740234375, 5.65234375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 8.0, 4.0, 17.0, 14.0, 29.0, 22.0, 60.0, 68.0, 124.0, 150.0, 259.0, 430.0, 723.0, 1161.0, 2214.0, 4652.0, 9282.0, 19245.0, 39847.0, 85007.0, 197958.0, 350414.0, 182708.0, 80820.0, 37225.0, 17993.0, 8699.0, 4274.0, 2160.0, 1161.0, 638.0, 401.0, 253.0, 148.0, 127.0, 94.0, 61.0, 29.0, 18.0, 17.0, 15.0, 10.0, 2.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-3.40625, -3.304443359375, -3.20263671875, -3.100830078125, -2.9990234375, -2.897216796875, -2.79541015625, -2.693603515625, -2.591796875, -2.489990234375, -2.38818359375, -2.286376953125, -2.1845703125, -2.082763671875, -1.98095703125, -1.879150390625, -1.77734375, -1.675537109375, -1.57373046875, -1.471923828125, -1.3701171875, -1.268310546875, -1.16650390625, -1.064697265625, -0.962890625, -0.861083984375, -0.75927734375, -0.657470703125, -0.5556640625, -0.453857421875, -0.35205078125, -0.250244140625, -0.1484375, -0.046630859375, 0.05517578125, 0.156982421875, 0.2587890625, 0.360595703125, 0.46240234375, 0.564208984375, 0.666015625, 0.767822265625, 0.86962890625, 0.971435546875, 1.0732421875, 1.175048828125, 1.27685546875, 1.378662109375, 1.48046875, 1.582275390625, 1.68408203125, 1.785888671875, 1.8876953125, 1.989501953125, 2.09130859375, 2.193115234375, 2.294921875, 2.396728515625, 2.49853515625, 2.600341796875, 2.7021484375, 2.803955078125, 2.90576171875, 3.007568359375, 3.109375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 2.0, 4.0, 9.0, 8.0, 10.0, 8.0, 16.0, 18.0, 23.0, 24.0, 25.0, 31.0, 38.0, 37.0, 49.0, 51.0, 66.0, 101.0, 354.0, 1598.0, 142.0, 69.0, 54.0, 44.0, 32.0, 40.0, 34.0, 29.0, 22.0, 22.0, 15.0, 11.0, 8.0, 12.0, 12.0, 11.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.96875, -20.35546875, -19.7421875, -19.12890625, -18.515625, -17.90234375, -17.2890625, -16.67578125, -16.0625, -15.44921875, -14.8359375, -14.22265625, -13.609375, -12.99609375, -12.3828125, -11.76953125, -11.15625, -10.54296875, -9.9296875, -9.31640625, -8.703125, -8.08984375, -7.4765625, -6.86328125, -6.25, -5.63671875, -5.0234375, -4.41015625, -3.796875, -3.18359375, -2.5703125, -1.95703125, -1.34375, -0.73046875, -0.1171875, 0.49609375, 1.109375, 1.72265625, 2.3359375, 2.94921875, 3.5625, 4.17578125, 4.7890625, 5.40234375, 6.015625, 6.62890625, 7.2421875, 7.85546875, 8.46875, 9.08203125, 9.6953125, 10.30859375, 10.921875, 11.53515625, 12.1484375, 12.76171875, 13.375, 13.98828125, 14.6015625, 15.21484375, 15.828125, 16.44140625, 17.0546875, 17.66796875, 18.28125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 10.0, 11.0, 15.0, 12.0, 14.0, 17.0, 17.0, 37.0, 41.0, 67.0, 83.0, 125.0, 148.0, 212.0, 343.0, 922.0, 6851.0, 2998578.0, 134317.0, 2278.0, 538.0, 320.0, 206.0, 124.0, 95.0, 66.0, 60.0, 53.0, 30.0, 18.0, 25.0, 11.0, 14.0, 9.0, 11.0, 6.0, 6.0, 6.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.25, -39.865234375, -38.48046875, -37.095703125, -35.7109375, -34.326171875, -32.94140625, -31.556640625, -30.171875, -28.787109375, -27.40234375, -26.017578125, -24.6328125, -23.248046875, -21.86328125, -20.478515625, -19.09375, -17.708984375, -16.32421875, -14.939453125, -13.5546875, -12.169921875, -10.78515625, -9.400390625, -8.015625, -6.630859375, -5.24609375, -3.861328125, -2.4765625, -1.091796875, 0.29296875, 1.677734375, 3.0625, 4.447265625, 5.83203125, 7.216796875, 8.6015625, 9.986328125, 11.37109375, 12.755859375, 14.140625, 15.525390625, 16.91015625, 18.294921875, 19.6796875, 21.064453125, 22.44921875, 23.833984375, 25.21875, 26.603515625, 27.98828125, 29.373046875, 30.7578125, 32.142578125, 33.52734375, 34.912109375, 36.296875, 37.681640625, 39.06640625, 40.451171875, 41.8359375, 43.220703125, 44.60546875, 45.990234375, 47.375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 3.0, 8.0, 15.0, 24.0, 31.0, 40.0, 65.0, 98.0, 115.0, 121.0, 111.0, 103.0, 85.0, 70.0, 43.0, 29.0, 12.0, 14.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.285987854003906, -13.757482528686523, -13.22897720336914, -12.700471878051758, -12.171966552734375, -11.643461227416992, -11.114956855773926, -10.586451530456543, -10.05794620513916, -9.529440879821777, -9.000935554504395, -8.472430229187012, -7.943925380706787, -7.415420055389404, -6.88691520690918, -6.358409881591797, -5.829904556274414, -5.301399230957031, -4.772893905639648, -4.244389057159424, -3.715883731842041, -3.187378406524658, -2.6588733196258545, -2.130368232727051, -1.601862907409668, -1.0733577013015747, -0.5448524951934814, -0.016347289085388184, 0.5121579170227051, 1.040663242340088, 1.5691683292388916, 2.0976734161376953, 2.6261768341064453, 3.154682159423828, 3.683187246322632, 4.2116923332214355, 4.740197658538818, 5.268702983856201, 5.797207832336426, 6.325713157653809, 6.854218482971191, 7.382723808288574, 7.911229133605957, 8.43973445892334, 8.968238830566406, 9.496744155883789, 10.025249481201172, 10.553754806518555, 11.082260131835938, 11.61076545715332, 12.139270782470703, 12.667776107788086, 13.196281433105469, 13.724786758422852, 14.253291130065918, 14.7817964553833, 15.310301780700684, 15.838807106018066, 16.367311477661133, 16.895816802978516, 17.4243221282959, 17.95282745361328, 18.481332778930664, 19.009838104248047, 19.53834342956543]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 13.0, 16.0, 21.0, 16.0, 28.0, 27.0, 34.0, 36.0, 36.0, 39.0, 52.0, 50.0, 33.0, 47.0, 47.0, 51.0, 42.0, 48.0, 56.0, 42.0, 42.0, 36.0, 37.0, 22.0, 18.0, 28.0, 23.0, 7.0, 12.0, 8.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.11354064941406, -41.5509033203125, -39.98826599121094, -38.425628662109375, -36.86299133300781, -35.30035400390625, -33.73771667480469, -32.175079345703125, -30.612443923950195, -29.049806594848633, -27.48716926574707, -25.92453384399414, -24.361896514892578, -22.799259185791016, -21.236621856689453, -19.67398452758789, -18.111347198486328, -16.548709869384766, -14.986072540283203, -13.423436164855957, -11.860798835754395, -10.298161506652832, -8.735525131225586, -7.172887802124023, -5.610250473022461, -4.047613143920898, -2.484976291656494, -0.9223394393920898, 0.6402978897094727, 2.202935218811035, 3.7655715942382812, 5.328208923339844, 6.890850067138672, 8.453487396240234, 10.016124725341797, 11.578761100769043, 13.141398429870605, 14.704035758972168, 16.266672134399414, 17.829309463500977, 19.39194679260254, 20.9545841217041, 22.517221450805664, 24.079856872558594, 25.642494201660156, 27.20513153076172, 28.76776885986328, 30.330406188964844, 31.893043518066406, 33.45568084716797, 35.01831817626953, 36.580955505371094, 38.143592834472656, 39.70623016357422, 41.26886749267578, 42.831504821777344, 44.394142150878906, 45.95677947998047, 47.51941680908203, 49.082054138183594, 50.644691467285156, 52.20732879638672, 53.76996612548828, 55.332603454589844, 56.89523696899414]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 13.0, 16.0, 19.0, 25.0, 22.0, 30.0, 33.0, 39.0, 36.0, 38.0, 37.0, 38.0, 53.0, 44.0, 40.0, 49.0, 45.0, 45.0, 37.0, 50.0, 36.0, 39.0, 40.0, 24.0, 25.0, 20.0, 18.0, 15.0, 18.0, 10.0, 13.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.10015869140625, -4.9229736328125, -4.74578857421875, -4.568603515625, -4.39141845703125, -4.2142333984375, -4.03704833984375, -3.85986328125, -3.68267822265625, -3.5054931640625, -3.32830810546875, -3.151123046875, -2.97393798828125, -2.7967529296875, -2.61956787109375, -2.4423828125, -2.26519775390625, -2.0880126953125, -1.91082763671875, -1.733642578125, -1.55645751953125, -1.3792724609375, -1.20208740234375, -1.02490234375, -0.84771728515625, -0.6705322265625, -0.49334716796875, -0.316162109375, -0.13897705078125, 0.0382080078125, 0.21539306640625, 0.392578125, 0.56976318359375, 0.7469482421875, 0.92413330078125, 1.101318359375, 1.27850341796875, 1.4556884765625, 1.63287353515625, 1.81005859375, 1.98724365234375, 2.1644287109375, 2.34161376953125, 2.518798828125, 2.69598388671875, 2.8731689453125, 3.05035400390625, 3.2275390625, 3.40472412109375, 3.5819091796875, 3.75909423828125, 3.936279296875, 4.11346435546875, 4.2906494140625, 4.46783447265625, 4.64501953125, 4.82220458984375, 4.9993896484375, 5.17657470703125, 5.353759765625, 5.53094482421875, 5.7081298828125, 5.88531494140625, 6.0625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 9.0, 9.0, 19.0, 15.0, 18.0, 30.0, 20.0, 22.0, 35.0, 38.0, 36.0, 48.0, 102.0, 472.0, 4020.0, 104376.0, 3497289.0, 575300.0, 10971.0, 974.0, 139.0, 56.0, 45.0, 36.0, 37.0, 32.0, 30.0, 17.0, 19.0, 9.0, 14.0, 17.0, 12.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.46875, -18.765380859375, -18.06201171875, -17.358642578125, -16.6552734375, -15.951904296875, -15.24853515625, -14.545166015625, -13.841796875, -13.138427734375, -12.43505859375, -11.731689453125, -11.0283203125, -10.324951171875, -9.62158203125, -8.918212890625, -8.21484375, -7.511474609375, -6.80810546875, -6.104736328125, -5.4013671875, -4.697998046875, -3.99462890625, -3.291259765625, -2.587890625, -1.884521484375, -1.18115234375, -0.477783203125, 0.2255859375, 0.928955078125, 1.63232421875, 2.335693359375, 3.0390625, 3.742431640625, 4.44580078125, 5.149169921875, 5.8525390625, 6.555908203125, 7.25927734375, 7.962646484375, 8.666015625, 9.369384765625, 10.07275390625, 10.776123046875, 11.4794921875, 12.182861328125, 12.88623046875, 13.589599609375, 14.29296875, 14.996337890625, 15.69970703125, 16.403076171875, 17.1064453125, 17.809814453125, 18.51318359375, 19.216552734375, 19.919921875, 20.623291015625, 21.32666015625, 22.030029296875, 22.7333984375, 23.436767578125, 24.14013671875, 24.843505859375, 25.546875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 6.0, 5.0, 5.0, 13.0, 28.0, 32.0, 36.0, 59.0, 65.0, 88.0, 101.0, 118.0, 185.0, 232.0, 276.0, 334.0, 418.0, 407.0, 384.0, 276.0, 233.0, 173.0, 121.0, 111.0, 97.0, 69.0, 58.0, 36.0, 20.0, 16.0, 16.0, 15.0, 12.0, 3.0, 2.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.90625, -10.6041259765625, -10.302001953125, -9.9998779296875, -9.69775390625, -9.3956298828125, -9.093505859375, -8.7913818359375, -8.4892578125, -8.1871337890625, -7.885009765625, -7.5828857421875, -7.28076171875, -6.9786376953125, -6.676513671875, -6.3743896484375, -6.072265625, -5.7701416015625, -5.468017578125, -5.1658935546875, -4.86376953125, -4.5616455078125, -4.259521484375, -3.9573974609375, -3.6552734375, -3.3531494140625, -3.051025390625, -2.7489013671875, -2.44677734375, -2.1446533203125, -1.842529296875, -1.5404052734375, -1.23828125, -0.9361572265625, -0.634033203125, -0.3319091796875, -0.02978515625, 0.2723388671875, 0.574462890625, 0.8765869140625, 1.1787109375, 1.4808349609375, 1.782958984375, 2.0850830078125, 2.38720703125, 2.6893310546875, 2.991455078125, 3.2935791015625, 3.595703125, 3.8978271484375, 4.199951171875, 4.5020751953125, 4.80419921875, 5.1063232421875, 5.408447265625, 5.7105712890625, 6.0126953125, 6.3148193359375, 6.616943359375, 6.9190673828125, 7.22119140625, 7.5233154296875, 7.825439453125, 8.1275634765625, 8.4296875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 7.0, 12.0, 13.0, 19.0, 31.0, 40.0, 32.0, 44.0, 61.0, 85.0, 121.0, 167.0, 239.0, 366.0, 1059.0, 10728.0, 1523143.0, 2639264.0, 16213.0, 1192.0, 444.0, 256.0, 190.0, 133.0, 112.0, 69.0, 54.0, 34.0, 26.0, 20.0, 23.0, 15.0, 12.0, 12.0, 6.0, 7.0, 5.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.6875, -33.49365234375, -32.2998046875, -31.10595703125, -29.912109375, -28.71826171875, -27.5244140625, -26.33056640625, -25.13671875, -23.94287109375, -22.7490234375, -21.55517578125, -20.361328125, -19.16748046875, -17.9736328125, -16.77978515625, -15.5859375, -14.39208984375, -13.1982421875, -12.00439453125, -10.810546875, -9.61669921875, -8.4228515625, -7.22900390625, -6.03515625, -4.84130859375, -3.6474609375, -2.45361328125, -1.259765625, -0.06591796875, 1.1279296875, 2.32177734375, 3.515625, 4.70947265625, 5.9033203125, 7.09716796875, 8.291015625, 9.48486328125, 10.6787109375, 11.87255859375, 13.06640625, 14.26025390625, 15.4541015625, 16.64794921875, 17.841796875, 19.03564453125, 20.2294921875, 21.42333984375, 22.6171875, 23.81103515625, 25.0048828125, 26.19873046875, 27.392578125, 28.58642578125, 29.7802734375, 30.97412109375, 32.16796875, 33.36181640625, 34.5556640625, 35.74951171875, 36.943359375, 38.13720703125, 39.3310546875, 40.52490234375, 41.71875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 136.0, 400.0, 387.0, 84.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.9327507019043, -54.79733657836914, -48.66192626953125, -42.526512145996094, -36.39109802246094, -30.255687713623047, -24.12027359008789, -17.98486328125, -11.849449157714844, -5.714036464691162, 0.42137622833251953, 6.556789398193359, 12.692201614379883, 18.827613830566406, 24.963027954101562, 31.098438262939453, 37.23385238647461, 43.369266510009766, 49.504676818847656, 55.64009094238281, 61.77550506591797, 67.91091918945312, 74.04632568359375, 80.1817398071289, 86.31715393066406, 92.45256805419922, 98.58798217773438, 104.723388671875, 110.85880279541016, 116.99421691894531, 123.12963104248047, 129.26504516601562, 135.4004669189453, 141.53587341308594, 147.67129516601562, 153.80670166015625, 159.94212341308594, 166.07752990722656, 172.21295166015625, 178.34835815429688, 184.4837646484375, 190.61917114257812, 196.7545928955078, 202.88999938964844, 209.02542114257812, 215.16082763671875, 221.29623413085938, 227.43165588378906, 233.56707763671875, 239.70248413085938, 245.83790588378906, 251.9733123779297, 258.1087341308594, 264.244140625, 270.3795471191406, 276.51495361328125, 282.6503601074219, 288.7857666015625, 294.9211730957031, 301.0566101074219, 307.1920166015625, 313.3274230957031, 319.46282958984375, 325.5982360839844, 331.7336730957031]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 2.0, 8.0, 7.0, 8.0, 13.0, 9.0, 12.0, 19.0, 27.0, 22.0, 22.0, 29.0, 33.0, 27.0, 29.0, 32.0, 45.0, 45.0, 45.0, 50.0, 50.0, 43.0, 34.0, 40.0, 39.0, 31.0, 39.0, 35.0, 21.0, 19.0, 23.0, 24.0, 18.0, 15.0, 17.0, 15.0, 13.0, 11.0, 7.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-35.31499481201172, -34.24851608276367, -33.18203353881836, -32.11555480957031, -31.049074172973633, -29.982593536376953, -28.916114807128906, -27.849634170532227, -26.783153533935547, -25.716672897338867, -24.65019416809082, -23.58371353149414, -22.51723289489746, -21.45075225830078, -20.384273529052734, -19.317792892456055, -18.251314163208008, -17.184833526611328, -16.11835479736328, -15.051874160766602, -13.985393524169922, -12.918913841247559, -11.852434158325195, -10.785953521728516, -9.719473838806152, -8.652994155883789, -7.586513519287109, -6.520033836364746, -5.453553676605225, -4.387073516845703, -3.32059383392334, -2.2541136741638184, -1.1876335144042969, -0.12115347385406494, 0.945326566696167, 2.0118064880371094, 3.078286647796631, 4.144766807556152, 5.211246490478516, 6.277726650238037, 7.344206809997559, 8.410686492919922, 9.477167129516602, 10.543646812438965, 11.610126495361328, 12.676607131958008, 13.743086814880371, 14.809566497802734, 15.876047134399414, 16.942527770996094, 18.00900650024414, 19.07548713684082, 20.1419677734375, 21.208446502685547, 22.274927139282227, 23.341407775878906, 24.407886505126953, 25.474367141723633, 26.54084587097168, 27.60732650756836, 28.67380714416504, 29.74028778076172, 30.806766510009766, 31.873247146606445, 32.939727783203125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 4.0, 11.0, 10.0, 18.0, 25.0, 17.0, 20.0, 30.0, 36.0, 31.0, 47.0, 30.0, 35.0, 52.0, 51.0, 48.0, 40.0, 46.0, 38.0, 42.0, 44.0, 53.0, 35.0, 28.0, 28.0, 36.0, 30.0, 24.0, 20.0, 18.0, 12.0, 14.0, 9.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.69134521484375, -5.5115966796875, -5.33184814453125, -5.152099609375, -4.97235107421875, -4.7926025390625, -4.61285400390625, -4.43310546875, -4.25335693359375, -4.0736083984375, -3.89385986328125, -3.714111328125, -3.53436279296875, -3.3546142578125, -3.17486572265625, -2.9951171875, -2.81536865234375, -2.6356201171875, -2.45587158203125, -2.276123046875, -2.09637451171875, -1.9166259765625, -1.73687744140625, -1.55712890625, -1.37738037109375, -1.1976318359375, -1.01788330078125, -0.838134765625, -0.65838623046875, -0.4786376953125, -0.29888916015625, -0.119140625, 0.06060791015625, 0.2403564453125, 0.42010498046875, 0.599853515625, 0.77960205078125, 0.9593505859375, 1.13909912109375, 1.31884765625, 1.49859619140625, 1.6783447265625, 1.85809326171875, 2.037841796875, 2.21759033203125, 2.3973388671875, 2.57708740234375, 2.7568359375, 2.93658447265625, 3.1163330078125, 3.29608154296875, 3.475830078125, 3.65557861328125, 3.8353271484375, 4.01507568359375, 4.19482421875, 4.37457275390625, 4.5543212890625, 4.73406982421875, 4.913818359375, 5.09356689453125, 5.2733154296875, 5.45306396484375, 5.6328125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 9.0, 15.0, 20.0, 23.0, 23.0, 52.0, 72.0, 111.0, 153.0, 238.0, 294.0, 480.0, 648.0, 986.0, 1384.0, 2024.0, 2940.0, 4248.0, 6210.0, 8900.0, 12948.0, 19150.0, 28483.0, 43178.0, 68363.0, 109443.0, 166293.0, 186960.0, 136546.0, 86206.0, 53897.0, 34797.0, 23162.0, 15783.0, 10860.0, 7272.0, 5048.0, 3519.0, 2399.0, 1699.0, 1132.0, 802.0, 553.0, 382.0, 269.0, 192.0, 126.0, 92.0, 48.0, 38.0, 33.0, 29.0, 10.0, 9.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.57666015625, -0.5582046508789062, -0.5397491455078125, -0.5212936401367188, -0.502838134765625, -0.48438262939453125, -0.4659271240234375, -0.44747161865234375, -0.42901611328125, -0.41056060791015625, -0.3921051025390625, -0.37364959716796875, -0.355194091796875, -0.33673858642578125, -0.3182830810546875, -0.29982757568359375, -0.2813720703125, -0.26291656494140625, -0.2444610595703125, -0.22600555419921875, -0.207550048828125, -0.18909454345703125, -0.1706390380859375, -0.15218353271484375, -0.13372802734375, -0.11527252197265625, -0.0968170166015625, -0.07836151123046875, -0.059906005859375, -0.04145050048828125, -0.0229949951171875, -0.00453948974609375, 0.013916015625, 0.03237152099609375, 0.0508270263671875, 0.06928253173828125, 0.087738037109375, 0.10619354248046875, 0.1246490478515625, 0.14310455322265625, 0.16156005859375, 0.18001556396484375, 0.1984710693359375, 0.21692657470703125, 0.235382080078125, 0.25383758544921875, 0.2722930908203125, 0.29074859619140625, 0.3092041015625, 0.32765960693359375, 0.3461151123046875, 0.36457061767578125, 0.383026123046875, 0.40148162841796875, 0.4199371337890625, 0.43839263916015625, 0.45684814453125, 0.47530364990234375, 0.4937591552734375, 0.5122146606445312, 0.530670166015625, 0.5491256713867188, 0.5675811767578125, 0.5860366821289062, 0.6044921875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 11.0, 9.0, 8.0, 11.0, 15.0, 23.0, 14.0, 19.0, 20.0, 29.0, 19.0, 27.0, 32.0, 49.0, 24.0, 38.0, 45.0, 47.0, 1066.0, 50.0, 43.0, 49.0, 45.0, 39.0, 30.0, 33.0, 29.0, 29.0, 23.0, 30.0, 19.0, 19.0, 8.0, 8.0, 13.0, 8.0, 12.0, 6.0, 8.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.08984375, -2.986602783203125, -2.88336181640625, -2.780120849609375, -2.6768798828125, -2.573638916015625, -2.47039794921875, -2.367156982421875, -2.263916015625, -2.160675048828125, -2.05743408203125, -1.954193115234375, -1.8509521484375, -1.747711181640625, -1.64447021484375, -1.541229248046875, -1.43798828125, -1.334747314453125, -1.23150634765625, -1.128265380859375, -1.0250244140625, -0.921783447265625, -0.81854248046875, -0.715301513671875, -0.612060546875, -0.508819580078125, -0.40557861328125, -0.302337646484375, -0.1990966796875, -0.095855712890625, 0.00738525390625, 0.110626220703125, 0.2138671875, 0.317108154296875, 0.42034912109375, 0.523590087890625, 0.6268310546875, 0.730072021484375, 0.83331298828125, 0.936553955078125, 1.039794921875, 1.143035888671875, 1.24627685546875, 1.349517822265625, 1.4527587890625, 1.555999755859375, 1.65924072265625, 1.762481689453125, 1.86572265625, 1.968963623046875, 2.07220458984375, 2.175445556640625, 2.2786865234375, 2.381927490234375, 2.48516845703125, 2.588409423828125, 2.691650390625, 2.794891357421875, 2.89813232421875, 3.001373291015625, 3.1046142578125, 3.207855224609375, 3.31109619140625, 3.414337158203125, 3.517578125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 7.0, 10.0, 24.0, 28.0, 42.0, 68.0, 102.0, 140.0, 208.0, 330.0, 495.0, 800.0, 1201.0, 1952.0, 3057.0, 4865.0, 7992.0, 12920.0, 21750.0, 38247.0, 68320.0, 126175.0, 213037.0, 1271163.0, 142384.0, 77031.0, 42312.0, 24680.0, 14365.0, 8763.0, 5327.0, 3283.0, 2164.0, 1379.0, 870.0, 562.0, 362.0, 250.0, 160.0, 91.0, 80.0, 36.0, 29.0, 16.0, 13.0, 11.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5576171875, -0.5402450561523438, -0.5228729248046875, -0.5055007934570312, -0.488128662109375, -0.47075653076171875, -0.4533843994140625, -0.43601226806640625, -0.41864013671875, -0.40126800537109375, -0.3838958740234375, -0.36652374267578125, -0.349151611328125, -0.33177947998046875, -0.3144073486328125, -0.29703521728515625, -0.2796630859375, -0.26229095458984375, -0.2449188232421875, -0.22754669189453125, -0.210174560546875, -0.19280242919921875, -0.1754302978515625, -0.15805816650390625, -0.14068603515625, -0.12331390380859375, -0.1059417724609375, -0.08856964111328125, -0.071197509765625, -0.05382537841796875, -0.0364532470703125, -0.01908111572265625, -0.001708984375, 0.01566314697265625, 0.0330352783203125, 0.05040740966796875, 0.067779541015625, 0.08515167236328125, 0.1025238037109375, 0.11989593505859375, 0.13726806640625, 0.15464019775390625, 0.1720123291015625, 0.18938446044921875, 0.206756591796875, 0.22412872314453125, 0.2415008544921875, 0.25887298583984375, 0.2762451171875, 0.29361724853515625, 0.3109893798828125, 0.32836151123046875, 0.345733642578125, 0.36310577392578125, 0.3804779052734375, 0.39785003662109375, 0.41522216796875, 0.43259429931640625, 0.4499664306640625, 0.46733856201171875, 0.484710693359375, 0.5020828247070312, 0.5194549560546875, 0.5368270874023438, 0.55419921875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 4.0, 3.0, 2.0, 1.0, 10.0, 10.0, 8.0, 14.0, 23.0, 26.0, 38.0, 46.0, 45.0, 63.0, 54.0, 57.0, 83.0, 80.0, 65.0, 75.0, 68.0, 53.0, 37.0, 24.0, 23.0, 18.0, 13.0, 9.0, 13.0, 10.0, 9.0, 3.0, 3.0, 2.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001983642578125, -0.0019269287586212158, -0.0018702149391174316, -0.0018135011196136475, -0.0017567873001098633, -0.001700073480606079, -0.001643359661102295, -0.0015866458415985107, -0.0015299320220947266, -0.0014732182025909424, -0.0014165043830871582, -0.001359790563583374, -0.0013030767440795898, -0.0012463629245758057, -0.0011896491050720215, -0.0011329352855682373, -0.0010762214660644531, -0.001019507646560669, -0.0009627938270568848, -0.0009060800075531006, -0.0008493661880493164, -0.0007926523685455322, -0.000735938549041748, -0.0006792247295379639, -0.0006225109100341797, -0.0005657970905303955, -0.0005090832710266113, -0.00045236945152282715, -0.00039565563201904297, -0.0003389418125152588, -0.0002822279930114746, -0.00022551417350769043, -0.00016880035400390625, -0.00011208653450012207, -5.537271499633789e-05, 1.341104507446289e-06, 5.805492401123047e-05, 0.00011476874351501465, 0.00017148256301879883, 0.000228196382522583, 0.0002849102020263672, 0.00034162402153015137, 0.00039833784103393555, 0.0004550516605377197, 0.0005117654800415039, 0.0005684792995452881, 0.0006251931190490723, 0.0006819069385528564, 0.0007386207580566406, 0.0007953345775604248, 0.000852048397064209, 0.0009087622165679932, 0.0009654760360717773, 0.0010221898555755615, 0.0010789036750793457, 0.0011356174945831299, 0.001192331314086914, 0.0012490451335906982, 0.0013057589530944824, 0.0013624727725982666, 0.0014191865921020508, 0.001475900411605835, 0.0015326142311096191, 0.0015893280506134033, 0.0016460418701171875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 6.0, 13.0, 15.0, 6.0, 18.0, 17.0, 29.0, 32.0, 52.0, 72.0, 90.0, 161.0, 239.0, 447.0, 1373.0, 48974.0, 986823.0, 8276.0, 842.0, 370.0, 220.0, 137.0, 100.0, 59.0, 49.0, 30.0, 31.0, 15.0, 10.0, 13.0, 8.0, 4.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.036773681640625, -0.03563642501831055, -0.034499168395996094, -0.03336191177368164, -0.03222465515136719, -0.031087398529052734, -0.02995014190673828, -0.028812885284423828, -0.027675628662109375, -0.026538372039794922, -0.02540111541748047, -0.024263858795166016, -0.023126602172851562, -0.02198934555053711, -0.020852088928222656, -0.019714832305908203, -0.01857757568359375, -0.017440319061279297, -0.016303062438964844, -0.01516580581665039, -0.014028549194335938, -0.012891292572021484, -0.011754035949707031, -0.010616779327392578, -0.009479522705078125, -0.008342266082763672, -0.007205009460449219, -0.006067752838134766, -0.0049304962158203125, -0.0037932395935058594, -0.0026559829711914062, -0.0015187263488769531, -0.0003814697265625, 0.0007557868957519531, 0.0018930435180664062, 0.0030303001403808594, 0.0041675567626953125, 0.005304813385009766, 0.006442070007324219, 0.007579326629638672, 0.008716583251953125, 0.009853839874267578, 0.010991096496582031, 0.012128353118896484, 0.013265609741210938, 0.01440286636352539, 0.015540122985839844, 0.016677379608154297, 0.01781463623046875, 0.018951892852783203, 0.020089149475097656, 0.02122640609741211, 0.022363662719726562, 0.023500919342041016, 0.02463817596435547, 0.025775432586669922, 0.026912689208984375, 0.028049945831298828, 0.02918720245361328, 0.030324459075927734, 0.03146171569824219, 0.03259897232055664, 0.033736228942871094, 0.03487348556518555, 0.0360107421875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 461.0, 539.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02173800580203533, -0.021312225610017776, -0.02088644541800022, -0.020460665225982666, -0.02003488503396511, -0.019609104841947556, -0.01918332278728485, -0.018757542595267296, -0.01833176240324974, -0.017905982211232185, -0.01748020201921463, -0.017054421827197075, -0.01662864163517952, -0.016202859580516815, -0.01577708125114441, -0.01535130012780428, -0.014925519935786724, -0.014499739743769169, -0.014073959551751614, -0.013648178428411484, -0.013222398236393929, -0.012796618044376373, -0.012370837852358818, -0.011945057660341263, -0.011519277468323708, -0.011093497276306152, -0.010667717084288597, -0.010241936892271042, -0.009816155768930912, -0.009390375576913357, -0.008964595384895802, -0.008538815192878246, -0.008113034069538116, -0.007687253877520561, -0.007261473219841719, -0.0068356930278241634, -0.006409912370145321, -0.005984132178127766, -0.00555835198611021, -0.005132571794092655, -0.004706791136413813, -0.004281010944396257, -0.003855230286717415, -0.0034294500946998596, -0.0030036696698516607, -0.002577889245003462, -0.0021521090529859066, -0.0017263286281377077, -0.0013005482032895088, -0.0008747678366489708, -0.00044898747000843287, -2.32071615755558e-05, 0.0004025732632726431, 0.000828353688120842, 0.0012541338801383972, 0.001679914304986596, 0.002105694729834795, 0.002531475154682994, 0.0029572555795311928, 0.003383035771548748, 0.003808816196396947, 0.004234596621245146, 0.004660376813262701, 0.005086157470941544, 0.005511937662959099]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 4.0, 10.0, 10.0, 10.0, 14.0, 22.0, 33.0, 31.0, 36.0, 35.0, 48.0, 49.0, 62.0, 61.0, 48.0, 68.0, 53.0, 54.0, 51.0, 62.0, 44.0, 45.0, 35.0, 25.0, 19.0, 19.0, 18.0, 10.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000890195369720459, -0.0008535804226994514, -0.0008169654756784439, -0.0007803505286574364, -0.0007437355816364288, -0.0007071206346154213, -0.0006705056875944138, -0.0006338907405734062, -0.0005972757935523987, -0.0005606608465313911, -0.0005240458995103836, -0.00048743095248937607, -0.00045081600546836853, -0.000414201058447361, -0.00037758611142635345, -0.0003409711644053459, -0.0003043562173843384, -0.00026774127036333084, -0.0002311263233423233, -0.00019451137632131577, -0.00015789642930030823, -0.00012128148227930069, -8.466653525829315e-05, -4.8051588237285614e-05, -1.1436641216278076e-05, 2.517830580472946e-05, 6.1793252825737e-05, 9.840819984674454e-05, 0.00013502314686775208, 0.0001716380938887596, 0.00020825304090976715, 0.0002448679879307747, 0.0002814829349517822, 0.00031809788197278976, 0.0003547128289937973, 0.00039132777601480484, 0.0004279427230358124, 0.0004645576700568199, 0.0005011726170778275, 0.000537787564098835, 0.0005744025111198425, 0.0006110174581408501, 0.0006476324051618576, 0.0006842473521828651, 0.0007208622992038727, 0.0007574772462248802, 0.0007940921932458878, 0.0008307071402668953, 0.0008673220872879028, 0.0009039370343089104, 0.0009405519813299179, 0.0009771669283509254, 0.001013781875371933, 0.0010503968223929405, 0.001087011769413948, 0.0011236267164349556, 0.0011602416634559631, 0.0011968566104769707, 0.0012334715574979782, 0.0012700865045189857, 0.0013067014515399933, 0.0013433163985610008, 0.0013799313455820084, 0.001416546292603016, 0.0014531612396240234]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 4.0, 11.0, 10.0, 18.0, 25.0, 17.0, 20.0, 30.0, 36.0, 31.0, 47.0, 30.0, 35.0, 52.0, 51.0, 48.0, 40.0, 46.0, 38.0, 42.0, 44.0, 53.0, 35.0, 28.0, 28.0, 36.0, 30.0, 24.0, 20.0, 18.0, 12.0, 14.0, 9.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.69134521484375, -5.5115966796875, -5.33184814453125, -5.152099609375, -4.97235107421875, -4.7926025390625, -4.61285400390625, -4.43310546875, -4.25335693359375, -4.0736083984375, -3.89385986328125, -3.714111328125, -3.53436279296875, -3.3546142578125, -3.17486572265625, -2.9951171875, -2.81536865234375, -2.6356201171875, -2.45587158203125, -2.276123046875, -2.09637451171875, -1.9166259765625, -1.73687744140625, -1.55712890625, -1.37738037109375, -1.1976318359375, -1.01788330078125, -0.838134765625, -0.65838623046875, -0.4786376953125, -0.29888916015625, -0.119140625, 0.06060791015625, 0.2403564453125, 0.42010498046875, 0.599853515625, 0.77960205078125, 0.9593505859375, 1.13909912109375, 1.31884765625, 1.49859619140625, 1.6783447265625, 1.85809326171875, 2.037841796875, 2.21759033203125, 2.3973388671875, 2.57708740234375, 2.7568359375, 2.93658447265625, 3.1163330078125, 3.29608154296875, 3.475830078125, 3.65557861328125, 3.8353271484375, 4.01507568359375, 4.19482421875, 4.37457275390625, 4.5543212890625, 4.73406982421875, 4.913818359375, 5.09356689453125, 5.2733154296875, 5.45306396484375, 5.6328125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 9.0, 12.0, 16.0, 21.0, 32.0, 41.0, 71.0, 90.0, 124.0, 179.0, 326.0, 624.0, 1071.0, 1961.0, 4085.0, 8629.0, 18704.0, 42999.0, 98098.0, 236251.0, 372985.0, 145431.0, 64077.0, 28148.0, 12520.0, 5856.0, 2826.0, 1405.0, 717.0, 444.0, 276.0, 143.0, 111.0, 74.0, 48.0, 39.0, 32.0, 23.0, 16.0, 17.0, 11.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.359375, -3.248291015625, -3.13720703125, -3.026123046875, -2.9150390625, -2.803955078125, -2.69287109375, -2.581787109375, -2.470703125, -2.359619140625, -2.24853515625, -2.137451171875, -2.0263671875, -1.915283203125, -1.80419921875, -1.693115234375, -1.58203125, -1.470947265625, -1.35986328125, -1.248779296875, -1.1376953125, -1.026611328125, -0.91552734375, -0.804443359375, -0.693359375, -0.582275390625, -0.47119140625, -0.360107421875, -0.2490234375, -0.137939453125, -0.02685546875, 0.084228515625, 0.1953125, 0.306396484375, 0.41748046875, 0.528564453125, 0.6396484375, 0.750732421875, 0.86181640625, 0.972900390625, 1.083984375, 1.195068359375, 1.30615234375, 1.417236328125, 1.5283203125, 1.639404296875, 1.75048828125, 1.861572265625, 1.97265625, 2.083740234375, 2.19482421875, 2.305908203125, 2.4169921875, 2.528076171875, 2.63916015625, 2.750244140625, 2.861328125, 2.972412109375, 3.08349609375, 3.194580078125, 3.3056640625, 3.416748046875, 3.52783203125, 3.638916015625, 3.75]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 4.0, 3.0, 3.0, 7.0, 3.0, 12.0, 8.0, 8.0, 7.0, 12.0, 13.0, 22.0, 18.0, 20.0, 25.0, 29.0, 26.0, 31.0, 33.0, 41.0, 39.0, 51.0, 86.0, 213.0, 1619.0, 215.0, 85.0, 55.0, 39.0, 44.0, 40.0, 43.0, 32.0, 31.0, 22.0, 19.0, 20.0, 11.0, 11.0, 14.0, 13.0, 4.0, 8.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.34375, -18.82763671875, -18.3115234375, -17.79541015625, -17.279296875, -16.76318359375, -16.2470703125, -15.73095703125, -15.21484375, -14.69873046875, -14.1826171875, -13.66650390625, -13.150390625, -12.63427734375, -12.1181640625, -11.60205078125, -11.0859375, -10.56982421875, -10.0537109375, -9.53759765625, -9.021484375, -8.50537109375, -7.9892578125, -7.47314453125, -6.95703125, -6.44091796875, -5.9248046875, -5.40869140625, -4.892578125, -4.37646484375, -3.8603515625, -3.34423828125, -2.828125, -2.31201171875, -1.7958984375, -1.27978515625, -0.763671875, -0.24755859375, 0.2685546875, 0.78466796875, 1.30078125, 1.81689453125, 2.3330078125, 2.84912109375, 3.365234375, 3.88134765625, 4.3974609375, 4.91357421875, 5.4296875, 5.94580078125, 6.4619140625, 6.97802734375, 7.494140625, 8.01025390625, 8.5263671875, 9.04248046875, 9.55859375, 10.07470703125, 10.5908203125, 11.10693359375, 11.623046875, 12.13916015625, 12.6552734375, 13.17138671875, 13.6875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 5.0, 7.0, 6.0, 9.0, 15.0, 11.0, 25.0, 24.0, 24.0, 44.0, 43.0, 75.0, 99.0, 122.0, 174.0, 214.0, 283.0, 591.0, 2575.0, 341800.0, 2792408.0, 5004.0, 764.0, 343.0, 249.0, 171.0, 121.0, 102.0, 80.0, 57.0, 51.0, 31.0, 37.0, 30.0, 20.0, 10.0, 21.0, 15.0, 9.0, 6.0, 5.0, 5.0, 5.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.875, -32.7119140625, -31.548828125, -30.3857421875, -29.22265625, -28.0595703125, -26.896484375, -25.7333984375, -24.5703125, -23.4072265625, -22.244140625, -21.0810546875, -19.91796875, -18.7548828125, -17.591796875, -16.4287109375, -15.265625, -14.1025390625, -12.939453125, -11.7763671875, -10.61328125, -9.4501953125, -8.287109375, -7.1240234375, -5.9609375, -4.7978515625, -3.634765625, -2.4716796875, -1.30859375, -0.1455078125, 1.017578125, 2.1806640625, 3.34375, 4.5068359375, 5.669921875, 6.8330078125, 7.99609375, 9.1591796875, 10.322265625, 11.4853515625, 12.6484375, 13.8115234375, 14.974609375, 16.1376953125, 17.30078125, 18.4638671875, 19.626953125, 20.7900390625, 21.953125, 23.1162109375, 24.279296875, 25.4423828125, 26.60546875, 27.7685546875, 28.931640625, 30.0947265625, 31.2578125, 32.4208984375, 33.583984375, 34.7470703125, 35.91015625, 37.0732421875, 38.236328125, 39.3994140625, 40.5625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 11.0, 338.0, 623.0, 44.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.69039916992188, -188.60650634765625, -184.5226287841797, -180.43873596191406, -176.3548583984375, -172.27096557617188, -168.1870880126953, -164.1031951904297, -160.01931762695312, -155.9354248046875, -151.85154724121094, -147.7676544189453, -143.68377685546875, -139.59988403320312, -135.51600646972656, -131.43211364746094, -127.34822845458984, -123.26434326171875, -119.18045806884766, -115.09657287597656, -111.01268768310547, -106.92880249023438, -102.84490966796875, -98.76103210449219, -94.67713928222656, -90.59325408935547, -86.50936889648438, -82.42548370361328, -78.34159851074219, -74.2577133178711, -70.173828125, -66.08993530273438, -62.00605010986328, -57.92216491699219, -53.838279724121094, -49.75439453125, -45.670509338378906, -41.58662414550781, -37.50273513793945, -33.41884994506836, -29.334964752197266, -25.251079559326172, -21.167194366455078, -17.08330726623535, -12.999422073364258, -8.915536880493164, -4.8316497802734375, -0.7477645874023438, 3.33612060546875, 7.420006275177002, 11.503891944885254, 15.587778091430664, 19.671663284301758, 23.75554847717285, 27.839435577392578, 31.923320770263672, 36.007205963134766, 40.09109115600586, 44.17497634887695, 48.25886535644531, 52.342750549316406, 56.4266357421875, 60.510520935058594, 64.59440612792969, 68.67829132080078]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 13.0, 6.0, 8.0, 9.0, 14.0, 15.0, 21.0, 28.0, 28.0, 26.0, 35.0, 27.0, 39.0, 27.0, 36.0, 45.0, 35.0, 53.0, 53.0, 31.0, 51.0, 47.0, 36.0, 34.0, 38.0, 22.0, 23.0, 22.0, 28.0, 20.0, 23.0, 13.0, 13.0, 13.0, 14.0, 10.0, 5.0, 4.0, 4.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0], "bins": [-52.956687927246094, -51.42449188232422, -49.892295837402344, -48.36009979248047, -46.82790756225586, -45.295711517333984, -43.76351547241211, -42.231319427490234, -40.699127197265625, -39.16693115234375, -37.634735107421875, -36.1025390625, -34.57034683227539, -33.038150787353516, -31.50595474243164, -29.973758697509766, -28.44156265258789, -26.909366607666016, -25.377172470092773, -23.8449764251709, -22.312782287597656, -20.78058624267578, -19.248390197753906, -17.71619415283203, -16.18400001525879, -14.65180492401123, -13.119609832763672, -11.587413787841797, -10.055218696594238, -8.52302360534668, -6.990827560424805, -5.458632469177246, -3.926433563232422, -2.394238233566284, -0.8620429039001465, 0.6701526641845703, 2.202347755432129, 3.7345428466796875, 5.2667388916015625, 6.798933982849121, 8.33112907409668, 9.863324165344238, 11.395519256591797, 12.927715301513672, 14.45991039276123, 15.992105484008789, 17.524301528930664, 19.056495666503906, 20.58869171142578, 22.120887756347656, 23.6530818939209, 25.185277938842773, 26.717472076416016, 28.24966812133789, 29.781864166259766, 31.31406021118164, 32.84625244140625, 34.378448486328125, 35.91064453125, 37.442840576171875, 38.975032806396484, 40.50722885131836, 42.039424896240234, 43.57162094116211, 45.103816986083984]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 1.0, 11.0, 5.0, 10.0, 13.0, 15.0, 22.0, 21.0, 27.0, 26.0, 37.0, 27.0, 37.0, 36.0, 43.0, 54.0, 46.0, 41.0, 41.0, 39.0, 35.0, 39.0, 42.0, 50.0, 36.0, 23.0, 30.0, 38.0, 27.0, 18.0, 25.0, 16.0, 16.0, 16.0, 12.0, 11.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90234375, -5.72216796875, -5.5419921875, -5.36181640625, -5.181640625, -5.00146484375, -4.8212890625, -4.64111328125, -4.4609375, -4.28076171875, -4.1005859375, -3.92041015625, -3.740234375, -3.56005859375, -3.3798828125, -3.19970703125, -3.01953125, -2.83935546875, -2.6591796875, -2.47900390625, -2.298828125, -2.11865234375, -1.9384765625, -1.75830078125, -1.578125, -1.39794921875, -1.2177734375, -1.03759765625, -0.857421875, -0.67724609375, -0.4970703125, -0.31689453125, -0.13671875, 0.04345703125, 0.2236328125, 0.40380859375, 0.583984375, 0.76416015625, 0.9443359375, 1.12451171875, 1.3046875, 1.48486328125, 1.6650390625, 1.84521484375, 2.025390625, 2.20556640625, 2.3857421875, 2.56591796875, 2.74609375, 2.92626953125, 3.1064453125, 3.28662109375, 3.466796875, 3.64697265625, 3.8271484375, 4.00732421875, 4.1875, 4.36767578125, 4.5478515625, 4.72802734375, 4.908203125, 5.08837890625, 5.2685546875, 5.44873046875, 5.62890625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 3.0, 9.0, 12.0, 12.0, 8.0, 19.0, 24.0, 21.0, 24.0, 28.0, 34.0, 47.0, 71.0, 107.0, 326.0, 1133.0, 7504.0, 179030.0, 3376288.0, 611000.0, 15817.0, 1806.0, 452.0, 166.0, 64.0, 44.0, 39.0, 28.0, 18.0, 27.0, 20.0, 21.0, 15.0, 22.0, 12.0, 6.0, 7.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.77294921875, -18.1396484375, -17.50634765625, -16.873046875, -16.23974609375, -15.6064453125, -14.97314453125, -14.33984375, -13.70654296875, -13.0732421875, -12.43994140625, -11.806640625, -11.17333984375, -10.5400390625, -9.90673828125, -9.2734375, -8.64013671875, -8.0068359375, -7.37353515625, -6.740234375, -6.10693359375, -5.4736328125, -4.84033203125, -4.20703125, -3.57373046875, -2.9404296875, -2.30712890625, -1.673828125, -1.04052734375, -0.4072265625, 0.22607421875, 0.859375, 1.49267578125, 2.1259765625, 2.75927734375, 3.392578125, 4.02587890625, 4.6591796875, 5.29248046875, 5.92578125, 6.55908203125, 7.1923828125, 7.82568359375, 8.458984375, 9.09228515625, 9.7255859375, 10.35888671875, 10.9921875, 11.62548828125, 12.2587890625, 12.89208984375, 13.525390625, 14.15869140625, 14.7919921875, 15.42529296875, 16.05859375, 16.69189453125, 17.3251953125, 17.95849609375, 18.591796875, 19.22509765625, 19.8583984375, 20.49169921875, 21.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 7.0, 9.0, 19.0, 13.0, 21.0, 20.0, 29.0, 38.0, 64.0, 77.0, 84.0, 110.0, 173.0, 207.0, 249.0, 318.0, 399.0, 409.0, 371.0, 342.0, 302.0, 192.0, 136.0, 118.0, 89.0, 72.0, 44.0, 29.0, 26.0, 28.0, 17.0, 19.0, 7.0, 4.0, 4.0, 9.0, 8.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.45703125, -8.1484375, -7.83984375, -7.53125, -7.22265625, -6.9140625, -6.60546875, -6.296875, -5.98828125, -5.6796875, -5.37109375, -5.0625, -4.75390625, -4.4453125, -4.13671875, -3.828125, -3.51953125, -3.2109375, -2.90234375, -2.59375, -2.28515625, -1.9765625, -1.66796875, -1.359375, -1.05078125, -0.7421875, -0.43359375, -0.125, 0.18359375, 0.4921875, 0.80078125, 1.109375, 1.41796875, 1.7265625, 2.03515625, 2.34375, 2.65234375, 2.9609375, 3.26953125, 3.578125, 3.88671875, 4.1953125, 4.50390625, 4.8125, 5.12109375, 5.4296875, 5.73828125, 6.046875, 6.35546875, 6.6640625, 6.97265625, 7.28125, 7.58984375, 7.8984375, 8.20703125, 8.515625, 8.82421875, 9.1328125, 9.44140625, 9.75, 10.05859375, 10.3671875, 10.67578125, 10.984375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 3.0, 8.0, 11.0, 8.0, 11.0, 12.0, 20.0, 35.0, 41.0, 45.0, 68.0, 76.0, 106.0, 130.0, 160.0, 233.0, 285.0, 502.0, 1429.0, 37221.0, 3746124.0, 401274.0, 4369.0, 610.0, 374.0, 242.0, 179.0, 148.0, 118.0, 107.0, 59.0, 51.0, 49.0, 34.0, 26.0, 28.0, 19.0, 17.0, 10.0, 9.0, 9.0, 6.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-38.1875, -36.98388671875, -35.7802734375, -34.57666015625, -33.373046875, -32.16943359375, -30.9658203125, -29.76220703125, -28.55859375, -27.35498046875, -26.1513671875, -24.94775390625, -23.744140625, -22.54052734375, -21.3369140625, -20.13330078125, -18.9296875, -17.72607421875, -16.5224609375, -15.31884765625, -14.115234375, -12.91162109375, -11.7080078125, -10.50439453125, -9.30078125, -8.09716796875, -6.8935546875, -5.68994140625, -4.486328125, -3.28271484375, -2.0791015625, -0.87548828125, 0.328125, 1.53173828125, 2.7353515625, 3.93896484375, 5.142578125, 6.34619140625, 7.5498046875, 8.75341796875, 9.95703125, 11.16064453125, 12.3642578125, 13.56787109375, 14.771484375, 15.97509765625, 17.1787109375, 18.38232421875, 19.5859375, 20.78955078125, 21.9931640625, 23.19677734375, 24.400390625, 25.60400390625, 26.8076171875, 28.01123046875, 29.21484375, 30.41845703125, 31.6220703125, 32.82568359375, 34.029296875, 35.23291015625, 36.4365234375, 37.64013671875, 38.84375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 58.0, 220.0, 378.0, 259.0, 80.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.08834075927734, -69.35191345214844, -64.61548614501953, -59.87905502319336, -55.14262771606445, -50.40620040893555, -45.669769287109375, -40.93334197998047, -36.19691467285156, -31.460487365722656, -26.724058151245117, -21.987628936767578, -17.251201629638672, -12.514774322509766, -7.778345108032227, -3.0419158935546875, 1.6945114135742188, 6.430939674377441, 11.167367935180664, 15.903796195983887, 20.64022445678711, 25.376651763916016, 30.113080978393555, 34.849510192871094, 39.5859375, 44.322364807128906, 49.05879211425781, 53.795223236083984, 58.53165054321289, 63.2680778503418, 68.00450897216797, 72.74093627929688, 77.47737121582031, 82.21379852294922, 86.95022583007812, 91.68665313720703, 96.42308044433594, 101.15951538085938, 105.89594268798828, 110.63236999511719, 115.3687973022461, 120.105224609375, 124.8416519165039, 129.5780792236328, 134.31451416015625, 139.05093383789062, 143.78736877441406, 148.5238037109375, 153.26022338867188, 157.9966583251953, 162.7330780029297, 167.46951293945312, 172.2059326171875, 176.94236755371094, 181.6787872314453, 186.41522216796875, 191.15164184570312, 195.88807678222656, 200.62449645996094, 205.36093139648438, 210.09735107421875, 214.8337860107422, 219.57020568847656, 224.306640625, 229.04307556152344]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 9.0, 6.0, 7.0, 6.0, 5.0, 13.0, 13.0, 18.0, 9.0, 22.0, 21.0, 16.0, 41.0, 28.0, 34.0, 20.0, 35.0, 31.0, 30.0, 32.0, 35.0, 30.0, 44.0, 33.0, 35.0, 35.0, 39.0, 36.0, 27.0, 37.0, 35.0, 25.0, 27.0, 31.0, 17.0, 10.0, 15.0, 19.0, 10.0, 11.0, 9.0, 13.0, 7.0, 5.0, 6.0, 1.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-31.401290893554688, -30.431167602539062, -29.461044311523438, -28.49091911315918, -27.520795822143555, -26.55067253112793, -25.580547332763672, -24.610424041748047, -23.640300750732422, -22.670177459716797, -21.700054168701172, -20.729928970336914, -19.75980567932129, -18.789682388305664, -17.819557189941406, -16.84943389892578, -15.879310607910156, -14.909187316894531, -13.93906307220459, -12.968938827514648, -11.998815536499023, -11.028692245483398, -10.058568000793457, -9.088443756103516, -8.11832046508789, -7.148196697235107, -6.178072929382324, -5.207949161529541, -4.237825393676758, -3.2677016258239746, -2.2975778579711914, -1.3274540901184082, -0.357330322265625, 0.6127934455871582, 1.5829172134399414, 2.5530409812927246, 3.523164749145508, 4.493288516998291, 5.463412284851074, 6.433536052703857, 7.403659820556641, 8.373783111572266, 9.343907356262207, 10.314031600952148, 11.284154891967773, 12.254278182983398, 13.22440242767334, 14.194526672363281, 15.164649963378906, 16.13477325439453, 17.104896545410156, 18.075021743774414, 19.04514503479004, 20.015268325805664, 20.985393524169922, 21.955516815185547, 22.925640106201172, 23.895763397216797, 24.865886688232422, 25.83601188659668, 26.806135177612305, 27.77625846862793, 28.746383666992188, 29.716506958007812, 30.686630249023438]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 3.0, 5.0, 8.0, 10.0, 20.0, 17.0, 21.0, 21.0, 16.0, 34.0, 31.0, 30.0, 31.0, 26.0, 45.0, 47.0, 19.0, 41.0, 33.0, 47.0, 37.0, 40.0, 41.0, 37.0, 48.0, 37.0, 24.0, 31.0, 33.0, 28.0, 21.0, 24.0, 14.0, 14.0, 14.0, 6.0, 14.0, 6.0, 4.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.6484375, -5.484619140625, -5.32080078125, -5.156982421875, -4.9931640625, -4.829345703125, -4.66552734375, -4.501708984375, -4.337890625, -4.174072265625, -4.01025390625, -3.846435546875, -3.6826171875, -3.518798828125, -3.35498046875, -3.191162109375, -3.02734375, -2.863525390625, -2.69970703125, -2.535888671875, -2.3720703125, -2.208251953125, -2.04443359375, -1.880615234375, -1.716796875, -1.552978515625, -1.38916015625, -1.225341796875, -1.0615234375, -0.897705078125, -0.73388671875, -0.570068359375, -0.40625, -0.242431640625, -0.07861328125, 0.085205078125, 0.2490234375, 0.412841796875, 0.57666015625, 0.740478515625, 0.904296875, 1.068115234375, 1.23193359375, 1.395751953125, 1.5595703125, 1.723388671875, 1.88720703125, 2.051025390625, 2.21484375, 2.378662109375, 2.54248046875, 2.706298828125, 2.8701171875, 3.033935546875, 3.19775390625, 3.361572265625, 3.525390625, 3.689208984375, 3.85302734375, 4.016845703125, 4.1806640625, 4.344482421875, 4.50830078125, 4.672119140625, 4.8359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 14.0, 13.0, 16.0, 28.0, 52.0, 77.0, 92.0, 140.0, 199.0, 250.0, 422.0, 546.0, 808.0, 1147.0, 1677.0, 2347.0, 3419.0, 5043.0, 7320.0, 10772.0, 15927.0, 24085.0, 36531.0, 56099.0, 88171.0, 140902.0, 190416.0, 163541.0, 104650.0, 65748.0, 42165.0, 27911.0, 18479.0, 12405.0, 8348.0, 5761.0, 4086.0, 2781.0, 1896.0, 1310.0, 873.0, 613.0, 402.0, 324.0, 239.0, 151.0, 132.0, 82.0, 56.0, 39.0, 19.0, 14.0, 11.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.58984375, -0.57061767578125, -0.5513916015625, -0.53216552734375, -0.512939453125, -0.49371337890625, -0.4744873046875, -0.45526123046875, -0.43603515625, -0.41680908203125, -0.3975830078125, -0.37835693359375, -0.359130859375, -0.33990478515625, -0.3206787109375, -0.30145263671875, -0.2822265625, -0.26300048828125, -0.2437744140625, -0.22454833984375, -0.205322265625, -0.18609619140625, -0.1668701171875, -0.14764404296875, -0.12841796875, -0.10919189453125, -0.0899658203125, -0.07073974609375, -0.051513671875, -0.03228759765625, -0.0130615234375, 0.00616455078125, 0.025390625, 0.04461669921875, 0.0638427734375, 0.08306884765625, 0.102294921875, 0.12152099609375, 0.1407470703125, 0.15997314453125, 0.17919921875, 0.19842529296875, 0.2176513671875, 0.23687744140625, 0.256103515625, 0.27532958984375, 0.2945556640625, 0.31378173828125, 0.3330078125, 0.35223388671875, 0.3714599609375, 0.39068603515625, 0.409912109375, 0.42913818359375, 0.4483642578125, 0.46759033203125, 0.48681640625, 0.50604248046875, 0.5252685546875, 0.54449462890625, 0.563720703125, 0.58294677734375, 0.6021728515625, 0.62139892578125, 0.640625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 2.0, 9.0, 6.0, 11.0, 12.0, 9.0, 8.0, 14.0, 19.0, 26.0, 25.0, 19.0, 22.0, 30.0, 35.0, 37.0, 26.0, 35.0, 30.0, 35.0, 42.0, 39.0, 1053.0, 31.0, 27.0, 37.0, 34.0, 34.0, 37.0, 31.0, 22.0, 22.0, 27.0, 17.0, 27.0, 20.0, 21.0, 12.0, 15.0, 10.0, 12.0, 5.0, 8.0, 8.0, 1.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.8046875, -2.712890625, -2.62109375, -2.529296875, -2.4375, -2.345703125, -2.25390625, -2.162109375, -2.0703125, -1.978515625, -1.88671875, -1.794921875, -1.703125, -1.611328125, -1.51953125, -1.427734375, -1.3359375, -1.244140625, -1.15234375, -1.060546875, -0.96875, -0.876953125, -0.78515625, -0.693359375, -0.6015625, -0.509765625, -0.41796875, -0.326171875, -0.234375, -0.142578125, -0.05078125, 0.041015625, 0.1328125, 0.224609375, 0.31640625, 0.408203125, 0.5, 0.591796875, 0.68359375, 0.775390625, 0.8671875, 0.958984375, 1.05078125, 1.142578125, 1.234375, 1.326171875, 1.41796875, 1.509765625, 1.6015625, 1.693359375, 1.78515625, 1.876953125, 1.96875, 2.060546875, 2.15234375, 2.244140625, 2.3359375, 2.427734375, 2.51953125, 2.611328125, 2.703125, 2.794921875, 2.88671875, 2.978515625, 3.0703125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 14.0, 18.0, 26.0, 38.0, 68.0, 84.0, 164.0, 285.0, 460.0, 729.0, 1334.0, 2289.0, 4040.0, 7042.0, 12588.0, 23941.0, 45058.0, 91186.0, 185327.0, 1320255.0, 197367.0, 98680.0, 49290.0, 25191.0, 13798.0, 7491.0, 4278.0, 2468.0, 1443.0, 886.0, 476.0, 314.0, 184.0, 109.0, 72.0, 43.0, 31.0, 12.0, 16.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.810546875, -0.7889633178710938, -0.7673797607421875, -0.7457962036132812, -0.724212646484375, -0.7026290893554688, -0.6810455322265625, -0.6594619750976562, -0.63787841796875, -0.6162948608398438, -0.5947113037109375, -0.5731277465820312, -0.551544189453125, -0.5299606323242188, -0.5083770751953125, -0.48679351806640625, -0.4652099609375, -0.44362640380859375, -0.4220428466796875, -0.40045928955078125, -0.378875732421875, -0.35729217529296875, -0.3357086181640625, -0.31412506103515625, -0.29254150390625, -0.27095794677734375, -0.2493743896484375, -0.22779083251953125, -0.206207275390625, -0.18462371826171875, -0.1630401611328125, -0.14145660400390625, -0.119873046875, -0.09828948974609375, -0.0767059326171875, -0.05512237548828125, -0.033538818359375, -0.01195526123046875, 0.0096282958984375, 0.03121185302734375, 0.05279541015625, 0.07437896728515625, 0.0959625244140625, 0.11754608154296875, 0.139129638671875, 0.16071319580078125, 0.1822967529296875, 0.20388031005859375, 0.2254638671875, 0.24704742431640625, 0.2686309814453125, 0.29021453857421875, 0.311798095703125, 0.33338165283203125, 0.3549652099609375, 0.37654876708984375, 0.39813232421875, 0.41971588134765625, 0.4412994384765625, 0.46288299560546875, 0.484466552734375, 0.5060501098632812, 0.5276336669921875, 0.5492172241210938, 0.57080078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 9.0, 10.0, 15.0, 10.0, 17.0, 22.0, 15.0, 30.0, 41.0, 33.0, 50.0, 43.0, 67.0, 61.0, 63.0, 68.0, 50.0, 56.0, 46.0, 57.0, 31.0, 29.0, 27.0, 24.0, 32.0, 18.0, 12.0, 17.0, 9.0, 6.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001987457275390625, -0.0019224882125854492, -0.0018575191497802734, -0.0017925500869750977, -0.0017275810241699219, -0.001662611961364746, -0.0015976428985595703, -0.0015326738357543945, -0.0014677047729492188, -0.001402735710144043, -0.0013377666473388672, -0.0012727975845336914, -0.0012078285217285156, -0.0011428594589233398, -0.001077890396118164, -0.0010129213333129883, -0.0009479522705078125, -0.0008829832077026367, -0.0008180141448974609, -0.0007530450820922852, -0.0006880760192871094, -0.0006231069564819336, -0.0005581378936767578, -0.000493168830871582, -0.00042819976806640625, -0.00036323070526123047, -0.0002982616424560547, -0.0002332925796508789, -0.00016832351684570312, -0.00010335445404052734, -3.838539123535156e-05, 2.658367156982422e-05, 9.1552734375e-05, 0.00015652179718017578, 0.00022149085998535156, 0.00028645992279052734, 0.0003514289855957031, 0.0004163980484008789, 0.0004813671112060547, 0.0005463361740112305, 0.0006113052368164062, 0.000676274299621582, 0.0007412433624267578, 0.0008062124252319336, 0.0008711814880371094, 0.0009361505508422852, 0.001001119613647461, 0.0010660886764526367, 0.0011310577392578125, 0.0011960268020629883, 0.001260995864868164, 0.0013259649276733398, 0.0013909339904785156, 0.0014559030532836914, 0.0015208721160888672, 0.001585841178894043, 0.0016508102416992188, 0.0017157793045043945, 0.0017807483673095703, 0.001845717430114746, 0.0019106864929199219, 0.0019756555557250977, 0.0020406246185302734, 0.0021055936813354492, 0.002170562744140625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 9.0, 2.0, 9.0, 17.0, 22.0, 24.0, 24.0, 29.0, 41.0, 68.0, 93.0, 121.0, 193.0, 383.0, 1394.0, 176131.0, 866623.0, 2189.0, 525.0, 215.0, 105.0, 71.0, 68.0, 52.0, 24.0, 23.0, 21.0, 18.0, 14.0, 18.0, 8.0, 4.0, 4.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.062347412109375, -0.060753822326660156, -0.05916023254394531, -0.05756664276123047, -0.055973052978515625, -0.05437946319580078, -0.05278587341308594, -0.051192283630371094, -0.04959869384765625, -0.048005104064941406, -0.04641151428222656, -0.04481792449951172, -0.043224334716796875, -0.04163074493408203, -0.04003715515136719, -0.038443565368652344, -0.0368499755859375, -0.035256385803222656, -0.03366279602050781, -0.03206920623779297, -0.030475616455078125, -0.02888202667236328, -0.027288436889648438, -0.025694847106933594, -0.02410125732421875, -0.022507667541503906, -0.020914077758789062, -0.01932048797607422, -0.017726898193359375, -0.01613330841064453, -0.014539718627929688, -0.012946128845214844, -0.0113525390625, -0.009758949279785156, -0.008165359497070312, -0.006571769714355469, -0.004978179931640625, -0.0033845901489257812, -0.0017910003662109375, -0.00019741058349609375, 0.00139617919921875, 0.0029897689819335938, 0.0045833587646484375, 0.006176948547363281, 0.007770538330078125, 0.009364128112792969, 0.010957717895507812, 0.012551307678222656, 0.0141448974609375, 0.015738487243652344, 0.017332077026367188, 0.01892566680908203, 0.020519256591796875, 0.02211284637451172, 0.023706436157226562, 0.025300025939941406, 0.02689361572265625, 0.028487205505371094, 0.030080795288085938, 0.03167438507080078, 0.033267974853515625, 0.03486156463623047, 0.03645515441894531, 0.038048744201660156, 0.039642333984375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 46.0, 849.0, 120.0, 1.0, 1.0], "bins": [-0.026967698708176613, -0.026522818952798843, -0.026077939197421074, -0.025633061304688454, -0.025188181549310684, -0.024743301793932915, -0.024298422038555145, -0.023853542283177376, -0.023408664390444756, -0.022963784635066986, -0.022518904879689217, -0.022074026986956596, -0.021629147231578827, -0.021184267476201057, -0.020739387720823288, -0.02029450796544552, -0.01984962821006775, -0.01940474845468998, -0.01895986869931221, -0.01851499080657959, -0.01807011105120182, -0.01762523129582405, -0.01718035154044628, -0.016735471785068512, -0.01629059389233589, -0.015845714136958122, -0.015400835312902927, -0.014955955557525158, -0.014511076733469963, -0.014066196978092194, -0.013621317222714424, -0.01317643839865923, -0.01273155864328146, -0.01228667888790369, -0.011841800063848495, -0.011396920308470726, -0.010952041484415531, -0.010507161729037762, -0.010062282904982567, -0.009617403149604797, -0.009172523394227028, -0.008727643638849258, -0.008282764814794064, -0.007837885059416294, -0.007393005769699812, -0.00694812647998333, -0.006503247190266848, -0.0060583679005503654, -0.005613488145172596, -0.005168608855456114, -0.004723729565739632, -0.004278849810361862, -0.00383397052064538, -0.003389091230928898, -0.0029442119412124157, -0.00249933241866529, -0.0020544533617794514, -0.0016095739556476474, -0.0011646945495158434, -0.0007198152597993612, -0.00027493585366755724, 0.00016994355246424675, 0.0006148228421807289, 0.0010597023647278547, 0.0015045816544443369]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 10.0, 10.0, 19.0, 23.0, 20.0, 28.0, 22.0, 43.0, 36.0, 51.0, 42.0, 47.0, 42.0, 45.0, 55.0, 35.0, 60.0, 52.0, 51.0, 52.0, 39.0, 35.0, 36.0, 27.0, 20.0, 14.0, 20.0, 17.0, 10.0, 10.0, 6.0, 2.0, 1.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001035928726196289, -0.0009940741583704948, -0.0009522195905447006, -0.0009103650227189064, -0.0008685104548931122, -0.000826655887067318, -0.0007848013192415237, -0.0007429467514157295, -0.0007010921835899353, -0.0006592376157641411, -0.0006173830479383469, -0.0005755284801125526, -0.0005336739122867584, -0.0004918193444609642, -0.00044996477663517, -0.00040811020880937576, -0.00036625564098358154, -0.0003244010731577873, -0.0002825465053319931, -0.00024069193750619888, -0.00019883736968040466, -0.00015698280185461044, -0.00011512823402881622, -7.3273666203022e-05, -3.141909837722778e-05, 1.0435469448566437e-05, 5.229003727436066e-05, 9.414460510015488e-05, 0.0001359991729259491, 0.00017785374075174332, 0.00021970830857753754, 0.00026156287640333176, 0.000303417444229126, 0.0003452720120549202, 0.0003871265798807144, 0.00042898114770650864, 0.00047083571553230286, 0.0005126902833580971, 0.0005545448511838913, 0.0005963994190096855, 0.0006382539868354797, 0.000680108554661274, 0.0007219631224870682, 0.0007638176903128624, 0.0008056722581386566, 0.0008475268259644508, 0.0008893813937902451, 0.0009312359616160393, 0.0009730905294418335, 0.0010149450972676277, 0.001056799665093422, 0.0010986542329192162, 0.0011405088007450104, 0.0011823633685708046, 0.0012242179363965988, 0.001266072504222393, 0.0013079270720481873, 0.0013497816398739815, 0.0013916362076997757, 0.00143349077552557, 0.0014753453433513641, 0.0015171999111771584, 0.0015590544790029526, 0.0016009090468287468, 0.001642763614654541]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 3.0, 5.0, 8.0, 10.0, 20.0, 17.0, 21.0, 21.0, 16.0, 34.0, 31.0, 30.0, 31.0, 26.0, 45.0, 47.0, 19.0, 41.0, 33.0, 47.0, 37.0, 40.0, 41.0, 37.0, 48.0, 37.0, 24.0, 31.0, 34.0, 27.0, 21.0, 24.0, 14.0, 14.0, 14.0, 6.0, 14.0, 6.0, 4.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.6484375, -5.484619140625, -5.32080078125, -5.156982421875, -4.9931640625, -4.829345703125, -4.66552734375, -4.501708984375, -4.337890625, -4.174072265625, -4.01025390625, -3.846435546875, -3.6826171875, -3.518798828125, -3.35498046875, -3.191162109375, -3.02734375, -2.863525390625, -2.69970703125, -2.535888671875, -2.3720703125, -2.208251953125, -2.04443359375, -1.880615234375, -1.716796875, -1.552978515625, -1.38916015625, -1.225341796875, -1.0615234375, -0.897705078125, -0.73388671875, -0.570068359375, -0.40625, -0.242431640625, -0.07861328125, 0.085205078125, 0.2490234375, 0.412841796875, 0.57666015625, 0.740478515625, 0.904296875, 1.068115234375, 1.23193359375, 1.395751953125, 1.5595703125, 1.723388671875, 1.88720703125, 2.051025390625, 2.21484375, 2.378662109375, 2.54248046875, 2.706298828125, 2.8701171875, 3.033935546875, 3.19775390625, 3.361572265625, 3.525390625, 3.689208984375, 3.85302734375, 4.016845703125, 4.1806640625, 4.344482421875, 4.50830078125, 4.672119140625, 4.8359375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 7.0, 6.0, 13.0, 15.0, 34.0, 60.0, 64.0, 85.0, 151.0, 177.0, 305.0, 478.0, 746.0, 1157.0, 1913.0, 3385.0, 5838.0, 11102.0, 21667.0, 47833.0, 115371.0, 312733.0, 314018.0, 116013.0, 47485.0, 22263.0, 11033.0, 5890.0, 3445.0, 1984.0, 1212.0, 693.0, 443.0, 315.0, 173.0, 122.0, 94.0, 74.0, 53.0, 29.0, 26.0, 15.0, 9.0, 6.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-3.86328125, -3.749664306640625, -3.63604736328125, -3.522430419921875, -3.4088134765625, -3.295196533203125, -3.18157958984375, -3.067962646484375, -2.954345703125, -2.840728759765625, -2.72711181640625, -2.613494873046875, -2.4998779296875, -2.386260986328125, -2.27264404296875, -2.159027099609375, -2.04541015625, -1.931793212890625, -1.81817626953125, -1.704559326171875, -1.5909423828125, -1.477325439453125, -1.36370849609375, -1.250091552734375, -1.136474609375, -1.022857666015625, -0.90924072265625, -0.795623779296875, -0.6820068359375, -0.568389892578125, -0.45477294921875, -0.341156005859375, -0.2275390625, -0.113922119140625, -0.00030517578125, 0.113311767578125, 0.2269287109375, 0.340545654296875, 0.45416259765625, 0.567779541015625, 0.681396484375, 0.795013427734375, 0.90863037109375, 1.022247314453125, 1.1358642578125, 1.249481201171875, 1.36309814453125, 1.476715087890625, 1.59033203125, 1.703948974609375, 1.81756591796875, 1.931182861328125, 2.0447998046875, 2.158416748046875, 2.27203369140625, 2.385650634765625, 2.499267578125, 2.612884521484375, 2.72650146484375, 2.840118408203125, 2.9537353515625, 3.067352294921875, 3.18096923828125, 3.294586181640625, 3.408203125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 6.0, 11.0, 10.0, 9.0, 14.0, 14.0, 11.0, 17.0, 26.0, 27.0, 22.0, 31.0, 43.0, 45.0, 49.0, 52.0, 82.0, 136.0, 1586.0, 268.0, 99.0, 69.0, 56.0, 37.0, 40.0, 43.0, 41.0, 31.0, 22.0, 25.0, 19.0, 23.0, 16.0, 15.0, 6.0, 9.0, 5.0, 9.0, 2.0, 2.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -18.0286865234375, -17.494873046875, -16.9610595703125, -16.42724609375, -15.8934326171875, -15.359619140625, -14.8258056640625, -14.2919921875, -13.7581787109375, -13.224365234375, -12.6905517578125, -12.15673828125, -11.6229248046875, -11.089111328125, -10.5552978515625, -10.021484375, -9.4876708984375, -8.953857421875, -8.4200439453125, -7.88623046875, -7.3524169921875, -6.818603515625, -6.2847900390625, -5.7509765625, -5.2171630859375, -4.683349609375, -4.1495361328125, -3.61572265625, -3.0819091796875, -2.548095703125, -2.0142822265625, -1.48046875, -0.9466552734375, -0.412841796875, 0.1209716796875, 0.65478515625, 1.1885986328125, 1.722412109375, 2.2562255859375, 2.7900390625, 3.3238525390625, 3.857666015625, 4.3914794921875, 4.92529296875, 5.4591064453125, 5.992919921875, 6.5267333984375, 7.060546875, 7.5943603515625, 8.128173828125, 8.6619873046875, 9.19580078125, 9.7296142578125, 10.263427734375, 10.7972412109375, 11.3310546875, 11.8648681640625, 12.398681640625, 12.9324951171875, 13.46630859375, 14.0001220703125, 14.533935546875, 15.0677490234375, 15.6015625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 11.0, 18.0, 37.0, 66.0, 119.0, 223.0, 404.0, 941.0, 2124166.0, 1018014.0, 894.0, 352.0, 197.0, 102.0, 66.0, 35.0, 28.0, 8.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.125, -115.015625, -111.90625, -108.796875, -105.6875, -102.578125, -99.46875, -96.359375, -93.25, -90.140625, -87.03125, -83.921875, -80.8125, -77.703125, -74.59375, -71.484375, -68.375, -65.265625, -62.15625, -59.046875, -55.9375, -52.828125, -49.71875, -46.609375, -43.5, -40.390625, -37.28125, -34.171875, -31.0625, -27.953125, -24.84375, -21.734375, -18.625, -15.515625, -12.40625, -9.296875, -6.1875, -3.078125, 0.03125, 3.140625, 6.25, 9.359375, 12.46875, 15.578125, 18.6875, 21.796875, 24.90625, 28.015625, 31.125, 34.234375, 37.34375, 40.453125, 43.5625, 46.671875, 49.78125, 52.890625, 56.0, 59.109375, 62.21875, 65.328125, 68.4375, 71.546875, 74.65625, 77.765625, 80.875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [912.0, 108.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.222808837890625, 2.0210132598876953, 13.264835357666016, 24.50865936279297, 35.752479553222656, 46.996299743652344, 58.24012756347656, 69.48394775390625, 80.72776794433594, 91.97158813476562, 103.21540832519531, 114.45923614501953, 125.70305633544922, 136.94686889648438, 148.19070434570312, 159.4345245361328, 170.6783447265625, 181.9221649169922, 193.16598510742188, 204.40982055664062, 215.65362548828125, 226.8974609375, 238.1412811279297, 249.38510131835938, 260.62890625, 271.87274169921875, 283.1165466308594, 294.3603820800781, 305.60418701171875, 316.8480224609375, 328.09185791015625, 339.3356628417969, 350.57952880859375, 361.8233642578125, 373.0671691894531, 384.3110046386719, 395.5548095703125, 406.79864501953125, 418.04248046875, 429.2862854003906, 440.53009033203125, 451.77392578125, 463.0177307128906, 474.2615661621094, 485.50537109375, 496.74920654296875, 507.9930419921875, 519.23681640625, 530.480712890625, 541.7245483398438, 552.9683837890625, 564.212158203125, 575.4559936523438, 586.6998291015625, 597.9436645507812, 609.1875, 620.4312744140625, 631.6751098632812, 642.9189453125, 654.1627197265625, 665.4065551757812, 676.650390625, 687.8942260742188, 699.1380615234375, 710.3818359375]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 6.0, 3.0, 4.0, 5.0, 14.0, 10.0, 7.0, 14.0, 19.0, 20.0, 25.0, 25.0, 19.0, 29.0, 26.0, 34.0, 31.0, 30.0, 45.0, 45.0, 49.0, 49.0, 43.0, 37.0, 42.0, 44.0, 44.0, 37.0, 27.0, 35.0, 32.0, 18.0, 29.0, 19.0, 29.0, 7.0, 16.0, 10.0, 12.0, 2.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.857139587402344, -52.239131927490234, -50.621124267578125, -49.003116607666016, -47.385108947753906, -45.7671012878418, -44.14909362792969, -42.531089782714844, -40.91307830810547, -39.29507064819336, -37.67706298828125, -36.05905532836914, -34.44104766845703, -32.82304000854492, -31.205034255981445, -29.587026596069336, -27.96902084350586, -26.35101318359375, -24.73300552368164, -23.11499786376953, -21.496990203857422, -19.878982543945312, -18.260976791381836, -16.642969131469727, -15.024961471557617, -13.406953811645508, -11.788946151733398, -10.170939445495605, -8.552931785583496, -6.934924125671387, -5.316917419433594, -3.6989097595214844, -2.080902099609375, -0.4628946781158447, 1.1551127433776855, 2.7731199264526367, 4.391127586364746, 6.0091352462768555, 7.627141952514648, 9.245149612426758, 10.863157272338867, 12.481164932250977, 14.099172592163086, 15.717179298400879, 17.335186004638672, 18.95319366455078, 20.57120132446289, 22.189208984375, 23.80721664428711, 25.42522430419922, 27.043231964111328, 28.661239624023438, 30.279247283935547, 31.897254943847656, 33.5152587890625, 35.133270263671875, 36.75127410888672, 38.36928176879883, 39.98728942871094, 41.60529708862305, 43.223304748535156, 44.841312408447266, 46.459320068359375, 48.07732391357422, 49.695335388183594]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 4.0, 11.0, 10.0, 13.0, 14.0, 14.0, 24.0, 30.0, 26.0, 25.0, 33.0, 28.0, 28.0, 34.0, 36.0, 46.0, 34.0, 37.0, 38.0, 46.0, 42.0, 38.0, 33.0, 48.0, 32.0, 29.0, 28.0, 24.0, 30.0, 31.0, 14.0, 20.0, 20.0, 16.0, 10.0, 11.0, 7.0, 5.0, 3.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-5.87109375, -5.7021484375, -5.533203125, -5.3642578125, -5.1953125, -5.0263671875, -4.857421875, -4.6884765625, -4.51953125, -4.3505859375, -4.181640625, -4.0126953125, -3.84375, -3.6748046875, -3.505859375, -3.3369140625, -3.16796875, -2.9990234375, -2.830078125, -2.6611328125, -2.4921875, -2.3232421875, -2.154296875, -1.9853515625, -1.81640625, -1.6474609375, -1.478515625, -1.3095703125, -1.140625, -0.9716796875, -0.802734375, -0.6337890625, -0.46484375, -0.2958984375, -0.126953125, 0.0419921875, 0.2109375, 0.3798828125, 0.548828125, 0.7177734375, 0.88671875, 1.0556640625, 1.224609375, 1.3935546875, 1.5625, 1.7314453125, 1.900390625, 2.0693359375, 2.23828125, 2.4072265625, 2.576171875, 2.7451171875, 2.9140625, 3.0830078125, 3.251953125, 3.4208984375, 3.58984375, 3.7587890625, 3.927734375, 4.0966796875, 4.265625, 4.4345703125, 4.603515625, 4.7724609375, 4.94140625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 8.0, 4.0, 7.0, 7.0, 8.0, 19.0, 11.0, 15.0, 22.0, 27.0, 19.0, 29.0, 37.0, 89.0, 105.0, 207.0, 482.0, 1284.0, 4806.0, 34978.0, 632244.0, 2877699.0, 601026.0, 33970.0, 4794.0, 1275.0, 506.0, 192.0, 110.0, 60.0, 35.0, 39.0, 21.0, 28.0, 21.0, 13.0, 19.0, 18.0, 8.0, 10.0, 10.0, 5.0, 1.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.7578125, -13.3209228515625, -12.884033203125, -12.4471435546875, -12.01025390625, -11.5733642578125, -11.136474609375, -10.6995849609375, -10.2626953125, -9.8258056640625, -9.388916015625, -8.9520263671875, -8.51513671875, -8.0782470703125, -7.641357421875, -7.2044677734375, -6.767578125, -6.3306884765625, -5.893798828125, -5.4569091796875, -5.02001953125, -4.5831298828125, -4.146240234375, -3.7093505859375, -3.2724609375, -2.8355712890625, -2.398681640625, -1.9617919921875, -1.52490234375, -1.0880126953125, -0.651123046875, -0.2142333984375, 0.22265625, 0.6595458984375, 1.096435546875, 1.5333251953125, 1.97021484375, 2.4071044921875, 2.843994140625, 3.2808837890625, 3.7177734375, 4.1546630859375, 4.591552734375, 5.0284423828125, 5.46533203125, 5.9022216796875, 6.339111328125, 6.7760009765625, 7.212890625, 7.6497802734375, 8.086669921875, 8.5235595703125, 8.96044921875, 9.3973388671875, 9.834228515625, 10.2711181640625, 10.7080078125, 11.1448974609375, 11.581787109375, 12.0186767578125, 12.45556640625, 12.8924560546875, 13.329345703125, 13.7662353515625, 14.203125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 7.0, 5.0, 12.0, 10.0, 13.0, 22.0, 34.0, 29.0, 43.0, 50.0, 69.0, 75.0, 128.0, 167.0, 189.0, 242.0, 357.0, 399.0, 373.0, 362.0, 328.0, 272.0, 221.0, 155.0, 133.0, 81.0, 70.0, 42.0, 51.0, 27.0, 32.0, 15.0, 10.0, 12.0, 9.0, 9.0, 1.0, 2.0, 6.0, 3.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.97265625, -8.6875, -8.40234375, -8.1171875, -7.83203125, -7.546875, -7.26171875, -6.9765625, -6.69140625, -6.40625, -6.12109375, -5.8359375, -5.55078125, -5.265625, -4.98046875, -4.6953125, -4.41015625, -4.125, -3.83984375, -3.5546875, -3.26953125, -2.984375, -2.69921875, -2.4140625, -2.12890625, -1.84375, -1.55859375, -1.2734375, -0.98828125, -0.703125, -0.41796875, -0.1328125, 0.15234375, 0.4375, 0.72265625, 1.0078125, 1.29296875, 1.578125, 1.86328125, 2.1484375, 2.43359375, 2.71875, 3.00390625, 3.2890625, 3.57421875, 3.859375, 4.14453125, 4.4296875, 4.71484375, 5.0, 5.28515625, 5.5703125, 5.85546875, 6.140625, 6.42578125, 6.7109375, 6.99609375, 7.28125, 7.56640625, 7.8515625, 8.13671875, 8.421875, 8.70703125, 8.9921875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 13.0, 3.0, 9.0, 13.0, 18.0, 31.0, 30.0, 39.0, 47.0, 70.0, 88.0, 129.0, 146.0, 205.0, 252.0, 384.0, 886.0, 14011.0, 3469605.0, 702230.0, 4118.0, 596.0, 332.0, 227.0, 168.0, 144.0, 95.0, 85.0, 76.0, 51.0, 34.0, 40.0, 28.0, 21.0, 16.0, 5.0, 7.0, 6.0, 2.0, 11.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.96875, -43.64013671875, -42.3115234375, -40.98291015625, -39.654296875, -38.32568359375, -36.9970703125, -35.66845703125, -34.33984375, -33.01123046875, -31.6826171875, -30.35400390625, -29.025390625, -27.69677734375, -26.3681640625, -25.03955078125, -23.7109375, -22.38232421875, -21.0537109375, -19.72509765625, -18.396484375, -17.06787109375, -15.7392578125, -14.41064453125, -13.08203125, -11.75341796875, -10.4248046875, -9.09619140625, -7.767578125, -6.43896484375, -5.1103515625, -3.78173828125, -2.453125, -1.12451171875, 0.2041015625, 1.53271484375, 2.861328125, 4.18994140625, 5.5185546875, 6.84716796875, 8.17578125, 9.50439453125, 10.8330078125, 12.16162109375, 13.490234375, 14.81884765625, 16.1474609375, 17.47607421875, 18.8046875, 20.13330078125, 21.4619140625, 22.79052734375, 24.119140625, 25.44775390625, 26.7763671875, 28.10498046875, 29.43359375, 30.76220703125, 32.0908203125, 33.41943359375, 34.748046875, 36.07666015625, 37.4052734375, 38.73388671875, 40.0625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 11.0, 18.0, 37.0, 45.0, 74.0, 104.0, 95.0, 115.0, 106.0, 118.0, 99.0, 60.0, 57.0, 28.0, 13.0, 8.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.936431884765625, -31.567873001098633, -30.199316024780273, -28.83075714111328, -27.462200164794922, -26.09364128112793, -24.725082397460938, -23.356525421142578, -21.987966537475586, -20.619407653808594, -19.250850677490234, -17.882291793823242, -16.51373291015625, -15.14517593383789, -13.776617050170898, -12.408059120178223, -11.039501190185547, -9.670943260192871, -8.302385330200195, -6.933826446533203, -5.565268516540527, -4.196710586547852, -2.8281517028808594, -1.4595937728881836, -0.09103584289550781, 1.277522325515747, 2.646080493927002, 4.014638900756836, 5.383196830749512, 6.7517547607421875, 8.12031364440918, 9.488871574401855, 10.857425689697266, 12.225983619689941, 13.594541549682617, 14.96310043334961, 16.33165740966797, 17.70021629333496, 19.068775177001953, 20.437332153320312, 21.805891036987305, 23.174449920654297, 24.543006896972656, 25.91156578063965, 27.28012466430664, 28.648681640625, 30.017240524291992, 31.385799407958984, 32.754356384277344, 34.1229133605957, 35.49147415161133, 36.86003112792969, 38.22858810424805, 39.597145080566406, 40.96570587158203, 42.33426284790039, 43.70281982421875, 45.07137680053711, 46.439937591552734, 47.808494567871094, 49.17705154418945, 50.54560852050781, 51.91416931152344, 53.2827262878418, 54.65128707885742]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 5.0, 10.0, 4.0, 5.0, 12.0, 7.0, 16.0, 20.0, 17.0, 14.0, 26.0, 19.0, 28.0, 27.0, 32.0, 29.0, 35.0, 37.0, 35.0, 48.0, 31.0, 44.0, 34.0, 36.0, 35.0, 34.0, 35.0, 41.0, 24.0, 38.0, 29.0, 27.0, 21.0, 17.0, 17.0, 19.0, 18.0, 9.0, 18.0, 9.0, 8.0, 8.0, 3.0, 3.0, 6.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.09229278564453, -31.064437866210938, -30.036582946777344, -29.00872802734375, -27.980873107910156, -26.953018188476562, -25.92516326904297, -24.897308349609375, -23.86945343017578, -22.841598510742188, -21.813743591308594, -20.785888671875, -19.758033752441406, -18.730178833007812, -17.70232391357422, -16.674468994140625, -15.646614074707031, -14.618759155273438, -13.590904235839844, -12.56304931640625, -11.535194396972656, -10.507339477539062, -9.479484558105469, -8.451629638671875, -7.423774719238281, -6.3959197998046875, -5.368064880371094, -4.3402099609375, -3.3123550415039062, -2.2845001220703125, -1.2566452026367188, -0.228790283203125, 0.7990646362304688, 1.8269195556640625, 2.8547744750976562, 3.88262939453125, 4.910484313964844, 5.9383392333984375, 6.966194152832031, 7.994049072265625, 9.021903991699219, 10.049758911132812, 11.077613830566406, 12.10546875, 13.133323669433594, 14.161178588867188, 15.189033508300781, 16.216888427734375, 17.24474334716797, 18.272598266601562, 19.300453186035156, 20.32830810546875, 21.356163024902344, 22.384017944335938, 23.41187286376953, 24.439727783203125, 25.46758270263672, 26.495437622070312, 27.523292541503906, 28.5511474609375, 29.579002380371094, 30.606857299804688, 31.63471221923828, 32.662567138671875, 33.69042205810547]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 2.0, 7.0, 10.0, 9.0, 13.0, 18.0, 15.0, 23.0, 20.0, 14.0, 29.0, 26.0, 37.0, 32.0, 24.0, 44.0, 43.0, 36.0, 43.0, 33.0, 52.0, 38.0, 47.0, 43.0, 42.0, 29.0, 32.0, 31.0, 31.0, 26.0, 14.0, 24.0, 19.0, 15.0, 16.0, 8.0, 14.0, 11.0, 8.0, 5.0, 2.0, 4.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.703125, -5.54095458984375, -5.3787841796875, -5.21661376953125, -5.054443359375, -4.89227294921875, -4.7301025390625, -4.56793212890625, -4.40576171875, -4.24359130859375, -4.0814208984375, -3.91925048828125, -3.757080078125, -3.59490966796875, -3.4327392578125, -3.27056884765625, -3.1083984375, -2.94622802734375, -2.7840576171875, -2.62188720703125, -2.459716796875, -2.29754638671875, -2.1353759765625, -1.97320556640625, -1.81103515625, -1.64886474609375, -1.4866943359375, -1.32452392578125, -1.162353515625, -1.00018310546875, -0.8380126953125, -0.67584228515625, -0.513671875, -0.35150146484375, -0.1893310546875, -0.02716064453125, 0.135009765625, 0.29718017578125, 0.4593505859375, 0.62152099609375, 0.78369140625, 0.94586181640625, 1.1080322265625, 1.27020263671875, 1.432373046875, 1.59454345703125, 1.7567138671875, 1.91888427734375, 2.0810546875, 2.24322509765625, 2.4053955078125, 2.56756591796875, 2.729736328125, 2.89190673828125, 3.0540771484375, 3.21624755859375, 3.37841796875, 3.54058837890625, 3.7027587890625, 3.86492919921875, 4.027099609375, 4.18927001953125, 4.3514404296875, 4.51361083984375, 4.67578125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 1.0, 14.0, 5.0, 11.0, 23.0, 25.0, 54.0, 73.0, 98.0, 163.0, 280.0, 409.0, 579.0, 790.0, 1133.0, 1603.0, 2387.0, 3344.0, 4882.0, 7184.0, 10448.0, 15888.0, 24413.0, 38303.0, 60910.0, 101705.0, 169350.0, 209978.0, 150240.0, 89455.0, 54109.0, 33871.0, 21791.0, 14173.0, 9667.0, 6793.0, 4585.0, 3116.0, 2050.0, 1426.0, 999.0, 705.0, 454.0, 340.0, 222.0, 126.0, 123.0, 76.0, 67.0, 34.0, 28.0, 19.0, 22.0, 6.0, 8.0, 1.0, 2.0], "bins": [-0.69970703125, -0.679351806640625, -0.65899658203125, -0.638641357421875, -0.6182861328125, -0.597930908203125, -0.57757568359375, -0.557220458984375, -0.536865234375, -0.516510009765625, -0.49615478515625, -0.475799560546875, -0.4554443359375, -0.435089111328125, -0.41473388671875, -0.394378662109375, -0.3740234375, -0.353668212890625, -0.33331298828125, -0.312957763671875, -0.2926025390625, -0.272247314453125, -0.25189208984375, -0.231536865234375, -0.211181640625, -0.190826416015625, -0.17047119140625, -0.150115966796875, -0.1297607421875, -0.109405517578125, -0.08905029296875, -0.068695068359375, -0.04833984375, -0.027984619140625, -0.00762939453125, 0.012725830078125, 0.0330810546875, 0.053436279296875, 0.07379150390625, 0.094146728515625, 0.114501953125, 0.134857177734375, 0.15521240234375, 0.175567626953125, 0.1959228515625, 0.216278076171875, 0.23663330078125, 0.256988525390625, 0.27734375, 0.297698974609375, 0.31805419921875, 0.338409423828125, 0.3587646484375, 0.379119873046875, 0.39947509765625, 0.419830322265625, 0.440185546875, 0.460540771484375, 0.48089599609375, 0.501251220703125, 0.5216064453125, 0.541961669921875, 0.56231689453125, 0.582672119140625, 0.60302734375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 8.0, 11.0, 8.0, 14.0, 7.0, 13.0, 16.0, 22.0, 25.0, 26.0, 33.0, 27.0, 31.0, 29.0, 23.0, 29.0, 39.0, 47.0, 43.0, 43.0, 1064.0, 39.0, 37.0, 34.0, 23.0, 33.0, 39.0, 31.0, 28.0, 24.0, 24.0, 24.0, 19.0, 15.0, 14.0, 14.0, 11.0, 14.0, 8.0, 6.0, 8.0, 6.0, 2.0, 5.0, 2.0, 0.0, 3.0], "bins": [-3.62890625, -3.531341552734375, -3.43377685546875, -3.336212158203125, -3.2386474609375, -3.141082763671875, -3.04351806640625, -2.945953369140625, -2.848388671875, -2.750823974609375, -2.65325927734375, -2.555694580078125, -2.4581298828125, -2.360565185546875, -2.26300048828125, -2.165435791015625, -2.06787109375, -1.970306396484375, -1.87274169921875, -1.775177001953125, -1.6776123046875, -1.580047607421875, -1.48248291015625, -1.384918212890625, -1.287353515625, -1.189788818359375, -1.09222412109375, -0.994659423828125, -0.8970947265625, -0.799530029296875, -0.70196533203125, -0.604400634765625, -0.5068359375, -0.409271240234375, -0.31170654296875, -0.214141845703125, -0.1165771484375, -0.019012451171875, 0.07855224609375, 0.176116943359375, 0.273681640625, 0.371246337890625, 0.46881103515625, 0.566375732421875, 0.6639404296875, 0.761505126953125, 0.85906982421875, 0.956634521484375, 1.05419921875, 1.151763916015625, 1.24932861328125, 1.346893310546875, 1.4444580078125, 1.542022705078125, 1.63958740234375, 1.737152099609375, 1.834716796875, 1.932281494140625, 2.02984619140625, 2.127410888671875, 2.2249755859375, 2.322540283203125, 2.42010498046875, 2.517669677734375, 2.615234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 12.0, 8.0, 8.0, 18.0, 33.0, 50.0, 62.0, 91.0, 143.0, 220.0, 379.0, 591.0, 946.0, 1561.0, 2542.0, 4224.0, 7150.0, 12628.0, 23002.0, 42090.0, 79174.0, 151165.0, 1287787.0, 216355.0, 122861.0, 64728.0, 34763.0, 18684.0, 10523.0, 6013.0, 3559.0, 2113.0, 1290.0, 842.0, 538.0, 342.0, 244.0, 137.0, 96.0, 45.0, 38.0, 34.0, 18.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.64990234375, -0.6301116943359375, -0.610321044921875, -0.5905303955078125, -0.57073974609375, -0.5509490966796875, -0.531158447265625, -0.5113677978515625, -0.4915771484375, -0.4717864990234375, -0.451995849609375, -0.4322052001953125, -0.41241455078125, -0.3926239013671875, -0.372833251953125, -0.3530426025390625, -0.333251953125, -0.3134613037109375, -0.293670654296875, -0.2738800048828125, -0.25408935546875, -0.2342987060546875, -0.214508056640625, -0.1947174072265625, -0.1749267578125, -0.1551361083984375, -0.135345458984375, -0.1155548095703125, -0.09576416015625, -0.0759735107421875, -0.056182861328125, -0.0363922119140625, -0.0166015625, 0.0031890869140625, 0.022979736328125, 0.0427703857421875, 0.06256103515625, 0.0823516845703125, 0.102142333984375, 0.1219329833984375, 0.1417236328125, 0.1615142822265625, 0.181304931640625, 0.2010955810546875, 0.22088623046875, 0.2406768798828125, 0.260467529296875, 0.2802581787109375, 0.300048828125, 0.3198394775390625, 0.339630126953125, 0.3594207763671875, 0.37921142578125, 0.3990020751953125, 0.418792724609375, 0.4385833740234375, 0.4583740234375, 0.4781646728515625, 0.497955322265625, 0.5177459716796875, 0.53753662109375, 0.5573272705078125, 0.577117919921875, 0.5969085693359375, 0.61669921875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 11.0, 12.0, 10.0, 11.0, 13.0, 25.0, 10.0, 22.0, 27.0, 30.0, 39.0, 42.0, 38.0, 39.0, 57.0, 56.0, 48.0, 58.0, 57.0, 46.0, 41.0, 50.0, 37.0, 32.0, 35.0, 27.0, 15.0, 24.0, 14.0, 8.0, 10.0, 10.0, 12.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.002185821533203125, -0.002126649022102356, -0.002067476511001587, -0.002008303999900818, -0.0019491314888000488, -0.0018899589776992798, -0.0018307864665985107, -0.0017716139554977417, -0.0017124414443969727, -0.0016532689332962036, -0.0015940964221954346, -0.0015349239110946655, -0.0014757513999938965, -0.0014165788888931274, -0.0013574063777923584, -0.0012982338666915894, -0.0012390613555908203, -0.0011798888444900513, -0.0011207163333892822, -0.0010615438222885132, -0.0010023713111877441, -0.0009431988000869751, -0.0008840262889862061, -0.000824853777885437, -0.000765681266784668, -0.0007065087556838989, -0.0006473362445831299, -0.0005881637334823608, -0.0005289912223815918, -0.00046981871128082275, -0.0004106462001800537, -0.00035147368907928467, -0.0002923011779785156, -0.00023312866687774658, -0.00017395615577697754, -0.0001147836446762085, -5.561113357543945e-05, 3.56137752532959e-06, 6.273388862609863e-05, 0.00012190639972686768, 0.00018107891082763672, 0.00024025142192840576, 0.0002994239330291748, 0.00035859644412994385, 0.0004177689552307129, 0.00047694146633148193, 0.000536113977432251, 0.00059528648853302, 0.0006544589996337891, 0.0007136315107345581, 0.0007728040218353271, 0.0008319765329360962, 0.0008911490440368652, 0.0009503215551376343, 0.0010094940662384033, 0.0010686665773391724, 0.0011278390884399414, 0.0011870115995407104, 0.0012461841106414795, 0.0013053566217422485, 0.0013645291328430176, 0.0014237016439437866, 0.0014828741550445557, 0.0015420466661453247, 0.0016012191772460938]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 3.0, 7.0, 11.0, 21.0, 22.0, 20.0, 29.0, 29.0, 42.0, 66.0, 58.0, 85.0, 127.0, 209.0, 439.0, 1140.0, 29294.0, 1001116.0, 13762.0, 937.0, 383.0, 175.0, 128.0, 99.0, 58.0, 52.0, 51.0, 39.0, 29.0, 22.0, 19.0, 10.0, 12.0, 12.0, 9.0, 10.0, 6.0, 4.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.034637451171875, -0.033374786376953125, -0.03211212158203125, -0.030849456787109375, -0.0295867919921875, -0.028324127197265625, -0.02706146240234375, -0.025798797607421875, -0.0245361328125, -0.023273468017578125, -0.02201080322265625, -0.020748138427734375, -0.0194854736328125, -0.018222808837890625, -0.01696014404296875, -0.015697479248046875, -0.014434814453125, -0.013172149658203125, -0.01190948486328125, -0.010646820068359375, -0.0093841552734375, -0.008121490478515625, -0.00685882568359375, -0.005596160888671875, -0.00433349609375, -0.003070831298828125, -0.00180816650390625, -0.000545501708984375, 0.0007171630859375, 0.001979827880859375, 0.00324249267578125, 0.004505157470703125, 0.005767822265625, 0.007030487060546875, 0.00829315185546875, 0.009555816650390625, 0.0108184814453125, 0.012081146240234375, 0.01334381103515625, 0.014606475830078125, 0.015869140625, 0.017131805419921875, 0.01839447021484375, 0.019657135009765625, 0.0209197998046875, 0.022182464599609375, 0.02344512939453125, 0.024707794189453125, 0.025970458984375, 0.027233123779296875, 0.02849578857421875, 0.029758453369140625, 0.0310211181640625, 0.032283782958984375, 0.03354644775390625, 0.034809112548828125, 0.03607177734375, 0.037334442138671875, 0.03859710693359375, 0.039859771728515625, 0.0411224365234375, 0.042385101318359375, 0.04364776611328125, 0.044910430908203125, 0.046173095703125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 35.0, 958.0, 23.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03621470928192139, -0.03551113232970238, -0.034807559102773666, -0.03410398215055466, -0.03340040519833565, -0.03269682824611664, -0.03199325501918793, -0.03128967806696892, -0.03058610111474991, -0.02988252602517605, -0.02917894907295704, -0.02847537398338318, -0.02777179703116417, -0.02706822194159031, -0.02636464685201645, -0.02566106989979744, -0.02495749481022358, -0.02425391972064972, -0.02355034276843071, -0.02284676767885685, -0.02214319072663784, -0.02143961563706398, -0.02073603868484497, -0.02003246359527111, -0.01932888850569725, -0.01862531341612339, -0.01792173646390438, -0.01721816137433052, -0.01651458442211151, -0.01581100933253765, -0.015107433311641216, -0.014403857290744781, -0.013700282201170921, -0.012996706180274487, -0.012293130159378052, -0.011589555069804192, -0.010885978117585182, -0.010182403028011322, -0.009478827007114887, -0.008775250986218452, -0.008071674965322018, -0.007368098944425583, -0.006664522923529148, -0.005960947368294001, -0.005257371347397566, -0.004553795326501131, -0.0038502197712659836, -0.003146643750369549, -0.002443067729473114, -0.001739491824992001, -0.001035915920510888, -0.00033234013244509697, 0.0003712358884513378, 0.0010748119093477726, 0.00177838746458292, 0.002481963485479355, 0.0031855395063757896, 0.0038891155272722244, 0.004592691548168659, 0.005296267103403807, 0.0059998431243002415, 0.006703419145196676, 0.007406994700431824, 0.008110570721328259, 0.008814146742224693]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 2.0, 6.0, 2.0, 9.0, 7.0, 9.0, 15.0, 15.0, 19.0, 29.0, 32.0, 30.0, 43.0, 48.0, 41.0, 58.0, 63.0, 61.0, 48.0, 51.0, 49.0, 50.0, 55.0, 50.0, 41.0, 38.0, 23.0, 28.0, 17.0, 12.0, 14.0, 14.0, 5.0, 6.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000955045223236084, -0.0009106993675231934, -0.0008663535118103027, -0.0008220076560974121, -0.0007776618003845215, -0.0007333159446716309, -0.0006889700889587402, -0.0006446242332458496, -0.000600278377532959, -0.0005559325218200684, -0.0005115866661071777, -0.0004672408103942871, -0.0004228949546813965, -0.00037854909896850586, -0.00033420324325561523, -0.0002898573875427246, -0.000245511531829834, -0.00020116567611694336, -0.00015681982040405273, -0.00011247396469116211, -6.812810897827148e-05, -2.378225326538086e-05, 2.0563602447509766e-05, 6.490945816040039e-05, 0.00010925531387329102, 0.00015360116958618164, 0.00019794702529907227, 0.0002422928810119629, 0.0002866387367248535, 0.00033098459243774414, 0.00037533044815063477, 0.0004196763038635254, 0.000464022159576416, 0.0005083680152893066, 0.0005527138710021973, 0.0005970597267150879, 0.0006414055824279785, 0.0006857514381408691, 0.0007300972938537598, 0.0007744431495666504, 0.000818789005279541, 0.0008631348609924316, 0.0009074807167053223, 0.0009518265724182129, 0.0009961724281311035, 0.0010405182838439941, 0.0010848641395568848, 0.0011292099952697754, 0.001173555850982666, 0.0012179017066955566, 0.0012622475624084473, 0.0013065934181213379, 0.0013509392738342285, 0.0013952851295471191, 0.0014396309852600098, 0.0014839768409729004, 0.001528322696685791, 0.0015726685523986816, 0.0016170144081115723, 0.0016613602638244629, 0.0017057061195373535, 0.0017500519752502441, 0.0017943978309631348, 0.0018387436866760254, 0.001883089542388916]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 2.0, 7.0, 10.0, 9.0, 13.0, 18.0, 15.0, 23.0, 20.0, 14.0, 29.0, 26.0, 37.0, 32.0, 24.0, 44.0, 43.0, 36.0, 43.0, 33.0, 52.0, 38.0, 47.0, 43.0, 42.0, 29.0, 32.0, 31.0, 31.0, 26.0, 14.0, 24.0, 19.0, 15.0, 16.0, 8.0, 14.0, 11.0, 8.0, 5.0, 2.0, 4.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.703125, -5.54095458984375, -5.3787841796875, -5.21661376953125, -5.054443359375, -4.89227294921875, -4.7301025390625, -4.56793212890625, -4.40576171875, -4.24359130859375, -4.0814208984375, -3.91925048828125, -3.757080078125, -3.59490966796875, -3.4327392578125, -3.27056884765625, -3.1083984375, -2.94622802734375, -2.7840576171875, -2.62188720703125, -2.459716796875, -2.29754638671875, -2.1353759765625, -1.97320556640625, -1.81103515625, -1.64886474609375, -1.4866943359375, -1.32452392578125, -1.162353515625, -1.00018310546875, -0.8380126953125, -0.67584228515625, -0.513671875, -0.35150146484375, -0.1893310546875, -0.02716064453125, 0.135009765625, 0.29718017578125, 0.4593505859375, 0.62152099609375, 0.78369140625, 0.94586181640625, 1.1080322265625, 1.27020263671875, 1.432373046875, 1.59454345703125, 1.7567138671875, 1.91888427734375, 2.0810546875, 2.24322509765625, 2.4053955078125, 2.56756591796875, 2.729736328125, 2.89190673828125, 3.0540771484375, 3.21624755859375, 3.37841796875, 3.54058837890625, 3.7027587890625, 3.86492919921875, 4.027099609375, 4.18927001953125, 4.3514404296875, 4.51361083984375, 4.67578125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 3.0, 8.0, 10.0, 15.0, 33.0, 26.0, 28.0, 62.0, 81.0, 94.0, 150.0, 274.0, 387.0, 708.0, 1530.0, 3003.0, 7127.0, 20471.0, 72841.0, 304327.0, 470563.0, 118014.0, 30724.0, 9897.0, 4008.0, 1896.0, 901.0, 512.0, 290.0, 188.0, 109.0, 76.0, 49.0, 27.0, 25.0, 20.0, 20.0, 18.0, 11.0, 6.0, 4.0, 4.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.50390625, -5.347412109375, -5.19091796875, -5.034423828125, -4.8779296875, -4.721435546875, -4.56494140625, -4.408447265625, -4.251953125, -4.095458984375, -3.93896484375, -3.782470703125, -3.6259765625, -3.469482421875, -3.31298828125, -3.156494140625, -3.0, -2.843505859375, -2.68701171875, -2.530517578125, -2.3740234375, -2.217529296875, -2.06103515625, -1.904541015625, -1.748046875, -1.591552734375, -1.43505859375, -1.278564453125, -1.1220703125, -0.965576171875, -0.80908203125, -0.652587890625, -0.49609375, -0.339599609375, -0.18310546875, -0.026611328125, 0.1298828125, 0.286376953125, 0.44287109375, 0.599365234375, 0.755859375, 0.912353515625, 1.06884765625, 1.225341796875, 1.3818359375, 1.538330078125, 1.69482421875, 1.851318359375, 2.0078125, 2.164306640625, 2.32080078125, 2.477294921875, 2.6337890625, 2.790283203125, 2.94677734375, 3.103271484375, 3.259765625, 3.416259765625, 3.57275390625, 3.729248046875, 3.8857421875, 4.042236328125, 4.19873046875, 4.355224609375, 4.51171875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 4.0, 8.0, 10.0, 5.0, 14.0, 17.0, 15.0, 22.0, 21.0, 25.0, 38.0, 33.0, 38.0, 51.0, 35.0, 49.0, 73.0, 154.0, 1685.0, 263.0, 75.0, 48.0, 45.0, 35.0, 37.0, 29.0, 21.0, 27.0, 41.0, 17.0, 16.0, 23.0, 9.0, 11.0, 11.0, 10.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.578125, -18.00927734375, -17.4404296875, -16.87158203125, -16.302734375, -15.73388671875, -15.1650390625, -14.59619140625, -14.02734375, -13.45849609375, -12.8896484375, -12.32080078125, -11.751953125, -11.18310546875, -10.6142578125, -10.04541015625, -9.4765625, -8.90771484375, -8.3388671875, -7.77001953125, -7.201171875, -6.63232421875, -6.0634765625, -5.49462890625, -4.92578125, -4.35693359375, -3.7880859375, -3.21923828125, -2.650390625, -2.08154296875, -1.5126953125, -0.94384765625, -0.375, 0.19384765625, 0.7626953125, 1.33154296875, 1.900390625, 2.46923828125, 3.0380859375, 3.60693359375, 4.17578125, 4.74462890625, 5.3134765625, 5.88232421875, 6.451171875, 7.02001953125, 7.5888671875, 8.15771484375, 8.7265625, 9.29541015625, 9.8642578125, 10.43310546875, 11.001953125, 11.57080078125, 12.1396484375, 12.70849609375, 13.27734375, 13.84619140625, 14.4150390625, 14.98388671875, 15.552734375, 16.12158203125, 16.6904296875, 17.25927734375, 17.828125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 3.0, 6.0, 9.0, 14.0, 21.0, 22.0, 35.0, 34.0, 74.0, 94.0, 120.0, 209.0, 304.0, 584.0, 2475.0, 2533494.0, 604698.0, 2002.0, 559.0, 299.0, 185.0, 140.0, 97.0, 52.0, 42.0, 32.0, 24.0, 20.0, 12.0, 8.0, 7.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.46875, -47.76025390625, -46.0517578125, -44.34326171875, -42.634765625, -40.92626953125, -39.2177734375, -37.50927734375, -35.80078125, -34.09228515625, -32.3837890625, -30.67529296875, -28.966796875, -27.25830078125, -25.5498046875, -23.84130859375, -22.1328125, -20.42431640625, -18.7158203125, -17.00732421875, -15.298828125, -13.59033203125, -11.8818359375, -10.17333984375, -8.46484375, -6.75634765625, -5.0478515625, -3.33935546875, -1.630859375, 0.07763671875, 1.7861328125, 3.49462890625, 5.203125, 6.91162109375, 8.6201171875, 10.32861328125, 12.037109375, 13.74560546875, 15.4541015625, 17.16259765625, 18.87109375, 20.57958984375, 22.2880859375, 23.99658203125, 25.705078125, 27.41357421875, 29.1220703125, 30.83056640625, 32.5390625, 34.24755859375, 35.9560546875, 37.66455078125, 39.373046875, 41.08154296875, 42.7900390625, 44.49853515625, 46.20703125, 47.91552734375, 49.6240234375, 51.33251953125, 53.041015625, 54.74951171875, 56.4580078125, 58.16650390625, 59.875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 3.0, 1004.0, 11.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.21566390991211, -16.800312042236328, -6.38496208190918, 4.030387878417969, 14.44573974609375, 24.86109161376953, 35.27643966674805, 45.69179153442383, 56.10714340209961, 66.52249145507812, 76.9378433227539, 87.35319519042969, 97.76854705810547, 108.18389892578125, 118.5992431640625, 129.0146026611328, 139.42994689941406, 149.8452911376953, 160.26065063476562, 170.67599487304688, 181.0913543701172, 191.50669860839844, 201.92205810546875, 212.33740234375, 222.7527618408203, 233.16810607910156, 243.58346557617188, 253.99880981445312, 264.4141540527344, 274.82952880859375, 285.244873046875, 295.66021728515625, 306.0755920410156, 316.4909362792969, 326.9062805175781, 337.3216552734375, 347.73699951171875, 358.15234375, 368.56768798828125, 378.9830322265625, 389.3984069824219, 399.8137512207031, 410.2290954589844, 420.64447021484375, 431.059814453125, 441.47515869140625, 451.8905029296875, 462.30584716796875, 472.72119140625, 483.13653564453125, 493.5518798828125, 503.9672546386719, 514.382568359375, 524.7979736328125, 535.2133178710938, 545.628662109375, 556.0440063476562, 566.4593505859375, 576.8746948242188, 587.2900390625, 597.7053833007812, 608.1207885742188, 618.5361328125, 628.9514770507812, 639.3668212890625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 4.0, 7.0, 5.0, 6.0, 4.0, 8.0, 17.0, 16.0, 27.0, 21.0, 28.0, 17.0, 28.0, 36.0, 37.0, 45.0, 32.0, 37.0, 37.0, 44.0, 40.0, 42.0, 36.0, 41.0, 46.0, 43.0, 29.0, 35.0, 29.0, 24.0, 29.0, 29.0, 21.0, 18.0, 14.0, 17.0, 6.0, 7.0, 13.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.68431854248047, -48.079673767089844, -46.475032806396484, -44.87038803100586, -43.2657470703125, -41.661102294921875, -40.05645751953125, -38.45181655883789, -36.847171783447266, -35.24252700805664, -33.63788604736328, -32.033241271972656, -30.428598403930664, -28.823955535888672, -27.21931266784668, -25.614669799804688, -24.010026931762695, -22.405384063720703, -20.80074119567871, -19.19609832763672, -17.591453552246094, -15.986810684204102, -14.38216781616211, -12.7775239944458, -11.172881126403809, -9.568238258361816, -7.963594436645508, -6.358951568603516, -4.754308223724365, -3.149664878845215, -1.5450220108032227, 0.05962181091308594, 1.6642646789550781, 3.2689080238342285, 4.873551368713379, 6.478194236755371, 8.08283805847168, 9.687480926513672, 11.292123794555664, 12.896767616271973, 14.501410484313965, 16.106054306030273, 17.710697174072266, 19.315340042114258, 20.91998291015625, 22.524627685546875, 24.129268646240234, 25.73391342163086, 27.33855628967285, 28.943199157714844, 30.547842025756836, 32.15248489379883, 33.75712966918945, 35.36177062988281, 36.96641540527344, 38.57106018066406, 40.17570114135742, 41.78034591674805, 43.384986877441406, 44.98963165283203, 46.59427261352539, 48.198917388916016, 49.803558349609375, 51.408203125, 53.012847900390625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 9.0, 5.0, 5.0, 5.0, 13.0, 8.0, 16.0, 24.0, 22.0, 10.0, 26.0, 20.0, 23.0, 33.0, 37.0, 33.0, 43.0, 43.0, 36.0, 38.0, 45.0, 40.0, 50.0, 47.0, 29.0, 35.0, 41.0, 34.0, 28.0, 26.0, 21.0, 18.0, 23.0, 19.0, 22.0, 10.0, 18.0, 12.0, 10.0, 2.0, 8.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.5234375, -5.3568115234375, -5.190185546875, -5.0235595703125, -4.85693359375, -4.6903076171875, -4.523681640625, -4.3570556640625, -4.1904296875, -4.0238037109375, -3.857177734375, -3.6905517578125, -3.52392578125, -3.3572998046875, -3.190673828125, -3.0240478515625, -2.857421875, -2.6907958984375, -2.524169921875, -2.3575439453125, -2.19091796875, -2.0242919921875, -1.857666015625, -1.6910400390625, -1.5244140625, -1.3577880859375, -1.191162109375, -1.0245361328125, -0.85791015625, -0.6912841796875, -0.524658203125, -0.3580322265625, -0.19140625, -0.0247802734375, 0.141845703125, 0.3084716796875, 0.47509765625, 0.6417236328125, 0.808349609375, 0.9749755859375, 1.1416015625, 1.3082275390625, 1.474853515625, 1.6414794921875, 1.80810546875, 1.9747314453125, 2.141357421875, 2.3079833984375, 2.474609375, 2.6412353515625, 2.807861328125, 2.9744873046875, 3.14111328125, 3.3077392578125, 3.474365234375, 3.6409912109375, 3.8076171875, 3.9742431640625, 4.140869140625, 4.3074951171875, 4.47412109375, 4.6407470703125, 4.807373046875, 4.9739990234375, 5.140625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 4.0, 5.0, 14.0, 8.0, 19.0, 19.0, 22.0, 25.0, 22.0, 35.0, 43.0, 46.0, 58.0, 81.0, 101.0, 158.0, 237.0, 443.0, 1048.0, 3939.0, 21826.0, 259746.0, 2247692.0, 1522723.0, 118231.0, 12930.0, 2739.0, 878.0, 354.0, 197.0, 129.0, 95.0, 73.0, 59.0, 43.0, 46.0, 24.0, 39.0, 31.0, 23.0, 16.0, 10.0, 10.0, 6.0, 8.0, 7.0, 1.0, 6.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-12.7265625, -12.3271484375, -11.927734375, -11.5283203125, -11.12890625, -10.7294921875, -10.330078125, -9.9306640625, -9.53125, -9.1318359375, -8.732421875, -8.3330078125, -7.93359375, -7.5341796875, -7.134765625, -6.7353515625, -6.3359375, -5.9365234375, -5.537109375, -5.1376953125, -4.73828125, -4.3388671875, -3.939453125, -3.5400390625, -3.140625, -2.7412109375, -2.341796875, -1.9423828125, -1.54296875, -1.1435546875, -0.744140625, -0.3447265625, 0.0546875, 0.4541015625, 0.853515625, 1.2529296875, 1.65234375, 2.0517578125, 2.451171875, 2.8505859375, 3.25, 3.6494140625, 4.048828125, 4.4482421875, 4.84765625, 5.2470703125, 5.646484375, 6.0458984375, 6.4453125, 6.8447265625, 7.244140625, 7.6435546875, 8.04296875, 8.4423828125, 8.841796875, 9.2412109375, 9.640625, 10.0400390625, 10.439453125, 10.8388671875, 11.23828125, 11.6376953125, 12.037109375, 12.4365234375, 12.8359375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 8.0, 12.0, 12.0, 23.0, 31.0, 34.0, 51.0, 53.0, 96.0, 126.0, 178.0, 247.0, 345.0, 449.0, 495.0, 438.0, 393.0, 313.0, 177.0, 154.0, 134.0, 57.0, 69.0, 46.0, 30.0, 24.0, 20.0, 13.0, 7.0, 10.0, 7.0, 9.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.231689453125, -7.88525390625, -7.538818359375, -7.1923828125, -6.845947265625, -6.49951171875, -6.153076171875, -5.806640625, -5.460205078125, -5.11376953125, -4.767333984375, -4.4208984375, -4.074462890625, -3.72802734375, -3.381591796875, -3.03515625, -2.688720703125, -2.34228515625, -1.995849609375, -1.6494140625, -1.302978515625, -0.95654296875, -0.610107421875, -0.263671875, 0.082763671875, 0.42919921875, 0.775634765625, 1.1220703125, 1.468505859375, 1.81494140625, 2.161376953125, 2.5078125, 2.854248046875, 3.20068359375, 3.547119140625, 3.8935546875, 4.239990234375, 4.58642578125, 4.932861328125, 5.279296875, 5.625732421875, 5.97216796875, 6.318603515625, 6.6650390625, 7.011474609375, 7.35791015625, 7.704345703125, 8.05078125, 8.397216796875, 8.74365234375, 9.090087890625, 9.4365234375, 9.782958984375, 10.12939453125, 10.475830078125, 10.822265625, 11.168701171875, 11.51513671875, 11.861572265625, 12.2080078125, 12.554443359375, 12.90087890625, 13.247314453125, 13.59375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 6.0, 14.0, 13.0, 18.0, 17.0, 25.0, 36.0, 44.0, 61.0, 93.0, 114.0, 149.0, 199.0, 244.0, 342.0, 596.0, 6030.0, 3808409.0, 374606.0, 1519.0, 496.0, 333.0, 209.0, 163.0, 156.0, 82.0, 81.0, 46.0, 57.0, 30.0, 22.0, 26.0, 18.0, 11.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-61.71875, -60.0419921875, -58.365234375, -56.6884765625, -55.01171875, -53.3349609375, -51.658203125, -49.9814453125, -48.3046875, -46.6279296875, -44.951171875, -43.2744140625, -41.59765625, -39.9208984375, -38.244140625, -36.5673828125, -34.890625, -33.2138671875, -31.537109375, -29.8603515625, -28.18359375, -26.5068359375, -24.830078125, -23.1533203125, -21.4765625, -19.7998046875, -18.123046875, -16.4462890625, -14.76953125, -13.0927734375, -11.416015625, -9.7392578125, -8.0625, -6.3857421875, -4.708984375, -3.0322265625, -1.35546875, 0.3212890625, 1.998046875, 3.6748046875, 5.3515625, 7.0283203125, 8.705078125, 10.3818359375, 12.05859375, 13.7353515625, 15.412109375, 17.0888671875, 18.765625, 20.4423828125, 22.119140625, 23.7958984375, 25.47265625, 27.1494140625, 28.826171875, 30.5029296875, 32.1796875, 33.8564453125, 35.533203125, 37.2099609375, 38.88671875, 40.5634765625, 42.240234375, 43.9169921875, 45.59375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 19.0, 125.0, 527.0, 316.0, 30.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.33722686767578, -102.78571319580078, -96.23420715332031, -89.68269348144531, -83.13117980957031, -76.57967376708984, -70.02816009521484, -63.47665023803711, -56.925140380859375, -50.37363052368164, -43.822120666503906, -37.270606994628906, -30.719097137451172, -24.167587280273438, -17.616073608398438, -11.064563751220703, -4.513053894042969, 2.038456916809082, 8.589967727661133, 15.1414794921875, 21.692989349365234, 28.24449920654297, 34.79601287841797, 41.3475227355957, 47.89903259277344, 54.45054244995117, 61.002052307128906, 67.5535659790039, 74.10507202148438, 80.65658569335938, 87.20809936523438, 93.75961303710938, 100.31112670898438, 106.86264038085938, 113.41414642333984, 119.96566009521484, 126.51716613769531, 133.0686798095703, 139.6201934814453, 146.1717071533203, 152.72320556640625, 159.27471923828125, 165.82623291015625, 172.37774658203125, 178.9292449951172, 185.4807586669922, 192.0322723388672, 198.5837860107422, 205.1352996826172, 211.6868133544922, 218.2383270263672, 224.78982543945312, 231.34133911132812, 237.89285278320312, 244.44436645507812, 250.99588012695312, 257.5473937988281, 264.0989074707031, 270.6504211425781, 277.2019348144531, 283.7534484863281, 290.304931640625, 296.8564453125, 303.407958984375, 309.95947265625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 6.0, 11.0, 6.0, 16.0, 9.0, 13.0, 26.0, 14.0, 21.0, 24.0, 22.0, 23.0, 24.0, 34.0, 27.0, 39.0, 36.0, 36.0, 52.0, 56.0, 46.0, 38.0, 35.0, 45.0, 35.0, 38.0, 36.0, 24.0, 20.0, 30.0, 28.0, 25.0, 15.0, 12.0, 17.0, 14.0, 11.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-37.34490966796875, -36.23625946044922, -35.12760925292969, -34.018959045410156, -32.910308837890625, -31.80165672302246, -30.693004608154297, -29.584354400634766, -28.475704193115234, -27.367053985595703, -26.258403778076172, -25.149751663208008, -24.041101455688477, -22.932451248168945, -21.82379913330078, -20.71514892578125, -19.60649871826172, -18.497848510742188, -17.389198303222656, -16.280546188354492, -15.171895980834961, -14.06324577331543, -12.954594612121582, -11.845943450927734, -10.737293243408203, -9.628643035888672, -8.519991874694824, -7.411341190338135, -6.302690505981445, -5.194039821624756, -4.085389137268066, -2.976738452911377, -1.8680877685546875, -0.759437084197998, 0.3492136001586914, 1.4578642845153809, 2.5665149688720703, 3.6751656532287598, 4.783816337585449, 5.892467021942139, 7.001117706298828, 8.10976791381836, 9.218419075012207, 10.327070236206055, 11.435720443725586, 12.544370651245117, 13.653021812438965, 14.761672973632812, 15.870323181152344, 16.978973388671875, 18.087623596191406, 19.19627571105957, 20.3049259185791, 21.413576126098633, 22.522228240966797, 23.630878448486328, 24.73952865600586, 25.84817886352539, 26.956829071044922, 28.065481185913086, 29.174131393432617, 30.28278160095215, 31.391433715820312, 32.500083923339844, 33.608734130859375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 10.0, 6.0, 12.0, 22.0, 10.0, 15.0, 21.0, 25.0, 23.0, 18.0, 26.0, 32.0, 23.0, 29.0, 30.0, 32.0, 42.0, 40.0, 38.0, 34.0, 31.0, 43.0, 43.0, 40.0, 27.0, 16.0, 32.0, 41.0, 18.0, 26.0, 27.0, 26.0, 18.0, 15.0, 16.0, 13.0, 10.0, 9.0, 10.0, 13.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.671875, -4.526611328125, -4.38134765625, -4.236083984375, -4.0908203125, -3.945556640625, -3.80029296875, -3.655029296875, -3.509765625, -3.364501953125, -3.21923828125, -3.073974609375, -2.9287109375, -2.783447265625, -2.63818359375, -2.492919921875, -2.34765625, -2.202392578125, -2.05712890625, -1.911865234375, -1.7666015625, -1.621337890625, -1.47607421875, -1.330810546875, -1.185546875, -1.040283203125, -0.89501953125, -0.749755859375, -0.6044921875, -0.459228515625, -0.31396484375, -0.168701171875, -0.0234375, 0.121826171875, 0.26708984375, 0.412353515625, 0.5576171875, 0.702880859375, 0.84814453125, 0.993408203125, 1.138671875, 1.283935546875, 1.42919921875, 1.574462890625, 1.7197265625, 1.864990234375, 2.01025390625, 2.155517578125, 2.30078125, 2.446044921875, 2.59130859375, 2.736572265625, 2.8818359375, 3.027099609375, 3.17236328125, 3.317626953125, 3.462890625, 3.608154296875, 3.75341796875, 3.898681640625, 4.0439453125, 4.189208984375, 4.33447265625, 4.479736328125, 4.625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 4.0, 12.0, 17.0, 29.0, 40.0, 54.0, 86.0, 122.0, 194.0, 265.0, 437.0, 562.0, 895.0, 1354.0, 2100.0, 2997.0, 4568.0, 6866.0, 10777.0, 16516.0, 26236.0, 42613.0, 73164.0, 129326.0, 210061.0, 207301.0, 126241.0, 70735.0, 41969.0, 25780.0, 16534.0, 10366.0, 6884.0, 4438.0, 2972.0, 2016.0, 1304.0, 897.0, 586.0, 423.0, 266.0, 167.0, 129.0, 82.0, 63.0, 37.0, 25.0, 14.0, 13.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.68115234375, -0.6591644287109375, -0.637176513671875, -0.6151885986328125, -0.59320068359375, -0.5712127685546875, -0.549224853515625, -0.5272369384765625, -0.5052490234375, -0.4832611083984375, -0.461273193359375, -0.4392852783203125, -0.41729736328125, -0.3953094482421875, -0.373321533203125, -0.3513336181640625, -0.329345703125, -0.3073577880859375, -0.285369873046875, -0.2633819580078125, -0.24139404296875, -0.2194061279296875, -0.197418212890625, -0.1754302978515625, -0.1534423828125, -0.1314544677734375, -0.109466552734375, -0.0874786376953125, -0.06549072265625, -0.0435028076171875, -0.021514892578125, 0.0004730224609375, 0.0224609375, 0.0444488525390625, 0.066436767578125, 0.0884246826171875, 0.11041259765625, 0.1324005126953125, 0.154388427734375, 0.1763763427734375, 0.1983642578125, 0.2203521728515625, 0.242340087890625, 0.2643280029296875, 0.28631591796875, 0.3083038330078125, 0.330291748046875, 0.3522796630859375, 0.374267578125, 0.3962554931640625, 0.418243408203125, 0.4402313232421875, 0.46221923828125, 0.4842071533203125, 0.506195068359375, 0.5281829833984375, 0.5501708984375, 0.5721588134765625, 0.594146728515625, 0.6161346435546875, 0.63812255859375, 0.6601104736328125, 0.682098388671875, 0.7040863037109375, 0.72607421875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 3.0, 4.0, 11.0, 11.0, 3.0, 12.0, 8.0, 16.0, 17.0, 25.0, 24.0, 27.0, 41.0, 24.0, 34.0, 37.0, 51.0, 35.0, 51.0, 38.0, 47.0, 1066.0, 45.0, 36.0, 46.0, 42.0, 30.0, 29.0, 29.0, 29.0, 19.0, 19.0, 24.0, 17.0, 19.0, 11.0, 10.0, 7.0, 2.0, 7.0, 6.0, 8.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.198974609375, -3.08544921875, -2.971923828125, -2.8583984375, -2.744873046875, -2.63134765625, -2.517822265625, -2.404296875, -2.290771484375, -2.17724609375, -2.063720703125, -1.9501953125, -1.836669921875, -1.72314453125, -1.609619140625, -1.49609375, -1.382568359375, -1.26904296875, -1.155517578125, -1.0419921875, -0.928466796875, -0.81494140625, -0.701416015625, -0.587890625, -0.474365234375, -0.36083984375, -0.247314453125, -0.1337890625, -0.020263671875, 0.09326171875, 0.206787109375, 0.3203125, 0.433837890625, 0.54736328125, 0.660888671875, 0.7744140625, 0.887939453125, 1.00146484375, 1.114990234375, 1.228515625, 1.342041015625, 1.45556640625, 1.569091796875, 1.6826171875, 1.796142578125, 1.90966796875, 2.023193359375, 2.13671875, 2.250244140625, 2.36376953125, 2.477294921875, 2.5908203125, 2.704345703125, 2.81787109375, 2.931396484375, 3.044921875, 3.158447265625, 3.27197265625, 3.385498046875, 3.4990234375, 3.612548828125, 3.72607421875, 3.839599609375, 3.953125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 14.0, 24.0, 26.0, 36.0, 49.0, 85.0, 146.0, 221.0, 298.0, 519.0, 837.0, 1309.0, 2011.0, 3260.0, 5034.0, 8227.0, 13573.0, 21872.0, 36436.0, 60063.0, 101874.0, 166994.0, 1259746.0, 163842.0, 99929.0, 59143.0, 35438.0, 21571.0, 12990.0, 7913.0, 4995.0, 3178.0, 1939.0, 1259.0, 765.0, 537.0, 345.0, 233.0, 127.0, 97.0, 57.0, 39.0, 25.0, 15.0, 14.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.5380859375, -0.52099609375, -0.50390625, -0.48681640625, -0.4697265625, -0.45263671875, -0.435546875, -0.41845703125, -0.4013671875, -0.38427734375, -0.3671875, -0.35009765625, -0.3330078125, -0.31591796875, -0.298828125, -0.28173828125, -0.2646484375, -0.24755859375, -0.23046875, -0.21337890625, -0.1962890625, -0.17919921875, -0.162109375, -0.14501953125, -0.1279296875, -0.11083984375, -0.09375, -0.07666015625, -0.0595703125, -0.04248046875, -0.025390625, -0.00830078125, 0.0087890625, 0.02587890625, 0.04296875, 0.06005859375, 0.0771484375, 0.09423828125, 0.111328125, 0.12841796875, 0.1455078125, 0.16259765625, 0.1796875, 0.19677734375, 0.2138671875, 0.23095703125, 0.248046875, 0.26513671875, 0.2822265625, 0.29931640625, 0.31640625, 0.33349609375, 0.3505859375, 0.36767578125, 0.384765625, 0.40185546875, 0.4189453125, 0.43603515625, 0.453125, 0.47021484375, 0.4873046875, 0.50439453125, 0.521484375, 0.53857421875, 0.5556640625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 11.0, 16.0, 28.0, 31.0, 51.0, 61.0, 68.0, 74.0, 115.0, 118.0, 94.0, 81.0, 62.0, 52.0, 42.0, 26.0, 17.0, 11.0, 8.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.00383758544921875, -0.0037343502044677734, -0.003631114959716797, -0.0035278797149658203, -0.0034246444702148438, -0.003321409225463867, -0.0032181739807128906, -0.003114938735961914, -0.0030117034912109375, -0.002908468246459961, -0.0028052330017089844, -0.002701997756958008, -0.0025987625122070312, -0.0024955272674560547, -0.002392292022705078, -0.0022890567779541016, -0.002185821533203125, -0.0020825862884521484, -0.001979351043701172, -0.0018761157989501953, -0.0017728805541992188, -0.0016696453094482422, -0.0015664100646972656, -0.001463174819946289, -0.0013599395751953125, -0.001256704330444336, -0.0011534690856933594, -0.0010502338409423828, -0.0009469985961914062, -0.0008437633514404297, -0.0007405281066894531, -0.0006372928619384766, -0.0005340576171875, -0.00043082237243652344, -0.0003275871276855469, -0.0002243518829345703, -0.00012111663818359375, -1.7881393432617188e-05, 8.535385131835938e-05, 0.00018858909606933594, 0.0002918243408203125, 0.00039505958557128906, 0.0004982948303222656, 0.0006015300750732422, 0.0007047653198242188, 0.0008080005645751953, 0.0009112358093261719, 0.0010144710540771484, 0.001117706298828125, 0.0012209415435791016, 0.0013241767883300781, 0.0014274120330810547, 0.0015306472778320312, 0.0016338825225830078, 0.0017371177673339844, 0.001840353012084961, 0.0019435882568359375, 0.002046823501586914, 0.0021500587463378906, 0.002253293991088867, 0.0023565292358398438, 0.0024597644805908203, 0.002562999725341797, 0.0026662349700927734, 0.00276947021484375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 13.0, 10.0, 18.0, 28.0, 26.0, 27.0, 79.0, 88.0, 105.0, 237.0, 747.0, 131584.0, 913597.0, 1223.0, 260.0, 166.0, 102.0, 51.0, 36.0, 39.0, 34.0, 16.0, 10.0, 12.0, 10.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053619384765625, -0.05156564712524414, -0.04951190948486328, -0.04745817184448242, -0.04540443420410156, -0.0433506965637207, -0.041296958923339844, -0.039243221282958984, -0.037189483642578125, -0.035135746002197266, -0.033082008361816406, -0.031028270721435547, -0.028974533081054688, -0.026920795440673828, -0.02486705780029297, -0.02281332015991211, -0.02075958251953125, -0.01870584487915039, -0.01665210723876953, -0.014598369598388672, -0.012544631958007812, -0.010490894317626953, -0.008437156677246094, -0.006383419036865234, -0.004329681396484375, -0.0022759437561035156, -0.00022220611572265625, 0.0018315315246582031, 0.0038852691650390625, 0.005939006805419922, 0.007992744445800781, 0.01004648208618164, 0.0121002197265625, 0.01415395736694336, 0.01620769500732422, 0.018261432647705078, 0.020315170288085938, 0.022368907928466797, 0.024422645568847656, 0.026476383209228516, 0.028530120849609375, 0.030583858489990234, 0.032637596130371094, 0.03469133377075195, 0.03674507141113281, 0.03879880905151367, 0.04085254669189453, 0.04290628433227539, 0.04496002197265625, 0.04701375961303711, 0.04906749725341797, 0.05112123489379883, 0.05317497253417969, 0.05522871017456055, 0.057282447814941406, 0.059336185455322266, 0.061389923095703125, 0.06344366073608398, 0.06549739837646484, 0.0675511360168457, 0.06960487365722656, 0.07165861129760742, 0.07371234893798828, 0.07576608657836914, 0.07781982421875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 17.0, 76.0, 247.0, 429.0, 196.0, 38.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020997445099055767, -0.001942525035701692, -0.0017853055614978075, -0.001628085970878601, -0.0014708664966747165, -0.0013136470224708319, -0.0011564274318516254, -0.0009992079576477408, -0.0008419884834438562, -0.0006847690092399716, -0.0005275494768284261, -0.00037032997352071106, -0.000213110470212996, -5.5890996009111404e-05, 0.00010132853640243411, 0.0002585480688139796, 0.00041576754301786423, 0.0005729870172217488, 0.0007302065496332943, 0.0008874260820448399, 0.0010446455562487245, 0.001201865030452609, 0.0013590846210718155, 0.0015163040952757, 0.0016735235694795847, 0.0018307430436834693, 0.001987962517887354, 0.0021451821085065603, 0.0023024016991257668, 0.0024596210569143295, 0.002616840647533536, 0.0027740602381527424, 0.002931279130280018, 0.0030884987208992243, 0.003245718078687787, 0.0034029376693069935, 0.0035601570270955563, 0.0037173766177147627, 0.003874596208333969, 0.004031815566122532, 0.004189034923911095, 0.0043462542816996574, 0.0045034741051495075, 0.00466069346293807, 0.004817912820726633, 0.004975132644176483, 0.005132352001965046, 0.005289571359753609, 0.005446791183203459, 0.0056040105409920216, 0.005761230364441872, 0.005918449722230434, 0.006075669080018997, 0.00623288843780756, 0.00639010826125741, 0.006547327619045973, 0.006704547442495823, 0.006861766800284386, 0.007018986623734236, 0.0071762059815227985, 0.007333425339311361, 0.007490645162761211, 0.007647864520549774, 0.007805083878338337, 0.0079623032361269]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 9.0, 5.0, 4.0, 3.0, 3.0, 7.0, 8.0, 8.0, 18.0, 13.0, 15.0, 25.0, 26.0, 28.0, 26.0, 27.0, 34.0, 35.0, 34.0, 41.0, 40.0, 38.0, 58.0, 36.0, 37.0, 61.0, 46.0, 27.0, 49.0, 34.0, 32.0, 32.0, 25.0, 21.0, 19.0, 14.0, 15.0, 6.0, 10.0, 7.0, 3.0, 7.0, 3.0, 8.0, 12.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0012882351875305176, -0.0012522926554083824, -0.0012163501232862473, -0.001180407591164112, -0.001144465059041977, -0.0011085225269198418, -0.0010725799947977066, -0.0010366374626755714, -0.0010006949305534363, -0.0009647523984313011, -0.000928809866309166, -0.0008928673341870308, -0.0008569248020648956, -0.0008209822699427605, -0.0007850397378206253, -0.0007490972056984901, -0.000713154673576355, -0.0006772121414542198, -0.0006412696093320847, -0.0006053270772099495, -0.0005693845450878143, -0.0005334420129656792, -0.000497499480843544, -0.00046155694872140884, -0.0004256144165992737, -0.0003896718844771385, -0.00035372935235500336, -0.0003177868202328682, -0.00028184428811073303, -0.00024590175598859787, -0.0002099592238664627, -0.00017401669174432755, -0.00013807415962219238, -0.00010213162750005722, -6.618909537792206e-05, -3.0246563255786896e-05, 5.695968866348267e-06, 4.163850098848343e-05, 7.758103311061859e-05, 0.00011352356523275375, 0.00014946609735488892, 0.00018540862947702408, 0.00022135116159915924, 0.0002572936937212944, 0.00029323622584342957, 0.00032917875796556473, 0.0003651212900876999, 0.00040106382220983505, 0.0004370063543319702, 0.0004729488864541054, 0.0005088914185762405, 0.0005448339506983757, 0.0005807764828205109, 0.000616719014942646, 0.0006526615470647812, 0.0006886040791869164, 0.0007245466113090515, 0.0007604891434311867, 0.0007964316755533218, 0.000832374207675457, 0.0008683167397975922, 0.0009042592719197273, 0.0009402018040418625, 0.0009761443361639977, 0.0010120868682861328]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 5.0, 9.0, 6.0, 12.0, 22.0, 10.0, 15.0, 21.0, 25.0, 23.0, 18.0, 27.0, 31.0, 23.0, 29.0, 30.0, 32.0, 42.0, 40.0, 38.0, 34.0, 31.0, 43.0, 43.0, 40.0, 27.0, 16.0, 32.0, 41.0, 18.0, 26.0, 27.0, 26.0, 18.0, 15.0, 16.0, 13.0, 10.0, 9.0, 10.0, 13.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.671875, -4.526611328125, -4.38134765625, -4.236083984375, -4.0908203125, -3.945556640625, -3.80029296875, -3.655029296875, -3.509765625, -3.364501953125, -3.21923828125, -3.073974609375, -2.9287109375, -2.783447265625, -2.63818359375, -2.492919921875, -2.34765625, -2.202392578125, -2.05712890625, -1.911865234375, -1.7666015625, -1.621337890625, -1.47607421875, -1.330810546875, -1.185546875, -1.040283203125, -0.89501953125, -0.749755859375, -0.6044921875, -0.459228515625, -0.31396484375, -0.168701171875, -0.0234375, 0.121826171875, 0.26708984375, 0.412353515625, 0.5576171875, 0.702880859375, 0.84814453125, 0.993408203125, 1.138671875, 1.283935546875, 1.42919921875, 1.574462890625, 1.7197265625, 1.864990234375, 2.01025390625, 2.155517578125, 2.30078125, 2.446044921875, 2.59130859375, 2.736572265625, 2.8818359375, 3.027099609375, 3.17236328125, 3.317626953125, 3.462890625, 3.608154296875, 3.75341796875, 3.898681640625, 4.0439453125, 4.189208984375, 4.33447265625, 4.479736328125, 4.625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 2.0, 3.0, 0.0, 5.0, 6.0, 10.0, 10.0, 12.0, 19.0, 24.0, 30.0, 43.0, 76.0, 118.0, 234.0, 391.0, 717.0, 1266.0, 2344.0, 4497.0, 8878.0, 17892.0, 39031.0, 91389.0, 229988.0, 372269.0, 158668.0, 64371.0, 28452.0, 13532.0, 6610.0, 3503.0, 1777.0, 996.0, 532.0, 342.0, 191.0, 110.0, 64.0, 48.0, 23.0, 20.0, 17.0, 9.0, 6.0, 7.0, 7.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0], "bins": [-3.458984375, -3.351898193359375, -3.24481201171875, -3.137725830078125, -3.0306396484375, -2.923553466796875, -2.81646728515625, -2.709381103515625, -2.602294921875, -2.495208740234375, -2.38812255859375, -2.281036376953125, -2.1739501953125, -2.066864013671875, -1.95977783203125, -1.852691650390625, -1.74560546875, -1.638519287109375, -1.53143310546875, -1.424346923828125, -1.3172607421875, -1.210174560546875, -1.10308837890625, -0.996002197265625, -0.888916015625, -0.781829833984375, -0.67474365234375, -0.567657470703125, -0.4605712890625, -0.353485107421875, -0.24639892578125, -0.139312744140625, -0.0322265625, 0.074859619140625, 0.18194580078125, 0.289031982421875, 0.3961181640625, 0.503204345703125, 0.61029052734375, 0.717376708984375, 0.824462890625, 0.931549072265625, 1.03863525390625, 1.145721435546875, 1.2528076171875, 1.359893798828125, 1.46697998046875, 1.574066162109375, 1.68115234375, 1.788238525390625, 1.89532470703125, 2.002410888671875, 2.1094970703125, 2.216583251953125, 2.32366943359375, 2.430755615234375, 2.537841796875, 2.644927978515625, 2.75201416015625, 2.859100341796875, 2.9661865234375, 3.073272705078125, 3.18035888671875, 3.287445068359375, 3.39453125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 8.0, 13.0, 3.0, 27.0, 19.0, 14.0, 13.0, 23.0, 35.0, 26.0, 38.0, 46.0, 50.0, 51.0, 87.0, 164.0, 1587.0, 300.0, 92.0, 59.0, 64.0, 49.0, 45.0, 25.0, 33.0, 26.0, 23.0, 31.0, 21.0, 12.0, 10.0, 7.0, 7.0, 7.0, 3.0, 4.0, 6.0, 5.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.984375, -17.417236328125, -16.85009765625, -16.282958984375, -15.7158203125, -15.148681640625, -14.58154296875, -14.014404296875, -13.447265625, -12.880126953125, -12.31298828125, -11.745849609375, -11.1787109375, -10.611572265625, -10.04443359375, -9.477294921875, -8.91015625, -8.343017578125, -7.77587890625, -7.208740234375, -6.6416015625, -6.074462890625, -5.50732421875, -4.940185546875, -4.373046875, -3.805908203125, -3.23876953125, -2.671630859375, -2.1044921875, -1.537353515625, -0.97021484375, -0.403076171875, 0.1640625, 0.731201171875, 1.29833984375, 1.865478515625, 2.4326171875, 2.999755859375, 3.56689453125, 4.134033203125, 4.701171875, 5.268310546875, 5.83544921875, 6.402587890625, 6.9697265625, 7.536865234375, 8.10400390625, 8.671142578125, 9.23828125, 9.805419921875, 10.37255859375, 10.939697265625, 11.5068359375, 12.073974609375, 12.64111328125, 13.208251953125, 13.775390625, 14.342529296875, 14.90966796875, 15.476806640625, 16.0439453125, 16.611083984375, 17.17822265625, 17.745361328125, 18.3125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 0.0, 4.0, 6.0, 6.0, 6.0, 6.0, 9.0, 9.0, 11.0, 19.0, 29.0, 37.0, 48.0, 58.0, 64.0, 72.0, 123.0, 148.0, 237.0, 341.0, 680.0, 3343.0, 2052661.0, 1082959.0, 3023.0, 625.0, 326.0, 233.0, 139.0, 131.0, 99.0, 56.0, 40.0, 22.0, 23.0, 33.0, 21.0, 8.0, 21.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.21875, -42.8779296875, -41.537109375, -40.1962890625, -38.85546875, -37.5146484375, -36.173828125, -34.8330078125, -33.4921875, -32.1513671875, -30.810546875, -29.4697265625, -28.12890625, -26.7880859375, -25.447265625, -24.1064453125, -22.765625, -21.4248046875, -20.083984375, -18.7431640625, -17.40234375, -16.0615234375, -14.720703125, -13.3798828125, -12.0390625, -10.6982421875, -9.357421875, -8.0166015625, -6.67578125, -5.3349609375, -3.994140625, -2.6533203125, -1.3125, 0.0283203125, 1.369140625, 2.7099609375, 4.05078125, 5.3916015625, 6.732421875, 8.0732421875, 9.4140625, 10.7548828125, 12.095703125, 13.4365234375, 14.77734375, 16.1181640625, 17.458984375, 18.7998046875, 20.140625, 21.4814453125, 22.822265625, 24.1630859375, 25.50390625, 26.8447265625, 28.185546875, 29.5263671875, 30.8671875, 32.2080078125, 33.548828125, 34.8896484375, 36.23046875, 37.5712890625, 38.912109375, 40.2529296875, 41.59375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 139.0, 506.0, 322.0, 38.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.318716049194336, -15.096857070922852, -12.874998092651367, -10.653138160705566, -8.431279182434082, -6.209420204162598, -3.987560272216797, -1.7657012939453125, 0.4561576843261719, 2.6780169010162354, 4.899876117706299, 7.121735572814941, 9.343594551086426, 11.56545352935791, 13.787313461303711, 16.009172439575195, 18.23103141784668, 20.452890396118164, 22.67474937438965, 24.896610260009766, 27.11846923828125, 29.340328216552734, 31.56218719482422, 33.7840461730957, 36.00590515136719, 38.22776412963867, 40.449623107910156, 42.67148208618164, 44.893341064453125, 47.11520004272461, 49.337059020996094, 51.558921813964844, 53.78077697753906, 56.00263595581055, 58.22449493408203, 60.446353912353516, 62.668212890625, 64.89007568359375, 67.11193084716797, 69.33379364013672, 71.55564880371094, 73.77751159667969, 75.9993667602539, 78.22122955322266, 80.44308471679688, 82.66494750976562, 84.88680267333984, 87.1086654663086, 89.33052062988281, 91.55238342285156, 93.77423858642578, 95.99610137939453, 98.21795654296875, 100.4398193359375, 102.66167449951172, 104.88353729248047, 107.10540008544922, 109.32726287841797, 111.54911804199219, 113.77098083496094, 115.99283599853516, 118.2146987915039, 120.43655395507812, 122.65841674804688, 124.8802719116211]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 6.0, 8.0, 6.0, 8.0, 12.0, 9.0, 12.0, 10.0, 22.0, 25.0, 33.0, 26.0, 33.0, 20.0, 24.0, 36.0, 35.0, 42.0, 38.0, 32.0, 35.0, 26.0, 30.0, 39.0, 32.0, 43.0, 38.0, 29.0, 28.0, 21.0, 23.0, 23.0, 31.0, 10.0, 20.0, 21.0, 18.0, 14.0, 15.0, 14.0, 11.0, 6.0, 7.0, 6.0, 3.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-38.85610580444336, -37.63048553466797, -36.40486145019531, -35.17924118041992, -33.95362091064453, -32.72800064086914, -31.502378463745117, -30.276756286621094, -29.051136016845703, -27.825515747070312, -26.59989356994629, -25.374271392822266, -24.148651123046875, -22.923030853271484, -21.69740867614746, -20.471786499023438, -19.246166229248047, -18.020545959472656, -16.794923782348633, -15.569302558898926, -14.343681335449219, -13.118060111999512, -11.892438888549805, -10.666817665100098, -9.44119644165039, -8.215575218200684, -6.989953994750977, -5.7643327713012695, -4.5387115478515625, -3.3130903244018555, -2.0874691009521484, -0.8618478775024414, 0.36377716064453125, 1.5893983840942383, 2.8150196075439453, 4.040640830993652, 5.266262054443359, 6.491883277893066, 7.717504501342773, 8.94312572479248, 10.168746948242188, 11.394368171691895, 12.619989395141602, 13.845610618591309, 15.071231842041016, 16.296852111816406, 17.52247428894043, 18.748096466064453, 19.973716735839844, 21.199337005615234, 22.424959182739258, 23.65058135986328, 24.876201629638672, 26.101821899414062, 27.327444076538086, 28.55306625366211, 29.7786865234375, 31.00430679321289, 32.22992706298828, 33.45555114746094, 34.68117141723633, 35.90679168701172, 37.132415771484375, 38.358036041259766, 39.583656311035156]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 4.0, 9.0, 14.0, 10.0, 9.0, 14.0, 14.0, 19.0, 35.0, 23.0, 28.0, 19.0, 25.0, 33.0, 38.0, 41.0, 24.0, 37.0, 33.0, 40.0, 46.0, 34.0, 44.0, 31.0, 34.0, 24.0, 24.0, 37.0, 25.0, 34.0, 14.0, 29.0, 24.0, 24.0, 12.0, 10.0, 8.0, 17.0, 11.0, 14.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.8828125, -4.72821044921875, -4.5736083984375, -4.41900634765625, -4.264404296875, -4.10980224609375, -3.9552001953125, -3.80059814453125, -3.64599609375, -3.49139404296875, -3.3367919921875, -3.18218994140625, -3.027587890625, -2.87298583984375, -2.7183837890625, -2.56378173828125, -2.4091796875, -2.25457763671875, -2.0999755859375, -1.94537353515625, -1.790771484375, -1.63616943359375, -1.4815673828125, -1.32696533203125, -1.17236328125, -1.01776123046875, -0.8631591796875, -0.70855712890625, -0.553955078125, -0.39935302734375, -0.2447509765625, -0.09014892578125, 0.064453125, 0.21905517578125, 0.3736572265625, 0.52825927734375, 0.682861328125, 0.83746337890625, 0.9920654296875, 1.14666748046875, 1.30126953125, 1.45587158203125, 1.6104736328125, 1.76507568359375, 1.919677734375, 2.07427978515625, 2.2288818359375, 2.38348388671875, 2.5380859375, 2.69268798828125, 2.8472900390625, 3.00189208984375, 3.156494140625, 3.31109619140625, 3.4656982421875, 3.62030029296875, 3.77490234375, 3.92950439453125, 4.0841064453125, 4.23870849609375, 4.393310546875, 4.54791259765625, 4.7025146484375, 4.85711669921875, 5.01171875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 7.0, 7.0, 9.0, 12.0, 13.0, 12.0, 11.0, 19.0, 22.0, 26.0, 31.0, 38.0, 46.0, 61.0, 133.0, 294.0, 543.0, 1902.0, 9547.0, 128996.0, 2484533.0, 1501858.0, 57332.0, 6230.0, 1378.0, 510.0, 260.0, 120.0, 61.0, 43.0, 36.0, 27.0, 14.0, 25.0, 18.0, 17.0, 12.0, 17.0, 14.0, 6.0, 7.0, 9.0, 6.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.9453125, -15.4288330078125, -14.912353515625, -14.3958740234375, -13.87939453125, -13.3629150390625, -12.846435546875, -12.3299560546875, -11.8134765625, -11.2969970703125, -10.780517578125, -10.2640380859375, -9.74755859375, -9.2310791015625, -8.714599609375, -8.1981201171875, -7.681640625, -7.1651611328125, -6.648681640625, -6.1322021484375, -5.61572265625, -5.0992431640625, -4.582763671875, -4.0662841796875, -3.5498046875, -3.0333251953125, -2.516845703125, -2.0003662109375, -1.48388671875, -0.9674072265625, -0.450927734375, 0.0655517578125, 0.58203125, 1.0985107421875, 1.614990234375, 2.1314697265625, 2.64794921875, 3.1644287109375, 3.680908203125, 4.1973876953125, 4.7138671875, 5.2303466796875, 5.746826171875, 6.2633056640625, 6.77978515625, 7.2962646484375, 7.812744140625, 8.3292236328125, 8.845703125, 9.3621826171875, 9.878662109375, 10.3951416015625, 10.91162109375, 11.4281005859375, 11.944580078125, 12.4610595703125, 12.9775390625, 13.4940185546875, 14.010498046875, 14.5269775390625, 15.04345703125, 15.5599365234375, 16.076416015625, 16.5928955078125, 17.109375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 7.0, 13.0, 18.0, 17.0, 37.0, 51.0, 65.0, 100.0, 164.0, 212.0, 342.0, 447.0, 616.0, 559.0, 434.0, 298.0, 206.0, 158.0, 111.0, 55.0, 56.0, 31.0, 26.0, 16.0, 10.0, 8.0, 4.0, 1.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.5234375, -15.1141357421875, -14.704833984375, -14.2955322265625, -13.88623046875, -13.4769287109375, -13.067626953125, -12.6583251953125, -12.2490234375, -11.8397216796875, -11.430419921875, -11.0211181640625, -10.61181640625, -10.2025146484375, -9.793212890625, -9.3839111328125, -8.974609375, -8.5653076171875, -8.156005859375, -7.7467041015625, -7.33740234375, -6.9281005859375, -6.518798828125, -6.1094970703125, -5.7001953125, -5.2908935546875, -4.881591796875, -4.4722900390625, -4.06298828125, -3.6536865234375, -3.244384765625, -2.8350830078125, -2.42578125, -2.0164794921875, -1.607177734375, -1.1978759765625, -0.78857421875, -0.3792724609375, 0.030029296875, 0.4393310546875, 0.8486328125, 1.2579345703125, 1.667236328125, 2.0765380859375, 2.48583984375, 2.8951416015625, 3.304443359375, 3.7137451171875, 4.123046875, 4.5323486328125, 4.941650390625, 5.3509521484375, 5.76025390625, 6.1695556640625, 6.578857421875, 6.9881591796875, 7.3974609375, 7.8067626953125, 8.216064453125, 8.6253662109375, 9.03466796875, 9.4439697265625, 9.853271484375, 10.2625732421875, 10.671875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 11.0, 7.0, 17.0, 24.0, 36.0, 56.0, 76.0, 102.0, 166.0, 241.0, 325.0, 473.0, 1738.0, 2380961.0, 1806839.0, 1692.0, 495.0, 279.0, 225.0, 151.0, 122.0, 84.0, 52.0, 36.0, 28.0, 22.0, 13.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -64.716796875, -62.55859375, -60.400390625, -58.2421875, -56.083984375, -53.92578125, -51.767578125, -49.609375, -47.451171875, -45.29296875, -43.134765625, -40.9765625, -38.818359375, -36.66015625, -34.501953125, -32.34375, -30.185546875, -28.02734375, -25.869140625, -23.7109375, -21.552734375, -19.39453125, -17.236328125, -15.078125, -12.919921875, -10.76171875, -8.603515625, -6.4453125, -4.287109375, -2.12890625, 0.029296875, 2.1875, 4.345703125, 6.50390625, 8.662109375, 10.8203125, 12.978515625, 15.13671875, 17.294921875, 19.453125, 21.611328125, 23.76953125, 25.927734375, 28.0859375, 30.244140625, 32.40234375, 34.560546875, 36.71875, 38.876953125, 41.03515625, 43.193359375, 45.3515625, 47.509765625, 49.66796875, 51.826171875, 53.984375, 56.142578125, 58.30078125, 60.458984375, 62.6171875, 64.775390625, 66.93359375, 69.091796875, 71.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 15.0, 150.0, 313.0, 374.0, 133.0, 27.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.8953399658203, -167.4841766357422, -163.072998046875, -158.66183471679688, -154.2506561279297, -149.83949279785156, -145.42831420898438, -141.01715087890625, -136.60598754882812, -132.19482421875, -127.78364562988281, -123.37247467041016, -118.9613037109375, -114.55014038085938, -110.13896942138672, -105.72779846191406, -101.31661987304688, -96.90544891357422, -92.49427795410156, -88.0831069946289, -83.67193603515625, -79.26077270507812, -74.84960174560547, -70.43843078613281, -66.02725982666016, -61.6160888671875, -57.204917907714844, -52.79375076293945, -48.3825798034668, -43.97140884399414, -39.56024169921875, -35.149070739746094, -30.737884521484375, -26.32671356201172, -21.915544509887695, -17.504375457763672, -13.093204498291016, -8.68203353881836, -4.270864486694336, 0.1403045654296875, 4.551475524902344, 8.962645530700684, 13.373815536499023, 17.784984588623047, 22.196155548095703, 26.60732650756836, 31.018495559692383, 35.429664611816406, 39.84083557128906, 44.25200653076172, 48.663177490234375, 53.074344635009766, 57.48551559448242, 61.89668655395508, 66.30785369873047, 70.71902465820312, 75.13019561767578, 79.54136657714844, 83.9525375366211, 88.36370849609375, 92.77487182617188, 97.18605041503906, 101.59721374511719, 106.00838470458984, 110.4195556640625]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 9.0, 3.0, 2.0, 8.0, 7.0, 14.0, 15.0, 14.0, 16.0, 20.0, 21.0, 24.0, 13.0, 21.0, 31.0, 33.0, 24.0, 34.0, 27.0, 25.0, 33.0, 39.0, 50.0, 46.0, 44.0, 37.0, 28.0, 42.0, 37.0, 30.0, 26.0, 27.0, 26.0, 17.0, 17.0, 19.0, 26.0, 17.0, 13.0, 15.0, 8.0, 15.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-32.211605072021484, -31.25213050842285, -30.29265785217285, -29.33318328857422, -28.373708724975586, -27.414234161376953, -26.454761505126953, -25.49528694152832, -24.535812377929688, -23.576337814331055, -22.616865158081055, -21.657390594482422, -20.69791603088379, -19.738441467285156, -18.778968811035156, -17.819494247436523, -16.86001968383789, -15.900546073913574, -14.941071510314941, -13.981597900390625, -13.022123336791992, -12.062649726867676, -11.10317611694336, -10.143701553344727, -9.184228897094727, -8.22475528717041, -7.265280723571777, -6.305807113647461, -5.346332550048828, -4.386858940124512, -3.427384853363037, -2.4679107666015625, -1.5084362030029297, -0.5489621758460999, 0.41051185131073, 1.369985818862915, 2.3294599056243896, 3.288933753967285, 4.24840784072876, 5.207881927490234, 6.167356014251709, 7.126830101013184, 8.0863037109375, 9.045778274536133, 10.00525188446045, 10.964725494384766, 11.924200057983398, 12.883674621582031, 13.843148231506348, 14.802621841430664, 15.762096405029297, 16.72157096862793, 17.68104362487793, 18.640518188476562, 19.599992752075195, 20.559467315673828, 21.518939971923828, 22.47841453552246, 23.43788719177246, 24.397361755371094, 25.356836318969727, 26.31631088256836, 27.27578353881836, 28.235258102416992, 29.194732666015625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 9.0, 5.0, 11.0, 11.0, 7.0, 9.0, 15.0, 20.0, 21.0, 27.0, 26.0, 19.0, 33.0, 35.0, 30.0, 26.0, 37.0, 40.0, 36.0, 45.0, 42.0, 36.0, 39.0, 42.0, 40.0, 38.0, 19.0, 35.0, 30.0, 28.0, 33.0, 22.0, 18.0, 17.0, 15.0, 19.0, 9.0, 10.0, 10.0, 12.0, 5.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.08984375, -4.93060302734375, -4.7713623046875, -4.61212158203125, -4.452880859375, -4.29364013671875, -4.1343994140625, -3.97515869140625, -3.81591796875, -3.65667724609375, -3.4974365234375, -3.33819580078125, -3.178955078125, -3.01971435546875, -2.8604736328125, -2.70123291015625, -2.5419921875, -2.38275146484375, -2.2235107421875, -2.06427001953125, -1.905029296875, -1.74578857421875, -1.5865478515625, -1.42730712890625, -1.26806640625, -1.10882568359375, -0.9495849609375, -0.79034423828125, -0.631103515625, -0.47186279296875, -0.3126220703125, -0.15338134765625, 0.005859375, 0.16510009765625, 0.3243408203125, 0.48358154296875, 0.642822265625, 0.80206298828125, 0.9613037109375, 1.12054443359375, 1.27978515625, 1.43902587890625, 1.5982666015625, 1.75750732421875, 1.916748046875, 2.07598876953125, 2.2352294921875, 2.39447021484375, 2.5537109375, 2.71295166015625, 2.8721923828125, 3.03143310546875, 3.190673828125, 3.34991455078125, 3.5091552734375, 3.66839599609375, 3.82763671875, 3.98687744140625, 4.1461181640625, 4.30535888671875, 4.464599609375, 4.62384033203125, 4.7830810546875, 4.94232177734375, 5.1015625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 7.0, 7.0, 6.0, 10.0, 30.0, 31.0, 66.0, 78.0, 125.0, 168.0, 226.0, 348.0, 507.0, 659.0, 953.0, 1333.0, 1930.0, 2742.0, 4001.0, 5730.0, 8002.0, 11863.0, 18048.0, 27550.0, 43047.0, 67855.0, 109272.0, 166491.0, 188395.0, 140193.0, 88111.0, 55328.0, 34726.0, 22698.0, 15370.0, 9985.0, 6825.0, 4697.0, 3250.0, 2343.0, 1644.0, 1180.0, 825.0, 583.0, 408.0, 294.0, 185.0, 159.0, 82.0, 62.0, 65.0, 24.0, 14.0, 14.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.6044921875, -0.5857620239257812, -0.5670318603515625, -0.5483016967773438, -0.529571533203125, -0.5108413696289062, -0.4921112060546875, -0.47338104248046875, -0.45465087890625, -0.43592071533203125, -0.4171905517578125, -0.39846038818359375, -0.379730224609375, -0.36100006103515625, -0.3422698974609375, -0.32353973388671875, -0.3048095703125, -0.28607940673828125, -0.2673492431640625, -0.24861907958984375, -0.229888916015625, -0.21115875244140625, -0.1924285888671875, -0.17369842529296875, -0.15496826171875, -0.13623809814453125, -0.1175079345703125, -0.09877777099609375, -0.080047607421875, -0.06131744384765625, -0.0425872802734375, -0.02385711669921875, -0.005126953125, 0.01360321044921875, 0.0323333740234375, 0.05106353759765625, 0.069793701171875, 0.08852386474609375, 0.1072540283203125, 0.12598419189453125, 0.14471435546875, 0.16344451904296875, 0.1821746826171875, 0.20090484619140625, 0.219635009765625, 0.23836517333984375, 0.2570953369140625, 0.27582550048828125, 0.2945556640625, 0.31328582763671875, 0.3320159912109375, 0.35074615478515625, 0.369476318359375, 0.38820648193359375, 0.4069366455078125, 0.42566680908203125, 0.44439697265625, 0.46312713623046875, 0.4818572998046875, 0.5005874633789062, 0.519317626953125, 0.5380477905273438, 0.5567779541015625, 0.5755081176757812, 0.59423828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 5.0, 9.0, 10.0, 9.0, 18.0, 19.0, 23.0, 22.0, 20.0, 26.0, 27.0, 31.0, 41.0, 36.0, 49.0, 41.0, 45.0, 48.0, 1077.0, 32.0, 44.0, 42.0, 30.0, 31.0, 38.0, 27.0, 27.0, 34.0, 21.0, 23.0, 21.0, 12.0, 17.0, 19.0, 7.0, 12.0, 8.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.267578125, -3.155242919921875, -3.04290771484375, -2.930572509765625, -2.8182373046875, -2.705902099609375, -2.59356689453125, -2.481231689453125, -2.368896484375, -2.256561279296875, -2.14422607421875, -2.031890869140625, -1.9195556640625, -1.807220458984375, -1.69488525390625, -1.582550048828125, -1.47021484375, -1.357879638671875, -1.24554443359375, -1.133209228515625, -1.0208740234375, -0.908538818359375, -0.79620361328125, -0.683868408203125, -0.571533203125, -0.459197998046875, -0.34686279296875, -0.234527587890625, -0.1221923828125, -0.009857177734375, 0.10247802734375, 0.214813232421875, 0.3271484375, 0.439483642578125, 0.55181884765625, 0.664154052734375, 0.7764892578125, 0.888824462890625, 1.00115966796875, 1.113494873046875, 1.225830078125, 1.338165283203125, 1.45050048828125, 1.562835693359375, 1.6751708984375, 1.787506103515625, 1.89984130859375, 2.012176513671875, 2.12451171875, 2.236846923828125, 2.34918212890625, 2.461517333984375, 2.5738525390625, 2.686187744140625, 2.79852294921875, 2.910858154296875, 3.023193359375, 3.135528564453125, 3.24786376953125, 3.360198974609375, 3.4725341796875, 3.584869384765625, 3.69720458984375, 3.809539794921875, 3.921875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 8.0, 16.0, 13.0, 23.0, 36.0, 62.0, 98.0, 119.0, 184.0, 320.0, 473.0, 819.0, 1387.0, 2196.0, 3568.0, 5995.0, 10509.0, 17943.0, 31681.0, 56319.0, 102264.0, 182842.0, 1287907.0, 172185.0, 95889.0, 52859.0, 30062.0, 16790.0, 9908.0, 5733.0, 3442.0, 2028.0, 1228.0, 782.0, 520.0, 316.0, 211.0, 127.0, 83.0, 56.0, 31.0, 44.0, 16.0, 12.0, 6.0, 9.0, 0.0, 1.0, 5.0, 0.0, 1.0], "bins": [-0.6884765625, -0.6690521240234375, -0.649627685546875, -0.6302032470703125, -0.61077880859375, -0.5913543701171875, -0.571929931640625, -0.5525054931640625, -0.5330810546875, -0.5136566162109375, -0.494232177734375, -0.4748077392578125, -0.45538330078125, -0.4359588623046875, -0.416534423828125, -0.3971099853515625, -0.377685546875, -0.3582611083984375, -0.338836669921875, -0.3194122314453125, -0.29998779296875, -0.2805633544921875, -0.261138916015625, -0.2417144775390625, -0.2222900390625, -0.2028656005859375, -0.183441162109375, -0.1640167236328125, -0.14459228515625, -0.1251678466796875, -0.105743408203125, -0.0863189697265625, -0.06689453125, -0.0474700927734375, -0.028045654296875, -0.0086212158203125, 0.01080322265625, 0.0302276611328125, 0.049652099609375, 0.0690765380859375, 0.0885009765625, 0.1079254150390625, 0.127349853515625, 0.1467742919921875, 0.16619873046875, 0.1856231689453125, 0.205047607421875, 0.2244720458984375, 0.243896484375, 0.2633209228515625, 0.282745361328125, 0.3021697998046875, 0.32159423828125, 0.3410186767578125, 0.360443115234375, 0.3798675537109375, 0.3992919921875, 0.4187164306640625, 0.438140869140625, 0.4575653076171875, 0.47698974609375, 0.4964141845703125, 0.515838623046875, 0.5352630615234375, 0.5546875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 7.0, 10.0, 9.0, 12.0, 11.0, 12.0, 17.0, 33.0, 33.0, 32.0, 52.0, 32.0, 38.0, 59.0, 60.0, 60.0, 65.0, 71.0, 57.0, 55.0, 36.0, 45.0, 35.0, 29.0, 29.0, 22.0, 12.0, 12.0, 13.0, 10.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00212860107421875, -0.0020547211170196533, -0.0019808411598205566, -0.00190696120262146, -0.0018330812454223633, -0.0017592012882232666, -0.00168532133102417, -0.0016114413738250732, -0.0015375614166259766, -0.0014636814594268799, -0.0013898015022277832, -0.0013159215450286865, -0.0012420415878295898, -0.0011681616306304932, -0.0010942816734313965, -0.0010204017162322998, -0.0009465217590332031, -0.0008726418018341064, -0.0007987618446350098, -0.0007248818874359131, -0.0006510019302368164, -0.0005771219730377197, -0.000503242015838623, -0.00042936205863952637, -0.0003554821014404297, -0.000281602144241333, -0.00020772218704223633, -0.00013384222984313965, -5.996227264404297e-05, 1.3917684555053711e-05, 8.779764175415039e-05, 0.00016167759895324707, 0.00023555755615234375, 0.00030943751335144043, 0.0003833174705505371, 0.0004571974277496338, 0.0005310773849487305, 0.0006049573421478271, 0.0006788372993469238, 0.0007527172565460205, 0.0008265972137451172, 0.0009004771709442139, 0.0009743571281433105, 0.0010482370853424072, 0.001122117042541504, 0.0011959969997406006, 0.0012698769569396973, 0.001343756914138794, 0.0014176368713378906, 0.0014915168285369873, 0.001565396785736084, 0.0016392767429351807, 0.0017131567001342773, 0.001787036657333374, 0.0018609166145324707, 0.0019347965717315674, 0.002008676528930664, 0.0020825564861297607, 0.0021564364433288574, 0.002230316400527954, 0.0023041963577270508, 0.0023780763149261475, 0.002451956272125244, 0.002525836229324341, 0.0025997161865234375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 8.0, 8.0, 13.0, 15.0, 23.0, 21.0, 22.0, 29.0, 46.0, 62.0, 84.0, 102.0, 127.0, 261.0, 478.0, 2157.0, 951446.0, 91648.0, 1013.0, 332.0, 170.0, 108.0, 79.0, 64.0, 65.0, 40.0, 25.0, 23.0, 16.0, 13.0, 17.0, 8.0, 5.0, 1.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.05810546875, -0.056527137756347656, -0.05494880676269531, -0.05337047576904297, -0.051792144775390625, -0.05021381378173828, -0.04863548278808594, -0.047057151794433594, -0.04547882080078125, -0.043900489807128906, -0.04232215881347656, -0.04074382781982422, -0.039165496826171875, -0.03758716583251953, -0.03600883483886719, -0.034430503845214844, -0.0328521728515625, -0.031273841857910156, -0.029695510864257812, -0.02811717987060547, -0.026538848876953125, -0.02496051788330078, -0.023382186889648438, -0.021803855895996094, -0.02022552490234375, -0.018647193908691406, -0.017068862915039062, -0.015490531921386719, -0.013912200927734375, -0.012333869934082031, -0.010755538940429688, -0.009177207946777344, -0.007598876953125, -0.006020545959472656, -0.0044422149658203125, -0.0028638839721679688, -0.001285552978515625, 0.00029277801513671875, 0.0018711090087890625, 0.0034494400024414062, 0.00502777099609375, 0.006606101989746094, 0.008184432983398438, 0.009762763977050781, 0.011341094970703125, 0.012919425964355469, 0.014497756958007812, 0.016076087951660156, 0.0176544189453125, 0.019232749938964844, 0.020811080932617188, 0.02238941192626953, 0.023967742919921875, 0.02554607391357422, 0.027124404907226562, 0.028702735900878906, 0.03028106689453125, 0.031859397888183594, 0.03343772888183594, 0.03501605987548828, 0.036594390869140625, 0.03817272186279297, 0.03975105285644531, 0.041329383850097656, 0.04290771484375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 65.0, 936.0, 18.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0337277427315712, -0.033129896968603134, -0.03253204748034477, -0.03193420171737671, -0.031336355954408646, -0.030738508328795433, -0.03014066256582737, -0.029542814940214157, -0.028944969177246094, -0.02834712155163288, -0.027749275788664818, -0.027151428163051605, -0.026553582400083542, -0.02595573477447033, -0.025357889011502266, -0.024760041385889053, -0.02416219376027584, -0.023564346134662628, -0.022966500371694565, -0.022368652746081352, -0.02177080698311329, -0.021172959357500076, -0.020575113594532013, -0.0199772659689188, -0.019379418343305588, -0.018781570717692375, -0.018183724954724312, -0.0175858773291111, -0.016988031566143036, -0.016390183940529823, -0.01579233817756176, -0.015194490551948547, -0.014596642926335335, -0.013998796232044697, -0.013400949537754059, -0.012803102843463421, -0.012205256149172783, -0.01160740852355957, -0.011009561829268932, -0.010411715134978294, -0.009813869372010231, -0.009216022677719593, -0.008618175983428955, -0.008020329289138317, -0.007422482129186392, -0.006824635434895754, -0.006226788274943829, -0.005628941580653191, -0.005031094420701265, -0.004433247726410627, -0.0038354007992893457, -0.003237553872168064, -0.002639707177877426, -0.002041860483586788, -0.0014440135564655066, -0.0008461666293442249, -0.00024831993505358696, 0.00034952687565237284, 0.0009473736863583326, 0.0015452204970642924, 0.0021430673077702522, 0.00274091400206089, 0.003338760929182172, 0.0039366078563034534, 0.004534454550594091]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 6.0, 12.0, 7.0, 14.0, 24.0, 11.0, 23.0, 37.0, 36.0, 38.0, 33.0, 46.0, 52.0, 54.0, 46.0, 43.0, 47.0, 51.0, 46.0, 46.0, 56.0, 42.0, 32.0, 23.0, 32.0, 30.0, 18.0, 20.0, 19.0, 14.0, 10.0, 10.0, 6.0, 5.0, 8.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012114644050598145, -0.001164414919912815, -0.0011173654347658157, -0.0010703159496188164, -0.001023266464471817, -0.0009762169793248177, -0.0009291674941778183, -0.0008821180090308189, -0.0008350685238838196, -0.0007880190387368202, -0.0007409695535898209, -0.0006939200684428215, -0.0006468705832958221, -0.0005998210981488228, -0.0005527716130018234, -0.0005057221278548241, -0.0004586726427078247, -0.00041162315756082535, -0.000364573672413826, -0.00031752418726682663, -0.00027047470211982727, -0.0002234252169728279, -0.00017637573182582855, -0.0001293262466788292, -8.227676153182983e-05, -3.5227276384830475e-05, 1.1822208762168884e-05, 5.8871693909168243e-05, 0.0001059211790561676, 0.00015297066420316696, 0.00020002014935016632, 0.0002470696344971657, 0.00029411911964416504, 0.0003411686047911644, 0.00038821808993816376, 0.0004352675750851631, 0.0004823170602321625, 0.0005293665453791618, 0.0005764160305261612, 0.0006234655156731606, 0.0006705150008201599, 0.0007175644859671593, 0.0007646139711141586, 0.000811663456261158, 0.0008587129414081573, 0.0009057624265551567, 0.0009528119117021561, 0.0009998613968491554, 0.0010469108819961548, 0.0010939603671431541, 0.0011410098522901535, 0.0011880593374371529, 0.0012351088225841522, 0.0012821583077311516, 0.001329207792878151, 0.0013762572780251503, 0.0014233067631721497, 0.001470356248319149, 0.0015174057334661484, 0.0015644552186131477, 0.001611504703760147, 0.0016585541889071465, 0.0017056036740541458, 0.0017526531592011452, 0.0017997026443481445]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 9.0, 5.0, 11.0, 11.0, 7.0, 9.0, 15.0, 20.0, 21.0, 27.0, 26.0, 19.0, 33.0, 35.0, 30.0, 26.0, 37.0, 41.0, 35.0, 45.0, 42.0, 36.0, 39.0, 42.0, 41.0, 37.0, 19.0, 35.0, 30.0, 28.0, 33.0, 22.0, 18.0, 17.0, 15.0, 19.0, 9.0, 10.0, 10.0, 12.0, 5.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.08984375, -4.93060302734375, -4.7713623046875, -4.61212158203125, -4.452880859375, -4.29364013671875, -4.1343994140625, -3.97515869140625, -3.81591796875, -3.65667724609375, -3.4974365234375, -3.33819580078125, -3.178955078125, -3.01971435546875, -2.8604736328125, -2.70123291015625, -2.5419921875, -2.38275146484375, -2.2235107421875, -2.06427001953125, -1.905029296875, -1.74578857421875, -1.5865478515625, -1.42730712890625, -1.26806640625, -1.10882568359375, -0.9495849609375, -0.79034423828125, -0.631103515625, -0.47186279296875, -0.3126220703125, -0.15338134765625, 0.005859375, 0.16510009765625, 0.3243408203125, 0.48358154296875, 0.642822265625, 0.80206298828125, 0.9613037109375, 1.12054443359375, 1.27978515625, 1.43902587890625, 1.5982666015625, 1.75750732421875, 1.916748046875, 2.07598876953125, 2.2352294921875, 2.39447021484375, 2.5537109375, 2.71295166015625, 2.8721923828125, 3.03143310546875, 3.190673828125, 3.34991455078125, 3.5091552734375, 3.66839599609375, 3.82763671875, 3.98687744140625, 4.1461181640625, 4.30535888671875, 4.464599609375, 4.62384033203125, 4.7830810546875, 4.94232177734375, 5.1015625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 9.0, 8.0, 15.0, 19.0, 39.0, 33.0, 39.0, 43.0, 69.0, 90.0, 149.0, 205.0, 293.0, 543.0, 1281.0, 2963.0, 7343.0, 20230.0, 56617.0, 170653.0, 474360.0, 206738.0, 67361.0, 24017.0, 8846.0, 3436.0, 1432.0, 676.0, 327.0, 186.0, 130.0, 80.0, 67.0, 53.0, 39.0, 42.0, 33.0, 17.0, 14.0, 13.0, 9.0, 4.0, 7.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.144287109375, -4.97607421875, -4.807861328125, -4.6396484375, -4.471435546875, -4.30322265625, -4.135009765625, -3.966796875, -3.798583984375, -3.63037109375, -3.462158203125, -3.2939453125, -3.125732421875, -2.95751953125, -2.789306640625, -2.62109375, -2.452880859375, -2.28466796875, -2.116455078125, -1.9482421875, -1.780029296875, -1.61181640625, -1.443603515625, -1.275390625, -1.107177734375, -0.93896484375, -0.770751953125, -0.6025390625, -0.434326171875, -0.26611328125, -0.097900390625, 0.0703125, 0.238525390625, 0.40673828125, 0.574951171875, 0.7431640625, 0.911376953125, 1.07958984375, 1.247802734375, 1.416015625, 1.584228515625, 1.75244140625, 1.920654296875, 2.0888671875, 2.257080078125, 2.42529296875, 2.593505859375, 2.76171875, 2.929931640625, 3.09814453125, 3.266357421875, 3.4345703125, 3.602783203125, 3.77099609375, 3.939208984375, 4.107421875, 4.275634765625, 4.44384765625, 4.612060546875, 4.7802734375, 4.948486328125, 5.11669921875, 5.284912109375, 5.453125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 9.0, 12.0, 13.0, 17.0, 19.0, 24.0, 23.0, 31.0, 28.0, 40.0, 33.0, 44.0, 54.0, 54.0, 69.0, 282.0, 1711.0, 136.0, 59.0, 53.0, 41.0, 41.0, 40.0, 33.0, 32.0, 22.0, 24.0, 16.0, 23.0, 13.0, 12.0, 10.0, 4.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.765625, -18.201416015625, -17.63720703125, -17.072998046875, -16.5087890625, -15.944580078125, -15.38037109375, -14.816162109375, -14.251953125, -13.687744140625, -13.12353515625, -12.559326171875, -11.9951171875, -11.430908203125, -10.86669921875, -10.302490234375, -9.73828125, -9.174072265625, -8.60986328125, -8.045654296875, -7.4814453125, -6.917236328125, -6.35302734375, -5.788818359375, -5.224609375, -4.660400390625, -4.09619140625, -3.531982421875, -2.9677734375, -2.403564453125, -1.83935546875, -1.275146484375, -0.7109375, -0.146728515625, 0.41748046875, 0.981689453125, 1.5458984375, 2.110107421875, 2.67431640625, 3.238525390625, 3.802734375, 4.366943359375, 4.93115234375, 5.495361328125, 6.0595703125, 6.623779296875, 7.18798828125, 7.752197265625, 8.31640625, 8.880615234375, 9.44482421875, 10.009033203125, 10.5732421875, 11.137451171875, 11.70166015625, 12.265869140625, 12.830078125, 13.394287109375, 13.95849609375, 14.522705078125, 15.0869140625, 15.651123046875, 16.21533203125, 16.779541015625, 17.34375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 11.0, 13.0, 20.0, 25.0, 35.0, 52.0, 51.0, 74.0, 96.0, 163.0, 233.0, 397.0, 901.0, 6749.0, 3099277.0, 34907.0, 1262.0, 529.0, 279.0, 166.0, 117.0, 87.0, 60.0, 50.0, 36.0, 30.0, 16.0, 21.0, 11.0, 10.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.0625, -40.541015625, -39.01953125, -37.498046875, -35.9765625, -34.455078125, -32.93359375, -31.412109375, -29.890625, -28.369140625, -26.84765625, -25.326171875, -23.8046875, -22.283203125, -20.76171875, -19.240234375, -17.71875, -16.197265625, -14.67578125, -13.154296875, -11.6328125, -10.111328125, -8.58984375, -7.068359375, -5.546875, -4.025390625, -2.50390625, -0.982421875, 0.5390625, 2.060546875, 3.58203125, 5.103515625, 6.625, 8.146484375, 9.66796875, 11.189453125, 12.7109375, 14.232421875, 15.75390625, 17.275390625, 18.796875, 20.318359375, 21.83984375, 23.361328125, 24.8828125, 26.404296875, 27.92578125, 29.447265625, 30.96875, 32.490234375, 34.01171875, 35.533203125, 37.0546875, 38.576171875, 40.09765625, 41.619140625, 43.140625, 44.662109375, 46.18359375, 47.705078125, 49.2265625, 50.748046875, 52.26953125, 53.791015625, 55.3125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 100.0, 843.0, 68.0, 3.0, 1.0, 0.0, 1.0], "bins": [-263.8231506347656, -259.3093566894531, -254.79559326171875, -250.2818145751953, -245.76803588867188, -241.25425720214844, -236.740478515625, -232.2266845703125, -227.71292114257812, -223.1991424560547, -218.68536376953125, -214.1715850830078, -209.65780639648438, -205.14402770996094, -200.6302490234375, -196.116455078125, -191.60267639160156, -187.08889770507812, -182.5751190185547, -178.06134033203125, -173.5475616455078, -169.03378295898438, -164.52000427246094, -160.0062255859375, -155.492431640625, -150.97865295410156, -146.46487426757812, -141.9510955810547, -137.43731689453125, -132.9235382080078, -128.40975952148438, -123.8959732055664, -119.38220977783203, -114.8684310913086, -110.35465240478516, -105.84087371826172, -101.32708740234375, -96.81330871582031, -92.29953002929688, -87.78575134277344, -83.27197265625, -78.75819396972656, -74.24441528320312, -69.73063659667969, -65.21685791015625, -60.70307540893555, -56.189292907714844, -51.675514221191406, -47.16173553466797, -42.64795684814453, -38.134178161621094, -33.62039566040039, -29.106616973876953, -24.592838287353516, -20.079057693481445, -15.565277099609375, -11.051496505737305, -6.537716865539551, -2.023937225341797, 2.489842414855957, 7.003622055053711, 11.517400741577148, 16.03118133544922, 20.54496192932129, 25.058740615844727]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 4.0, 4.0, 7.0, 12.0, 5.0, 19.0, 17.0, 11.0, 17.0, 17.0, 13.0, 42.0, 36.0, 46.0, 35.0, 37.0, 38.0, 29.0, 38.0, 43.0, 34.0, 52.0, 48.0, 37.0, 39.0, 33.0, 39.0, 29.0, 26.0, 21.0, 26.0, 24.0, 15.0, 29.0, 12.0, 9.0, 10.0, 15.0, 7.0, 5.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-47.05217742919922, -45.647544860839844, -44.242916107177734, -42.838287353515625, -41.43365478515625, -40.029022216796875, -38.624393463134766, -37.219764709472656, -35.81513214111328, -34.410499572753906, -33.0058708190918, -31.601240158081055, -30.196609497070312, -28.79197883605957, -27.387348175048828, -25.982717514038086, -24.578086853027344, -23.1734561920166, -21.76882553100586, -20.364194869995117, -18.959564208984375, -17.554933547973633, -16.15030288696289, -14.745672225952148, -13.341041564941406, -11.936410903930664, -10.531780242919922, -9.12714958190918, -7.7225189208984375, -6.317888259887695, -4.913257598876953, -3.508626937866211, -2.1039962768554688, -0.6993656158447266, 0.7052650451660156, 2.109895706176758, 3.5145263671875, 4.919157028198242, 6.323787689208984, 7.728418350219727, 9.133049011230469, 10.537679672241211, 11.942310333251953, 13.346940994262695, 14.751571655273438, 16.15620231628418, 17.560832977294922, 18.965463638305664, 20.370094299316406, 21.77472496032715, 23.17935562133789, 24.583986282348633, 25.988616943359375, 27.393247604370117, 28.79787826538086, 30.2025089263916, 31.607139587402344, 33.01177215576172, 34.41640090942383, 35.82102966308594, 37.22566223144531, 38.63029479980469, 40.0349235534668, 41.439552307128906, 42.84418487548828]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 5.0, 3.0, 7.0, 8.0, 11.0, 11.0, 18.0, 21.0, 19.0, 20.0, 29.0, 29.0, 33.0, 33.0, 25.0, 40.0, 35.0, 35.0, 36.0, 45.0, 41.0, 37.0, 33.0, 36.0, 33.0, 34.0, 40.0, 25.0, 25.0, 34.0, 27.0, 30.0, 15.0, 19.0, 14.0, 23.0, 12.0, 10.0, 11.0, 6.0, 6.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.2265625, -5.06298828125, -4.8994140625, -4.73583984375, -4.572265625, -4.40869140625, -4.2451171875, -4.08154296875, -3.91796875, -3.75439453125, -3.5908203125, -3.42724609375, -3.263671875, -3.10009765625, -2.9365234375, -2.77294921875, -2.609375, -2.44580078125, -2.2822265625, -2.11865234375, -1.955078125, -1.79150390625, -1.6279296875, -1.46435546875, -1.30078125, -1.13720703125, -0.9736328125, -0.81005859375, -0.646484375, -0.48291015625, -0.3193359375, -0.15576171875, 0.0078125, 0.17138671875, 0.3349609375, 0.49853515625, 0.662109375, 0.82568359375, 0.9892578125, 1.15283203125, 1.31640625, 1.47998046875, 1.6435546875, 1.80712890625, 1.970703125, 2.13427734375, 2.2978515625, 2.46142578125, 2.625, 2.78857421875, 2.9521484375, 3.11572265625, 3.279296875, 3.44287109375, 3.6064453125, 3.77001953125, 3.93359375, 4.09716796875, 4.2607421875, 4.42431640625, 4.587890625, 4.75146484375, 4.9150390625, 5.07861328125, 5.2421875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 6.0, 10.0, 9.0, 15.0, 14.0, 21.0, 21.0, 39.0, 48.0, 45.0, 64.0, 103.0, 157.0, 298.0, 559.0, 1736.0, 11092.0, 286637.0, 3385640.0, 487788.0, 16158.0, 2198.0, 659.0, 316.0, 175.0, 131.0, 85.0, 61.0, 41.0, 25.0, 19.0, 24.0, 14.0, 14.0, 10.0, 12.0, 10.0, 12.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.21875, -18.646240234375, -18.07373046875, -17.501220703125, -16.9287109375, -16.356201171875, -15.78369140625, -15.211181640625, -14.638671875, -14.066162109375, -13.49365234375, -12.921142578125, -12.3486328125, -11.776123046875, -11.20361328125, -10.631103515625, -10.05859375, -9.486083984375, -8.91357421875, -8.341064453125, -7.7685546875, -7.196044921875, -6.62353515625, -6.051025390625, -5.478515625, -4.906005859375, -4.33349609375, -3.760986328125, -3.1884765625, -2.615966796875, -2.04345703125, -1.470947265625, -0.8984375, -0.325927734375, 0.24658203125, 0.819091796875, 1.3916015625, 1.964111328125, 2.53662109375, 3.109130859375, 3.681640625, 4.254150390625, 4.82666015625, 5.399169921875, 5.9716796875, 6.544189453125, 7.11669921875, 7.689208984375, 8.26171875, 8.834228515625, 9.40673828125, 9.979248046875, 10.5517578125, 11.124267578125, 11.69677734375, 12.269287109375, 12.841796875, 13.414306640625, 13.98681640625, 14.559326171875, 15.1318359375, 15.704345703125, 16.27685546875, 16.849365234375, 17.421875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 8.0, 17.0, 22.0, 34.0, 43.0, 58.0, 78.0, 129.0, 143.0, 174.0, 253.0, 402.0, 478.0, 550.0, 484.0, 334.0, 277.0, 176.0, 124.0, 72.0, 64.0, 34.0, 36.0, 18.0, 21.0, 10.0, 3.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-15.1484375, -14.79852294921875, -14.4486083984375, -14.09869384765625, -13.748779296875, -13.39886474609375, -13.0489501953125, -12.69903564453125, -12.34912109375, -11.99920654296875, -11.6492919921875, -11.29937744140625, -10.949462890625, -10.59954833984375, -10.2496337890625, -9.89971923828125, -9.5498046875, -9.19989013671875, -8.8499755859375, -8.50006103515625, -8.150146484375, -7.80023193359375, -7.4503173828125, -7.10040283203125, -6.75048828125, -6.40057373046875, -6.0506591796875, -5.70074462890625, -5.350830078125, -5.00091552734375, -4.6510009765625, -4.30108642578125, -3.951171875, -3.60125732421875, -3.2513427734375, -2.90142822265625, -2.551513671875, -2.20159912109375, -1.8516845703125, -1.50177001953125, -1.15185546875, -0.80194091796875, -0.4520263671875, -0.10211181640625, 0.247802734375, 0.59771728515625, 0.9476318359375, 1.29754638671875, 1.6474609375, 1.99737548828125, 2.3472900390625, 2.69720458984375, 3.047119140625, 3.39703369140625, 3.7469482421875, 4.09686279296875, 4.44677734375, 4.79669189453125, 5.1466064453125, 5.49652099609375, 5.846435546875, 6.19635009765625, 6.5462646484375, 6.89617919921875, 7.24609375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 8.0, 16.0, 19.0, 28.0, 25.0, 47.0, 70.0, 88.0, 129.0, 168.0, 252.0, 329.0, 576.0, 2973.0, 2841722.0, 1343952.0, 2163.0, 478.0, 293.0, 226.0, 183.0, 134.0, 100.0, 74.0, 77.0, 58.0, 33.0, 21.0, 12.0, 8.0, 8.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.6875, -38.74609375, -36.8046875, -34.86328125, -32.921875, -30.98046875, -29.0390625, -27.09765625, -25.15625, -23.21484375, -21.2734375, -19.33203125, -17.390625, -15.44921875, -13.5078125, -11.56640625, -9.625, -7.68359375, -5.7421875, -3.80078125, -1.859375, 0.08203125, 2.0234375, 3.96484375, 5.90625, 7.84765625, 9.7890625, 11.73046875, 13.671875, 15.61328125, 17.5546875, 19.49609375, 21.4375, 23.37890625, 25.3203125, 27.26171875, 29.203125, 31.14453125, 33.0859375, 35.02734375, 36.96875, 38.91015625, 40.8515625, 42.79296875, 44.734375, 46.67578125, 48.6171875, 50.55859375, 52.5, 54.44140625, 56.3828125, 58.32421875, 60.265625, 62.20703125, 64.1484375, 66.08984375, 68.03125, 69.97265625, 71.9140625, 73.85546875, 75.796875, 77.73828125, 79.6796875, 81.62109375, 83.5625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 40.0, 206.0, 373.0, 276.0, 86.0, 22.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-197.3533935546875, -193.31011962890625, -189.266845703125, -185.2235870361328, -181.18031311035156, -177.1370391845703, -173.09378051757812, -169.05050659179688, -165.00723266601562, -160.96395874023438, -156.92068481445312, -152.87742614746094, -148.8341522216797, -144.79087829589844, -140.74761962890625, -136.704345703125, -132.66107177734375, -128.6177978515625, -124.57453155517578, -120.53126525878906, -116.48799133300781, -112.44471740722656, -108.40145111083984, -104.35818481445312, -100.31491088867188, -96.27163696289062, -92.2283706665039, -88.18510437011719, -84.14183044433594, -80.09855651855469, -76.05529022216797, -72.01202392578125, -67.96876525878906, -63.92549514770508, -59.882225036621094, -55.83895492553711, -51.795684814453125, -47.75241470336914, -43.709144592285156, -39.66587448120117, -35.62260437011719, -31.579334259033203, -27.53606414794922, -23.492794036865234, -19.44952392578125, -15.406253814697266, -11.362983703613281, -7.319713592529297, -3.2764434814453125, 0.7668266296386719, 4.810096740722656, 8.85336685180664, 12.896636962890625, 16.93990707397461, 20.983177185058594, 25.026447296142578, 29.069717407226562, 33.11298751831055, 37.15625762939453, 41.199527740478516, 45.2427978515625, 49.286067962646484, 53.32933807373047, 57.37260818481445, 61.41587829589844]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 1.0, 3.0, 3.0, 5.0, 8.0, 8.0, 11.0, 8.0, 12.0, 13.0, 17.0, 29.0, 25.0, 25.0, 38.0, 31.0, 24.0, 29.0, 50.0, 41.0, 35.0, 44.0, 42.0, 42.0, 31.0, 45.0, 43.0, 38.0, 33.0, 35.0, 37.0, 25.0, 31.0, 20.0, 24.0, 18.0, 15.0, 12.0, 11.0, 10.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.54911804199219, -32.466426849365234, -31.38373565673828, -30.301042556762695, -29.218351364135742, -28.13566017150879, -27.052967071533203, -25.97027587890625, -24.887584686279297, -23.804893493652344, -22.72220230102539, -21.639509201049805, -20.55681800842285, -19.4741268157959, -18.391433715820312, -17.30874252319336, -16.226051330566406, -15.143360137939453, -14.060667991638184, -12.977975845336914, -11.895284652709961, -10.812593460083008, -9.729901313781738, -8.647209167480469, -7.564517974853516, -6.481826305389404, -5.399134635925293, -4.316442966461182, -3.2337512969970703, -2.151059627532959, -1.0683679580688477, 0.014323711395263672, 1.097015380859375, 2.1797070503234863, 3.2623987197875977, 4.345090389251709, 5.42778205871582, 6.510473728179932, 7.593165397644043, 8.675857543945312, 9.758548736572266, 10.841239929199219, 11.923932075500488, 13.006624221801758, 14.089315414428711, 15.172006607055664, 16.25469970703125, 17.337390899658203, 18.420082092285156, 19.50277328491211, 20.585464477539062, 21.66815757751465, 22.7508487701416, 23.833539962768555, 24.91623306274414, 25.998924255371094, 27.081615447998047, 28.164306640625, 29.246997833251953, 30.32969093322754, 31.412382125854492, 32.49507522583008, 33.57776641845703, 34.660457611083984, 35.74314880371094]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 6.0, 13.0, 13.0, 14.0, 13.0, 23.0, 21.0, 23.0, 20.0, 28.0, 42.0, 33.0, 27.0, 40.0, 25.0, 33.0, 48.0, 40.0, 46.0, 30.0, 38.0, 40.0, 36.0, 31.0, 36.0, 23.0, 28.0, 28.0, 26.0, 14.0, 18.0, 25.0, 13.0, 16.0, 18.0, 15.0, 12.0, 10.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.2578125, -5.0916748046875, -4.925537109375, -4.7593994140625, -4.59326171875, -4.4271240234375, -4.260986328125, -4.0948486328125, -3.9287109375, -3.7625732421875, -3.596435546875, -3.4302978515625, -3.26416015625, -3.0980224609375, -2.931884765625, -2.7657470703125, -2.599609375, -2.4334716796875, -2.267333984375, -2.1011962890625, -1.93505859375, -1.7689208984375, -1.602783203125, -1.4366455078125, -1.2705078125, -1.1043701171875, -0.938232421875, -0.7720947265625, -0.60595703125, -0.4398193359375, -0.273681640625, -0.1075439453125, 0.05859375, 0.2247314453125, 0.390869140625, 0.5570068359375, 0.72314453125, 0.8892822265625, 1.055419921875, 1.2215576171875, 1.3876953125, 1.5538330078125, 1.719970703125, 1.8861083984375, 2.05224609375, 2.2183837890625, 2.384521484375, 2.5506591796875, 2.716796875, 2.8829345703125, 3.049072265625, 3.2152099609375, 3.38134765625, 3.5474853515625, 3.713623046875, 3.8797607421875, 4.0458984375, 4.2120361328125, 4.378173828125, 4.5443115234375, 4.71044921875, 4.8765869140625, 5.042724609375, 5.2088623046875, 5.375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 8.0, 19.0, 33.0, 38.0, 52.0, 69.0, 112.0, 148.0, 235.0, 310.0, 489.0, 757.0, 1045.0, 1591.0, 2262.0, 3584.0, 5496.0, 8264.0, 12830.0, 20145.0, 32901.0, 55481.0, 96681.0, 168643.0, 227572.0, 168357.0, 96104.0, 54918.0, 32943.0, 20173.0, 12959.0, 8320.0, 5273.0, 3536.0, 2320.0, 1572.0, 1066.0, 738.0, 457.0, 345.0, 216.0, 151.0, 102.0, 63.0, 61.0, 34.0, 25.0, 18.0, 13.0, 8.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.7509765625, -0.7278671264648438, -0.7047576904296875, -0.6816482543945312, -0.658538818359375, -0.6354293823242188, -0.6123199462890625, -0.5892105102539062, -0.56610107421875, -0.5429916381835938, -0.5198822021484375, -0.49677276611328125, -0.473663330078125, -0.45055389404296875, -0.4274444580078125, -0.40433502197265625, -0.3812255859375, -0.35811614990234375, -0.3350067138671875, -0.31189727783203125, -0.288787841796875, -0.26567840576171875, -0.2425689697265625, -0.21945953369140625, -0.19635009765625, -0.17324066162109375, -0.1501312255859375, -0.12702178955078125, -0.103912353515625, -0.08080291748046875, -0.0576934814453125, -0.03458404541015625, -0.011474609375, 0.01163482666015625, 0.0347442626953125, 0.05785369873046875, 0.080963134765625, 0.10407257080078125, 0.1271820068359375, 0.15029144287109375, 0.17340087890625, 0.19651031494140625, 0.2196197509765625, 0.24272918701171875, 0.265838623046875, 0.28894805908203125, 0.3120574951171875, 0.33516693115234375, 0.3582763671875, 0.38138580322265625, 0.4044952392578125, 0.42760467529296875, 0.450714111328125, 0.47382354736328125, 0.4969329833984375, 0.5200424194335938, 0.54315185546875, 0.5662612915039062, 0.5893707275390625, 0.6124801635742188, 0.635589599609375, 0.6586990356445312, 0.6818084716796875, 0.7049179077148438, 0.72802734375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 7.0, 20.0, 16.0, 13.0, 23.0, 21.0, 20.0, 18.0, 29.0, 30.0, 28.0, 42.0, 43.0, 43.0, 40.0, 41.0, 1073.0, 54.0, 48.0, 37.0, 43.0, 38.0, 26.0, 34.0, 38.0, 28.0, 27.0, 23.0, 23.0, 16.0, 21.0, 13.0, 7.0, 9.0, 4.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.9140625, -2.796875, -2.6796875, -2.5625, -2.4453125, -2.328125, -2.2109375, -2.09375, -1.9765625, -1.859375, -1.7421875, -1.625, -1.5078125, -1.390625, -1.2734375, -1.15625, -1.0390625, -0.921875, -0.8046875, -0.6875, -0.5703125, -0.453125, -0.3359375, -0.21875, -0.1015625, 0.015625, 0.1328125, 0.25, 0.3671875, 0.484375, 0.6015625, 0.71875, 0.8359375, 0.953125, 1.0703125, 1.1875, 1.3046875, 1.421875, 1.5390625, 1.65625, 1.7734375, 1.890625, 2.0078125, 2.125, 2.2421875, 2.359375, 2.4765625, 2.59375, 2.7109375, 2.828125, 2.9453125, 3.0625, 3.1796875, 3.296875, 3.4140625, 3.53125, 3.6484375, 3.765625, 3.8828125, 4.0, 4.1171875, 4.234375, 4.3515625, 4.46875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 2.0, 8.0, 22.0, 18.0, 33.0, 51.0, 77.0, 115.0, 185.0, 322.0, 479.0, 800.0, 1231.0, 2086.0, 3654.0, 6430.0, 11224.0, 20418.0, 38084.0, 72566.0, 139336.0, 1172916.0, 338844.0, 135115.0, 69967.0, 37096.0, 19972.0, 11091.0, 6100.0, 3491.0, 2074.0, 1291.0, 762.0, 479.0, 303.0, 166.0, 102.0, 92.0, 47.0, 20.0, 20.0, 12.0, 14.0, 4.0, 5.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68115234375, -0.6591644287109375, -0.637176513671875, -0.6151885986328125, -0.59320068359375, -0.5712127685546875, -0.549224853515625, -0.5272369384765625, -0.5052490234375, -0.4832611083984375, -0.461273193359375, -0.4392852783203125, -0.41729736328125, -0.3953094482421875, -0.373321533203125, -0.3513336181640625, -0.329345703125, -0.3073577880859375, -0.285369873046875, -0.2633819580078125, -0.24139404296875, -0.2194061279296875, -0.197418212890625, -0.1754302978515625, -0.1534423828125, -0.1314544677734375, -0.109466552734375, -0.0874786376953125, -0.06549072265625, -0.0435028076171875, -0.021514892578125, 0.0004730224609375, 0.0224609375, 0.0444488525390625, 0.066436767578125, 0.0884246826171875, 0.11041259765625, 0.1324005126953125, 0.154388427734375, 0.1763763427734375, 0.1983642578125, 0.2203521728515625, 0.242340087890625, 0.2643280029296875, 0.28631591796875, 0.3083038330078125, 0.330291748046875, 0.3522796630859375, 0.374267578125, 0.3962554931640625, 0.418243408203125, 0.4402313232421875, 0.46221923828125, 0.4842071533203125, 0.506195068359375, 0.5281829833984375, 0.5501708984375, 0.5721588134765625, 0.594146728515625, 0.6161346435546875, 0.63812255859375, 0.6601104736328125, 0.682098388671875, 0.7040863037109375, 0.72607421875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 2.0, 4.0, 6.0, 9.0, 13.0, 16.0, 20.0, 31.0, 45.0, 44.0, 54.0, 53.0, 57.0, 62.0, 67.0, 79.0, 54.0, 61.0, 52.0, 49.0, 39.0, 40.0, 24.0, 35.0, 19.0, 15.0, 15.0, 11.0, 6.0, 6.0, 4.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.002292633056640625, -0.0022272467613220215, -0.002161860466003418, -0.0020964741706848145, -0.002031087875366211, -0.0019657015800476074, -0.001900315284729004, -0.0018349289894104004, -0.0017695426940917969, -0.0017041563987731934, -0.0016387701034545898, -0.0015733838081359863, -0.0015079975128173828, -0.0014426112174987793, -0.0013772249221801758, -0.0013118386268615723, -0.0012464523315429688, -0.0011810660362243652, -0.0011156797409057617, -0.0010502934455871582, -0.0009849071502685547, -0.0009195208549499512, -0.0008541345596313477, -0.0007887482643127441, -0.0007233619689941406, -0.0006579756736755371, -0.0005925893783569336, -0.0005272030830383301, -0.00046181678771972656, -0.00039643049240112305, -0.00033104419708251953, -0.000265657901763916, -0.0002002716064453125, -0.00013488531112670898, -6.949901580810547e-05, -4.112720489501953e-06, 6.127357482910156e-05, 0.00012665987014770508, 0.0001920461654663086, 0.0002574324607849121, 0.0003228187561035156, 0.00038820505142211914, 0.00045359134674072266, 0.0005189776420593262, 0.0005843639373779297, 0.0006497502326965332, 0.0007151365280151367, 0.0007805228233337402, 0.0008459091186523438, 0.0009112954139709473, 0.0009766817092895508, 0.0010420680046081543, 0.0011074542999267578, 0.0011728405952453613, 0.0012382268905639648, 0.0013036131858825684, 0.0013689994812011719, 0.0014343857765197754, 0.001499772071838379, 0.0015651583671569824, 0.001630544662475586, 0.0016959309577941895, 0.001761317253112793, 0.0018267035484313965, 0.00189208984375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 11.0, 17.0, 19.0, 16.0, 30.0, 52.0, 52.0, 82.0, 80.0, 134.0, 243.0, 618.0, 10582.0, 1026347.0, 9007.0, 524.0, 229.0, 145.0, 97.0, 58.0, 55.0, 41.0, 23.0, 22.0, 17.0, 10.0, 7.0, 6.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05224609375, -0.050685882568359375, -0.04912567138671875, -0.047565460205078125, -0.0460052490234375, -0.044445037841796875, -0.04288482666015625, -0.041324615478515625, -0.039764404296875, -0.038204193115234375, -0.03664398193359375, -0.035083770751953125, -0.0335235595703125, -0.031963348388671875, -0.03040313720703125, -0.028842926025390625, -0.02728271484375, -0.025722503662109375, -0.02416229248046875, -0.022602081298828125, -0.0210418701171875, -0.019481658935546875, -0.01792144775390625, -0.016361236572265625, -0.014801025390625, -0.013240814208984375, -0.01168060302734375, -0.010120391845703125, -0.0085601806640625, -0.006999969482421875, -0.00543975830078125, -0.003879547119140625, -0.0023193359375, -0.000759124755859375, 0.00080108642578125, 0.002361297607421875, 0.0039215087890625, 0.005481719970703125, 0.00704193115234375, 0.008602142333984375, 0.010162353515625, 0.011722564697265625, 0.01328277587890625, 0.014842987060546875, 0.0164031982421875, 0.017963409423828125, 0.01952362060546875, 0.021083831787109375, 0.02264404296875, 0.024204254150390625, 0.02576446533203125, 0.027324676513671875, 0.0288848876953125, 0.030445098876953125, 0.03200531005859375, 0.033565521240234375, 0.035125732421875, 0.036685943603515625, 0.03824615478515625, 0.039806365966796875, 0.0413665771484375, 0.042926788330078125, 0.04448699951171875, 0.046047210693359375, 0.047607421875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 18.0, 34.0, 96.0, 187.0, 239.0, 222.0, 125.0, 58.0, 14.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004594548139721155, -0.0045001995749771595, -0.004405851010233164, -0.0043115029111504555, -0.00421715434640646, -0.004122805781662464, -0.0040284572169184685, -0.003934108652174473, -0.003839760320261121, -0.003745411755517125, -0.003651063423603773, -0.0035567148588597775, -0.0034623665269464254, -0.0033680179622024298, -0.0032736696302890778, -0.003179321065545082, -0.0030849725008010864, -0.0029906239360570908, -0.0028962756041437387, -0.002801927039399743, -0.002707578707486391, -0.0026132301427423954, -0.0025188815779983997, -0.0024245332460850477, -0.0023301849141716957, -0.0022358363494277, -0.002141488017514348, -0.0020471394527703524, -0.0019527910044416785, -0.0018584425561130047, -0.0017640941077843308, -0.001669745659455657, -0.0015753972111269832, -0.0014810487627983093, -0.0013867003144696355, -0.0012923518661409616, -0.001198003301396966, -0.0011036548530682921, -0.0010093064047396183, -0.0009149578982032835, -0.0008206094498746097, -0.0007262610015459359, -0.0006319124950096011, -0.0005375640466809273, -0.000443215569248423, -0.0003488670918159187, -0.00025451864348724484, -0.0001601701369509101, -6.582168862223625e-05, 2.852678153431043e-05, 0.0001228752516908571, 0.00021722371457144618, 0.0003115721920039505, 0.0004059206694364548, 0.0005002691177651286, 0.0005946176243014634, 0.0006889660726301372, 0.000783314520958811, 0.0008776630274951458, 0.0009720114758238196, 0.0010663599241524935, 0.0011607084888964891, 0.0012550568208098412, 0.0013494053855538368, 0.0014437538338825107]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 5.0, 9.0, 10.0, 14.0, 16.0, 18.0, 21.0, 23.0, 25.0, 28.0, 25.0, 39.0, 48.0, 38.0, 42.0, 39.0, 40.0, 40.0, 35.0, 40.0, 35.0, 42.0, 39.0, 38.0, 40.0, 31.0, 36.0, 32.0, 22.0, 17.0, 15.0, 23.0, 23.0, 7.0, 9.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009667873382568359, -0.0009367233142256737, -0.0009066592901945114, -0.0008765952661633492, -0.0008465312421321869, -0.0008164672181010246, -0.0007864031940698624, -0.0007563391700387001, -0.0007262751460075378, -0.0006962111219763756, -0.0006661470979452133, -0.0006360830739140511, -0.0006060190498828888, -0.0005759550258517265, -0.0005458910018205643, -0.000515826977789402, -0.00048576295375823975, -0.0004556989297270775, -0.0004256349056959152, -0.00039557088166475296, -0.0003655068576335907, -0.00033544283360242844, -0.0003053788095712662, -0.0002753147855401039, -0.00024525076150894165, -0.0002151867374777794, -0.00018512271344661713, -0.00015505868941545486, -0.0001249946653842926, -9.493064135313034e-05, -6.486661732196808e-05, -3.480259329080582e-05, -4.738569259643555e-06, 2.5325454771518707e-05, 5.538947880268097e-05, 8.545350283384323e-05, 0.00011551752686500549, 0.00014558155089616776, 0.00017564557492733002, 0.00020570959895849228, 0.00023577362298965454, 0.0002658376470208168, 0.00029590167105197906, 0.0003259656950831413, 0.0003560297191143036, 0.00038609374314546585, 0.0004161577671766281, 0.0004462217912077904, 0.00047628581523895264, 0.0005063498392701149, 0.0005364138633012772, 0.0005664778873324394, 0.0005965419113636017, 0.000626605935394764, 0.0006566699594259262, 0.0006867339834570885, 0.0007167980074882507, 0.000746862031519413, 0.0007769260555505753, 0.0008069900795817375, 0.0008370541036128998, 0.000867118127644062, 0.0008971821516752243, 0.0009272461757063866, 0.0009573101997375488]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 6.0, 13.0, 13.0, 14.0, 13.0, 23.0, 21.0, 23.0, 20.0, 28.0, 42.0, 33.0, 27.0, 40.0, 25.0, 33.0, 48.0, 40.0, 46.0, 30.0, 38.0, 40.0, 36.0, 31.0, 36.0, 23.0, 28.0, 28.0, 26.0, 14.0, 18.0, 25.0, 13.0, 16.0, 18.0, 15.0, 12.0, 10.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.2578125, -5.0916748046875, -4.925537109375, -4.7593994140625, -4.59326171875, -4.4271240234375, -4.260986328125, -4.0948486328125, -3.9287109375, -3.7625732421875, -3.596435546875, -3.4302978515625, -3.26416015625, -3.0980224609375, -2.931884765625, -2.7657470703125, -2.599609375, -2.4334716796875, -2.267333984375, -2.1011962890625, -1.93505859375, -1.7689208984375, -1.602783203125, -1.4366455078125, -1.2705078125, -1.1043701171875, -0.938232421875, -0.7720947265625, -0.60595703125, -0.4398193359375, -0.273681640625, -0.1075439453125, 0.05859375, 0.2247314453125, 0.390869140625, 0.5570068359375, 0.72314453125, 0.8892822265625, 1.055419921875, 1.2215576171875, 1.3876953125, 1.5538330078125, 1.719970703125, 1.8861083984375, 2.05224609375, 2.2183837890625, 2.384521484375, 2.5506591796875, 2.716796875, 2.8829345703125, 3.049072265625, 3.2152099609375, 3.38134765625, 3.5474853515625, 3.713623046875, 3.8797607421875, 4.0458984375, 4.2120361328125, 4.378173828125, 4.5443115234375, 4.71044921875, 4.8765869140625, 5.042724609375, 5.2088623046875, 5.375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 13.0, 11.0, 17.0, 18.0, 20.0, 25.0, 42.0, 46.0, 75.0, 78.0, 112.0, 168.0, 220.0, 334.0, 583.0, 992.0, 2986.0, 15867.0, 120079.0, 753048.0, 130858.0, 16948.0, 3156.0, 1088.0, 598.0, 318.0, 211.0, 158.0, 101.0, 83.0, 59.0, 51.0, 43.0, 23.0, 28.0, 24.0, 15.0, 16.0, 10.0, 7.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.734375, -9.425537109375, -9.11669921875, -8.807861328125, -8.4990234375, -8.190185546875, -7.88134765625, -7.572509765625, -7.263671875, -6.954833984375, -6.64599609375, -6.337158203125, -6.0283203125, -5.719482421875, -5.41064453125, -5.101806640625, -4.79296875, -4.484130859375, -4.17529296875, -3.866455078125, -3.5576171875, -3.248779296875, -2.93994140625, -2.631103515625, -2.322265625, -2.013427734375, -1.70458984375, -1.395751953125, -1.0869140625, -0.778076171875, -0.46923828125, -0.160400390625, 0.1484375, 0.457275390625, 0.76611328125, 1.074951171875, 1.3837890625, 1.692626953125, 2.00146484375, 2.310302734375, 2.619140625, 2.927978515625, 3.23681640625, 3.545654296875, 3.8544921875, 4.163330078125, 4.47216796875, 4.781005859375, 5.08984375, 5.398681640625, 5.70751953125, 6.016357421875, 6.3251953125, 6.634033203125, 6.94287109375, 7.251708984375, 7.560546875, 7.869384765625, 8.17822265625, 8.487060546875, 8.7958984375, 9.104736328125, 9.41357421875, 9.722412109375, 10.03125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 10.0, 11.0, 9.0, 7.0, 12.0, 8.0, 18.0, 18.0, 25.0, 29.0, 34.0, 27.0, 24.0, 37.0, 46.0, 45.0, 50.0, 67.0, 214.0, 1698.0, 154.0, 76.0, 47.0, 45.0, 41.0, 29.0, 24.0, 34.0, 28.0, 26.0, 21.0, 19.0, 16.0, 12.0, 12.0, 11.0, 10.0, 9.0, 12.0, 9.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.828125, -15.307373046875, -14.78662109375, -14.265869140625, -13.7451171875, -13.224365234375, -12.70361328125, -12.182861328125, -11.662109375, -11.141357421875, -10.62060546875, -10.099853515625, -9.5791015625, -9.058349609375, -8.53759765625, -8.016845703125, -7.49609375, -6.975341796875, -6.45458984375, -5.933837890625, -5.4130859375, -4.892333984375, -4.37158203125, -3.850830078125, -3.330078125, -2.809326171875, -2.28857421875, -1.767822265625, -1.2470703125, -0.726318359375, -0.20556640625, 0.315185546875, 0.8359375, 1.356689453125, 1.87744140625, 2.398193359375, 2.9189453125, 3.439697265625, 3.96044921875, 4.481201171875, 5.001953125, 5.522705078125, 6.04345703125, 6.564208984375, 7.0849609375, 7.605712890625, 8.12646484375, 8.647216796875, 9.16796875, 9.688720703125, 10.20947265625, 10.730224609375, 11.2509765625, 11.771728515625, 12.29248046875, 12.813232421875, 13.333984375, 13.854736328125, 14.37548828125, 14.896240234375, 15.4169921875, 15.937744140625, 16.45849609375, 16.979248046875, 17.5]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 4.0, 14.0, 13.0, 10.0, 17.0, 16.0, 20.0, 19.0, 28.0, 35.0, 43.0, 41.0, 70.0, 87.0, 121.0, 204.0, 388.0, 926.0, 23779.0, 3112229.0, 5998.0, 656.0, 282.0, 187.0, 121.0, 79.0, 49.0, 50.0, 47.0, 30.0, 23.0, 19.0, 14.0, 13.0, 8.0, 10.0, 8.0, 14.0, 4.0, 6.0, 2.0, 3.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-52.5, -50.8779296875, -49.255859375, -47.6337890625, -46.01171875, -44.3896484375, -42.767578125, -41.1455078125, -39.5234375, -37.9013671875, -36.279296875, -34.6572265625, -33.03515625, -31.4130859375, -29.791015625, -28.1689453125, -26.546875, -24.9248046875, -23.302734375, -21.6806640625, -20.05859375, -18.4365234375, -16.814453125, -15.1923828125, -13.5703125, -11.9482421875, -10.326171875, -8.7041015625, -7.08203125, -5.4599609375, -3.837890625, -2.2158203125, -0.59375, 1.0283203125, 2.650390625, 4.2724609375, 5.89453125, 7.5166015625, 9.138671875, 10.7607421875, 12.3828125, 14.0048828125, 15.626953125, 17.2490234375, 18.87109375, 20.4931640625, 22.115234375, 23.7373046875, 25.359375, 26.9814453125, 28.603515625, 30.2255859375, 31.84765625, 33.4697265625, 35.091796875, 36.7138671875, 38.3359375, 39.9580078125, 41.580078125, 43.2021484375, 44.82421875, 46.4462890625, 48.068359375, 49.6904296875, 51.3125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 47.0, 208.0, 376.0, 272.0, 86.0, 15.0, 3.0], "bins": [-83.17974853515625, -81.78570556640625, -80.39166259765625, -78.99762725830078, -77.60358428955078, -76.20954132080078, -74.81549835205078, -73.42146301269531, -72.02742004394531, -70.63337707519531, -69.23933410644531, -67.84529876708984, -66.45125579833984, -65.05721282958984, -63.66317367553711, -62.26913070678711, -60.875091552734375, -59.481048583984375, -58.08700942993164, -56.69296646118164, -55.298927307128906, -53.904884338378906, -52.51084518432617, -51.11680221557617, -49.72275924682617, -48.32871627807617, -46.93467712402344, -45.54063415527344, -44.1465950012207, -42.7525520324707, -41.35851287841797, -39.96446990966797, -38.570430755615234, -37.176387786865234, -35.7823486328125, -34.3883056640625, -32.994266510009766, -31.6002254486084, -30.20618438720703, -28.81214141845703, -27.418100357055664, -26.024059295654297, -24.63001823425293, -23.235977172851562, -21.841936111450195, -20.447895050048828, -19.053852081298828, -17.659812927246094, -16.265769958496094, -14.871728897094727, -13.47768783569336, -12.083646774291992, -10.689605712890625, -9.295564651489258, -7.901522636413574, -6.507481575012207, -5.113441467285156, -3.719400405883789, -2.3253591060638428, -0.9313178062438965, 0.4627232551574707, 1.856764316558838, 3.2508058547973633, 4.6448469161987305, 6.038887977600098]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 4.0, 7.0, 4.0, 7.0, 6.0, 13.0, 14.0, 8.0, 14.0, 12.0, 16.0, 21.0, 21.0, 26.0, 30.0, 25.0, 23.0, 25.0, 24.0, 34.0, 37.0, 32.0, 35.0, 49.0, 50.0, 35.0, 27.0, 38.0, 29.0, 26.0, 22.0, 27.0, 29.0, 31.0, 24.0, 24.0, 18.0, 27.0, 18.0, 18.0, 20.0, 9.0, 9.0, 8.0, 6.0, 11.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-46.25877380371094, -44.89012145996094, -43.52146911621094, -42.15281677246094, -40.78416061401367, -39.41550827026367, -38.04685592651367, -36.67820358276367, -35.309547424316406, -33.940895080566406, -32.572242736816406, -31.203588485717773, -29.83493423461914, -28.46628189086914, -27.09762954711914, -25.72897720336914, -24.36032485961914, -22.99167251586914, -21.623018264770508, -20.254365921020508, -18.885711669921875, -17.517059326171875, -16.148406982421875, -14.779753684997559, -13.411100387573242, -12.042447090148926, -10.67379379272461, -9.30514144897461, -7.936488151550293, -6.567834854125977, -5.199182510375977, -3.83052921295166, -2.461872100830078, -1.0932190418243408, 0.2754340171813965, 1.6440868377685547, 3.012740135192871, 4.3813934326171875, 5.7500457763671875, 7.118699073791504, 8.48735237121582, 9.856005668640137, 11.224658966064453, 12.593311309814453, 13.96196460723877, 15.330617904663086, 16.699270248413086, 18.06792449951172, 19.43657684326172, 20.80522918701172, 22.17388343811035, 23.54253578186035, 24.911190032958984, 26.279842376708984, 27.648494720458984, 29.017147064208984, 30.385801315307617, 31.754453659057617, 33.12310791015625, 34.49176025390625, 35.86041259765625, 37.22906494140625, 38.59771728515625, 39.966373443603516, 41.335025787353516]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 6.0, 9.0, 7.0, 15.0, 11.0, 18.0, 18.0, 24.0, 19.0, 27.0, 31.0, 23.0, 32.0, 32.0, 33.0, 35.0, 38.0, 37.0, 37.0, 45.0, 47.0, 49.0, 34.0, 29.0, 37.0, 31.0, 20.0, 33.0, 20.0, 33.0, 24.0, 15.0, 14.0, 19.0, 20.0, 12.0, 13.0, 16.0, 7.0, 10.0, 2.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.05859375, -5.8802490234375, -5.701904296875, -5.5235595703125, -5.34521484375, -5.1668701171875, -4.988525390625, -4.8101806640625, -4.6318359375, -4.4534912109375, -4.275146484375, -4.0968017578125, -3.91845703125, -3.7401123046875, -3.561767578125, -3.3834228515625, -3.205078125, -3.0267333984375, -2.848388671875, -2.6700439453125, -2.49169921875, -2.3133544921875, -2.135009765625, -1.9566650390625, -1.7783203125, -1.5999755859375, -1.421630859375, -1.2432861328125, -1.06494140625, -0.8865966796875, -0.708251953125, -0.5299072265625, -0.3515625, -0.1732177734375, 0.005126953125, 0.1834716796875, 0.36181640625, 0.5401611328125, 0.718505859375, 0.8968505859375, 1.0751953125, 1.2535400390625, 1.431884765625, 1.6102294921875, 1.78857421875, 1.9669189453125, 2.145263671875, 2.3236083984375, 2.501953125, 2.6802978515625, 2.858642578125, 3.0369873046875, 3.21533203125, 3.3936767578125, 3.572021484375, 3.7503662109375, 3.9287109375, 4.1070556640625, 4.285400390625, 4.4637451171875, 4.64208984375, 4.8204345703125, 4.998779296875, 5.1771240234375, 5.35546875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 7.0, 16.0, 23.0, 29.0, 37.0, 53.0, 83.0, 95.0, 178.0, 320.0, 632.0, 1495.0, 4136.0, 12722.0, 50101.0, 276236.0, 1176925.0, 1796704.0, 703808.0, 128885.0, 28331.0, 8126.0, 2880.0, 1162.0, 532.0, 267.0, 171.0, 87.0, 67.0, 53.0, 40.0, 15.0, 22.0, 19.0, 11.0, 7.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-10.6171875, -10.34698486328125, -10.0767822265625, -9.80657958984375, -9.536376953125, -9.26617431640625, -8.9959716796875, -8.72576904296875, -8.45556640625, -8.18536376953125, -7.9151611328125, -7.64495849609375, -7.374755859375, -7.10455322265625, -6.8343505859375, -6.56414794921875, -6.2939453125, -6.02374267578125, -5.7535400390625, -5.48333740234375, -5.213134765625, -4.94293212890625, -4.6727294921875, -4.40252685546875, -4.13232421875, -3.86212158203125, -3.5919189453125, -3.32171630859375, -3.051513671875, -2.78131103515625, -2.5111083984375, -2.24090576171875, -1.970703125, -1.70050048828125, -1.4302978515625, -1.16009521484375, -0.889892578125, -0.61968994140625, -0.3494873046875, -0.07928466796875, 0.19091796875, 0.46112060546875, 0.7313232421875, 1.00152587890625, 1.271728515625, 1.54193115234375, 1.8121337890625, 2.08233642578125, 2.3525390625, 2.62274169921875, 2.8929443359375, 3.16314697265625, 3.433349609375, 3.70355224609375, 3.9737548828125, 4.24395751953125, 4.51416015625, 4.78436279296875, 5.0545654296875, 5.32476806640625, 5.594970703125, 5.86517333984375, 6.1353759765625, 6.40557861328125, 6.67578125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 8.0, 9.0, 13.0, 18.0, 24.0, 40.0, 36.0, 52.0, 87.0, 103.0, 125.0, 189.0, 214.0, 265.0, 363.0, 384.0, 407.0, 392.0, 318.0, 276.0, 179.0, 123.0, 111.0, 76.0, 57.0, 41.0, 39.0, 27.0, 30.0, 16.0, 15.0, 15.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.46875, -12.1422119140625, -11.815673828125, -11.4891357421875, -11.16259765625, -10.8360595703125, -10.509521484375, -10.1829833984375, -9.8564453125, -9.5299072265625, -9.203369140625, -8.8768310546875, -8.55029296875, -8.2237548828125, -7.897216796875, -7.5706787109375, -7.244140625, -6.9176025390625, -6.591064453125, -6.2645263671875, -5.93798828125, -5.6114501953125, -5.284912109375, -4.9583740234375, -4.6318359375, -4.3052978515625, -3.978759765625, -3.6522216796875, -3.32568359375, -2.9991455078125, -2.672607421875, -2.3460693359375, -2.01953125, -1.6929931640625, -1.366455078125, -1.0399169921875, -0.71337890625, -0.3868408203125, -0.060302734375, 0.2662353515625, 0.5927734375, 0.9193115234375, 1.245849609375, 1.5723876953125, 1.89892578125, 2.2254638671875, 2.552001953125, 2.8785400390625, 3.205078125, 3.5316162109375, 3.858154296875, 4.1846923828125, 4.51123046875, 4.8377685546875, 5.164306640625, 5.4908447265625, 5.8173828125, 6.1439208984375, 6.470458984375, 6.7969970703125, 7.12353515625, 7.4500732421875, 7.776611328125, 8.1031494140625, 8.4296875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 7.0, 13.0, 27.0, 16.0, 36.0, 28.0, 66.0, 75.0, 91.0, 127.0, 139.0, 199.0, 266.0, 384.0, 654.0, 1538.0, 15070.0, 3276531.0, 889409.0, 6631.0, 1026.0, 528.0, 325.0, 277.0, 209.0, 135.0, 102.0, 95.0, 66.0, 49.0, 40.0, 33.0, 25.0, 14.0, 15.0, 12.0, 1.0, 7.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.75, -31.43359375, -30.1171875, -28.80078125, -27.484375, -26.16796875, -24.8515625, -23.53515625, -22.21875, -20.90234375, -19.5859375, -18.26953125, -16.953125, -15.63671875, -14.3203125, -13.00390625, -11.6875, -10.37109375, -9.0546875, -7.73828125, -6.421875, -5.10546875, -3.7890625, -2.47265625, -1.15625, 0.16015625, 1.4765625, 2.79296875, 4.109375, 5.42578125, 6.7421875, 8.05859375, 9.375, 10.69140625, 12.0078125, 13.32421875, 14.640625, 15.95703125, 17.2734375, 18.58984375, 19.90625, 21.22265625, 22.5390625, 23.85546875, 25.171875, 26.48828125, 27.8046875, 29.12109375, 30.4375, 31.75390625, 33.0703125, 34.38671875, 35.703125, 37.01953125, 38.3359375, 39.65234375, 40.96875, 42.28515625, 43.6015625, 44.91796875, 46.234375, 47.55078125, 48.8671875, 50.18359375, 51.5]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 436.0, 532.0, 30.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-486.7415466308594, -477.9002685546875, -469.0589904785156, -460.21771240234375, -451.3764343261719, -442.53515625, -433.6938781738281, -424.85260009765625, -416.0113220214844, -407.1700439453125, -398.3287658691406, -389.48748779296875, -380.6462097167969, -371.804931640625, -362.9636535644531, -354.12237548828125, -345.2811279296875, -336.4398498535156, -327.59857177734375, -318.7572937011719, -309.916015625, -301.0747375488281, -292.23345947265625, -283.3921813964844, -274.5509033203125, -265.7096252441406, -256.86834716796875, -248.02706909179688, -239.185791015625, -230.34451293945312, -221.50323486328125, -212.66195678710938, -203.82070922851562, -194.97943115234375, -186.13815307617188, -177.296875, -168.45559692382812, -159.61431884765625, -150.77304077148438, -141.9317626953125, -133.09048461914062, -124.24920654296875, -115.40792846679688, -106.566650390625, -97.72537231445312, -88.88409423828125, -80.0428237915039, -71.20154571533203, -62.360267639160156, -53.51898956298828, -44.677711486816406, -35.8364372253418, -26.995159149169922, -18.153881072998047, -9.312606811523438, -0.4713287353515625, 8.369949340820312, 17.211227416992188, 26.05250358581543, 34.89377975463867, 43.73505783081055, 52.57633590698242, 61.41761016845703, 70.2588882446289, 79.10016632080078]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 4.0, 8.0, 10.0, 16.0, 12.0, 9.0, 25.0, 17.0, 21.0, 22.0, 21.0, 28.0, 27.0, 47.0, 49.0, 34.0, 56.0, 31.0, 39.0, 32.0, 44.0, 39.0, 43.0, 27.0, 33.0, 33.0, 25.0, 32.0, 21.0, 28.0, 28.0, 14.0, 25.0, 26.0, 11.0, 11.0, 11.0, 6.0, 3.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-36.28489685058594, -35.20779037475586, -34.13068389892578, -33.0535774230957, -31.976472854614258, -30.89936637878418, -29.822261810302734, -28.745155334472656, -27.668048858642578, -26.5909423828125, -25.513835906982422, -24.436731338500977, -23.3596248626709, -22.28251838684082, -21.205413818359375, -20.128307342529297, -19.05120086669922, -17.97409439086914, -16.896987915039062, -15.819883346557617, -14.742776870727539, -13.665670394897461, -12.5885648727417, -11.511459350585938, -10.43435287475586, -9.357246398925781, -8.28014087677002, -7.2030348777771, -6.12592887878418, -5.04882287979126, -3.97171688079834, -2.89461088180542, -1.8175048828125, -0.7403988838195801, 0.33670711517333984, 1.4138131141662598, 2.4909191131591797, 3.5680251121520996, 4.6451311111450195, 5.7222371101379395, 6.799343109130859, 7.876449108123779, 8.9535551071167, 10.030660629272461, 11.107767105102539, 12.184873580932617, 13.261979103088379, 14.33908462524414, 15.416191101074219, 16.493297576904297, 17.570404052734375, 18.64750862121582, 19.7246150970459, 20.801721572875977, 21.878826141357422, 22.9559326171875, 24.033039093017578, 25.110145568847656, 26.187252044677734, 27.26435661315918, 28.341463088989258, 29.418569564819336, 30.49567413330078, 31.57278060913086, 32.64988708496094]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 7.0, 9.0, 8.0, 8.0, 13.0, 14.0, 12.0, 13.0, 13.0, 18.0, 13.0, 24.0, 26.0, 39.0, 17.0, 31.0, 24.0, 28.0, 33.0, 48.0, 36.0, 34.0, 43.0, 37.0, 32.0, 34.0, 27.0, 31.0, 32.0, 28.0, 36.0, 23.0, 23.0, 19.0, 21.0, 18.0, 18.0, 15.0, 19.0, 15.0, 13.0, 13.0, 9.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-5.20703125, -5.04876708984375, -4.8905029296875, -4.73223876953125, -4.573974609375, -4.41571044921875, -4.2574462890625, -4.09918212890625, -3.94091796875, -3.78265380859375, -3.6243896484375, -3.46612548828125, -3.307861328125, -3.14959716796875, -2.9913330078125, -2.83306884765625, -2.6748046875, -2.51654052734375, -2.3582763671875, -2.20001220703125, -2.041748046875, -1.88348388671875, -1.7252197265625, -1.56695556640625, -1.40869140625, -1.25042724609375, -1.0921630859375, -0.93389892578125, -0.775634765625, -0.61737060546875, -0.4591064453125, -0.30084228515625, -0.142578125, 0.01568603515625, 0.1739501953125, 0.33221435546875, 0.490478515625, 0.64874267578125, 0.8070068359375, 0.96527099609375, 1.12353515625, 1.28179931640625, 1.4400634765625, 1.59832763671875, 1.756591796875, 1.91485595703125, 2.0731201171875, 2.23138427734375, 2.3896484375, 2.54791259765625, 2.7061767578125, 2.86444091796875, 3.022705078125, 3.18096923828125, 3.3392333984375, 3.49749755859375, 3.65576171875, 3.81402587890625, 3.9722900390625, 4.13055419921875, 4.288818359375, 4.44708251953125, 4.6053466796875, 4.76361083984375, 4.921875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 7.0, 10.0, 29.0, 37.0, 41.0, 45.0, 89.0, 112.0, 187.0, 258.0, 423.0, 654.0, 866.0, 1303.0, 1878.0, 2717.0, 4190.0, 6313.0, 9689.0, 15092.0, 23952.0, 39169.0, 66442.0, 116878.0, 198392.0, 218805.0, 139022.0, 78785.0, 45588.0, 27660.0, 17194.0, 11044.0, 7196.0, 4774.0, 3161.0, 2106.0, 1414.0, 978.0, 672.0, 445.0, 296.0, 197.0, 143.0, 93.0, 79.0, 37.0, 27.0, 25.0, 20.0, 7.0, 4.0, 2.0, 7.0, 2.0, 3.0, 1.0], "bins": [-0.767578125, -0.7444229125976562, -0.7212677001953125, -0.6981124877929688, -0.674957275390625, -0.6518020629882812, -0.6286468505859375, -0.6054916381835938, -0.58233642578125, -0.5591812133789062, -0.5360260009765625, -0.5128707885742188, -0.489715576171875, -0.46656036376953125, -0.4434051513671875, -0.42024993896484375, -0.3970947265625, -0.37393951416015625, -0.3507843017578125, -0.32762908935546875, -0.304473876953125, -0.28131866455078125, -0.2581634521484375, -0.23500823974609375, -0.21185302734375, -0.18869781494140625, -0.1655426025390625, -0.14238739013671875, -0.119232177734375, -0.09607696533203125, -0.0729217529296875, -0.04976654052734375, -0.026611328125, -0.00345611572265625, 0.0196990966796875, 0.04285430908203125, 0.066009521484375, 0.08916473388671875, 0.1123199462890625, 0.13547515869140625, 0.15863037109375, 0.18178558349609375, 0.2049407958984375, 0.22809600830078125, 0.251251220703125, 0.27440643310546875, 0.2975616455078125, 0.32071685791015625, 0.3438720703125, 0.36702728271484375, 0.3901824951171875, 0.41333770751953125, 0.436492919921875, 0.45964813232421875, 0.4828033447265625, 0.5059585571289062, 0.52911376953125, 0.5522689819335938, 0.5754241943359375, 0.5985794067382812, 0.621734619140625, 0.6448898315429688, 0.6680450439453125, 0.6912002563476562, 0.71435546875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 9.0, 8.0, 17.0, 10.0, 24.0, 14.0, 21.0, 29.0, 17.0, 20.0, 31.0, 39.0, 30.0, 45.0, 46.0, 42.0, 49.0, 37.0, 1068.0, 42.0, 36.0, 31.0, 46.0, 30.0, 36.0, 35.0, 32.0, 29.0, 22.0, 12.0, 18.0, 13.0, 12.0, 19.0, 13.0, 7.0, 6.0, 11.0, 1.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.486328125, -3.363861083984375, -3.24139404296875, -3.118927001953125, -2.9964599609375, -2.873992919921875, -2.75152587890625, -2.629058837890625, -2.506591796875, -2.384124755859375, -2.26165771484375, -2.139190673828125, -2.0167236328125, -1.894256591796875, -1.77178955078125, -1.649322509765625, -1.52685546875, -1.404388427734375, -1.28192138671875, -1.159454345703125, -1.0369873046875, -0.914520263671875, -0.79205322265625, -0.669586181640625, -0.547119140625, -0.424652099609375, -0.30218505859375, -0.179718017578125, -0.0572509765625, 0.065216064453125, 0.18768310546875, 0.310150146484375, 0.4326171875, 0.555084228515625, 0.67755126953125, 0.800018310546875, 0.9224853515625, 1.044952392578125, 1.16741943359375, 1.289886474609375, 1.412353515625, 1.534820556640625, 1.65728759765625, 1.779754638671875, 1.9022216796875, 2.024688720703125, 2.14715576171875, 2.269622802734375, 2.39208984375, 2.514556884765625, 2.63702392578125, 2.759490966796875, 2.8819580078125, 3.004425048828125, 3.12689208984375, 3.249359130859375, 3.371826171875, 3.494293212890625, 3.61676025390625, 3.739227294921875, 3.8616943359375, 3.984161376953125, 4.10662841796875, 4.229095458984375, 4.3515625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 10.0, 18.0, 27.0, 51.0, 87.0, 129.0, 194.0, 329.0, 579.0, 996.0, 1629.0, 2829.0, 4889.0, 8850.0, 15937.0, 29633.0, 55331.0, 107766.0, 200992.0, 1304456.0, 172160.0, 88494.0, 46477.0, 24829.0, 13304.0, 7356.0, 4132.0, 2327.0, 1300.0, 762.0, 462.0, 279.0, 173.0, 111.0, 71.0, 46.0, 37.0, 18.0, 15.0, 18.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.84716796875, -0.8238677978515625, -0.800567626953125, -0.7772674560546875, -0.75396728515625, -0.7306671142578125, -0.707366943359375, -0.6840667724609375, -0.6607666015625, -0.6374664306640625, -0.614166259765625, -0.5908660888671875, -0.56756591796875, -0.5442657470703125, -0.520965576171875, -0.4976654052734375, -0.474365234375, -0.4510650634765625, -0.427764892578125, -0.4044647216796875, -0.38116455078125, -0.3578643798828125, -0.334564208984375, -0.3112640380859375, -0.2879638671875, -0.2646636962890625, -0.241363525390625, -0.2180633544921875, -0.19476318359375, -0.1714630126953125, -0.148162841796875, -0.1248626708984375, -0.1015625, -0.0782623291015625, -0.054962158203125, -0.0316619873046875, -0.00836181640625, 0.0149383544921875, 0.038238525390625, 0.0615386962890625, 0.0848388671875, 0.1081390380859375, 0.131439208984375, 0.1547393798828125, 0.17803955078125, 0.2013397216796875, 0.224639892578125, 0.2479400634765625, 0.271240234375, 0.2945404052734375, 0.317840576171875, 0.3411407470703125, 0.36444091796875, 0.3877410888671875, 0.411041259765625, 0.4343414306640625, 0.4576416015625, 0.4809417724609375, 0.504241943359375, 0.5275421142578125, 0.55084228515625, 0.5741424560546875, 0.597442626953125, 0.6207427978515625, 0.64404296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 17.0, 17.0, 20.0, 18.0, 29.0, 21.0, 34.0, 43.0, 50.0, 58.0, 74.0, 74.0, 53.0, 67.0, 69.0, 48.0, 49.0, 37.0, 48.0, 26.0, 20.0, 27.0, 21.0, 15.0, 8.0, 11.0, 8.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.002773284912109375, -0.002696692943572998, -0.002620100975036621, -0.002543509006500244, -0.002466917037963867, -0.0023903250694274902, -0.0023137331008911133, -0.0022371411323547363, -0.0021605491638183594, -0.0020839571952819824, -0.0020073652267456055, -0.0019307732582092285, -0.0018541812896728516, -0.0017775893211364746, -0.0017009973526000977, -0.0016244053840637207, -0.0015478134155273438, -0.0014712214469909668, -0.0013946294784545898, -0.0013180375099182129, -0.001241445541381836, -0.001164853572845459, -0.001088261604309082, -0.001011669635772705, -0.0009350776672363281, -0.0008584856986999512, -0.0007818937301635742, -0.0007053017616271973, -0.0006287097930908203, -0.0005521178245544434, -0.0004755258560180664, -0.00039893388748168945, -0.0003223419189453125, -0.00024574995040893555, -0.0001691579818725586, -9.256601333618164e-05, -1.5974044799804688e-05, 6.0617923736572266e-05, 0.00013720989227294922, 0.00021380186080932617, 0.0002903938293457031, 0.0003669857978820801, 0.00044357776641845703, 0.000520169734954834, 0.0005967617034912109, 0.0006733536720275879, 0.0007499456405639648, 0.0008265376091003418, 0.0009031295776367188, 0.0009797215461730957, 0.0010563135147094727, 0.0011329054832458496, 0.0012094974517822266, 0.0012860894203186035, 0.0013626813888549805, 0.0014392733573913574, 0.0015158653259277344, 0.0015924572944641113, 0.0016690492630004883, 0.0017456412315368652, 0.0018222332000732422, 0.0018988251686096191, 0.001975417137145996, 0.002052009105682373, 0.00212860107421875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 2.0, 1.0, 3.0, 8.0, 7.0, 11.0, 13.0, 17.0, 19.0, 24.0, 47.0, 56.0, 81.0, 77.0, 124.0, 194.0, 511.0, 2013.0, 1008521.0, 35279.0, 748.0, 278.0, 153.0, 89.0, 59.0, 52.0, 36.0, 36.0, 28.0, 18.0, 16.0, 4.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05291748046875, -0.05107593536376953, -0.04923439025878906, -0.047392845153808594, -0.045551300048828125, -0.043709754943847656, -0.04186820983886719, -0.04002666473388672, -0.03818511962890625, -0.03634357452392578, -0.03450202941894531, -0.032660484313964844, -0.030818939208984375, -0.028977394104003906, -0.027135848999023438, -0.02529430389404297, -0.0234527587890625, -0.02161121368408203, -0.019769668579101562, -0.017928123474121094, -0.016086578369140625, -0.014245033264160156, -0.012403488159179688, -0.010561943054199219, -0.00872039794921875, -0.006878852844238281, -0.0050373077392578125, -0.0031957626342773438, -0.001354217529296875, 0.00048732757568359375, 0.0023288726806640625, 0.004170417785644531, 0.006011962890625, 0.007853507995605469, 0.009695053100585938, 0.011536598205566406, 0.013378143310546875, 0.015219688415527344, 0.017061233520507812, 0.01890277862548828, 0.02074432373046875, 0.02258586883544922, 0.024427413940429688, 0.026268959045410156, 0.028110504150390625, 0.029952049255371094, 0.03179359436035156, 0.03363513946533203, 0.0354766845703125, 0.03731822967529297, 0.03915977478027344, 0.041001319885253906, 0.042842864990234375, 0.044684410095214844, 0.04652595520019531, 0.04836750030517578, 0.05020904541015625, 0.05205059051513672, 0.05389213562011719, 0.055733680725097656, 0.057575225830078125, 0.059416770935058594, 0.06125831604003906, 0.06309986114501953, 0.06494140625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 24.0, 98.0, 347.0, 360.0, 142.0, 34.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027707030531018972, -0.0026084640994668007, -0.0024462249130010605, -0.0022839857265353203, -0.0021217467729002237, -0.001959507819265127, -0.001797268632799387, -0.0016350295627489686, -0.0014727904926985502, -0.0013105514226481318, -0.0011483123525977135, -0.000986073282547295, -0.0008238342124968767, -0.0006615951424464583, -0.00049935607239604, -0.0003371170023456216, -0.0001748779322952032, -1.2638862244784832e-05, 0.00014960020780563354, 0.0003118392778560519, 0.0004740783479064703, 0.0006363174179568887, 0.000798556488007307, 0.0009607955580577254, 0.0011230346281081438, 0.0012852736981585622, 0.0014475127682089806, 0.001609751838259399, 0.0017719909083098173, 0.0019342299783602357, 0.002096469048410654, 0.0022587082348763943, 0.0024209474213421345, 0.0025831866078078747, 0.0027454255614429712, 0.0029076645150780678, 0.003069903701543808, 0.003232142888009548, 0.0033943818416446447, 0.0035566207952797413, 0.0037188599817454815, 0.0038810991682112217, 0.004043337889015675, 0.004205577075481415, 0.004367816261947155, 0.004530055448412895, 0.004692294634878635, 0.004854533355683088, 0.0050167725421488285, 0.005179011728614569, 0.005341250449419022, 0.005503489635884762, 0.005665728822350502, 0.005827968008816242, 0.005990207195281982, 0.006152445916086435, 0.0063146851025521755, 0.006476924289017916, 0.006639163009822369, 0.006801402196288109, 0.006963641382753849, 0.007125880569219589, 0.0072881197556853294, 0.007450358476489782, 0.0076125976629555225]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 10.0, 16.0, 6.0, 14.0, 15.0, 14.0, 17.0, 25.0, 30.0, 27.0, 31.0, 31.0, 32.0, 38.0, 38.0, 31.0, 39.0, 28.0, 25.0, 45.0, 37.0, 37.0, 43.0, 31.0, 37.0, 24.0, 43.0, 36.0, 25.0, 29.0, 24.0, 15.0, 16.0, 20.0, 10.0, 13.0, 7.0, 7.0, 9.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.001285254955291748, -0.0012497790157794952, -0.0012143030762672424, -0.0011788271367549896, -0.0011433511972427368, -0.001107875257730484, -0.0010723993182182312, -0.0010369233787059784, -0.0010014474391937256, -0.0009659714996814728, -0.00093049556016922, -0.0008950196206569672, -0.0008595436811447144, -0.0008240677416324615, -0.0007885918021202087, -0.0007531158626079559, -0.0007176399230957031, -0.0006821639835834503, -0.0006466880440711975, -0.0006112121045589447, -0.0005757361650466919, -0.0005402602255344391, -0.0005047842860221863, -0.00046930834650993347, -0.00043383240699768066, -0.00039835646748542786, -0.00036288052797317505, -0.00032740458846092224, -0.00029192864894866943, -0.0002564527094364166, -0.00022097676992416382, -0.000185500830411911, -0.0001500248908996582, -0.0001145489513874054, -7.907301187515259e-05, -4.359707236289978e-05, -8.121132850646973e-06, 2.7354806661605835e-05, 6.283074617385864e-05, 9.830668568611145e-05, 0.00013378262519836426, 0.00016925856471061707, 0.00020473450422286987, 0.00024021044373512268, 0.0002756863832473755, 0.0003111623227596283, 0.0003466382622718811, 0.0003821142017841339, 0.0004175901412963867, 0.0004530660808086395, 0.0004885420203208923, 0.0005240179598331451, 0.000559493899345398, 0.0005949698388576508, 0.0006304457783699036, 0.0006659217178821564, 0.0007013976573944092, 0.000736873596906662, 0.0007723495364189148, 0.0008078254759311676, 0.0008433014154434204, 0.0008787773549556732, 0.000914253294467926, 0.0009497292339801788, 0.0009852051734924316]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 7.0, 9.0, 8.0, 8.0, 13.0, 14.0, 12.0, 13.0, 13.0, 18.0, 13.0, 24.0, 26.0, 39.0, 17.0, 31.0, 24.0, 28.0, 33.0, 48.0, 36.0, 34.0, 43.0, 37.0, 32.0, 34.0, 27.0, 31.0, 32.0, 28.0, 36.0, 23.0, 23.0, 19.0, 21.0, 18.0, 18.0, 15.0, 19.0, 15.0, 13.0, 13.0, 9.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-5.20703125, -5.04876708984375, -4.8905029296875, -4.73223876953125, -4.573974609375, -4.41571044921875, -4.2574462890625, -4.09918212890625, -3.94091796875, -3.78265380859375, -3.6243896484375, -3.46612548828125, -3.307861328125, -3.14959716796875, -2.9913330078125, -2.83306884765625, -2.6748046875, -2.51654052734375, -2.3582763671875, -2.20001220703125, -2.041748046875, -1.88348388671875, -1.7252197265625, -1.56695556640625, -1.40869140625, -1.25042724609375, -1.0921630859375, -0.93389892578125, -0.775634765625, -0.61737060546875, -0.4591064453125, -0.30084228515625, -0.142578125, 0.01568603515625, 0.1739501953125, 0.33221435546875, 0.490478515625, 0.64874267578125, 0.8070068359375, 0.96527099609375, 1.12353515625, 1.28179931640625, 1.4400634765625, 1.59832763671875, 1.756591796875, 1.91485595703125, 2.0731201171875, 2.23138427734375, 2.3896484375, 2.54791259765625, 2.7061767578125, 2.86444091796875, 3.022705078125, 3.18096923828125, 3.3392333984375, 3.49749755859375, 3.65576171875, 3.81402587890625, 3.9722900390625, 4.13055419921875, 4.288818359375, 4.44708251953125, 4.6053466796875, 4.76361083984375, 4.921875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 2.0, 9.0, 7.0, 6.0, 16.0, 19.0, 20.0, 26.0, 26.0, 30.0, 45.0, 73.0, 104.0, 196.0, 358.0, 712.0, 1455.0, 3194.0, 7179.0, 16085.0, 35281.0, 81149.0, 217841.0, 391580.0, 171807.0, 66966.0, 29733.0, 13318.0, 5899.0, 2730.0, 1238.0, 586.0, 303.0, 165.0, 113.0, 71.0, 40.0, 30.0, 39.0, 10.0, 24.0, 12.0, 11.0, 16.0, 4.0, 8.0, 6.0, 4.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.890625, -4.7396240234375, -4.588623046875, -4.4376220703125, -4.28662109375, -4.1356201171875, -3.984619140625, -3.8336181640625, -3.6826171875, -3.5316162109375, -3.380615234375, -3.2296142578125, -3.07861328125, -2.9276123046875, -2.776611328125, -2.6256103515625, -2.474609375, -2.3236083984375, -2.172607421875, -2.0216064453125, -1.87060546875, -1.7196044921875, -1.568603515625, -1.4176025390625, -1.2666015625, -1.1156005859375, -0.964599609375, -0.8135986328125, -0.66259765625, -0.5115966796875, -0.360595703125, -0.2095947265625, -0.05859375, 0.0924072265625, 0.243408203125, 0.3944091796875, 0.54541015625, 0.6964111328125, 0.847412109375, 0.9984130859375, 1.1494140625, 1.3004150390625, 1.451416015625, 1.6024169921875, 1.75341796875, 1.9044189453125, 2.055419921875, 2.2064208984375, 2.357421875, 2.5084228515625, 2.659423828125, 2.8104248046875, 2.96142578125, 3.1124267578125, 3.263427734375, 3.4144287109375, 3.5654296875, 3.7164306640625, 3.867431640625, 4.0184326171875, 4.16943359375, 4.3204345703125, 4.471435546875, 4.6224365234375, 4.7734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 3.0, 5.0, 12.0, 10.0, 16.0, 15.0, 22.0, 14.0, 23.0, 29.0, 19.0, 33.0, 30.0, 37.0, 48.0, 56.0, 64.0, 134.0, 1480.0, 392.0, 112.0, 65.0, 51.0, 46.0, 32.0, 34.0, 31.0, 21.0, 22.0, 31.0, 29.0, 15.0, 19.0, 15.0, 19.0, 8.0, 5.0, 9.0, 11.0, 7.0, 5.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.734375, -18.165283203125, -17.59619140625, -17.027099609375, -16.4580078125, -15.888916015625, -15.31982421875, -14.750732421875, -14.181640625, -13.612548828125, -13.04345703125, -12.474365234375, -11.9052734375, -11.336181640625, -10.76708984375, -10.197998046875, -9.62890625, -9.059814453125, -8.49072265625, -7.921630859375, -7.3525390625, -6.783447265625, -6.21435546875, -5.645263671875, -5.076171875, -4.507080078125, -3.93798828125, -3.368896484375, -2.7998046875, -2.230712890625, -1.66162109375, -1.092529296875, -0.5234375, 0.045654296875, 0.61474609375, 1.183837890625, 1.7529296875, 2.322021484375, 2.89111328125, 3.460205078125, 4.029296875, 4.598388671875, 5.16748046875, 5.736572265625, 6.3056640625, 6.874755859375, 7.44384765625, 8.012939453125, 8.58203125, 9.151123046875, 9.72021484375, 10.289306640625, 10.8583984375, 11.427490234375, 11.99658203125, 12.565673828125, 13.134765625, 13.703857421875, 14.27294921875, 14.842041015625, 15.4111328125, 15.980224609375, 16.54931640625, 17.118408203125, 17.6875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 2.0, 5.0, 6.0, 13.0, 11.0, 14.0, 11.0, 24.0, 25.0, 31.0, 50.0, 55.0, 72.0, 76.0, 104.0, 134.0, 180.0, 260.0, 421.0, 911.0, 8723.0, 2652769.0, 475527.0, 4230.0, 795.0, 395.0, 215.0, 156.0, 106.0, 82.0, 65.0, 54.0, 34.0, 32.0, 29.0, 21.0, 13.0, 8.0, 8.0, 11.0, 11.0, 3.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -30.948974609375, -29.91357421875, -28.878173828125, -27.8427734375, -26.807373046875, -25.77197265625, -24.736572265625, -23.701171875, -22.665771484375, -21.63037109375, -20.594970703125, -19.5595703125, -18.524169921875, -17.48876953125, -16.453369140625, -15.41796875, -14.382568359375, -13.34716796875, -12.311767578125, -11.2763671875, -10.240966796875, -9.20556640625, -8.170166015625, -7.134765625, -6.099365234375, -5.06396484375, -4.028564453125, -2.9931640625, -1.957763671875, -0.92236328125, 0.113037109375, 1.1484375, 2.183837890625, 3.21923828125, 4.254638671875, 5.2900390625, 6.325439453125, 7.36083984375, 8.396240234375, 9.431640625, 10.467041015625, 11.50244140625, 12.537841796875, 13.5732421875, 14.608642578125, 15.64404296875, 16.679443359375, 17.71484375, 18.750244140625, 19.78564453125, 20.821044921875, 21.8564453125, 22.891845703125, 23.92724609375, 24.962646484375, 25.998046875, 27.033447265625, 28.06884765625, 29.104248046875, 30.1396484375, 31.175048828125, 32.21044921875, 33.245849609375, 34.28125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 9.0, 164.0, 597.0, 227.0, 19.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.780529022216797, -10.007795333862305, -7.235060691833496, -4.4623260498046875, -1.6895923614501953, 1.0831413269042969, 3.855876922607422, 6.628610610961914, 9.401344299316406, 12.174077987670898, 14.946812629699707, 17.719547271728516, 20.492280960083008, 23.2650146484375, 26.037750244140625, 28.810483932495117, 31.58321762084961, 34.355953216552734, 37.128684997558594, 39.90142059326172, 42.674156188964844, 45.4468879699707, 48.21962356567383, 50.99235534667969, 53.76509094238281, 56.53782653808594, 59.3105583190918, 62.08329391479492, 64.85602569580078, 67.6287612915039, 70.40149688720703, 73.17423248291016, 75.94696044921875, 78.71969604492188, 81.492431640625, 84.26516723632812, 87.03789520263672, 89.81063079833984, 92.58336639404297, 95.3561019897461, 98.12882995605469, 100.90156555175781, 103.67430114746094, 106.44703674316406, 109.21976470947266, 111.99250030517578, 114.7652359008789, 117.53797149658203, 120.31070709228516, 123.08344268798828, 125.8561782836914, 128.62890625, 131.40164184570312, 134.17437744140625, 136.94711303710938, 139.7198486328125, 142.49258422851562, 145.26531982421875, 148.03805541992188, 150.810791015625, 153.58352661132812, 156.35626220703125, 159.12899780273438, 161.90171813964844, 164.67445373535156]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 5.0, 3.0, 4.0, 6.0, 8.0, 7.0, 13.0, 8.0, 11.0, 12.0, 12.0, 19.0, 19.0, 27.0, 29.0, 31.0, 42.0, 38.0, 39.0, 37.0, 36.0, 39.0, 54.0, 45.0, 42.0, 42.0, 34.0, 30.0, 44.0, 42.0, 32.0, 24.0, 27.0, 21.0, 22.0, 18.0, 14.0, 9.0, 15.0, 12.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-53.05552291870117, -51.49504089355469, -49.93455505371094, -48.37407302856445, -46.81359100341797, -45.253108978271484, -43.692623138427734, -42.13214111328125, -40.571659088134766, -39.01117706298828, -37.45069122314453, -35.89020919799805, -34.32972717285156, -32.76924514770508, -31.208759307861328, -29.648277282714844, -28.087793350219727, -26.52730941772461, -24.966827392578125, -23.406343460083008, -21.845861434936523, -20.285377502441406, -18.724895477294922, -17.164411544799805, -15.603928565979004, -14.043445587158203, -12.482962608337402, -10.922479629516602, -9.361995697021484, -7.801513195037842, -6.241029739379883, -4.680546760559082, -3.1200637817382812, -1.559580683708191, 0.0009024143218994141, 1.5613856315612793, 3.12186861038208, 4.682351589202881, 6.24283504486084, 7.803318023681641, 9.363801002502441, 10.924283981323242, 12.484766960144043, 14.045249938964844, 15.605733871459961, 17.166215896606445, 18.726699829101562, 20.287181854248047, 21.847665786743164, 23.40814971923828, 24.968631744384766, 26.529115676879883, 28.089597702026367, 29.650081634521484, 31.21056365966797, 32.77104949951172, 34.3315315246582, 35.89201354980469, 37.45249938964844, 39.01298141479492, 40.573463439941406, 42.13394546508789, 43.69443130493164, 45.254913330078125, 46.81539535522461]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 5.0, 7.0, 7.0, 11.0, 13.0, 14.0, 16.0, 9.0, 16.0, 17.0, 18.0, 32.0, 24.0, 23.0, 27.0, 27.0, 43.0, 36.0, 40.0, 33.0, 38.0, 41.0, 30.0, 31.0, 34.0, 41.0, 34.0, 26.0, 36.0, 25.0, 25.0, 32.0, 21.0, 16.0, 24.0, 10.0, 18.0, 22.0, 8.0, 9.0, 9.0, 12.0, 9.0, 6.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.10546875, -4.94158935546875, -4.7777099609375, -4.61383056640625, -4.449951171875, -4.28607177734375, -4.1221923828125, -3.95831298828125, -3.79443359375, -3.63055419921875, -3.4666748046875, -3.30279541015625, -3.138916015625, -2.97503662109375, -2.8111572265625, -2.64727783203125, -2.4833984375, -2.31951904296875, -2.1556396484375, -1.99176025390625, -1.827880859375, -1.66400146484375, -1.5001220703125, -1.33624267578125, -1.17236328125, -1.00848388671875, -0.8446044921875, -0.68072509765625, -0.516845703125, -0.35296630859375, -0.1890869140625, -0.02520751953125, 0.138671875, 0.30255126953125, 0.4664306640625, 0.63031005859375, 0.794189453125, 0.95806884765625, 1.1219482421875, 1.28582763671875, 1.44970703125, 1.61358642578125, 1.7774658203125, 1.94134521484375, 2.105224609375, 2.26910400390625, 2.4329833984375, 2.59686279296875, 2.7607421875, 2.92462158203125, 3.0885009765625, 3.25238037109375, 3.416259765625, 3.58013916015625, 3.7440185546875, 3.90789794921875, 4.07177734375, 4.23565673828125, 4.3995361328125, 4.56341552734375, 4.727294921875, 4.89117431640625, 5.0550537109375, 5.21893310546875, 5.3828125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 12.0, 13.0, 11.0, 12.0, 14.0, 25.0, 25.0, 31.0, 24.0, 38.0, 51.0, 66.0, 84.0, 147.0, 234.0, 738.0, 4486.0, 47685.0, 1295290.0, 2696876.0, 136426.0, 9594.0, 1432.0, 342.0, 145.0, 99.0, 84.0, 42.0, 37.0, 40.0, 32.0, 24.0, 20.0, 21.0, 16.0, 12.0, 7.0, 14.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.578125, -17.03173828125, -16.4853515625, -15.93896484375, -15.392578125, -14.84619140625, -14.2998046875, -13.75341796875, -13.20703125, -12.66064453125, -12.1142578125, -11.56787109375, -11.021484375, -10.47509765625, -9.9287109375, -9.38232421875, -8.8359375, -8.28955078125, -7.7431640625, -7.19677734375, -6.650390625, -6.10400390625, -5.5576171875, -5.01123046875, -4.46484375, -3.91845703125, -3.3720703125, -2.82568359375, -2.279296875, -1.73291015625, -1.1865234375, -0.64013671875, -0.09375, 0.45263671875, 0.9990234375, 1.54541015625, 2.091796875, 2.63818359375, 3.1845703125, 3.73095703125, 4.27734375, 4.82373046875, 5.3701171875, 5.91650390625, 6.462890625, 7.00927734375, 7.5556640625, 8.10205078125, 8.6484375, 9.19482421875, 9.7412109375, 10.28759765625, 10.833984375, 11.38037109375, 11.9267578125, 12.47314453125, 13.01953125, 13.56591796875, 14.1123046875, 14.65869140625, 15.205078125, 15.75146484375, 16.2978515625, 16.84423828125, 17.390625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 7.0, 13.0, 15.0, 23.0, 36.0, 47.0, 67.0, 99.0, 134.0, 189.0, 237.0, 304.0, 406.0, 473.0, 523.0, 392.0, 300.0, 208.0, 140.0, 113.0, 87.0, 68.0, 37.0, 43.0, 28.0, 24.0, 16.0, 11.0, 8.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.796875, -10.46728515625, -10.1376953125, -9.80810546875, -9.478515625, -9.14892578125, -8.8193359375, -8.48974609375, -8.16015625, -7.83056640625, -7.5009765625, -7.17138671875, -6.841796875, -6.51220703125, -6.1826171875, -5.85302734375, -5.5234375, -5.19384765625, -4.8642578125, -4.53466796875, -4.205078125, -3.87548828125, -3.5458984375, -3.21630859375, -2.88671875, -2.55712890625, -2.2275390625, -1.89794921875, -1.568359375, -1.23876953125, -0.9091796875, -0.57958984375, -0.25, 0.07958984375, 0.4091796875, 0.73876953125, 1.068359375, 1.39794921875, 1.7275390625, 2.05712890625, 2.38671875, 2.71630859375, 3.0458984375, 3.37548828125, 3.705078125, 4.03466796875, 4.3642578125, 4.69384765625, 5.0234375, 5.35302734375, 5.6826171875, 6.01220703125, 6.341796875, 6.67138671875, 7.0009765625, 7.33056640625, 7.66015625, 7.98974609375, 8.3193359375, 8.64892578125, 8.978515625, 9.30810546875, 9.6376953125, 9.96728515625, 10.296875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 4.0, 12.0, 14.0, 13.0, 28.0, 24.0, 34.0, 49.0, 63.0, 71.0, 97.0, 113.0, 172.0, 210.0, 278.0, 437.0, 1140.0, 17167.0, 3690034.0, 477878.0, 4369.0, 712.0, 357.0, 243.0, 169.0, 130.0, 110.0, 76.0, 69.0, 37.0, 40.0, 32.0, 29.0, 18.0, 15.0, 9.0, 8.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.96875, -45.537109375, -44.10546875, -42.673828125, -41.2421875, -39.810546875, -38.37890625, -36.947265625, -35.515625, -34.083984375, -32.65234375, -31.220703125, -29.7890625, -28.357421875, -26.92578125, -25.494140625, -24.0625, -22.630859375, -21.19921875, -19.767578125, -18.3359375, -16.904296875, -15.47265625, -14.041015625, -12.609375, -11.177734375, -9.74609375, -8.314453125, -6.8828125, -5.451171875, -4.01953125, -2.587890625, -1.15625, 0.275390625, 1.70703125, 3.138671875, 4.5703125, 6.001953125, 7.43359375, 8.865234375, 10.296875, 11.728515625, 13.16015625, 14.591796875, 16.0234375, 17.455078125, 18.88671875, 20.318359375, 21.75, 23.181640625, 24.61328125, 26.044921875, 27.4765625, 28.908203125, 30.33984375, 31.771484375, 33.203125, 34.634765625, 36.06640625, 37.498046875, 38.9296875, 40.361328125, 41.79296875, 43.224609375, 44.65625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 25.0, 143.0, 448.0, 324.0, 67.0, 10.0, 0.0, 2.0], "bins": [-276.5811767578125, -271.86993408203125, -267.1587219238281, -262.447509765625, -257.73626708984375, -253.02503967285156, -248.31381225585938, -243.6025848388672, -238.891357421875, -234.1801300048828, -229.46890258789062, -224.75767517089844, -220.04644775390625, -215.33522033691406, -210.62399291992188, -205.9127655029297, -201.2015380859375, -196.4903106689453, -191.77908325195312, -187.06785583496094, -182.35662841796875, -177.64540100097656, -172.93417358398438, -168.2229461669922, -163.51171875, -158.8004913330078, -154.08926391601562, -149.37803649902344, -144.66680908203125, -139.95558166503906, -135.24435424804688, -130.5331268310547, -125.82190704345703, -121.11067962646484, -116.39945220947266, -111.68822479248047, -106.97699737548828, -102.2657699584961, -97.5545425415039, -92.84331512451172, -88.13208770751953, -83.42086029052734, -78.70963287353516, -73.99840545654297, -69.28717803955078, -64.5759506225586, -59.864723205566406, -55.15349578857422, -50.44226837158203, -45.731040954589844, -41.019813537597656, -36.30858612060547, -31.59735870361328, -26.886131286621094, -22.174903869628906, -17.46367645263672, -12.752447128295898, -8.041219711303711, -3.3299922943115234, 1.381235122680664, 6.092462539672852, 10.803689956665039, 15.514917373657227, 20.226144790649414, 24.9373722076416]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 7.0, 5.0, 6.0, 9.0, 9.0, 9.0, 16.0, 16.0, 23.0, 25.0, 30.0, 27.0, 34.0, 37.0, 41.0, 34.0, 40.0, 47.0, 39.0, 35.0, 51.0, 45.0, 41.0, 49.0, 24.0, 35.0, 31.0, 37.0, 31.0, 27.0, 25.0, 22.0, 23.0, 15.0, 12.0, 13.0, 5.0, 7.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.204925537109375, -32.067684173583984, -30.930438995361328, -29.793197631835938, -28.655954360961914, -27.51871109008789, -26.3814697265625, -25.244226455688477, -24.106983184814453, -22.96973991394043, -21.832496643066406, -20.695255279541016, -19.558012008666992, -18.42076873779297, -17.283527374267578, -16.146284103393555, -15.009040832519531, -13.871797561645508, -12.7345552444458, -11.597312927246094, -10.46006965637207, -9.322826385498047, -8.18558406829834, -7.048341274261475, -5.911098480224609, -4.773855686187744, -3.636612892150879, -2.4993700981140137, -1.3621273040771484, -0.2248845100402832, 0.912358283996582, 2.0496010780334473, 3.1868438720703125, 4.324086666107178, 5.461329460144043, 6.598572254180908, 7.735815048217773, 8.873058319091797, 10.010300636291504, 11.147542953491211, 12.284786224365234, 13.422029495239258, 14.559271812438965, 15.696514129638672, 16.833757400512695, 17.97100067138672, 19.10824203491211, 20.245485305786133, 21.382728576660156, 22.51997184753418, 23.657215118408203, 24.794456481933594, 25.931699752807617, 27.06894302368164, 28.20618438720703, 29.343427658081055, 30.480670928955078, 31.6179141998291, 32.755157470703125, 33.892398834228516, 35.029640197753906, 36.16688537597656, 37.30412673950195, 38.44137191772461, 39.57861328125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 5.0, 9.0, 12.0, 14.0, 8.0, 12.0, 23.0, 20.0, 14.0, 21.0, 25.0, 39.0, 26.0, 47.0, 32.0, 36.0, 30.0, 30.0, 42.0, 34.0, 37.0, 42.0, 36.0, 47.0, 30.0, 32.0, 38.0, 28.0, 33.0, 23.0, 21.0, 23.0, 13.0, 16.0, 19.0, 15.0, 11.0, 11.0, 5.0, 11.0, 6.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.6796875, -5.50750732421875, -5.3353271484375, -5.16314697265625, -4.990966796875, -4.81878662109375, -4.6466064453125, -4.47442626953125, -4.30224609375, -4.13006591796875, -3.9578857421875, -3.78570556640625, -3.613525390625, -3.44134521484375, -3.2691650390625, -3.09698486328125, -2.9248046875, -2.75262451171875, -2.5804443359375, -2.40826416015625, -2.236083984375, -2.06390380859375, -1.8917236328125, -1.71954345703125, -1.54736328125, -1.37518310546875, -1.2030029296875, -1.03082275390625, -0.858642578125, -0.68646240234375, -0.5142822265625, -0.34210205078125, -0.169921875, 0.00225830078125, 0.1744384765625, 0.34661865234375, 0.518798828125, 0.69097900390625, 0.8631591796875, 1.03533935546875, 1.20751953125, 1.37969970703125, 1.5518798828125, 1.72406005859375, 1.896240234375, 2.06842041015625, 2.2406005859375, 2.41278076171875, 2.5849609375, 2.75714111328125, 2.9293212890625, 3.10150146484375, 3.273681640625, 3.44586181640625, 3.6180419921875, 3.79022216796875, 3.96240234375, 4.13458251953125, 4.3067626953125, 4.47894287109375, 4.651123046875, 4.82330322265625, 4.9954833984375, 5.16766357421875, 5.33984375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 13.0, 17.0, 39.0, 41.0, 49.0, 89.0, 97.0, 194.0, 285.0, 390.0, 578.0, 879.0, 1193.0, 1874.0, 2462.0, 3613.0, 5122.0, 7358.0, 10337.0, 15077.0, 21832.0, 33213.0, 50357.0, 78240.0, 125765.0, 181695.0, 173662.0, 115995.0, 73240.0, 46882.0, 30613.0, 20553.0, 14029.0, 9908.0, 6824.0, 4770.0, 3564.0, 2363.0, 1698.0, 1162.0, 813.0, 523.0, 366.0, 253.0, 178.0, 111.0, 67.0, 57.0, 40.0, 29.0, 21.0, 7.0, 9.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.65478515625, -0.6342697143554688, -0.6137542724609375, -0.5932388305664062, -0.572723388671875, -0.5522079467773438, -0.5316925048828125, -0.5111770629882812, -0.49066162109375, -0.47014617919921875, -0.4496307373046875, -0.42911529541015625, -0.408599853515625, -0.38808441162109375, -0.3675689697265625, -0.34705352783203125, -0.3265380859375, -0.30602264404296875, -0.2855072021484375, -0.26499176025390625, -0.244476318359375, -0.22396087646484375, -0.2034454345703125, -0.18292999267578125, -0.16241455078125, -0.14189910888671875, -0.1213836669921875, -0.10086822509765625, -0.080352783203125, -0.05983734130859375, -0.0393218994140625, -0.01880645751953125, 0.001708984375, 0.02222442626953125, 0.0427398681640625, 0.06325531005859375, 0.083770751953125, 0.10428619384765625, 0.1248016357421875, 0.14531707763671875, 0.16583251953125, 0.18634796142578125, 0.2068634033203125, 0.22737884521484375, 0.247894287109375, 0.26840972900390625, 0.2889251708984375, 0.30944061279296875, 0.3299560546875, 0.35047149658203125, 0.3709869384765625, 0.39150238037109375, 0.412017822265625, 0.43253326416015625, 0.4530487060546875, 0.47356414794921875, 0.49407958984375, 0.5145950317382812, 0.5351104736328125, 0.5556259155273438, 0.576141357421875, 0.5966567993164062, 0.6171722412109375, 0.6376876831054688, 0.658203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 11.0, 5.0, 13.0, 12.0, 12.0, 11.0, 23.0, 15.0, 22.0, 27.0, 19.0, 29.0, 43.0, 46.0, 40.0, 36.0, 35.0, 46.0, 41.0, 1061.0, 42.0, 40.0, 33.0, 44.0, 37.0, 38.0, 33.0, 36.0, 23.0, 20.0, 26.0, 18.0, 12.0, 15.0, 12.0, 9.0, 10.0, 5.0, 8.0, 6.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.970977783203125, -3.84820556640625, -3.725433349609375, -3.6026611328125, -3.479888916015625, -3.35711669921875, -3.234344482421875, -3.111572265625, -2.988800048828125, -2.86602783203125, -2.743255615234375, -2.6204833984375, -2.497711181640625, -2.37493896484375, -2.252166748046875, -2.12939453125, -2.006622314453125, -1.88385009765625, -1.761077880859375, -1.6383056640625, -1.515533447265625, -1.39276123046875, -1.269989013671875, -1.147216796875, -1.024444580078125, -0.90167236328125, -0.778900146484375, -0.6561279296875, -0.533355712890625, -0.41058349609375, -0.287811279296875, -0.1650390625, -0.042266845703125, 0.08050537109375, 0.203277587890625, 0.3260498046875, 0.448822021484375, 0.57159423828125, 0.694366455078125, 0.817138671875, 0.939910888671875, 1.06268310546875, 1.185455322265625, 1.3082275390625, 1.430999755859375, 1.55377197265625, 1.676544189453125, 1.79931640625, 1.922088623046875, 2.04486083984375, 2.167633056640625, 2.2904052734375, 2.413177490234375, 2.53594970703125, 2.658721923828125, 2.781494140625, 2.904266357421875, 3.02703857421875, 3.149810791015625, 3.2725830078125, 3.395355224609375, 3.51812744140625, 3.640899658203125, 3.763671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 12.0, 3.0, 13.0, 14.0, 25.0, 35.0, 50.0, 90.0, 139.0, 243.0, 393.0, 673.0, 1019.0, 1683.0, 2877.0, 4872.0, 8283.0, 14103.0, 24256.0, 43485.0, 78151.0, 146047.0, 1281594.0, 212865.0, 122995.0, 65772.0, 36871.0, 20979.0, 12051.0, 7149.0, 4118.0, 2398.0, 1483.0, 871.0, 563.0, 337.0, 229.0, 131.0, 81.0, 51.0, 54.0, 24.0, 16.0, 8.0, 8.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7685546875, -0.7458572387695312, -0.7231597900390625, -0.7004623413085938, -0.677764892578125, -0.6550674438476562, -0.6323699951171875, -0.6096725463867188, -0.58697509765625, -0.5642776489257812, -0.5415802001953125, -0.5188827514648438, -0.496185302734375, -0.47348785400390625, -0.4507904052734375, -0.42809295654296875, -0.4053955078125, -0.38269805908203125, -0.3600006103515625, -0.33730316162109375, -0.314605712890625, -0.29190826416015625, -0.2692108154296875, -0.24651336669921875, -0.22381591796875, -0.20111846923828125, -0.1784210205078125, -0.15572357177734375, -0.133026123046875, -0.11032867431640625, -0.0876312255859375, -0.06493377685546875, -0.042236328125, -0.01953887939453125, 0.0031585693359375, 0.02585601806640625, 0.048553466796875, 0.07125091552734375, 0.0939483642578125, 0.11664581298828125, 0.13934326171875, 0.16204071044921875, 0.1847381591796875, 0.20743560791015625, 0.230133056640625, 0.25283050537109375, 0.2755279541015625, 0.29822540283203125, 0.3209228515625, 0.34362030029296875, 0.3663177490234375, 0.38901519775390625, 0.411712646484375, 0.43441009521484375, 0.4571075439453125, 0.47980499267578125, 0.50250244140625, 0.5251998901367188, 0.5478973388671875, 0.5705947875976562, 0.593292236328125, 0.6159896850585938, 0.6386871337890625, 0.6613845825195312, 0.68408203125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 4.0, 1.0, 4.0, 1.0, 8.0, 4.0, 14.0, 8.0, 14.0, 10.0, 16.0, 23.0, 25.0, 32.0, 37.0, 42.0, 37.0, 48.0, 55.0, 52.0, 59.0, 39.0, 69.0, 59.0, 46.0, 37.0, 31.0, 41.0, 37.0, 34.0, 20.0, 15.0, 12.0, 11.0, 8.0, 9.0, 8.0, 8.0, 7.0, 2.0, 4.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019006729125976562, -0.0018430203199386597, -0.001785367727279663, -0.0017277151346206665, -0.00167006254196167, -0.0016124099493026733, -0.0015547573566436768, -0.0014971047639846802, -0.0014394521713256836, -0.001381799578666687, -0.0013241469860076904, -0.0012664943933486938, -0.0012088418006896973, -0.0011511892080307007, -0.001093536615371704, -0.0010358840227127075, -0.000978231430053711, -0.0009205788373947144, -0.0008629262447357178, -0.0008052736520767212, -0.0007476210594177246, -0.000689968466758728, -0.0006323158740997314, -0.0005746632814407349, -0.0005170106887817383, -0.0004593580961227417, -0.0004017055034637451, -0.00034405291080474854, -0.00028640031814575195, -0.00022874772548675537, -0.0001710951328277588, -0.00011344254016876221, -5.5789947509765625e-05, 1.862645149230957e-06, 5.951523780822754e-05, 0.00011716783046722412, 0.0001748204231262207, 0.00023247301578521729, 0.00029012560844421387, 0.00034777820110321045, 0.00040543079376220703, 0.0004630833864212036, 0.0005207359790802002, 0.0005783885717391968, 0.0006360411643981934, 0.0006936937570571899, 0.0007513463497161865, 0.0008089989423751831, 0.0008666515350341797, 0.0009243041276931763, 0.0009819567203521729, 0.0010396093130111694, 0.001097261905670166, 0.0011549144983291626, 0.0012125670909881592, 0.0012702196836471558, 0.0013278722763061523, 0.001385524868965149, 0.0014431774616241455, 0.001500830054283142, 0.0015584826469421387, 0.0016161352396011353, 0.0016737878322601318, 0.0017314404249191284, 0.001789093017578125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 9.0, 8.0, 8.0, 14.0, 13.0, 18.0, 26.0, 31.0, 33.0, 43.0, 56.0, 69.0, 98.0, 131.0, 213.0, 368.0, 980.0, 49957.0, 990377.0, 4551.0, 605.0, 279.0, 156.0, 135.0, 77.0, 53.0, 43.0, 35.0, 30.0, 40.0, 15.0, 19.0, 12.0, 11.0, 7.0, 6.0, 8.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.04083251953125, -0.03952789306640625, -0.0382232666015625, -0.03691864013671875, -0.035614013671875, -0.03430938720703125, -0.0330047607421875, -0.03170013427734375, -0.0303955078125, -0.02909088134765625, -0.0277862548828125, -0.02648162841796875, -0.025177001953125, -0.02387237548828125, -0.0225677490234375, -0.02126312255859375, -0.01995849609375, -0.01865386962890625, -0.0173492431640625, -0.01604461669921875, -0.014739990234375, -0.01343536376953125, -0.0121307373046875, -0.01082611083984375, -0.009521484375, -0.00821685791015625, -0.0069122314453125, -0.00560760498046875, -0.004302978515625, -0.00299835205078125, -0.0016937255859375, -0.00038909912109375, 0.00091552734375, 0.00222015380859375, 0.0035247802734375, 0.00482940673828125, 0.006134033203125, 0.00743865966796875, 0.0087432861328125, 0.01004791259765625, 0.0113525390625, 0.01265716552734375, 0.0139617919921875, 0.01526641845703125, 0.016571044921875, 0.01787567138671875, 0.0191802978515625, 0.02048492431640625, 0.02178955078125, 0.02309417724609375, 0.0243988037109375, 0.02570343017578125, 0.027008056640625, 0.02831268310546875, 0.0296173095703125, 0.03092193603515625, 0.0322265625, 0.03353118896484375, 0.0348358154296875, 0.03614044189453125, 0.037445068359375, 0.03874969482421875, 0.0400543212890625, 0.04135894775390625, 0.04266357421875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 24.0, 943.0, 48.0, 1.0, 0.0, 1.0], "bins": [-0.036522723734378815, -0.035909418016672134, -0.035296108573675156, -0.034682802855968475, -0.0340694934129715, -0.033456187695264816, -0.032842881977558136, -0.03222957253456116, -0.03161626681685448, -0.031002959236502647, -0.030389651656150818, -0.029776345938444138, -0.029163038358092308, -0.02854973077774048, -0.027936425060033798, -0.02732311747968197, -0.02670980989933014, -0.02609650231897831, -0.02548319473862648, -0.0248698890209198, -0.02425658144056797, -0.02364327386021614, -0.02302996814250946, -0.02241666056215763, -0.0218033529818058, -0.021190045401453972, -0.020576737821102142, -0.019963432103395462, -0.019350124523043633, -0.018736816942691803, -0.018123511224985123, -0.017510203644633293, -0.016896894201636314, -0.016283586621284485, -0.015670280903577805, -0.015056973323225975, -0.014443665742874146, -0.013830358162522316, -0.013217051513493061, -0.012603744864463806, -0.011990437284111977, -0.011377129703760147, -0.010763823054730892, -0.010150516405701637, -0.009537208825349808, -0.008923901244997978, -0.008310594595968723, -0.007697287481278181, -0.007083980366587639, -0.006470673251897097, -0.005857366137206554, -0.005244059022516012, -0.00463075190782547, -0.004017444793134928, -0.0034041376784443855, -0.0027908305637538433, -0.002177523449063301, -0.0015642163343727589, -0.0009509092196822166, -0.0003376021049916744, 0.0002757050096988678, 0.00088901212438941, 0.0015023192390799522, 0.0021156263537704945, 0.0027289334684610367]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 12.0, 15.0, 26.0, 29.0, 32.0, 43.0, 53.0, 65.0, 54.0, 64.0, 70.0, 62.0, 70.0, 69.0, 54.0, 49.0, 55.0, 37.0, 25.0, 25.0, 30.0, 24.0, 8.0, 7.0, 11.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011633038520812988, -0.0011096522212028503, -0.0010560005903244019, -0.0010023489594459534, -0.0009486973285675049, -0.0008950456976890564, -0.0008413940668106079, -0.0007877424359321594, -0.0007340908050537109, -0.0006804391741752625, -0.000626787543296814, -0.0005731359124183655, -0.000519484281539917, -0.0004658326506614685, -0.00041218101978302, -0.00035852938890457153, -0.00030487775802612305, -0.00025122612714767456, -0.00019757449626922607, -0.0001439228653907776, -9.02712345123291e-05, -3.6619603633880615e-05, 1.703202724456787e-05, 7.068365812301636e-05, 0.00012433528900146484, 0.00017798691987991333, 0.00023163855075836182, 0.0002852901816368103, 0.0003389418125152588, 0.0003925934433937073, 0.00044624507427215576, 0.0004998967051506042, 0.0005535483360290527, 0.0006071999669075012, 0.0006608515977859497, 0.0007145032286643982, 0.0007681548595428467, 0.0008218064904212952, 0.0008754581212997437, 0.0009291097521781921, 0.0009827613830566406, 0.0010364130139350891, 0.0010900646448135376, 0.001143716275691986, 0.0011973679065704346, 0.001251019537448883, 0.0013046711683273315, 0.00135832279920578, 0.0014119744300842285, 0.001465626060962677, 0.0015192776918411255, 0.001572929322719574, 0.0016265809535980225, 0.001680232584476471, 0.0017338842153549194, 0.001787535846233368, 0.0018411874771118164, 0.001894839107990265, 0.0019484907388687134, 0.002002142369747162, 0.0020557940006256104, 0.002109445631504059, 0.0021630972623825073, 0.002216748893260956, 0.0022704005241394043]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 5.0, 9.0, 12.0, 14.0, 8.0, 12.0, 23.0, 20.0, 14.0, 21.0, 25.0, 39.0, 26.0, 47.0, 32.0, 36.0, 30.0, 30.0, 42.0, 34.0, 37.0, 42.0, 36.0, 47.0, 30.0, 32.0, 38.0, 28.0, 33.0, 24.0, 20.0, 23.0, 13.0, 16.0, 19.0, 15.0, 11.0, 11.0, 5.0, 11.0, 6.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.6796875, -5.50750732421875, -5.3353271484375, -5.16314697265625, -4.990966796875, -4.81878662109375, -4.6466064453125, -4.47442626953125, -4.30224609375, -4.13006591796875, -3.9578857421875, -3.78570556640625, -3.613525390625, -3.44134521484375, -3.2691650390625, -3.09698486328125, -2.9248046875, -2.75262451171875, -2.5804443359375, -2.40826416015625, -2.236083984375, -2.06390380859375, -1.8917236328125, -1.71954345703125, -1.54736328125, -1.37518310546875, -1.2030029296875, -1.03082275390625, -0.858642578125, -0.68646240234375, -0.5142822265625, -0.34210205078125, -0.169921875, 0.00225830078125, 0.1744384765625, 0.34661865234375, 0.518798828125, 0.69097900390625, 0.8631591796875, 1.03533935546875, 1.20751953125, 1.37969970703125, 1.5518798828125, 1.72406005859375, 1.896240234375, 2.06842041015625, 2.2406005859375, 2.41278076171875, 2.5849609375, 2.75714111328125, 2.9293212890625, 3.10150146484375, 3.273681640625, 3.44586181640625, 3.6180419921875, 3.79022216796875, 3.96240234375, 4.13458251953125, 4.3067626953125, 4.47894287109375, 4.651123046875, 4.82330322265625, 4.9954833984375, 5.16766357421875, 5.33984375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 8.0, 4.0, 4.0, 10.0, 16.0, 17.0, 18.0, 18.0, 21.0, 40.0, 39.0, 54.0, 81.0, 115.0, 140.0, 201.0, 311.0, 513.0, 1314.0, 5655.0, 30810.0, 254706.0, 667732.0, 70710.0, 11662.0, 2338.0, 727.0, 382.0, 239.0, 157.0, 131.0, 89.0, 53.0, 46.0, 43.0, 28.0, 26.0, 23.0, 18.0, 12.0, 9.0, 8.0, 7.0, 4.0, 3.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.2890625, -10.94921875, -10.609375, -10.26953125, -9.9296875, -9.58984375, -9.25, -8.91015625, -8.5703125, -8.23046875, -7.890625, -7.55078125, -7.2109375, -6.87109375, -6.53125, -6.19140625, -5.8515625, -5.51171875, -5.171875, -4.83203125, -4.4921875, -4.15234375, -3.8125, -3.47265625, -3.1328125, -2.79296875, -2.453125, -2.11328125, -1.7734375, -1.43359375, -1.09375, -0.75390625, -0.4140625, -0.07421875, 0.265625, 0.60546875, 0.9453125, 1.28515625, 1.625, 1.96484375, 2.3046875, 2.64453125, 2.984375, 3.32421875, 3.6640625, 4.00390625, 4.34375, 4.68359375, 5.0234375, 5.36328125, 5.703125, 6.04296875, 6.3828125, 6.72265625, 7.0625, 7.40234375, 7.7421875, 8.08203125, 8.421875, 8.76171875, 9.1015625, 9.44140625, 9.78125, 10.12109375, 10.4609375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 8.0, 7.0, 8.0, 7.0, 8.0, 14.0, 11.0, 16.0, 19.0, 23.0, 20.0, 14.0, 43.0, 28.0, 47.0, 43.0, 43.0, 56.0, 53.0, 198.0, 1722.0, 206.0, 62.0, 48.0, 49.0, 29.0, 41.0, 24.0, 33.0, 29.0, 22.0, 19.0, 23.0, 16.0, 20.0, 10.0, 6.0, 4.0, 4.0, 9.0, 2.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.890625, -19.278564453125, -18.66650390625, -18.054443359375, -17.4423828125, -16.830322265625, -16.21826171875, -15.606201171875, -14.994140625, -14.382080078125, -13.77001953125, -13.157958984375, -12.5458984375, -11.933837890625, -11.32177734375, -10.709716796875, -10.09765625, -9.485595703125, -8.87353515625, -8.261474609375, -7.6494140625, -7.037353515625, -6.42529296875, -5.813232421875, -5.201171875, -4.589111328125, -3.97705078125, -3.364990234375, -2.7529296875, -2.140869140625, -1.52880859375, -0.916748046875, -0.3046875, 0.307373046875, 0.91943359375, 1.531494140625, 2.1435546875, 2.755615234375, 3.36767578125, 3.979736328125, 4.591796875, 5.203857421875, 5.81591796875, 6.427978515625, 7.0400390625, 7.652099609375, 8.26416015625, 8.876220703125, 9.48828125, 10.100341796875, 10.71240234375, 11.324462890625, 11.9365234375, 12.548583984375, 13.16064453125, 13.772705078125, 14.384765625, 14.996826171875, 15.60888671875, 16.220947265625, 16.8330078125, 17.445068359375, 18.05712890625, 18.669189453125, 19.28125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 5.0, 5.0, 5.0, 11.0, 17.0, 22.0, 25.0, 29.0, 25.0, 43.0, 52.0, 50.0, 60.0, 121.0, 205.0, 406.0, 1088.0, 28455.0, 3104010.0, 9225.0, 816.0, 351.0, 176.0, 113.0, 91.0, 55.0, 42.0, 33.0, 29.0, 33.0, 18.0, 16.0, 14.0, 11.0, 8.0, 10.0, 5.0, 6.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5, -43.08251953125, -41.6650390625, -40.24755859375, -38.830078125, -37.41259765625, -35.9951171875, -34.57763671875, -33.16015625, -31.74267578125, -30.3251953125, -28.90771484375, -27.490234375, -26.07275390625, -24.6552734375, -23.23779296875, -21.8203125, -20.40283203125, -18.9853515625, -17.56787109375, -16.150390625, -14.73291015625, -13.3154296875, -11.89794921875, -10.48046875, -9.06298828125, -7.6455078125, -6.22802734375, -4.810546875, -3.39306640625, -1.9755859375, -0.55810546875, 0.859375, 2.27685546875, 3.6943359375, 5.11181640625, 6.529296875, 7.94677734375, 9.3642578125, 10.78173828125, 12.19921875, 13.61669921875, 15.0341796875, 16.45166015625, 17.869140625, 19.28662109375, 20.7041015625, 22.12158203125, 23.5390625, 24.95654296875, 26.3740234375, 27.79150390625, 29.208984375, 30.62646484375, 32.0439453125, 33.46142578125, 34.87890625, 36.29638671875, 37.7138671875, 39.13134765625, 40.548828125, 41.96630859375, 43.3837890625, 44.80126953125, 46.21875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 164.0, 781.0, 69.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.91584014892578, -17.040651321411133, -13.1654634475708, -9.290275573730469, -5.41508674621582, -1.5398979187011719, 2.3352890014648438, 6.210477828979492, 10.08566665649414, 13.960855484008789, 17.836044311523438, 21.711231231689453, 25.5864200592041, 29.46160888671875, 33.336795806884766, 37.21198272705078, 41.08717346191406, 44.96236038208008, 48.83755111694336, 52.712738037109375, 56.587928771972656, 60.46311569213867, 64.33830261230469, 68.21349334716797, 72.08868408203125, 75.96387481689453, 79.83905792236328, 83.71424865722656, 87.58943939208984, 91.46463012695312, 95.33981323242188, 99.21500396728516, 103.09017944335938, 106.96537017822266, 110.8405532836914, 114.71574401855469, 118.59093475341797, 122.46612548828125, 126.34130859375, 130.21649169921875, 134.09169006347656, 137.9668731689453, 141.84207153320312, 145.71725463867188, 149.59243774414062, 153.46763610839844, 157.3428192138672, 161.21800231933594, 165.09320068359375, 168.9683837890625, 172.8435821533203, 176.71876525878906, 180.5939483642578, 184.46914672851562, 188.34432983398438, 192.21951293945312, 196.09469604492188, 199.96987915039062, 203.84507751464844, 207.7202606201172, 211.59544372558594, 215.47064208984375, 219.3458251953125, 223.22100830078125, 227.09620666503906]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 6.0, 7.0, 9.0, 13.0, 9.0, 12.0, 11.0, 12.0, 18.0, 22.0, 33.0, 40.0, 35.0, 45.0, 37.0, 38.0, 48.0, 46.0, 38.0, 50.0, 39.0, 48.0, 32.0, 34.0, 37.0, 32.0, 38.0, 36.0, 32.0, 24.0, 21.0, 16.0, 13.0, 17.0, 14.0, 7.0, 5.0, 4.0, 4.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-55.597747802734375, -54.0280876159668, -52.45842742919922, -50.88876724243164, -49.31910705566406, -47.749446868896484, -46.179786682128906, -44.61012649536133, -43.04046630859375, -41.47080612182617, -39.901145935058594, -38.331485748291016, -36.76182556152344, -35.19216537475586, -33.62250518798828, -32.0528450012207, -30.483186721801758, -28.91352653503418, -27.3438663482666, -25.774206161499023, -24.204545974731445, -22.634885787963867, -21.065227508544922, -19.495567321777344, -17.925907135009766, -16.356246948242188, -14.78658676147461, -13.216926574707031, -11.647266387939453, -10.077606201171875, -8.507946968078613, -6.938286781311035, -5.368625640869141, -3.7989654541015625, -2.2293055057525635, -0.6596455574035645, 0.9100146293640137, 2.479674816131592, 4.049334526062012, 5.61899471282959, 7.188654899597168, 8.758315086364746, 10.327975273132324, 11.897634506225586, 13.467294692993164, 15.036954879760742, 16.60661506652832, 18.1762752532959, 19.745935440063477, 21.315595626831055, 22.885255813598633, 24.45491600036621, 26.02457618713379, 27.594236373901367, 29.163894653320312, 30.73355484008789, 32.30321502685547, 33.87287521362305, 35.442535400390625, 37.0121955871582, 38.58185577392578, 40.15151596069336, 41.72117614746094, 43.290836334228516, 44.860496520996094]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 14.0, 6.0, 9.0, 9.0, 14.0, 15.0, 18.0, 18.0, 18.0, 24.0, 34.0, 34.0, 29.0, 37.0, 36.0, 40.0, 41.0, 31.0, 42.0, 27.0, 39.0, 42.0, 44.0, 37.0, 29.0, 31.0, 31.0, 33.0, 36.0, 31.0, 19.0, 17.0, 9.0, 20.0, 16.0, 6.0, 10.0, 8.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.62109375, -5.44287109375, -5.2646484375, -5.08642578125, -4.908203125, -4.72998046875, -4.5517578125, -4.37353515625, -4.1953125, -4.01708984375, -3.8388671875, -3.66064453125, -3.482421875, -3.30419921875, -3.1259765625, -2.94775390625, -2.76953125, -2.59130859375, -2.4130859375, -2.23486328125, -2.056640625, -1.87841796875, -1.7001953125, -1.52197265625, -1.34375, -1.16552734375, -0.9873046875, -0.80908203125, -0.630859375, -0.45263671875, -0.2744140625, -0.09619140625, 0.08203125, 0.26025390625, 0.4384765625, 0.61669921875, 0.794921875, 0.97314453125, 1.1513671875, 1.32958984375, 1.5078125, 1.68603515625, 1.8642578125, 2.04248046875, 2.220703125, 2.39892578125, 2.5771484375, 2.75537109375, 2.93359375, 3.11181640625, 3.2900390625, 3.46826171875, 3.646484375, 3.82470703125, 4.0029296875, 4.18115234375, 4.359375, 4.53759765625, 4.7158203125, 4.89404296875, 5.072265625, 5.25048828125, 5.4287109375, 5.60693359375, 5.78515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 11.0, 9.0, 9.0, 7.0, 16.0, 13.0, 18.0, 29.0, 32.0, 42.0, 54.0, 97.0, 170.0, 331.0, 748.0, 2147.0, 8288.0, 54691.0, 830426.0, 2865569.0, 392151.0, 30708.0, 5633.0, 1689.0, 607.0, 278.0, 153.0, 92.0, 47.0, 56.0, 25.0, 24.0, 23.0, 16.0, 12.0, 7.0, 10.0, 9.0, 4.0, 3.0, 2.0, 7.0, 8.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-15.0859375, -14.619873046875, -14.15380859375, -13.687744140625, -13.2216796875, -12.755615234375, -12.28955078125, -11.823486328125, -11.357421875, -10.891357421875, -10.42529296875, -9.959228515625, -9.4931640625, -9.027099609375, -8.56103515625, -8.094970703125, -7.62890625, -7.162841796875, -6.69677734375, -6.230712890625, -5.7646484375, -5.298583984375, -4.83251953125, -4.366455078125, -3.900390625, -3.434326171875, -2.96826171875, -2.502197265625, -2.0361328125, -1.570068359375, -1.10400390625, -0.637939453125, -0.171875, 0.294189453125, 0.76025390625, 1.226318359375, 1.6923828125, 2.158447265625, 2.62451171875, 3.090576171875, 3.556640625, 4.022705078125, 4.48876953125, 4.954833984375, 5.4208984375, 5.886962890625, 6.35302734375, 6.819091796875, 7.28515625, 7.751220703125, 8.21728515625, 8.683349609375, 9.1494140625, 9.615478515625, 10.08154296875, 10.547607421875, 11.013671875, 11.479736328125, 11.94580078125, 12.411865234375, 12.8779296875, 13.343994140625, 13.81005859375, 14.276123046875, 14.7421875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 6.0, 6.0, 11.0, 14.0, 14.0, 30.0, 23.0, 36.0, 44.0, 60.0, 81.0, 119.0, 138.0, 207.0, 263.0, 304.0, 421.0, 434.0, 408.0, 343.0, 292.0, 199.0, 146.0, 101.0, 92.0, 77.0, 51.0, 41.0, 27.0, 15.0, 13.0, 13.0, 11.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.84375, -9.551025390625, -9.25830078125, -8.965576171875, -8.6728515625, -8.380126953125, -8.08740234375, -7.794677734375, -7.501953125, -7.209228515625, -6.91650390625, -6.623779296875, -6.3310546875, -6.038330078125, -5.74560546875, -5.452880859375, -5.16015625, -4.867431640625, -4.57470703125, -4.281982421875, -3.9892578125, -3.696533203125, -3.40380859375, -3.111083984375, -2.818359375, -2.525634765625, -2.23291015625, -1.940185546875, -1.6474609375, -1.354736328125, -1.06201171875, -0.769287109375, -0.4765625, -0.183837890625, 0.10888671875, 0.401611328125, 0.6943359375, 0.987060546875, 1.27978515625, 1.572509765625, 1.865234375, 2.157958984375, 2.45068359375, 2.743408203125, 3.0361328125, 3.328857421875, 3.62158203125, 3.914306640625, 4.20703125, 4.499755859375, 4.79248046875, 5.085205078125, 5.3779296875, 5.670654296875, 5.96337890625, 6.256103515625, 6.548828125, 6.841552734375, 7.13427734375, 7.427001953125, 7.7197265625, 8.012451171875, 8.30517578125, 8.597900390625, 8.890625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 9.0, 3.0, 3.0, 8.0, 11.0, 15.0, 21.0, 26.0, 48.0, 63.0, 88.0, 98.0, 144.0, 206.0, 352.0, 732.0, 4715.0, 432507.0, 3735104.0, 17516.0, 1290.0, 471.0, 261.0, 170.0, 106.0, 89.0, 60.0, 57.0, 31.0, 29.0, 15.0, 13.0, 4.0, 6.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.28125, -41.798828125, -40.31640625, -38.833984375, -37.3515625, -35.869140625, -34.38671875, -32.904296875, -31.421875, -29.939453125, -28.45703125, -26.974609375, -25.4921875, -24.009765625, -22.52734375, -21.044921875, -19.5625, -18.080078125, -16.59765625, -15.115234375, -13.6328125, -12.150390625, -10.66796875, -9.185546875, -7.703125, -6.220703125, -4.73828125, -3.255859375, -1.7734375, -0.291015625, 1.19140625, 2.673828125, 4.15625, 5.638671875, 7.12109375, 8.603515625, 10.0859375, 11.568359375, 13.05078125, 14.533203125, 16.015625, 17.498046875, 18.98046875, 20.462890625, 21.9453125, 23.427734375, 24.91015625, 26.392578125, 27.875, 29.357421875, 30.83984375, 32.322265625, 33.8046875, 35.287109375, 36.76953125, 38.251953125, 39.734375, 41.216796875, 42.69921875, 44.181640625, 45.6640625, 47.146484375, 48.62890625, 50.111328125, 51.59375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 13.0, 39.0, 76.0, 136.0, 173.0, 203.0, 139.0, 110.0, 59.0, 36.0, 12.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.45834350585938, -71.72279357910156, -69.98724365234375, -68.2516860961914, -66.5161361694336, -64.78058624267578, -63.0450325012207, -61.30948257446289, -59.57392883300781, -57.83837890625, -56.10282516479492, -54.36727523803711, -52.63172149658203, -50.89617156982422, -49.16061782836914, -47.42506790161133, -45.68951416015625, -43.95396423339844, -42.21841049194336, -40.48286056518555, -38.74730682373047, -37.011756896972656, -35.27620315551758, -33.540653228759766, -31.805103302001953, -30.069551467895508, -28.333999633789062, -26.598447799682617, -24.862895965576172, -23.12734603881836, -21.39179229736328, -19.65624237060547, -17.92068862915039, -16.185136795043945, -14.4495849609375, -12.714033126831055, -10.97848129272461, -9.24293041229248, -7.507378578186035, -5.77182674407959, -4.0362749099731445, -2.300723075866699, -0.565171480178833, 1.1703801155090332, 2.9059319496154785, 4.641483306884766, 6.377035140991211, 8.112586975097656, 9.848138809204102, 11.583690643310547, 13.319242477416992, 15.054794311523438, 16.790346145629883, 18.525897979736328, 20.26144790649414, 21.99700164794922, 23.73255157470703, 25.468103408813477, 27.203655242919922, 28.939207077026367, 30.674758911132812, 32.410308837890625, 34.1458625793457, 35.881412506103516, 37.616966247558594]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 2.0, 7.0, 12.0, 11.0, 11.0, 15.0, 14.0, 20.0, 20.0, 20.0, 27.0, 36.0, 29.0, 34.0, 35.0, 35.0, 40.0, 44.0, 49.0, 49.0, 43.0, 44.0, 42.0, 44.0, 39.0, 37.0, 34.0, 11.0, 27.0, 27.0, 25.0, 22.0, 14.0, 22.0, 19.0, 11.0, 7.0, 1.0, 5.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.78478240966797, -26.771011352539062, -25.75724220275879, -24.743471145629883, -23.72970199584961, -22.715930938720703, -21.702159881591797, -20.688390731811523, -19.67462158203125, -18.660850524902344, -17.64708137512207, -16.633310317993164, -15.61954116821289, -14.605770111083984, -13.592000007629395, -12.578229904174805, -11.564458847045898, -10.550688743591309, -9.536918640136719, -8.523147583007812, -7.509377956390381, -6.495607852935791, -5.481837272644043, -4.468067169189453, -3.4542970657348633, -2.4405269622802734, -1.4267566204071045, -0.41298627853393555, 0.6007838249206543, 1.6145539283752441, 2.628324508666992, 3.642094612121582, 4.655864715576172, 5.669634819030762, 6.683404922485352, 7.6971755027771, 8.710945129394531, 9.724716186523438, 10.738486289978027, 11.752256393432617, 12.766026496887207, 13.779796600341797, 14.793566703796387, 15.807336807250977, 16.821107864379883, 17.834877014160156, 18.848648071289062, 19.86241912841797, 20.876188278198242, 21.88995933532715, 22.903728485107422, 23.917499542236328, 24.9312686920166, 25.945039749145508, 26.95880889892578, 27.972579956054688, 28.986351013183594, 30.0001220703125, 31.013891220092773, 32.02766036987305, 33.04143142700195, 34.05520248413086, 35.068973541259766, 36.082740783691406, 37.09651184082031]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 7.0, 5.0, 4.0, 9.0, 11.0, 13.0, 11.0, 23.0, 15.0, 20.0, 20.0, 22.0, 21.0, 40.0, 40.0, 40.0, 35.0, 42.0, 39.0, 43.0, 32.0, 32.0, 43.0, 36.0, 32.0, 52.0, 34.0, 35.0, 43.0, 26.0, 29.0, 20.0, 15.0, 19.0, 14.0, 16.0, 11.0, 11.0, 11.0, 10.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.1328125, -5.9410400390625, -5.749267578125, -5.5574951171875, -5.36572265625, -5.1739501953125, -4.982177734375, -4.7904052734375, -4.5986328125, -4.4068603515625, -4.215087890625, -4.0233154296875, -3.83154296875, -3.6397705078125, -3.447998046875, -3.2562255859375, -3.064453125, -2.8726806640625, -2.680908203125, -2.4891357421875, -2.29736328125, -2.1055908203125, -1.913818359375, -1.7220458984375, -1.5302734375, -1.3385009765625, -1.146728515625, -0.9549560546875, -0.76318359375, -0.5714111328125, -0.379638671875, -0.1878662109375, 0.00390625, 0.1956787109375, 0.387451171875, 0.5792236328125, 0.77099609375, 0.9627685546875, 1.154541015625, 1.3463134765625, 1.5380859375, 1.7298583984375, 1.921630859375, 2.1134033203125, 2.30517578125, 2.4969482421875, 2.688720703125, 2.8804931640625, 3.072265625, 3.2640380859375, 3.455810546875, 3.6475830078125, 3.83935546875, 4.0311279296875, 4.222900390625, 4.4146728515625, 4.6064453125, 4.7982177734375, 4.989990234375, 5.1817626953125, 5.37353515625, 5.5653076171875, 5.757080078125, 5.9488525390625, 6.140625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 5.0, 11.0, 6.0, 21.0, 23.0, 34.0, 56.0, 89.0, 99.0, 148.0, 196.0, 316.0, 455.0, 622.0, 946.0, 1322.0, 1878.0, 2712.0, 4100.0, 5902.0, 9062.0, 13616.0, 21094.0, 33239.0, 53658.0, 88902.0, 143349.0, 196758.0, 172948.0, 111615.0, 67700.0, 41399.0, 25999.0, 16603.0, 10907.0, 7288.0, 4797.0, 3336.0, 2238.0, 1559.0, 1046.0, 789.0, 506.0, 356.0, 275.0, 189.0, 113.0, 100.0, 53.0, 43.0, 36.0, 19.0, 14.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.72509765625, -0.7022476196289062, -0.6793975830078125, -0.6565475463867188, -0.633697509765625, -0.6108474731445312, -0.5879974365234375, -0.5651473999023438, -0.54229736328125, -0.5194473266601562, -0.4965972900390625, -0.47374725341796875, -0.450897216796875, -0.42804718017578125, -0.4051971435546875, -0.38234710693359375, -0.3594970703125, -0.33664703369140625, -0.3137969970703125, -0.29094696044921875, -0.268096923828125, -0.24524688720703125, -0.2223968505859375, -0.19954681396484375, -0.17669677734375, -0.15384674072265625, -0.1309967041015625, -0.10814666748046875, -0.085296630859375, -0.06244659423828125, -0.0395965576171875, -0.01674652099609375, 0.006103515625, 0.02895355224609375, 0.0518035888671875, 0.07465362548828125, 0.097503662109375, 0.12035369873046875, 0.1432037353515625, 0.16605377197265625, 0.18890380859375, 0.21175384521484375, 0.2346038818359375, 0.25745391845703125, 0.280303955078125, 0.30315399169921875, 0.3260040283203125, 0.34885406494140625, 0.3717041015625, 0.39455413818359375, 0.4174041748046875, 0.44025421142578125, 0.463104248046875, 0.48595428466796875, 0.5088043212890625, 0.5316543579101562, 0.55450439453125, 0.5773544311523438, 0.6002044677734375, 0.6230545043945312, 0.645904541015625, 0.6687545776367188, 0.6916046142578125, 0.7144546508789062, 0.7373046875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 9.0, 5.0, 8.0, 11.0, 9.0, 13.0, 12.0, 15.0, 16.0, 19.0, 22.0, 29.0, 41.0, 40.0, 37.0, 44.0, 40.0, 50.0, 35.0, 45.0, 1075.0, 36.0, 41.0, 37.0, 31.0, 44.0, 29.0, 31.0, 32.0, 28.0, 18.0, 23.0, 20.0, 14.0, 5.0, 8.0, 8.0, 12.0, 10.0, 4.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44140625, -3.3153076171875, -3.189208984375, -3.0631103515625, -2.93701171875, -2.8109130859375, -2.684814453125, -2.5587158203125, -2.4326171875, -2.3065185546875, -2.180419921875, -2.0543212890625, -1.92822265625, -1.8021240234375, -1.676025390625, -1.5499267578125, -1.423828125, -1.2977294921875, -1.171630859375, -1.0455322265625, -0.91943359375, -0.7933349609375, -0.667236328125, -0.5411376953125, -0.4150390625, -0.2889404296875, -0.162841796875, -0.0367431640625, 0.08935546875, 0.2154541015625, 0.341552734375, 0.4676513671875, 0.59375, 0.7198486328125, 0.845947265625, 0.9720458984375, 1.09814453125, 1.2242431640625, 1.350341796875, 1.4764404296875, 1.6025390625, 1.7286376953125, 1.854736328125, 1.9808349609375, 2.10693359375, 2.2330322265625, 2.359130859375, 2.4852294921875, 2.611328125, 2.7374267578125, 2.863525390625, 2.9896240234375, 3.11572265625, 3.2418212890625, 3.367919921875, 3.4940185546875, 3.6201171875, 3.7462158203125, 3.872314453125, 3.9984130859375, 4.12451171875, 4.2506103515625, 4.376708984375, 4.5028076171875, 4.62890625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 9.0, 9.0, 12.0, 25.0, 24.0, 31.0, 54.0, 85.0, 139.0, 200.0, 297.0, 485.0, 823.0, 1252.0, 1875.0, 2963.0, 4738.0, 7548.0, 12423.0, 20174.0, 33448.0, 56621.0, 98612.0, 169206.0, 1268386.0, 171093.0, 100774.0, 57353.0, 34441.0, 20428.0, 12262.0, 7731.0, 4920.0, 3098.0, 2037.0, 1283.0, 772.0, 548.0, 325.0, 207.0, 135.0, 114.0, 64.0, 39.0, 21.0, 16.0, 11.0, 10.0, 5.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.7119140625, -0.690673828125, -0.66943359375, -0.648193359375, -0.626953125, -0.605712890625, -0.58447265625, -0.563232421875, -0.5419921875, -0.520751953125, -0.49951171875, -0.478271484375, -0.45703125, -0.435791015625, -0.41455078125, -0.393310546875, -0.3720703125, -0.350830078125, -0.32958984375, -0.308349609375, -0.287109375, -0.265869140625, -0.24462890625, -0.223388671875, -0.2021484375, -0.180908203125, -0.15966796875, -0.138427734375, -0.1171875, -0.095947265625, -0.07470703125, -0.053466796875, -0.0322265625, -0.010986328125, 0.01025390625, 0.031494140625, 0.052734375, 0.073974609375, 0.09521484375, 0.116455078125, 0.1376953125, 0.158935546875, 0.18017578125, 0.201416015625, 0.22265625, 0.243896484375, 0.26513671875, 0.286376953125, 0.3076171875, 0.328857421875, 0.35009765625, 0.371337890625, 0.392578125, 0.413818359375, 0.43505859375, 0.456298828125, 0.4775390625, 0.498779296875, 0.52001953125, 0.541259765625, 0.5625, 0.583740234375, 0.60498046875, 0.626220703125, 0.6474609375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 4.0, 5.0, 4.0, 8.0, 3.0, 8.0, 16.0, 26.0, 21.0, 29.0, 37.0, 67.0, 60.0, 85.0, 82.0, 82.0, 73.0, 74.0, 73.0, 51.0, 47.0, 31.0, 24.0, 20.0, 20.0, 5.0, 7.0, 12.0, 4.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026187896728515625, -0.002526789903640747, -0.0024347901344299316, -0.002342790365219116, -0.0022507905960083008, -0.0021587908267974854, -0.00206679105758667, -0.0019747912883758545, -0.001882791519165039, -0.0017907917499542236, -0.0016987919807434082, -0.0016067922115325928, -0.0015147924423217773, -0.001422792673110962, -0.0013307929039001465, -0.001238793134689331, -0.0011467933654785156, -0.0010547935962677002, -0.0009627938270568848, -0.0008707940578460693, -0.0007787942886352539, -0.0006867945194244385, -0.000594794750213623, -0.0005027949810028076, -0.0004107952117919922, -0.00031879544258117676, -0.00022679567337036133, -0.0001347959041595459, -4.279613494873047e-05, 4.920363426208496e-05, 0.0001412034034729004, 0.00023320317268371582, 0.00032520294189453125, 0.0004172027111053467, 0.0005092024803161621, 0.0006012022495269775, 0.000693202018737793, 0.0007852017879486084, 0.0008772015571594238, 0.0009692013263702393, 0.0010612010955810547, 0.0011532008647918701, 0.0012452006340026855, 0.001337200403213501, 0.0014292001724243164, 0.0015211999416351318, 0.0016131997108459473, 0.0017051994800567627, 0.0017971992492675781, 0.0018891990184783936, 0.001981198787689209, 0.0020731985569000244, 0.00216519832611084, 0.0022571980953216553, 0.0023491978645324707, 0.002441197633743286, 0.0025331974029541016, 0.002625197172164917, 0.0027171969413757324, 0.002809196710586548, 0.0029011964797973633, 0.0029931962490081787, 0.003085196018218994, 0.0031771957874298096, 0.003269195556640625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 8.0, 5.0, 14.0, 11.0, 14.0, 15.0, 35.0, 38.0, 71.0, 82.0, 122.0, 180.0, 349.0, 940.0, 182603.0, 861744.0, 1258.0, 422.0, 213.0, 128.0, 82.0, 52.0, 37.0, 36.0, 19.0, 14.0, 17.0, 8.0, 7.0, 5.0, 2.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0687255859375, -0.06676721572875977, -0.06480884552001953, -0.0628504753112793, -0.06089210510253906, -0.05893373489379883, -0.056975364685058594, -0.05501699447631836, -0.053058624267578125, -0.05110025405883789, -0.049141883850097656, -0.04718351364135742, -0.04522514343261719, -0.04326677322387695, -0.04130840301513672, -0.039350032806396484, -0.03739166259765625, -0.035433292388916016, -0.03347492218017578, -0.03151655197143555, -0.029558181762695312, -0.027599811553955078, -0.025641441345214844, -0.02368307113647461, -0.021724700927734375, -0.01976633071899414, -0.017807960510253906, -0.015849590301513672, -0.013891220092773438, -0.011932849884033203, -0.009974479675292969, -0.008016109466552734, -0.0060577392578125, -0.004099369049072266, -0.0021409988403320312, -0.00018262863159179688, 0.0017757415771484375, 0.003734111785888672, 0.005692481994628906, 0.007650852203369141, 0.009609222412109375, 0.01156759262084961, 0.013525962829589844, 0.015484333038330078, 0.017442703247070312, 0.019401073455810547, 0.02135944366455078, 0.023317813873291016, 0.02527618408203125, 0.027234554290771484, 0.02919292449951172, 0.031151294708251953, 0.03310966491699219, 0.03506803512573242, 0.037026405334472656, 0.03898477554321289, 0.040943145751953125, 0.04290151596069336, 0.044859886169433594, 0.04681825637817383, 0.04877662658691406, 0.0507349967956543, 0.05269336700439453, 0.054651737213134766, 0.056610107421875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 366.0, 651.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054013825953006744, -0.052995696663856506, -0.05197757109999657, -0.05095944181084633, -0.04994131252169609, -0.04892318695783615, -0.04790505766868591, -0.046886928379535675, -0.045868802815675735, -0.0448506735265255, -0.04383254796266556, -0.04281441867351532, -0.04179628938436508, -0.04077816382050514, -0.039760034531354904, -0.038741905242204666, -0.03772377967834473, -0.03670565038919449, -0.03568752482533455, -0.03466939553618431, -0.03365126624703407, -0.03263314068317413, -0.031615011394023895, -0.030596883967518806, -0.02957875281572342, -0.02856062538921833, -0.027542496100068092, -0.026524368673563004, -0.025506241247057915, -0.024488113820552826, -0.023469984531402588, -0.0224518571048975, -0.02143372967839241, -0.02041560225188732, -0.019397472962737083, -0.018379345536231995, -0.017361218109726906, -0.016343090683221817, -0.015324961394071579, -0.01430683396756649, -0.013288704678416252, -0.012270576320588589, -0.0112524488940835, -0.010234320536255836, -0.009216193109750748, -0.008198064751923084, -0.007179936394095421, -0.006161808501929045, -0.005143680609762669, -0.0041255527175962925, -0.0031074245925992727, -0.002089296467602253, -0.0010711685754358768, -5.304068326950073e-05, 0.0009650876745581627, 0.001983215566724539, 0.003001343458890915, 0.004019471351057291, 0.005037599243223667, 0.006055727601051331, 0.007073855493217707, 0.008091983385384083, 0.009110111743211746, 0.010128239169716835, 0.011146367527544498]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 5.0, 5.0, 9.0, 11.0, 11.0, 11.0, 20.0, 25.0, 25.0, 40.0, 38.0, 44.0, 44.0, 51.0, 45.0, 64.0, 65.0, 64.0, 67.0, 59.0, 53.0, 54.0, 41.0, 41.0, 28.0, 24.0, 19.0, 15.0, 13.0, 8.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001131296157836914, -0.0010736426338553429, -0.0010159891098737717, -0.0009583355858922005, -0.0009006820619106293, -0.0008430285379290581, -0.0007853750139474869, -0.0007277214899659157, -0.0006700679659843445, -0.0006124144420027733, -0.0005547609180212021, -0.0004971073940396309, -0.0004394538700580597, -0.0003818003460764885, -0.0003241468220949173, -0.0002664932981133461, -0.0002088397741317749, -0.0001511862501502037, -9.353272616863251e-05, -3.587920218706131e-05, 2.1774321794509888e-05, 7.942784577608109e-05, 0.00013708136975765228, 0.00019473489373922348, 0.0002523884177207947, 0.0003100419417023659, 0.00036769546568393707, 0.00042534898966550827, 0.00048300251364707947, 0.0005406560376286507, 0.0005983095616102219, 0.0006559630855917931, 0.0007136166095733643, 0.0007712701335549355, 0.0008289236575365067, 0.0008865771815180779, 0.000944230705499649, 0.0010018842294812202, 0.0010595377534627914, 0.0011171912774443626, 0.0011748448014259338, 0.001232498325407505, 0.0012901518493890762, 0.0013478053733706474, 0.0014054588973522186, 0.0014631124213337898, 0.001520765945315361, 0.0015784194692969322, 0.0016360729932785034, 0.0016937265172600746, 0.0017513800412416458, 0.001809033565223217, 0.0018666870892047882, 0.0019243406131863594, 0.0019819941371679306, 0.002039647661149502, 0.002097301185131073, 0.002154954709112644, 0.0022126082330942154, 0.0022702617570757866, 0.002327915281057358, 0.002385568805038929, 0.0024432223290205, 0.0025008758530020714, 0.0025585293769836426]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 7.0, 5.0, 4.0, 9.0, 11.0, 13.0, 11.0, 23.0, 15.0, 20.0, 20.0, 22.0, 21.0, 40.0, 40.0, 40.0, 35.0, 42.0, 39.0, 43.0, 32.0, 32.0, 43.0, 36.0, 32.0, 52.0, 34.0, 35.0, 43.0, 26.0, 29.0, 20.0, 15.0, 19.0, 14.0, 16.0, 11.0, 11.0, 11.0, 10.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.1328125, -5.9410400390625, -5.749267578125, -5.5574951171875, -5.36572265625, -5.1739501953125, -4.982177734375, -4.7904052734375, -4.5986328125, -4.4068603515625, -4.215087890625, -4.0233154296875, -3.83154296875, -3.6397705078125, -3.447998046875, -3.2562255859375, -3.064453125, -2.8726806640625, -2.680908203125, -2.4891357421875, -2.29736328125, -2.1055908203125, -1.913818359375, -1.7220458984375, -1.5302734375, -1.3385009765625, -1.146728515625, -0.9549560546875, -0.76318359375, -0.5714111328125, -0.379638671875, -0.1878662109375, 0.00390625, 0.1956787109375, 0.387451171875, 0.5792236328125, 0.77099609375, 0.9627685546875, 1.154541015625, 1.3463134765625, 1.5380859375, 1.7298583984375, 1.921630859375, 2.1134033203125, 2.30517578125, 2.4969482421875, 2.688720703125, 2.8804931640625, 3.072265625, 3.2640380859375, 3.455810546875, 3.6475830078125, 3.83935546875, 4.0311279296875, 4.222900390625, 4.4146728515625, 4.6064453125, 4.7982177734375, 4.989990234375, 5.1817626953125, 5.37353515625, 5.5653076171875, 5.757080078125, 5.9488525390625, 6.140625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 7.0, 12.0, 14.0, 9.0, 15.0, 15.0, 36.0, 31.0, 47.0, 64.0, 68.0, 119.0, 146.0, 201.0, 297.0, 368.0, 495.0, 736.0, 1585.0, 5292.0, 28112.0, 505408.0, 468650.0, 27465.0, 5066.0, 1565.0, 770.0, 484.0, 389.0, 279.0, 209.0, 137.0, 121.0, 74.0, 54.0, 39.0, 37.0, 37.0, 24.0, 23.0, 17.0, 6.0, 12.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.46875, -14.9852294921875, -14.501708984375, -14.0181884765625, -13.53466796875, -13.0511474609375, -12.567626953125, -12.0841064453125, -11.6005859375, -11.1170654296875, -10.633544921875, -10.1500244140625, -9.66650390625, -9.1829833984375, -8.699462890625, -8.2159423828125, -7.732421875, -7.2489013671875, -6.765380859375, -6.2818603515625, -5.79833984375, -5.3148193359375, -4.831298828125, -4.3477783203125, -3.8642578125, -3.3807373046875, -2.897216796875, -2.4136962890625, -1.93017578125, -1.4466552734375, -0.963134765625, -0.4796142578125, 0.00390625, 0.4874267578125, 0.970947265625, 1.4544677734375, 1.93798828125, 2.4215087890625, 2.905029296875, 3.3885498046875, 3.8720703125, 4.3555908203125, 4.839111328125, 5.3226318359375, 5.80615234375, 6.2896728515625, 6.773193359375, 7.2567138671875, 7.740234375, 8.2237548828125, 8.707275390625, 9.1907958984375, 9.67431640625, 10.1578369140625, 10.641357421875, 11.1248779296875, 11.6083984375, 12.0919189453125, 12.575439453125, 13.0589599609375, 13.54248046875, 14.0260009765625, 14.509521484375, 14.9930419921875, 15.4765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 1.0, 7.0, 5.0, 5.0, 3.0, 6.0, 7.0, 11.0, 8.0, 11.0, 15.0, 23.0, 15.0, 31.0, 25.0, 27.0, 32.0, 37.0, 34.0, 29.0, 52.0, 39.0, 84.0, 444.0, 1526.0, 101.0, 54.0, 45.0, 41.0, 41.0, 34.0, 32.0, 33.0, 36.0, 16.0, 22.0, 24.0, 16.0, 7.0, 16.0, 14.0, 10.0, 8.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.734375, -16.195068359375, -15.65576171875, -15.116455078125, -14.5771484375, -14.037841796875, -13.49853515625, -12.959228515625, -12.419921875, -11.880615234375, -11.34130859375, -10.802001953125, -10.2626953125, -9.723388671875, -9.18408203125, -8.644775390625, -8.10546875, -7.566162109375, -7.02685546875, -6.487548828125, -5.9482421875, -5.408935546875, -4.86962890625, -4.330322265625, -3.791015625, -3.251708984375, -2.71240234375, -2.173095703125, -1.6337890625, -1.094482421875, -0.55517578125, -0.015869140625, 0.5234375, 1.062744140625, 1.60205078125, 2.141357421875, 2.6806640625, 3.219970703125, 3.75927734375, 4.298583984375, 4.837890625, 5.377197265625, 5.91650390625, 6.455810546875, 6.9951171875, 7.534423828125, 8.07373046875, 8.613037109375, 9.15234375, 9.691650390625, 10.23095703125, 10.770263671875, 11.3095703125, 11.848876953125, 12.38818359375, 12.927490234375, 13.466796875, 14.006103515625, 14.54541015625, 15.084716796875, 15.6240234375, 16.163330078125, 16.70263671875, 17.241943359375, 17.78125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 4.0, 4.0, 2.0, 4.0, 8.0, 11.0, 12.0, 14.0, 14.0, 19.0, 24.0, 24.0, 24.0, 37.0, 40.0, 39.0, 58.0, 78.0, 117.0, 206.0, 443.0, 1490.0, 84206.0, 3052228.0, 5100.0, 647.0, 285.0, 133.0, 78.0, 61.0, 49.0, 37.0, 32.0, 39.0, 19.0, 22.0, 20.0, 11.0, 11.0, 10.0, 11.0, 7.0, 6.0, 4.0, 3.0, 7.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-50.09375, -48.58544921875, -47.0771484375, -45.56884765625, -44.060546875, -42.55224609375, -41.0439453125, -39.53564453125, -38.02734375, -36.51904296875, -35.0107421875, -33.50244140625, -31.994140625, -30.48583984375, -28.9775390625, -27.46923828125, -25.9609375, -24.45263671875, -22.9443359375, -21.43603515625, -19.927734375, -18.41943359375, -16.9111328125, -15.40283203125, -13.89453125, -12.38623046875, -10.8779296875, -9.36962890625, -7.861328125, -6.35302734375, -4.8447265625, -3.33642578125, -1.828125, -0.31982421875, 1.1884765625, 2.69677734375, 4.205078125, 5.71337890625, 7.2216796875, 8.72998046875, 10.23828125, 11.74658203125, 13.2548828125, 14.76318359375, 16.271484375, 17.77978515625, 19.2880859375, 20.79638671875, 22.3046875, 23.81298828125, 25.3212890625, 26.82958984375, 28.337890625, 29.84619140625, 31.3544921875, 32.86279296875, 34.37109375, 35.87939453125, 37.3876953125, 38.89599609375, 40.404296875, 41.91259765625, 43.4208984375, 44.92919921875, 46.4375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 89.0, 619.0, 290.0, 15.0], "bins": [-155.8143768310547, -153.29119873046875, -150.7680206298828, -148.2448272705078, -145.72164916992188, -143.19847106933594, -140.67529296875, -138.15211486816406, -135.62893676757812, -133.1057586669922, -130.58258056640625, -128.05938720703125, -125.53620910644531, -123.01303100585938, -120.48985290527344, -117.9666748046875, -115.4434814453125, -112.92030334472656, -110.3971176147461, -107.87393951416016, -105.35075378417969, -102.82757568359375, -100.30439758300781, -97.78121948242188, -95.2580337524414, -92.73485565185547, -90.211669921875, -87.68849182128906, -85.16531372070312, -82.64212799072266, -80.11894989013672, -77.59576416015625, -75.07258605957031, -72.54940795898438, -70.0262222290039, -67.50304412841797, -64.9798583984375, -62.45668029785156, -59.933502197265625, -57.41032028198242, -54.887142181396484, -52.36396026611328, -49.840782165527344, -47.31760025024414, -44.79441833496094, -42.271236419677734, -39.74805450439453, -37.224876403808594, -34.70169448852539, -32.17851257324219, -29.655332565307617, -27.132152557373047, -24.608970642089844, -22.08578872680664, -19.56260871887207, -17.0394287109375, -14.516246795654297, -11.99306583404541, -9.469884872436523, -6.946703910827637, -4.42352294921875, -1.9003419876098633, 0.6228389739990234, 3.1460189819335938, 5.669201374053955]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 9.0, 8.0, 8.0, 11.0, 15.0, 13.0, 17.0, 27.0, 24.0, 31.0, 39.0, 34.0, 43.0, 51.0, 55.0, 50.0, 51.0, 50.0, 51.0, 28.0, 46.0, 41.0, 47.0, 39.0, 27.0, 37.0, 29.0, 24.0, 15.0, 17.0, 14.0, 14.0, 10.0, 4.0, 5.0, 6.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.079185485839844, -51.39681625366211, -49.71445083618164, -48.032081604003906, -46.34971237182617, -44.66734313964844, -42.98497772216797, -41.302608489990234, -39.6202392578125, -37.937870025634766, -36.2555046081543, -34.57313537597656, -32.89076614379883, -31.208398818969727, -29.526031494140625, -27.84366226196289, -26.16129493713379, -24.478927612304688, -22.796558380126953, -21.11419105529785, -19.431821823120117, -17.749454498291016, -16.06708526611328, -14.38471794128418, -12.702349662780762, -11.019981384277344, -9.337613105773926, -7.655245304107666, -5.972877025604248, -4.290509223937988, -2.6081409454345703, -0.9257726669311523, 0.7565956115722656, 2.4389638900756836, 4.121332168579102, 5.803699970245361, 7.486068248748779, 9.168436050415039, 10.850804328918457, 12.533172607421875, 14.215540885925293, 15.897909164428711, 17.580276489257812, 19.262645721435547, 20.94501304626465, 22.62738037109375, 24.309749603271484, 25.99211883544922, 27.67448616027832, 29.356853485107422, 31.039222717285156, 32.72159194946289, 34.40395736694336, 36.086326599121094, 37.76869583129883, 39.45106506347656, 41.13343048095703, 42.815799713134766, 44.498165130615234, 46.18053436279297, 47.8629035949707, 49.54527282714844, 51.227638244628906, 52.91000747680664, 54.592376708984375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 12.0, 6.0, 7.0, 10.0, 12.0, 8.0, 18.0, 21.0, 13.0, 30.0, 18.0, 28.0, 31.0, 33.0, 29.0, 34.0, 34.0, 36.0, 43.0, 43.0, 34.0, 38.0, 39.0, 33.0, 40.0, 33.0, 41.0, 42.0, 25.0, 27.0, 30.0, 22.0, 17.0, 10.0, 22.0, 13.0, 10.0, 9.0, 14.0, 8.0, 5.0, 3.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.73828125, -5.55059814453125, -5.3629150390625, -5.17523193359375, -4.987548828125, -4.79986572265625, -4.6121826171875, -4.42449951171875, -4.23681640625, -4.04913330078125, -3.8614501953125, -3.67376708984375, -3.486083984375, -3.29840087890625, -3.1107177734375, -2.92303466796875, -2.7353515625, -2.54766845703125, -2.3599853515625, -2.17230224609375, -1.984619140625, -1.79693603515625, -1.6092529296875, -1.42156982421875, -1.23388671875, -1.04620361328125, -0.8585205078125, -0.67083740234375, -0.483154296875, -0.29547119140625, -0.1077880859375, 0.07989501953125, 0.267578125, 0.45526123046875, 0.6429443359375, 0.83062744140625, 1.018310546875, 1.20599365234375, 1.3936767578125, 1.58135986328125, 1.76904296875, 1.95672607421875, 2.1444091796875, 2.33209228515625, 2.519775390625, 2.70745849609375, 2.8951416015625, 3.08282470703125, 3.2705078125, 3.45819091796875, 3.6458740234375, 3.83355712890625, 4.021240234375, 4.20892333984375, 4.3966064453125, 4.58428955078125, 4.77197265625, 4.95965576171875, 5.1473388671875, 5.33502197265625, 5.522705078125, 5.71038818359375, 5.8980712890625, 6.08575439453125, 6.2734375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 5.0, 8.0, 10.0, 8.0, 12.0, 14.0, 24.0, 34.0, 40.0, 55.0, 68.0, 83.0, 109.0, 169.0, 247.0, 363.0, 575.0, 988.0, 1994.0, 4455.0, 12646.0, 55269.0, 477440.0, 2410576.0, 1078947.0, 117347.0, 20490.0, 6321.0, 2597.0, 1285.0, 641.0, 446.0, 291.0, 159.0, 134.0, 101.0, 74.0, 50.0, 42.0, 37.0, 29.0, 26.0, 17.0, 12.0, 15.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.515625, -11.140380859375, -10.76513671875, -10.389892578125, -10.0146484375, -9.639404296875, -9.26416015625, -8.888916015625, -8.513671875, -8.138427734375, -7.76318359375, -7.387939453125, -7.0126953125, -6.637451171875, -6.26220703125, -5.886962890625, -5.51171875, -5.136474609375, -4.76123046875, -4.385986328125, -4.0107421875, -3.635498046875, -3.26025390625, -2.885009765625, -2.509765625, -2.134521484375, -1.75927734375, -1.384033203125, -1.0087890625, -0.633544921875, -0.25830078125, 0.116943359375, 0.4921875, 0.867431640625, 1.24267578125, 1.617919921875, 1.9931640625, 2.368408203125, 2.74365234375, 3.118896484375, 3.494140625, 3.869384765625, 4.24462890625, 4.619873046875, 4.9951171875, 5.370361328125, 5.74560546875, 6.120849609375, 6.49609375, 6.871337890625, 7.24658203125, 7.621826171875, 7.9970703125, 8.372314453125, 8.74755859375, 9.122802734375, 9.498046875, 9.873291015625, 10.24853515625, 10.623779296875, 10.9990234375, 11.374267578125, 11.74951171875, 12.124755859375, 12.5]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 12.0, 9.0, 15.0, 37.0, 51.0, 85.0, 127.0, 204.0, 330.0, 524.0, 770.0, 698.0, 473.0, 283.0, 166.0, 124.0, 58.0, 45.0, 23.0, 16.0, 10.0, 6.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8125, -12.317138671875, -11.82177734375, -11.326416015625, -10.8310546875, -10.335693359375, -9.84033203125, -9.344970703125, -8.849609375, -8.354248046875, -7.85888671875, -7.363525390625, -6.8681640625, -6.372802734375, -5.87744140625, -5.382080078125, -4.88671875, -4.391357421875, -3.89599609375, -3.400634765625, -2.9052734375, -2.409912109375, -1.91455078125, -1.419189453125, -0.923828125, -0.428466796875, 0.06689453125, 0.562255859375, 1.0576171875, 1.552978515625, 2.04833984375, 2.543701171875, 3.0390625, 3.534423828125, 4.02978515625, 4.525146484375, 5.0205078125, 5.515869140625, 6.01123046875, 6.506591796875, 7.001953125, 7.497314453125, 7.99267578125, 8.488037109375, 8.9833984375, 9.478759765625, 9.97412109375, 10.469482421875, 10.96484375, 11.460205078125, 11.95556640625, 12.450927734375, 12.9462890625, 13.441650390625, 13.93701171875, 14.432373046875, 14.927734375, 15.423095703125, 15.91845703125, 16.413818359375, 16.9091796875, 17.404541015625, 17.89990234375, 18.395263671875, 18.890625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 8.0, 7.0, 12.0, 15.0, 28.0, 33.0, 38.0, 85.0, 101.0, 138.0, 211.0, 357.0, 1047.0, 5324.0, 153336.0, 3960594.0, 67407.0, 3640.0, 856.0, 355.0, 200.0, 147.0, 91.0, 74.0, 42.0, 44.0, 30.0, 22.0, 12.0, 9.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-50.65625, -49.33740234375, -48.0185546875, -46.69970703125, -45.380859375, -44.06201171875, -42.7431640625, -41.42431640625, -40.10546875, -38.78662109375, -37.4677734375, -36.14892578125, -34.830078125, -33.51123046875, -32.1923828125, -30.87353515625, -29.5546875, -28.23583984375, -26.9169921875, -25.59814453125, -24.279296875, -22.96044921875, -21.6416015625, -20.32275390625, -19.00390625, -17.68505859375, -16.3662109375, -15.04736328125, -13.728515625, -12.40966796875, -11.0908203125, -9.77197265625, -8.453125, -7.13427734375, -5.8154296875, -4.49658203125, -3.177734375, -1.85888671875, -0.5400390625, 0.77880859375, 2.09765625, 3.41650390625, 4.7353515625, 6.05419921875, 7.373046875, 8.69189453125, 10.0107421875, 11.32958984375, 12.6484375, 13.96728515625, 15.2861328125, 16.60498046875, 17.923828125, 19.24267578125, 20.5615234375, 21.88037109375, 23.19921875, 24.51806640625, 25.8369140625, 27.15576171875, 28.474609375, 29.79345703125, 31.1123046875, 32.43115234375, 33.75]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 22.0, 116.0, 324.0, 368.0, 138.0, 37.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.95913696289062, -206.14895629882812, -202.33877563476562, -198.52859497070312, -194.7184295654297, -190.9082489013672, -187.0980682373047, -183.2878875732422, -179.4777069091797, -175.6675262451172, -171.8573455810547, -168.04718017578125, -164.23699951171875, -160.42681884765625, -156.61663818359375, -152.80645751953125, -148.99627685546875, -145.18609619140625, -141.37591552734375, -137.56573486328125, -133.7555694580078, -129.9453887939453, -126.13520812988281, -122.32502746582031, -118.51486206054688, -114.70468139648438, -110.8945083618164, -107.0843276977539, -103.2741470336914, -99.46397399902344, -95.65379333496094, -91.84361267089844, -88.0334243774414, -84.2232437133789, -80.41307067871094, -76.60289001464844, -72.79270935058594, -68.98252868652344, -65.17235565185547, -61.36217498779297, -57.551998138427734, -53.7418212890625, -49.931640625, -46.121463775634766, -42.31128692626953, -38.50110626220703, -34.6909294128418, -30.88075065612793, -27.070571899414062, -23.260393142700195, -19.450214385986328, -15.640037536621094, -11.829858779907227, -8.01968002319336, -4.209503173828125, -0.3993244171142578, 3.4108543395996094, 7.221032619476318, 11.031210899353027, 14.841388702392578, 18.651567459106445, 22.461746215820312, 26.271923065185547, 30.082101821899414, 33.89228057861328]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 3.0, 9.0, 11.0, 19.0, 16.0, 18.0, 32.0, 21.0, 20.0, 28.0, 29.0, 40.0, 28.0, 38.0, 41.0, 44.0, 40.0, 31.0, 40.0, 29.0, 43.0, 35.0, 36.0, 43.0, 40.0, 35.0, 32.0, 31.0, 29.0, 19.0, 16.0, 23.0, 7.0, 14.0, 9.0, 10.0, 9.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-31.353004455566406, -30.33247184753418, -29.311941146850586, -28.29140853881836, -27.270875930786133, -26.250343322753906, -25.229812622070312, -24.209280014038086, -23.18874740600586, -22.168214797973633, -21.14768409729004, -20.127151489257812, -19.106618881225586, -18.08608627319336, -17.065555572509766, -16.04502296447754, -15.024492263793945, -14.003960609436035, -12.983428001403809, -11.962896347045898, -10.942363739013672, -9.921832084655762, -8.901300430297852, -7.880768299102783, -6.860236167907715, -5.8397040367126465, -4.819171905517578, -3.798640251159668, -2.7781081199645996, -1.7575759887695312, -0.7370443344116211, 0.28348779678344727, 1.3040199279785156, 2.324552059173584, 3.3450839519500732, 4.3656158447265625, 5.386147975921631, 6.406680107116699, 7.427211761474609, 8.447744369506836, 9.468276023864746, 10.488807678222656, 11.509340286254883, 12.529871940612793, 13.550403594970703, 14.57093620300293, 15.59146785736084, 16.61199951171875, 17.632532119750977, 18.653064727783203, 19.673595428466797, 20.694128036499023, 21.71466064453125, 22.735191345214844, 23.75572395324707, 24.776256561279297, 25.79678726196289, 26.817319869995117, 27.83785057067871, 28.858383178710938, 29.878915786743164, 30.89944839477539, 31.919979095458984, 32.94050979614258, 33.96104431152344]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 1.0, 7.0, 8.0, 9.0, 6.0, 8.0, 8.0, 7.0, 17.0, 13.0, 13.0, 16.0, 20.0, 24.0, 25.0, 26.0, 40.0, 37.0, 26.0, 31.0, 32.0, 34.0, 48.0, 52.0, 34.0, 34.0, 33.0, 33.0, 38.0, 35.0, 21.0, 30.0, 30.0, 28.0, 20.0, 24.0, 26.0, 12.0, 12.0, 16.0, 20.0, 9.0, 6.0, 5.0, 6.0, 9.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.45703125, -5.27044677734375, -5.0838623046875, -4.89727783203125, -4.710693359375, -4.52410888671875, -4.3375244140625, -4.15093994140625, -3.96435546875, -3.77777099609375, -3.5911865234375, -3.40460205078125, -3.218017578125, -3.03143310546875, -2.8448486328125, -2.65826416015625, -2.4716796875, -2.28509521484375, -2.0985107421875, -1.91192626953125, -1.725341796875, -1.53875732421875, -1.3521728515625, -1.16558837890625, -0.97900390625, -0.79241943359375, -0.6058349609375, -0.41925048828125, -0.232666015625, -0.04608154296875, 0.1405029296875, 0.32708740234375, 0.513671875, 0.70025634765625, 0.8868408203125, 1.07342529296875, 1.260009765625, 1.44659423828125, 1.6331787109375, 1.81976318359375, 2.00634765625, 2.19293212890625, 2.3795166015625, 2.56610107421875, 2.752685546875, 2.93927001953125, 3.1258544921875, 3.31243896484375, 3.4990234375, 3.68560791015625, 3.8721923828125, 4.05877685546875, 4.245361328125, 4.43194580078125, 4.6185302734375, 4.80511474609375, 4.99169921875, 5.17828369140625, 5.3648681640625, 5.55145263671875, 5.738037109375, 5.92462158203125, 6.1112060546875, 6.29779052734375, 6.484375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 7.0, 7.0, 20.0, 22.0, 25.0, 43.0, 56.0, 80.0, 108.0, 171.0, 234.0, 318.0, 407.0, 634.0, 806.0, 1071.0, 1497.0, 2147.0, 2800.0, 3999.0, 5301.0, 7361.0, 10102.0, 14267.0, 19917.0, 28532.0, 41355.0, 61103.0, 91951.0, 133345.0, 163429.0, 141535.0, 99005.0, 66043.0, 43882.0, 30687.0, 21282.0, 15326.0, 10950.0, 7771.0, 5585.0, 4157.0, 3108.0, 2230.0, 1577.0, 1187.0, 876.0, 642.0, 484.0, 335.0, 227.0, 171.0, 111.0, 94.0, 57.0, 54.0, 26.0, 20.0, 12.0, 8.0, 7.0, 3.0, 3.0], "bins": [-0.60888671875, -0.5896148681640625, -0.570343017578125, -0.5510711669921875, -0.53179931640625, -0.5125274658203125, -0.493255615234375, -0.4739837646484375, -0.4547119140625, -0.4354400634765625, -0.416168212890625, -0.3968963623046875, -0.37762451171875, -0.3583526611328125, -0.339080810546875, -0.3198089599609375, -0.300537109375, -0.2812652587890625, -0.261993408203125, -0.2427215576171875, -0.22344970703125, -0.2041778564453125, -0.184906005859375, -0.1656341552734375, -0.1463623046875, -0.1270904541015625, -0.107818603515625, -0.0885467529296875, -0.06927490234375, -0.0500030517578125, -0.030731201171875, -0.0114593505859375, 0.0078125, 0.0270843505859375, 0.046356201171875, 0.0656280517578125, 0.08489990234375, 0.1041717529296875, 0.123443603515625, 0.1427154541015625, 0.1619873046875, 0.1812591552734375, 0.200531005859375, 0.2198028564453125, 0.23907470703125, 0.2583465576171875, 0.277618408203125, 0.2968902587890625, 0.316162109375, 0.3354339599609375, 0.354705810546875, 0.3739776611328125, 0.39324951171875, 0.4125213623046875, 0.431793212890625, 0.4510650634765625, 0.4703369140625, 0.4896087646484375, 0.508880615234375, 0.5281524658203125, 0.54742431640625, 0.5666961669921875, 0.585968017578125, 0.6052398681640625, 0.62451171875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 12.0, 13.0, 12.0, 14.0, 16.0, 11.0, 22.0, 35.0, 25.0, 28.0, 38.0, 31.0, 32.0, 30.0, 30.0, 38.0, 28.0, 43.0, 1067.0, 38.0, 25.0, 40.0, 35.0, 27.0, 42.0, 33.0, 31.0, 28.0, 19.0, 19.0, 19.0, 13.0, 15.0, 15.0, 12.0, 13.0, 13.0, 8.0, 8.0, 7.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-4.26171875, -4.13787841796875, -4.0140380859375, -3.89019775390625, -3.766357421875, -3.64251708984375, -3.5186767578125, -3.39483642578125, -3.27099609375, -3.14715576171875, -3.0233154296875, -2.89947509765625, -2.775634765625, -2.65179443359375, -2.5279541015625, -2.40411376953125, -2.2802734375, -2.15643310546875, -2.0325927734375, -1.90875244140625, -1.784912109375, -1.66107177734375, -1.5372314453125, -1.41339111328125, -1.28955078125, -1.16571044921875, -1.0418701171875, -0.91802978515625, -0.794189453125, -0.67034912109375, -0.5465087890625, -0.42266845703125, -0.298828125, -0.17498779296875, -0.0511474609375, 0.07269287109375, 0.196533203125, 0.32037353515625, 0.4442138671875, 0.56805419921875, 0.69189453125, 0.81573486328125, 0.9395751953125, 1.06341552734375, 1.187255859375, 1.31109619140625, 1.4349365234375, 1.55877685546875, 1.6826171875, 1.80645751953125, 1.9302978515625, 2.05413818359375, 2.177978515625, 2.30181884765625, 2.4256591796875, 2.54949951171875, 2.67333984375, 2.79718017578125, 2.9210205078125, 3.04486083984375, 3.168701171875, 3.29254150390625, 3.4163818359375, 3.54022216796875, 3.6640625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 14.0, 17.0, 21.0, 37.0, 61.0, 89.0, 124.0, 183.0, 264.0, 431.0, 647.0, 934.0, 1583.0, 2535.0, 4115.0, 6734.0, 11350.0, 19119.0, 32732.0, 57040.0, 102086.0, 179617.0, 1283590.0, 169082.0, 95050.0, 53464.0, 30684.0, 17941.0, 10523.0, 6415.0, 3942.0, 2518.0, 1529.0, 980.0, 584.0, 376.0, 243.0, 174.0, 109.0, 62.0, 31.0, 34.0, 18.0, 16.0, 5.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.7041015625, -0.6801834106445312, -0.6562652587890625, -0.6323471069335938, -0.608428955078125, -0.5845108032226562, -0.5605926513671875, -0.5366744995117188, -0.51275634765625, -0.48883819580078125, -0.4649200439453125, -0.44100189208984375, -0.417083740234375, -0.39316558837890625, -0.3692474365234375, -0.34532928466796875, -0.3214111328125, -0.29749298095703125, -0.2735748291015625, -0.24965667724609375, -0.225738525390625, -0.20182037353515625, -0.1779022216796875, -0.15398406982421875, -0.13006591796875, -0.10614776611328125, -0.0822296142578125, -0.05831146240234375, -0.034393310546875, -0.01047515869140625, 0.0134429931640625, 0.03736114501953125, 0.061279296875, 0.08519744873046875, 0.1091156005859375, 0.13303375244140625, 0.156951904296875, 0.18087005615234375, 0.2047882080078125, 0.22870635986328125, 0.25262451171875, 0.27654266357421875, 0.3004608154296875, 0.32437896728515625, 0.348297119140625, 0.37221527099609375, 0.3961334228515625, 0.42005157470703125, 0.4439697265625, 0.46788787841796875, 0.4918060302734375, 0.5157241821289062, 0.539642333984375, 0.5635604858398438, 0.5874786376953125, 0.6113967895507812, 0.63531494140625, 0.6592330932617188, 0.6831512451171875, 0.7070693969726562, 0.730987548828125, 0.7549057006835938, 0.7788238525390625, 0.8027420043945312, 0.82666015625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 11.0, 5.0, 4.0, 7.0, 15.0, 18.0, 29.0, 26.0, 32.0, 21.0, 32.0, 60.0, 41.0, 66.0, 58.0, 56.0, 64.0, 53.0, 52.0, 59.0, 36.0, 42.0, 31.0, 29.0, 41.0, 26.0, 22.0, 14.0, 9.0, 8.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0027141571044921875, -0.002634882926940918, -0.0025556087493896484, -0.002476334571838379, -0.0023970603942871094, -0.00231778621673584, -0.0022385120391845703, -0.0021592378616333008, -0.0020799636840820312, -0.0020006895065307617, -0.0019214153289794922, -0.0018421411514282227, -0.0017628669738769531, -0.0016835927963256836, -0.001604318618774414, -0.0015250444412231445, -0.001445770263671875, -0.0013664960861206055, -0.001287221908569336, -0.0012079477310180664, -0.0011286735534667969, -0.0010493993759155273, -0.0009701251983642578, -0.0008908510208129883, -0.0008115768432617188, -0.0007323026657104492, -0.0006530284881591797, -0.0005737543106079102, -0.0004944801330566406, -0.0004152059555053711, -0.00033593177795410156, -0.00025665760040283203, -0.0001773834228515625, -9.810924530029297e-05, -1.8835067749023438e-05, 6.0439109802246094e-05, 0.00013971328735351562, 0.00021898746490478516, 0.0002982616424560547, 0.0003775358200073242, 0.00045680999755859375, 0.0005360841751098633, 0.0006153583526611328, 0.0006946325302124023, 0.0007739067077636719, 0.0008531808853149414, 0.0009324550628662109, 0.0010117292404174805, 0.00109100341796875, 0.0011702775955200195, 0.001249551773071289, 0.0013288259506225586, 0.0014081001281738281, 0.0014873743057250977, 0.0015666484832763672, 0.0016459226608276367, 0.0017251968383789062, 0.0018044710159301758, 0.0018837451934814453, 0.001963019371032715, 0.0020422935485839844, 0.002121567726135254, 0.0022008419036865234, 0.002280116081237793, 0.0023593902587890625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 10.0, 6.0, 15.0, 27.0, 27.0, 34.0, 46.0, 76.0, 82.0, 77.0, 126.0, 174.0, 318.0, 609.0, 2237.0, 859854.0, 182102.0, 1234.0, 498.0, 280.0, 176.0, 118.0, 98.0, 69.0, 50.0, 39.0, 24.0, 37.0, 21.0, 14.0, 13.0, 12.0, 8.0, 6.0, 7.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04827880859375, -0.04671478271484375, -0.0451507568359375, -0.04358673095703125, -0.042022705078125, -0.04045867919921875, -0.0388946533203125, -0.03733062744140625, -0.0357666015625, -0.03420257568359375, -0.0326385498046875, -0.03107452392578125, -0.029510498046875, -0.02794647216796875, -0.0263824462890625, -0.02481842041015625, -0.02325439453125, -0.02169036865234375, -0.0201263427734375, -0.01856231689453125, -0.016998291015625, -0.01543426513671875, -0.0138702392578125, -0.01230621337890625, -0.0107421875, -0.00917816162109375, -0.0076141357421875, -0.00605010986328125, -0.004486083984375, -0.00292205810546875, -0.0013580322265625, 0.00020599365234375, 0.00177001953125, 0.00333404541015625, 0.0048980712890625, 0.00646209716796875, 0.008026123046875, 0.00959014892578125, 0.0111541748046875, 0.01271820068359375, 0.0142822265625, 0.01584625244140625, 0.0174102783203125, 0.01897430419921875, 0.020538330078125, 0.02210235595703125, 0.0236663818359375, 0.02523040771484375, 0.02679443359375, 0.02835845947265625, 0.0299224853515625, 0.03148651123046875, 0.033050537109375, 0.03461456298828125, 0.0361785888671875, 0.03774261474609375, 0.039306640625, 0.04087066650390625, 0.0424346923828125, 0.04399871826171875, 0.045562744140625, 0.04712677001953125, 0.0486907958984375, 0.05025482177734375, 0.05181884765625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 981.0, 32.0], "bins": [-0.057560306042432785, -0.056641124188899994, -0.0557219460606575, -0.05480276420712471, -0.05388358607888222, -0.052964404225349426, -0.052045226097106934, -0.05112604424357414, -0.05020686611533165, -0.04928768426179886, -0.048368506133556366, -0.047449324280023575, -0.04653014615178108, -0.04561096429824829, -0.0446917861700058, -0.04377260431647301, -0.042853426188230515, -0.04193424433469772, -0.04101506620645523, -0.04009588435292244, -0.03917670622467995, -0.038257524371147156, -0.03733834624290466, -0.03641916438937187, -0.03549998626112938, -0.03458080440759659, -0.033661626279354095, -0.032742444425821304, -0.03182326629757881, -0.03090408630669117, -0.029984906315803528, -0.029065726324915886, -0.028146542608737946, -0.027227362617850304, -0.026308182626962662, -0.02538900263607502, -0.024469822645187378, -0.023550642654299736, -0.022631462663412094, -0.021712282672524452, -0.02079310268163681, -0.01987392269074917, -0.018954742699861526, -0.018035562708973885, -0.017116382718086243, -0.0161972027271986, -0.015278022736310959, -0.014358842745423317, -0.0134396618232131, -0.012520481832325459, -0.011601301841437817, -0.010682121850550175, -0.009762941859662533, -0.008843760937452316, -0.007924580946564674, -0.00700540142133832, -0.006086221896111965, -0.005167041905224323, -0.004247861914336681, -0.003328681690618396, -0.002409501699730754, -0.0014903214760124683, -0.0005711414851248264, 0.0003480385057628155, 0.0012672186130657792]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 9.0, 17.0, 29.0, 31.0, 29.0, 45.0, 41.0, 61.0, 76.0, 59.0, 79.0, 89.0, 67.0, 80.0, 72.0, 67.0, 34.0, 32.0, 23.0, 26.0, 18.0, 8.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014080405235290527, -0.0013303542509675026, -0.0012526679784059525, -0.0011749817058444023, -0.0010972954332828522, -0.001019609160721302, -0.0009419228881597519, -0.0008642366155982018, -0.0007865503430366516, -0.0007088640704751015, -0.0006311777979135513, -0.0005534915253520012, -0.00047580525279045105, -0.0003981189802289009, -0.00032043270766735077, -0.00024274643510580063, -0.0001650601625442505, -8.737388998270035e-05, -9.687617421150208e-06, 6.799865514039993e-05, 0.00014568492770195007, 0.00022337120026350021, 0.00030105747282505035, 0.0003787437453866005, 0.00045643001794815063, 0.0005341162905097008, 0.0006118025630712509, 0.0006894888356328011, 0.0007671751081943512, 0.0008448613807559013, 0.0009225476533174515, 0.0010002339258790016, 0.0010779201984405518, 0.001155606471002102, 0.001233292743563652, 0.0013109790161252022, 0.0013886652886867523, 0.0014663515612483025, 0.0015440378338098526, 0.0016217241063714027, 0.0016994103789329529, 0.001777096651494503, 0.0018547829240560532, 0.0019324691966176033, 0.0020101554691791534, 0.0020878417417407036, 0.0021655280143022537, 0.002243214286863804, 0.002320900559425354, 0.002398586831986904, 0.0024762731045484543, 0.0025539593771100044, 0.0026316456496715546, 0.0027093319222331047, 0.002787018194794655, 0.002864704467356205, 0.002942390739917755, 0.0030200770124793053, 0.0030977632850408554, 0.0031754495576024055, 0.0032531358301639557, 0.003330822102725506, 0.003408508375287056, 0.003486194647848606, 0.0035638809204101562]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 1.0, 7.0, 8.0, 9.0, 6.0, 8.0, 7.0, 8.0, 17.0, 13.0, 13.0, 16.0, 20.0, 24.0, 25.0, 26.0, 40.0, 37.0, 26.0, 31.0, 32.0, 34.0, 47.0, 53.0, 34.0, 34.0, 33.0, 33.0, 38.0, 35.0, 21.0, 30.0, 30.0, 28.0, 20.0, 24.0, 26.0, 12.0, 12.0, 16.0, 20.0, 9.0, 6.0, 5.0, 6.0, 9.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.45703125, -5.27044677734375, -5.0838623046875, -4.89727783203125, -4.710693359375, -4.52410888671875, -4.3375244140625, -4.15093994140625, -3.96435546875, -3.77777099609375, -3.5911865234375, -3.40460205078125, -3.218017578125, -3.03143310546875, -2.8448486328125, -2.65826416015625, -2.4716796875, -2.28509521484375, -2.0985107421875, -1.91192626953125, -1.725341796875, -1.53875732421875, -1.3521728515625, -1.16558837890625, -0.97900390625, -0.79241943359375, -0.6058349609375, -0.41925048828125, -0.232666015625, -0.04608154296875, 0.1405029296875, 0.32708740234375, 0.513671875, 0.70025634765625, 0.8868408203125, 1.07342529296875, 1.260009765625, 1.44659423828125, 1.6331787109375, 1.81976318359375, 2.00634765625, 2.19293212890625, 2.3795166015625, 2.56610107421875, 2.752685546875, 2.93927001953125, 3.1258544921875, 3.31243896484375, 3.4990234375, 3.68560791015625, 3.8721923828125, 4.05877685546875, 4.245361328125, 4.43194580078125, 4.6185302734375, 4.80511474609375, 4.99169921875, 5.17828369140625, 5.3648681640625, 5.55145263671875, 5.738037109375, 5.92462158203125, 6.1112060546875, 6.29779052734375, 6.484375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 10.0, 12.0, 16.0, 17.0, 24.0, 26.0, 32.0, 48.0, 41.0, 69.0, 83.0, 113.0, 157.0, 275.0, 392.0, 700.0, 1315.0, 2563.0, 5607.0, 12830.0, 31776.0, 88536.0, 303733.0, 410432.0, 118732.0, 41176.0, 16071.0, 6819.0, 3154.0, 1491.0, 794.0, 494.0, 275.0, 178.0, 144.0, 107.0, 66.0, 55.0, 33.0, 41.0, 27.0, 14.0, 17.0, 12.0, 12.0, 5.0, 10.0, 6.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.95703125, -6.71820068359375, -6.4793701171875, -6.24053955078125, -6.001708984375, -5.76287841796875, -5.5240478515625, -5.28521728515625, -5.04638671875, -4.80755615234375, -4.5687255859375, -4.32989501953125, -4.091064453125, -3.85223388671875, -3.6134033203125, -3.37457275390625, -3.1357421875, -2.89691162109375, -2.6580810546875, -2.41925048828125, -2.180419921875, -1.94158935546875, -1.7027587890625, -1.46392822265625, -1.22509765625, -0.98626708984375, -0.7474365234375, -0.50860595703125, -0.269775390625, -0.03094482421875, 0.2078857421875, 0.44671630859375, 0.685546875, 0.92437744140625, 1.1632080078125, 1.40203857421875, 1.640869140625, 1.87969970703125, 2.1185302734375, 2.35736083984375, 2.59619140625, 2.83502197265625, 3.0738525390625, 3.31268310546875, 3.551513671875, 3.79034423828125, 4.0291748046875, 4.26800537109375, 4.5068359375, 4.74566650390625, 4.9844970703125, 5.22332763671875, 5.462158203125, 5.70098876953125, 5.9398193359375, 6.17864990234375, 6.41748046875, 6.65631103515625, 6.8951416015625, 7.13397216796875, 7.372802734375, 7.61163330078125, 7.8504638671875, 8.08929443359375, 8.328125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 1.0, 5.0, 7.0, 16.0, 14.0, 7.0, 20.0, 19.0, 20.0, 14.0, 32.0, 35.0, 29.0, 42.0, 41.0, 44.0, 51.0, 75.0, 111.0, 313.0, 1510.0, 147.0, 86.0, 76.0, 49.0, 37.0, 42.0, 26.0, 20.0, 24.0, 17.0, 23.0, 18.0, 7.0, 16.0, 8.0, 7.0, 8.0, 6.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.8125, -16.23583984375, -15.6591796875, -15.08251953125, -14.505859375, -13.92919921875, -13.3525390625, -12.77587890625, -12.19921875, -11.62255859375, -11.0458984375, -10.46923828125, -9.892578125, -9.31591796875, -8.7392578125, -8.16259765625, -7.5859375, -7.00927734375, -6.4326171875, -5.85595703125, -5.279296875, -4.70263671875, -4.1259765625, -3.54931640625, -2.97265625, -2.39599609375, -1.8193359375, -1.24267578125, -0.666015625, -0.08935546875, 0.4873046875, 1.06396484375, 1.640625, 2.21728515625, 2.7939453125, 3.37060546875, 3.947265625, 4.52392578125, 5.1005859375, 5.67724609375, 6.25390625, 6.83056640625, 7.4072265625, 7.98388671875, 8.560546875, 9.13720703125, 9.7138671875, 10.29052734375, 10.8671875, 11.44384765625, 12.0205078125, 12.59716796875, 13.173828125, 13.75048828125, 14.3271484375, 14.90380859375, 15.48046875, 16.05712890625, 16.6337890625, 17.21044921875, 17.787109375, 18.36376953125, 18.9404296875, 19.51708984375, 20.09375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 9.0, 7.0, 10.0, 16.0, 23.0, 39.0, 29.0, 52.0, 95.0, 131.0, 198.0, 364.0, 793.0, 6256.0, 583838.0, 2540141.0, 11527.0, 1013.0, 421.0, 258.0, 155.0, 89.0, 63.0, 59.0, 28.0, 25.0, 17.0, 20.0, 8.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.4375, -29.27099609375, -28.1044921875, -26.93798828125, -25.771484375, -24.60498046875, -23.4384765625, -22.27197265625, -21.10546875, -19.93896484375, -18.7724609375, -17.60595703125, -16.439453125, -15.27294921875, -14.1064453125, -12.93994140625, -11.7734375, -10.60693359375, -9.4404296875, -8.27392578125, -7.107421875, -5.94091796875, -4.7744140625, -3.60791015625, -2.44140625, -1.27490234375, -0.1083984375, 1.05810546875, 2.224609375, 3.39111328125, 4.5576171875, 5.72412109375, 6.890625, 8.05712890625, 9.2236328125, 10.39013671875, 11.556640625, 12.72314453125, 13.8896484375, 15.05615234375, 16.22265625, 17.38916015625, 18.5556640625, 19.72216796875, 20.888671875, 22.05517578125, 23.2216796875, 24.38818359375, 25.5546875, 26.72119140625, 27.8876953125, 29.05419921875, 30.220703125, 31.38720703125, 32.5537109375, 33.72021484375, 34.88671875, 36.05322265625, 37.2197265625, 38.38623046875, 39.552734375, 40.71923828125, 41.8857421875, 43.05224609375, 44.21875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 514.0, 474.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.32444763183594, -55.664268493652344, -51.004093170166016, -46.34391784667969, -41.683738708496094, -37.0235595703125, -32.36338424682617, -27.703208923339844, -23.04302978515625, -18.38285255432129, -13.722675323486328, -9.062498092651367, -4.402320861816406, 0.2578563690185547, 4.918033599853516, 9.578208923339844, 14.238388061523438, 18.8985652923584, 23.55874252319336, 28.21891975402832, 32.87909698486328, 37.539276123046875, 42.1994514465332, 46.85962677001953, 51.519805908203125, 56.17998504638672, 60.84016036987305, 65.50033569335938, 70.16051483154297, 74.82069396972656, 79.48086547851562, 84.14104461669922, 88.80122375488281, 93.4614028930664, 98.12158203125, 102.78175354003906, 107.44193267822266, 112.10211181640625, 116.76228332519531, 121.4224624633789, 126.0826416015625, 130.74281311035156, 135.4029998779297, 140.06317138671875, 144.72335815429688, 149.38352966308594, 154.043701171875, 158.70388793945312, 163.3640594482422, 168.02423095703125, 172.68441772460938, 177.34458923339844, 182.0047607421875, 186.66494750976562, 191.3251190185547, 195.98529052734375, 200.64547729492188, 205.30564880371094, 209.96583557128906, 214.62600708007812, 219.28619384765625, 223.9463653564453, 228.60653686523438, 233.2667236328125, 237.92689514160156]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 4.0, 9.0, 3.0, 9.0, 9.0, 8.0, 12.0, 15.0, 19.0, 20.0, 25.0, 24.0, 24.0, 16.0, 20.0, 26.0, 25.0, 36.0, 36.0, 39.0, 34.0, 35.0, 38.0, 46.0, 38.0, 33.0, 33.0, 32.0, 31.0, 35.0, 20.0, 36.0, 23.0, 24.0, 23.0, 24.0, 13.0, 14.0, 12.0, 6.0, 7.0, 9.0, 7.0, 7.0, 9.0, 4.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0], "bins": [-34.837284088134766, -33.746849060058594, -32.65641784667969, -31.56598472595215, -30.47555160522461, -29.38511848449707, -28.29468536376953, -27.20425033569336, -26.113819122314453, -25.023386001586914, -23.932952880859375, -22.842519760131836, -21.752086639404297, -20.661653518676758, -19.57122039794922, -18.480785369873047, -17.390352249145508, -16.29991912841797, -15.20948600769043, -14.11905288696289, -13.028619766235352, -11.938186645507812, -10.847752571105957, -9.757319450378418, -8.666886329650879, -7.57645320892334, -6.486020088195801, -5.3955864906311035, -4.3051533699035645, -3.2147202491760254, -2.124286651611328, -1.033853530883789, 0.05657958984375, 1.1470128297805786, 2.2374460697174072, 3.3278794288635254, 4.4183125495910645, 5.5087456703186035, 6.599179267883301, 7.68961238861084, 8.780045509338379, 9.870478630065918, 10.960911750793457, 12.051345825195312, 13.141778945922852, 14.23221206665039, 15.32264518737793, 16.41307830810547, 17.503511428833008, 18.593944549560547, 19.684377670288086, 20.774810791015625, 21.865243911743164, 22.955677032470703, 24.046112060546875, 25.13654327392578, 26.226978302001953, 27.317411422729492, 28.40784454345703, 29.49827766418457, 30.58871078491211, 31.67914390563965, 32.76957702636719, 33.86001205444336, 34.950443267822266]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 5.0, 6.0, 7.0, 14.0, 8.0, 7.0, 15.0, 11.0, 17.0, 21.0, 14.0, 23.0, 27.0, 31.0, 37.0, 32.0, 36.0, 40.0, 26.0, 40.0, 46.0, 42.0, 33.0, 35.0, 34.0, 31.0, 38.0, 33.0, 29.0, 28.0, 31.0, 24.0, 27.0, 18.0, 18.0, 14.0, 14.0, 17.0, 16.0, 6.0, 8.0, 9.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78125, -5.5869140625, -5.392578125, -5.1982421875, -5.00390625, -4.8095703125, -4.615234375, -4.4208984375, -4.2265625, -4.0322265625, -3.837890625, -3.6435546875, -3.44921875, -3.2548828125, -3.060546875, -2.8662109375, -2.671875, -2.4775390625, -2.283203125, -2.0888671875, -1.89453125, -1.7001953125, -1.505859375, -1.3115234375, -1.1171875, -0.9228515625, -0.728515625, -0.5341796875, -0.33984375, -0.1455078125, 0.048828125, 0.2431640625, 0.4375, 0.6318359375, 0.826171875, 1.0205078125, 1.21484375, 1.4091796875, 1.603515625, 1.7978515625, 1.9921875, 2.1865234375, 2.380859375, 2.5751953125, 2.76953125, 2.9638671875, 3.158203125, 3.3525390625, 3.546875, 3.7412109375, 3.935546875, 4.1298828125, 4.32421875, 4.5185546875, 4.712890625, 4.9072265625, 5.1015625, 5.2958984375, 5.490234375, 5.6845703125, 5.87890625, 6.0732421875, 6.267578125, 6.4619140625, 6.65625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 7.0, 8.0, 17.0, 10.0, 12.0, 25.0, 27.0, 36.0, 45.0, 88.0, 124.0, 272.0, 562.0, 1310.0, 3861.0, 14236.0, 111318.0, 2352079.0, 1626123.0, 68044.0, 10808.0, 3115.0, 1116.0, 457.0, 196.0, 126.0, 66.0, 36.0, 27.0, 23.0, 19.0, 17.0, 17.0, 10.0, 11.0, 6.0, 5.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.484375, -16.879638671875, -16.27490234375, -15.670166015625, -15.0654296875, -14.460693359375, -13.85595703125, -13.251220703125, -12.646484375, -12.041748046875, -11.43701171875, -10.832275390625, -10.2275390625, -9.622802734375, -9.01806640625, -8.413330078125, -7.80859375, -7.203857421875, -6.59912109375, -5.994384765625, -5.3896484375, -4.784912109375, -4.18017578125, -3.575439453125, -2.970703125, -2.365966796875, -1.76123046875, -1.156494140625, -0.5517578125, 0.052978515625, 0.65771484375, 1.262451171875, 1.8671875, 2.471923828125, 3.07666015625, 3.681396484375, 4.2861328125, 4.890869140625, 5.49560546875, 6.100341796875, 6.705078125, 7.309814453125, 7.91455078125, 8.519287109375, 9.1240234375, 9.728759765625, 10.33349609375, 10.938232421875, 11.54296875, 12.147705078125, 12.75244140625, 13.357177734375, 13.9619140625, 14.566650390625, 15.17138671875, 15.776123046875, 16.380859375, 16.985595703125, 17.59033203125, 18.195068359375, 18.7998046875, 19.404541015625, 20.00927734375, 20.614013671875, 21.21875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 9.0, 3.0, 8.0, 8.0, 11.0, 13.0, 12.0, 28.0, 25.0, 29.0, 41.0, 59.0, 88.0, 127.0, 172.0, 243.0, 333.0, 471.0, 533.0, 502.0, 408.0, 267.0, 179.0, 131.0, 96.0, 73.0, 49.0, 35.0, 34.0, 18.0, 16.0, 17.0, 8.0, 11.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.696044921875, -8.39208984375, -8.088134765625, -7.7841796875, -7.480224609375, -7.17626953125, -6.872314453125, -6.568359375, -6.264404296875, -5.96044921875, -5.656494140625, -5.3525390625, -5.048583984375, -4.74462890625, -4.440673828125, -4.13671875, -3.832763671875, -3.52880859375, -3.224853515625, -2.9208984375, -2.616943359375, -2.31298828125, -2.009033203125, -1.705078125, -1.401123046875, -1.09716796875, -0.793212890625, -0.4892578125, -0.185302734375, 0.11865234375, 0.422607421875, 0.7265625, 1.030517578125, 1.33447265625, 1.638427734375, 1.9423828125, 2.246337890625, 2.55029296875, 2.854248046875, 3.158203125, 3.462158203125, 3.76611328125, 4.070068359375, 4.3740234375, 4.677978515625, 4.98193359375, 5.285888671875, 5.58984375, 5.893798828125, 6.19775390625, 6.501708984375, 6.8056640625, 7.109619140625, 7.41357421875, 7.717529296875, 8.021484375, 8.325439453125, 8.62939453125, 8.933349609375, 9.2373046875, 9.541259765625, 9.84521484375, 10.149169921875, 10.453125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 12.0, 10.0, 9.0, 18.0, 22.0, 27.0, 47.0, 68.0, 122.0, 199.0, 462.0, 951.0, 2524.0, 9882.0, 64205.0, 1255360.0, 2729127.0, 111346.0, 14171.0, 3314.0, 1189.0, 543.0, 268.0, 128.0, 87.0, 61.0, 37.0, 19.0, 25.0, 16.0, 11.0, 6.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.734375, -21.0576171875, -20.380859375, -19.7041015625, -19.02734375, -18.3505859375, -17.673828125, -16.9970703125, -16.3203125, -15.6435546875, -14.966796875, -14.2900390625, -13.61328125, -12.9365234375, -12.259765625, -11.5830078125, -10.90625, -10.2294921875, -9.552734375, -8.8759765625, -8.19921875, -7.5224609375, -6.845703125, -6.1689453125, -5.4921875, -4.8154296875, -4.138671875, -3.4619140625, -2.78515625, -2.1083984375, -1.431640625, -0.7548828125, -0.078125, 0.5986328125, 1.275390625, 1.9521484375, 2.62890625, 3.3056640625, 3.982421875, 4.6591796875, 5.3359375, 6.0126953125, 6.689453125, 7.3662109375, 8.04296875, 8.7197265625, 9.396484375, 10.0732421875, 10.75, 11.4267578125, 12.103515625, 12.7802734375, 13.45703125, 14.1337890625, 14.810546875, 15.4873046875, 16.1640625, 16.8408203125, 17.517578125, 18.1943359375, 18.87109375, 19.5478515625, 20.224609375, 20.9013671875, 21.578125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 8.0, 14.0, 63.0, 195.0, 365.0, 249.0, 94.0, 23.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.16478729248047, -119.70677185058594, -116.2487564086914, -112.79074096679688, -109.33272552490234, -105.87471008300781, -102.41669464111328, -98.95867919921875, -95.50066375732422, -92.04264831542969, -88.58463287353516, -85.12661743164062, -81.6686019897461, -78.21058654785156, -74.75257110595703, -71.2945556640625, -67.83654022216797, -64.37852478027344, -60.920509338378906, -57.462493896484375, -54.004478454589844, -50.54646301269531, -47.08844757080078, -43.63043212890625, -40.17241668701172, -36.71440124511719, -33.256385803222656, -29.798370361328125, -26.340354919433594, -22.882339477539062, -19.42432403564453, -15.96630859375, -12.508293151855469, -9.050277709960938, -5.592262268066406, -2.134246826171875, 1.3237686157226562, 4.7817840576171875, 8.239799499511719, 11.69781494140625, 15.155830383300781, 18.613845825195312, 22.071861267089844, 25.529876708984375, 28.987892150878906, 32.44590759277344, 35.90392303466797, 39.3619384765625, 42.81995391845703, 46.27796936035156, 49.735984802246094, 53.194000244140625, 56.652015686035156, 60.11003112792969, 63.56804656982422, 67.02606201171875, 70.48407745361328, 73.94209289550781, 77.40010833740234, 80.85812377929688, 84.3161392211914, 87.77415466308594, 91.23217010498047, 94.690185546875, 98.14820098876953]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 11.0, 10.0, 9.0, 8.0, 9.0, 17.0, 18.0, 23.0, 21.0, 24.0, 23.0, 26.0, 32.0, 21.0, 29.0, 29.0, 36.0, 24.0, 30.0, 48.0, 32.0, 40.0, 40.0, 38.0, 37.0, 30.0, 36.0, 29.0, 22.0, 23.0, 32.0, 33.0, 23.0, 17.0, 23.0, 18.0, 14.0, 13.0, 3.0, 11.0, 9.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-26.51313018798828, -25.61332893371582, -24.713525772094727, -23.813724517822266, -22.913921356201172, -22.01412010192871, -21.11431884765625, -20.214515686035156, -19.314714431762695, -18.414913177490234, -17.51511001586914, -16.61530876159668, -15.715506553649902, -14.815704345703125, -13.915903091430664, -13.016100883483887, -12.11629867553711, -11.216496467590332, -10.316694259643555, -9.416893005371094, -8.517090797424316, -7.617288589477539, -6.71748685836792, -5.817685127258301, -4.917882919311523, -4.018080711364746, -3.118278980255127, -2.2184770107269287, -1.3186750411987305, -0.4188728332519531, 0.480928897857666, 1.3807306289672852, 2.2805328369140625, 3.1803348064422607, 4.080136775970459, 4.979938507080078, 5.8797407150268555, 6.779542922973633, 7.679344654083252, 8.579146385192871, 9.478948593139648, 10.378750801086426, 11.278553009033203, 12.178354263305664, 13.078156471252441, 13.977958679199219, 14.87775993347168, 15.777562141418457, 16.677364349365234, 17.577165603637695, 18.47696876525879, 19.37677001953125, 20.276573181152344, 21.176374435424805, 22.076175689697266, 22.97597885131836, 23.87578010559082, 24.77558135986328, 25.675384521484375, 26.575185775756836, 27.474987030029297, 28.37479019165039, 29.27459144592285, 30.174392700195312, 31.074195861816406]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 9.0, 15.0, 17.0, 9.0, 11.0, 14.0, 21.0, 17.0, 32.0, 21.0, 32.0, 28.0, 18.0, 40.0, 40.0, 38.0, 36.0, 39.0, 32.0, 32.0, 41.0, 33.0, 38.0, 41.0, 37.0, 32.0, 27.0, 32.0, 26.0, 28.0, 21.0, 17.0, 17.0, 13.0, 17.0, 12.0, 9.0, 7.0, 8.0, 11.0, 4.0, 8.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.234375, -6.03515625, -5.8359375, -5.63671875, -5.4375, -5.23828125, -5.0390625, -4.83984375, -4.640625, -4.44140625, -4.2421875, -4.04296875, -3.84375, -3.64453125, -3.4453125, -3.24609375, -3.046875, -2.84765625, -2.6484375, -2.44921875, -2.25, -2.05078125, -1.8515625, -1.65234375, -1.453125, -1.25390625, -1.0546875, -0.85546875, -0.65625, -0.45703125, -0.2578125, -0.05859375, 0.140625, 0.33984375, 0.5390625, 0.73828125, 0.9375, 1.13671875, 1.3359375, 1.53515625, 1.734375, 1.93359375, 2.1328125, 2.33203125, 2.53125, 2.73046875, 2.9296875, 3.12890625, 3.328125, 3.52734375, 3.7265625, 3.92578125, 4.125, 4.32421875, 4.5234375, 4.72265625, 4.921875, 5.12109375, 5.3203125, 5.51953125, 5.71875, 5.91796875, 6.1171875, 6.31640625, 6.515625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 9.0, 15.0, 25.0, 29.0, 33.0, 70.0, 97.0, 161.0, 222.0, 325.0, 479.0, 764.0, 1124.0, 1699.0, 2473.0, 3792.0, 5855.0, 8868.0, 13828.0, 21026.0, 33838.0, 55115.0, 91566.0, 150865.0, 209461.0, 170818.0, 105179.0, 63770.0, 38976.0, 23965.0, 15091.0, 9728.0, 6466.0, 4293.0, 2856.0, 1822.0, 1255.0, 837.0, 574.0, 400.0, 256.0, 180.0, 131.0, 78.0, 45.0, 34.0, 26.0, 14.0, 5.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8173828125, -0.7907028198242188, -0.7640228271484375, -0.7373428344726562, -0.710662841796875, -0.6839828491210938, -0.6573028564453125, -0.6306228637695312, -0.60394287109375, -0.5772628784179688, -0.5505828857421875, -0.5239028930664062, -0.497222900390625, -0.47054290771484375, -0.4438629150390625, -0.41718292236328125, -0.3905029296875, -0.36382293701171875, -0.3371429443359375, -0.31046295166015625, -0.283782958984375, -0.25710296630859375, -0.2304229736328125, -0.20374298095703125, -0.17706298828125, -0.15038299560546875, -0.1237030029296875, -0.09702301025390625, -0.070343017578125, -0.04366302490234375, -0.0169830322265625, 0.00969696044921875, 0.036376953125, 0.06305694580078125, 0.0897369384765625, 0.11641693115234375, 0.143096923828125, 0.16977691650390625, 0.1964569091796875, 0.22313690185546875, 0.24981689453125, 0.27649688720703125, 0.3031768798828125, 0.32985687255859375, 0.356536865234375, 0.38321685791015625, 0.4098968505859375, 0.43657684326171875, 0.4632568359375, 0.48993682861328125, 0.5166168212890625, 0.5432968139648438, 0.569976806640625, 0.5966567993164062, 0.6233367919921875, 0.6500167846679688, 0.67669677734375, 0.7033767700195312, 0.7300567626953125, 0.7567367553710938, 0.783416748046875, 0.8100967407226562, 0.8367767333984375, 0.8634567260742188, 0.89013671875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 6.0, 6.0, 6.0, 6.0, 4.0, 5.0, 11.0, 15.0, 11.0, 11.0, 23.0, 16.0, 26.0, 14.0, 28.0, 32.0, 23.0, 28.0, 37.0, 24.0, 34.0, 38.0, 41.0, 35.0, 1056.0, 37.0, 44.0, 46.0, 36.0, 26.0, 32.0, 20.0, 23.0, 30.0, 17.0, 30.0, 25.0, 17.0, 18.0, 14.0, 15.0, 12.0, 9.0, 3.0, 7.0, 7.0, 5.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-3.947265625, -3.82916259765625, -3.7110595703125, -3.59295654296875, -3.474853515625, -3.35675048828125, -3.2386474609375, -3.12054443359375, -3.00244140625, -2.88433837890625, -2.7662353515625, -2.64813232421875, -2.530029296875, -2.41192626953125, -2.2938232421875, -2.17572021484375, -2.0576171875, -1.93951416015625, -1.8214111328125, -1.70330810546875, -1.585205078125, -1.46710205078125, -1.3489990234375, -1.23089599609375, -1.11279296875, -0.99468994140625, -0.8765869140625, -0.75848388671875, -0.640380859375, -0.52227783203125, -0.4041748046875, -0.28607177734375, -0.16796875, -0.04986572265625, 0.0682373046875, 0.18634033203125, 0.304443359375, 0.42254638671875, 0.5406494140625, 0.65875244140625, 0.77685546875, 0.89495849609375, 1.0130615234375, 1.13116455078125, 1.249267578125, 1.36737060546875, 1.4854736328125, 1.60357666015625, 1.7216796875, 1.83978271484375, 1.9578857421875, 2.07598876953125, 2.194091796875, 2.31219482421875, 2.4302978515625, 2.54840087890625, 2.66650390625, 2.78460693359375, 2.9027099609375, 3.02081298828125, 3.138916015625, 3.25701904296875, 3.3751220703125, 3.49322509765625, 3.611328125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 9.0, 6.0, 9.0, 13.0, 23.0, 30.0, 51.0, 66.0, 124.0, 198.0, 330.0, 490.0, 734.0, 1227.0, 1997.0, 3299.0, 5399.0, 8884.0, 14799.0, 25152.0, 42918.0, 74204.0, 129930.0, 240808.0, 1223232.0, 134986.0, 77447.0, 45035.0, 26078.0, 15774.0, 9265.0, 5676.0, 3469.0, 2022.0, 1263.0, 800.0, 528.0, 295.0, 184.0, 141.0, 86.0, 51.0, 45.0, 18.0, 13.0, 9.0, 3.0, 7.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.810546875, -0.7867355346679688, -0.7629241943359375, -0.7391128540039062, -0.715301513671875, -0.6914901733398438, -0.6676788330078125, -0.6438674926757812, -0.62005615234375, -0.5962448120117188, -0.5724334716796875, -0.5486221313476562, -0.524810791015625, -0.5009994506835938, -0.4771881103515625, -0.45337677001953125, -0.4295654296875, -0.40575408935546875, -0.3819427490234375, -0.35813140869140625, -0.334320068359375, -0.31050872802734375, -0.2866973876953125, -0.26288604736328125, -0.23907470703125, -0.21526336669921875, -0.1914520263671875, -0.16764068603515625, -0.143829345703125, -0.12001800537109375, -0.0962066650390625, -0.07239532470703125, -0.048583984375, -0.02477264404296875, -0.0009613037109375, 0.02285003662109375, 0.046661376953125, 0.07047271728515625, 0.0942840576171875, 0.11809539794921875, 0.14190673828125, 0.16571807861328125, 0.1895294189453125, 0.21334075927734375, 0.237152099609375, 0.26096343994140625, 0.2847747802734375, 0.30858612060546875, 0.3323974609375, 0.35620880126953125, 0.3800201416015625, 0.40383148193359375, 0.427642822265625, 0.45145416259765625, 0.4752655029296875, 0.49907684326171875, 0.52288818359375, 0.5466995239257812, 0.5705108642578125, 0.5943222045898438, 0.618133544921875, 0.6419448852539062, 0.6657562255859375, 0.6895675659179688, 0.71337890625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 10.0, 12.0, 19.0, 18.0, 23.0, 42.0, 55.0, 56.0, 53.0, 67.0, 72.0, 85.0, 68.0, 74.0, 53.0, 62.0, 45.0, 33.0, 37.0, 20.0, 17.0, 14.0, 20.0, 7.0, 2.0, 6.0, 7.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028076171875, -0.002715975046157837, -0.002624332904815674, -0.0025326907634735107, -0.0024410486221313477, -0.0023494064807891846, -0.0022577643394470215, -0.0021661221981048584, -0.0020744800567626953, -0.0019828379154205322, -0.0018911957740783691, -0.001799553632736206, -0.001707911491394043, -0.0016162693500518799, -0.0015246272087097168, -0.0014329850673675537, -0.0013413429260253906, -0.0012497007846832275, -0.0011580586433410645, -0.0010664165019989014, -0.0009747743606567383, -0.0008831322193145752, -0.0007914900779724121, -0.000699847936630249, -0.0006082057952880859, -0.0005165636539459229, -0.00042492151260375977, -0.0003332793712615967, -0.0002416372299194336, -0.0001499950885772705, -5.835294723510742e-05, 3.3289194107055664e-05, 0.00012493133544921875, 0.00021657347679138184, 0.0003082156181335449, 0.000399857759475708, 0.0004914999008178711, 0.0005831420421600342, 0.0006747841835021973, 0.0007664263248443604, 0.0008580684661865234, 0.0009497106075286865, 0.0010413527488708496, 0.0011329948902130127, 0.0012246370315551758, 0.0013162791728973389, 0.001407921314239502, 0.001499563455581665, 0.0015912055969238281, 0.0016828477382659912, 0.0017744898796081543, 0.0018661320209503174, 0.0019577741622924805, 0.0020494163036346436, 0.0021410584449768066, 0.0022327005863189697, 0.002324342727661133, 0.002415984869003296, 0.002507627010345459, 0.002599269151687622, 0.002690911293029785, 0.0027825534343719482, 0.0028741955757141113, 0.0029658377170562744, 0.0030574798583984375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 6.0, 8.0, 9.0, 11.0, 20.0, 24.0, 27.0, 54.0, 52.0, 66.0, 92.0, 141.0, 222.0, 425.0, 1038.0, 203211.0, 840326.0, 1555.0, 460.0, 262.0, 165.0, 83.0, 86.0, 65.0, 38.0, 17.0, 24.0, 10.0, 13.0, 8.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06024169921875, -0.05842161178588867, -0.056601524353027344, -0.054781436920166016, -0.05296134948730469, -0.05114126205444336, -0.04932117462158203, -0.0475010871887207, -0.045680999755859375, -0.04386091232299805, -0.04204082489013672, -0.04022073745727539, -0.03840065002441406, -0.036580562591552734, -0.034760475158691406, -0.03294038772583008, -0.03112030029296875, -0.029300212860107422, -0.027480125427246094, -0.025660037994384766, -0.023839950561523438, -0.02201986312866211, -0.02019977569580078, -0.018379688262939453, -0.016559600830078125, -0.014739513397216797, -0.012919425964355469, -0.01109933853149414, -0.009279251098632812, -0.007459163665771484, -0.005639076232910156, -0.003818988800048828, -0.0019989013671875, -0.00017881393432617188, 0.0016412734985351562, 0.0034613609313964844, 0.0052814483642578125, 0.007101535797119141, 0.008921623229980469, 0.010741710662841797, 0.012561798095703125, 0.014381885528564453, 0.01620197296142578, 0.01802206039428711, 0.019842147827148438, 0.021662235260009766, 0.023482322692871094, 0.025302410125732422, 0.02712249755859375, 0.028942584991455078, 0.030762672424316406, 0.032582759857177734, 0.03440284729003906, 0.03622293472290039, 0.03804302215576172, 0.03986310958862305, 0.041683197021484375, 0.0435032844543457, 0.04532337188720703, 0.04714345932006836, 0.04896354675292969, 0.050783634185791016, 0.052603721618652344, 0.05442380905151367, 0.056243896484375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 11.0, 36.0, 120.0, 277.0, 344.0, 165.0, 44.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007026367820799351, -0.0005662731127813458, -0.00042990950169041753, -0.00029354586149565876, -0.00015718222130089998, -2.0818552002310753e-05, 0.00011554505908861756, 0.0002519086701795459, 0.0003882723394781351, 0.0005246360087767243, 0.0006609996198676527, 0.000797363230958581, 0.0009337269002571702, 0.0010700905695557594, 0.0012064541224390268, 0.001342817791737616, 0.0014791814610362053, 0.0016155451303347945, 0.0017519087996333838, 0.0018882723525166512, 0.002024636138230562, 0.0021609996911138296, 0.002297363243997097, 0.002433727029711008, 0.0025700905825942755, 0.002706454135477543, 0.002842817921191454, 0.0029791814740747213, 0.0031155450269579887, 0.0032519088126719, 0.003388272365555167, 0.0035246359184384346, 0.0036609992384910583, 0.0037973627913743258, 0.003933726344257593, 0.004070090129971504, 0.004206453915685415, 0.004342817701399326, 0.00447918102145195, 0.004615544807165861, 0.004751908592879772, 0.004888272378593683, 0.005024635698646307, 0.005160999484360218, 0.005297363270074129, 0.00543372705578804, 0.005570090375840664, 0.005706454161554575, 0.005842817481607199, 0.00597918126732111, 0.0061155445873737335, 0.006251908373087645, 0.006388272158801556, 0.006524635478854179, 0.0066609992645680904, 0.0067973630502820015, 0.006933726370334625, 0.007070090156048536, 0.00720645347610116, 0.007342817261815071, 0.007479181047528982, 0.007615544833242893, 0.007751908153295517, 0.00788827147334814, 0.008024635724723339]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 3.0, 8.0, 11.0, 9.0, 19.0, 14.0, 12.0, 10.0, 18.0, 14.0, 25.0, 15.0, 29.0, 27.0, 43.0, 29.0, 30.0, 38.0, 39.0, 43.0, 44.0, 40.0, 43.0, 47.0, 32.0, 33.0, 37.0, 40.0, 27.0, 22.0, 33.0, 23.0, 22.0, 15.0, 26.0, 15.0, 14.0, 11.0, 7.0, 9.0, 8.0, 4.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013598799705505371, -0.0013212459161877632, -0.0012826118618249893, -0.0012439778074622154, -0.0012053437530994415, -0.0011667096987366676, -0.0011280756443738937, -0.0010894415900111198, -0.001050807535648346, -0.001012173481285572, -0.0009735394269227982, -0.0009349053725600243, -0.0008962713181972504, -0.0008576372638344765, -0.0008190032094717026, -0.0007803691551089287, -0.0007417351007461548, -0.0007031010463833809, -0.000664466992020607, -0.0006258329376578331, -0.0005871988832950592, -0.0005485648289322853, -0.0005099307745695114, -0.0004712967202067375, -0.0004326626658439636, -0.00039402861148118973, -0.00035539455711841583, -0.00031676050275564194, -0.00027812644839286804, -0.00023949239403009415, -0.00020085833966732025, -0.00016222428530454636, -0.00012359023094177246, -8.495617657899857e-05, -4.632212221622467e-05, -7.688067853450775e-06, 3.094598650932312e-05, 6.958004087209702e-05, 0.00010821409523487091, 0.0001468481495976448, 0.0001854822039604187, 0.0002241162583231926, 0.0002627503126859665, 0.0003013843670487404, 0.0003400184214115143, 0.0003786524757742882, 0.00041728653013706207, 0.00045592058449983597, 0.0004945546388626099, 0.0005331886932253838, 0.0005718227475881577, 0.0006104568019509315, 0.0006490908563137054, 0.0006877249106764793, 0.0007263589650392532, 0.0007649930194020271, 0.000803627073764801, 0.0008422611281275749, 0.0008808951824903488, 0.0009195292368531227, 0.0009581632912158966, 0.0009967973455786705, 0.0010354313999414444, 0.0010740654543042183, 0.0011126995086669922]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 9.0, 15.0, 17.0, 9.0, 11.0, 14.0, 21.0, 17.0, 32.0, 21.0, 32.0, 28.0, 18.0, 40.0, 40.0, 38.0, 36.0, 39.0, 32.0, 32.0, 41.0, 33.0, 38.0, 41.0, 37.0, 32.0, 27.0, 32.0, 26.0, 28.0, 21.0, 17.0, 17.0, 13.0, 17.0, 12.0, 9.0, 7.0, 8.0, 11.0, 4.0, 8.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.234375, -6.03515625, -5.8359375, -5.63671875, -5.4375, -5.23828125, -5.0390625, -4.83984375, -4.640625, -4.44140625, -4.2421875, -4.04296875, -3.84375, -3.64453125, -3.4453125, -3.24609375, -3.046875, -2.84765625, -2.6484375, -2.44921875, -2.25, -2.05078125, -1.8515625, -1.65234375, -1.453125, -1.25390625, -1.0546875, -0.85546875, -0.65625, -0.45703125, -0.2578125, -0.05859375, 0.140625, 0.33984375, 0.5390625, 0.73828125, 0.9375, 1.13671875, 1.3359375, 1.53515625, 1.734375, 1.93359375, 2.1328125, 2.33203125, 2.53125, 2.73046875, 2.9296875, 3.12890625, 3.328125, 3.52734375, 3.7265625, 3.92578125, 4.125, 4.32421875, 4.5234375, 4.72265625, 4.921875, 5.12109375, 5.3203125, 5.51953125, 5.71875, 5.91796875, 6.1171875, 6.31640625, 6.515625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 13.0, 14.0, 13.0, 34.0, 34.0, 49.0, 70.0, 102.0, 101.0, 172.0, 240.0, 344.0, 457.0, 665.0, 1062.0, 1912.0, 3571.0, 7290.0, 17513.0, 46002.0, 136100.0, 388499.0, 290937.0, 94208.0, 33127.0, 12872.0, 5707.0, 2863.0, 1537.0, 946.0, 615.0, 413.0, 288.0, 232.0, 144.0, 112.0, 99.0, 55.0, 41.0, 31.0, 19.0, 20.0, 11.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.9921875, -7.748779296875, -7.50537109375, -7.261962890625, -7.0185546875, -6.775146484375, -6.53173828125, -6.288330078125, -6.044921875, -5.801513671875, -5.55810546875, -5.314697265625, -5.0712890625, -4.827880859375, -4.58447265625, -4.341064453125, -4.09765625, -3.854248046875, -3.61083984375, -3.367431640625, -3.1240234375, -2.880615234375, -2.63720703125, -2.393798828125, -2.150390625, -1.906982421875, -1.66357421875, -1.420166015625, -1.1767578125, -0.933349609375, -0.68994140625, -0.446533203125, -0.203125, 0.040283203125, 0.28369140625, 0.527099609375, 0.7705078125, 1.013916015625, 1.25732421875, 1.500732421875, 1.744140625, 1.987548828125, 2.23095703125, 2.474365234375, 2.7177734375, 2.961181640625, 3.20458984375, 3.447998046875, 3.69140625, 3.934814453125, 4.17822265625, 4.421630859375, 4.6650390625, 4.908447265625, 5.15185546875, 5.395263671875, 5.638671875, 5.882080078125, 6.12548828125, 6.368896484375, 6.6123046875, 6.855712890625, 7.09912109375, 7.342529296875, 7.5859375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 3.0, 6.0, 1.0, 3.0, 7.0, 12.0, 11.0, 16.0, 12.0, 18.0, 13.0, 23.0, 18.0, 27.0, 34.0, 30.0, 36.0, 58.0, 71.0, 77.0, 152.0, 1402.0, 370.0, 155.0, 91.0, 62.0, 41.0, 61.0, 28.0, 34.0, 31.0, 32.0, 22.0, 15.0, 18.0, 8.0, 9.0, 9.0, 9.0, 4.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-18.421875, -17.879638671875, -17.33740234375, -16.795166015625, -16.2529296875, -15.710693359375, -15.16845703125, -14.626220703125, -14.083984375, -13.541748046875, -12.99951171875, -12.457275390625, -11.9150390625, -11.372802734375, -10.83056640625, -10.288330078125, -9.74609375, -9.203857421875, -8.66162109375, -8.119384765625, -7.5771484375, -7.034912109375, -6.49267578125, -5.950439453125, -5.408203125, -4.865966796875, -4.32373046875, -3.781494140625, -3.2392578125, -2.697021484375, -2.15478515625, -1.612548828125, -1.0703125, -0.528076171875, 0.01416015625, 0.556396484375, 1.0986328125, 1.640869140625, 2.18310546875, 2.725341796875, 3.267578125, 3.809814453125, 4.35205078125, 4.894287109375, 5.4365234375, 5.978759765625, 6.52099609375, 7.063232421875, 7.60546875, 8.147705078125, 8.68994140625, 9.232177734375, 9.7744140625, 10.316650390625, 10.85888671875, 11.401123046875, 11.943359375, 12.485595703125, 13.02783203125, 13.570068359375, 14.1123046875, 14.654541015625, 15.19677734375, 15.739013671875, 16.28125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 4.0, 9.0, 6.0, 16.0, 17.0, 16.0, 23.0, 27.0, 32.0, 40.0, 41.0, 78.0, 118.0, 164.0, 222.0, 372.0, 667.0, 2887.0, 50415.0, 2964031.0, 119874.0, 4577.0, 837.0, 373.0, 234.0, 149.0, 118.0, 82.0, 64.0, 56.0, 33.0, 24.0, 31.0, 16.0, 9.0, 6.0, 9.0, 7.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.125, -26.1767578125, -25.228515625, -24.2802734375, -23.33203125, -22.3837890625, -21.435546875, -20.4873046875, -19.5390625, -18.5908203125, -17.642578125, -16.6943359375, -15.74609375, -14.7978515625, -13.849609375, -12.9013671875, -11.953125, -11.0048828125, -10.056640625, -9.1083984375, -8.16015625, -7.2119140625, -6.263671875, -5.3154296875, -4.3671875, -3.4189453125, -2.470703125, -1.5224609375, -0.57421875, 0.3740234375, 1.322265625, 2.2705078125, 3.21875, 4.1669921875, 5.115234375, 6.0634765625, 7.01171875, 7.9599609375, 8.908203125, 9.8564453125, 10.8046875, 11.7529296875, 12.701171875, 13.6494140625, 14.59765625, 15.5458984375, 16.494140625, 17.4423828125, 18.390625, 19.3388671875, 20.287109375, 21.2353515625, 22.18359375, 23.1318359375, 24.080078125, 25.0283203125, 25.9765625, 26.9248046875, 27.873046875, 28.8212890625, 29.76953125, 30.7177734375, 31.666015625, 32.6142578125, 33.5625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.0, 832.0, 128.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.935203552246094, -56.08351135253906, -50.23181915283203, -44.380123138427734, -38.5284309387207, -32.67673873901367, -26.825042724609375, -20.973350524902344, -15.121658325195312, -9.269965171813965, -3.418272018432617, 2.433422088623047, 8.285114288330078, 14.13680648803711, 19.988502502441406, 25.840194702148438, 31.69188690185547, 37.5435791015625, 43.39527130126953, 49.24696731567383, 55.09865951538086, 60.95035171508789, 66.80204772949219, 72.65373992919922, 78.50543212890625, 84.35712432861328, 90.20881652832031, 96.06051635742188, 101.91220092773438, 107.76390075683594, 113.61559295654297, 119.46728515625, 125.3189697265625, 131.17066955566406, 137.02235412597656, 142.87405395507812, 148.72573852539062, 154.5774383544922, 160.42913818359375, 166.28082275390625, 172.13250732421875, 177.9842071533203, 183.8358917236328, 189.68759155273438, 195.53927612304688, 201.39097595214844, 207.24267578125, 213.0943603515625, 218.94606018066406, 224.79776000976562, 230.64944458007812, 236.5011444091797, 242.3528289794922, 248.20452880859375, 254.05621337890625, 259.90789794921875, 265.7596130371094, 271.6112976074219, 277.4630126953125, 283.314697265625, 289.1663818359375, 295.01806640625, 300.8697814941406, 306.7214660644531, 312.5731506347656]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 3.0, 9.0, 10.0, 15.0, 12.0, 7.0, 16.0, 20.0, 25.0, 22.0, 36.0, 33.0, 23.0, 35.0, 41.0, 49.0, 32.0, 47.0, 36.0, 46.0, 54.0, 33.0, 34.0, 36.0, 30.0, 30.0, 36.0, 32.0, 26.0, 25.0, 29.0, 26.0, 27.0, 12.0, 12.0, 7.0, 7.0, 3.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.90922546386719, -37.681705474853516, -36.45418930053711, -35.22666931152344, -33.99915313720703, -32.77163314819336, -31.544113159179688, -30.31659507751465, -29.08907699584961, -27.86155891418457, -26.63404083251953, -25.40652084350586, -24.17900276184082, -22.95148468017578, -21.72396469116211, -20.49644660949707, -19.26892852783203, -18.041410446166992, -16.813892364501953, -15.586372375488281, -14.358854293823242, -13.131336212158203, -11.903817176818848, -10.676298141479492, -9.448780059814453, -8.221261978149414, -6.993742942810059, -5.766224384307861, -4.538705825805664, -3.311187267303467, -2.0836687088012695, -0.8561496734619141, 0.3713645935058594, 1.5988831520080566, 2.826401710510254, 4.053920269012451, 5.281438827514648, 6.508957386016846, 7.736475944519043, 8.963994979858398, 10.191513061523438, 11.419031143188477, 12.646550178527832, 13.874069213867188, 15.101587295532227, 16.329105377197266, 17.556625366210938, 18.784143447875977, 20.011661529541016, 21.239179611206055, 22.466697692871094, 23.694217681884766, 24.921735763549805, 26.149253845214844, 27.376773834228516, 28.604291915893555, 29.831809997558594, 31.059328079223633, 32.28684616088867, 33.514366149902344, 34.74188232421875, 35.96940231323242, 37.196922302246094, 38.4244384765625, 39.65195846557617]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 6.0, 3.0, 12.0, 15.0, 12.0, 9.0, 13.0, 25.0, 23.0, 26.0, 36.0, 22.0, 33.0, 37.0, 33.0, 46.0, 46.0, 42.0, 40.0, 37.0, 40.0, 39.0, 35.0, 47.0, 49.0, 29.0, 35.0, 30.0, 29.0, 16.0, 26.0, 16.0, 17.0, 17.0, 11.0, 15.0, 11.0, 10.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.64453125, -6.42071533203125, -6.1968994140625, -5.97308349609375, -5.749267578125, -5.52545166015625, -5.3016357421875, -5.07781982421875, -4.85400390625, -4.63018798828125, -4.4063720703125, -4.18255615234375, -3.958740234375, -3.73492431640625, -3.5111083984375, -3.28729248046875, -3.0634765625, -2.83966064453125, -2.6158447265625, -2.39202880859375, -2.168212890625, -1.94439697265625, -1.7205810546875, -1.49676513671875, -1.27294921875, -1.04913330078125, -0.8253173828125, -0.60150146484375, -0.377685546875, -0.15386962890625, 0.0699462890625, 0.29376220703125, 0.517578125, 0.74139404296875, 0.9652099609375, 1.18902587890625, 1.412841796875, 1.63665771484375, 1.8604736328125, 2.08428955078125, 2.30810546875, 2.53192138671875, 2.7557373046875, 2.97955322265625, 3.203369140625, 3.42718505859375, 3.6510009765625, 3.87481689453125, 4.0986328125, 4.32244873046875, 4.5462646484375, 4.77008056640625, 4.993896484375, 5.21771240234375, 5.4415283203125, 5.66534423828125, 5.88916015625, 6.11297607421875, 6.3367919921875, 6.56060791015625, 6.784423828125, 7.00823974609375, 7.2320556640625, 7.45587158203125, 7.6796875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 11.0, 4.0, 11.0, 14.0, 19.0, 11.0, 28.0, 39.0, 44.0, 59.0, 67.0, 105.0, 131.0, 219.0, 278.0, 395.0, 477.0, 3671.0, 4185128.0, 1776.0, 468.0, 335.0, 261.0, 192.0, 135.0, 93.0, 77.0, 47.0, 34.0, 31.0, 27.0, 26.0, 22.0, 10.0, 7.0, 9.0, 4.0, 9.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.375, -146.23046875, -141.0859375, -135.94140625, -130.796875, -125.65234375, -120.5078125, -115.36328125, -110.21875, -105.07421875, -99.9296875, -94.78515625, -89.640625, -84.49609375, -79.3515625, -74.20703125, -69.0625, -63.91796875, -58.7734375, -53.62890625, -48.484375, -43.33984375, -38.1953125, -33.05078125, -27.90625, -22.76171875, -17.6171875, -12.47265625, -7.328125, -2.18359375, 2.9609375, 8.10546875, 13.25, 18.39453125, 23.5390625, 28.68359375, 33.828125, 38.97265625, 44.1171875, 49.26171875, 54.40625, 59.55078125, 64.6953125, 69.83984375, 74.984375, 80.12890625, 85.2734375, 90.41796875, 95.5625, 100.70703125, 105.8515625, 110.99609375, 116.140625, 121.28515625, 126.4296875, 131.57421875, 136.71875, 141.86328125, 147.0078125, 152.15234375, 157.296875, 162.44140625, 167.5859375, 172.73046875, 177.875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 17.0, 14.0, 25.0, 49.0, 83.0, 121.0, 270.0, 508.0, 1006.0, 1008.0, 459.0, 226.0, 110.0, 61.0, 37.0, 33.0, 11.0, 10.0, 6.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.046875, -14.418212890625, -13.78955078125, -13.160888671875, -12.5322265625, -11.903564453125, -11.27490234375, -10.646240234375, -10.017578125, -9.388916015625, -8.76025390625, -8.131591796875, -7.5029296875, -6.874267578125, -6.24560546875, -5.616943359375, -4.98828125, -4.359619140625, -3.73095703125, -3.102294921875, -2.4736328125, -1.844970703125, -1.21630859375, -0.587646484375, 0.041015625, 0.669677734375, 1.29833984375, 1.927001953125, 2.5556640625, 3.184326171875, 3.81298828125, 4.441650390625, 5.0703125, 5.698974609375, 6.32763671875, 6.956298828125, 7.5849609375, 8.213623046875, 8.84228515625, 9.470947265625, 10.099609375, 10.728271484375, 11.35693359375, 11.985595703125, 12.6142578125, 13.242919921875, 13.87158203125, 14.500244140625, 15.12890625, 15.757568359375, 16.38623046875, 17.014892578125, 17.6435546875, 18.272216796875, 18.90087890625, 19.529541015625, 20.158203125, 20.786865234375, 21.41552734375, 22.044189453125, 22.6728515625, 23.301513671875, 23.93017578125, 24.558837890625, 25.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 17.0, 19.0, 21.0, 14.0, 31.0, 37.0, 65.0, 83.0, 117.0, 479.0, 99437.0, 4092251.0, 1212.0, 172.0, 92.0, 52.0, 48.0, 36.0, 25.0, 17.0, 19.0, 16.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.0, -140.32421875, -136.6484375, -132.97265625, -129.296875, -125.62109375, -121.9453125, -118.26953125, -114.59375, -110.91796875, -107.2421875, -103.56640625, -99.890625, -96.21484375, -92.5390625, -88.86328125, -85.1875, -81.51171875, -77.8359375, -74.16015625, -70.484375, -66.80859375, -63.1328125, -59.45703125, -55.78125, -52.10546875, -48.4296875, -44.75390625, -41.078125, -37.40234375, -33.7265625, -30.05078125, -26.375, -22.69921875, -19.0234375, -15.34765625, -11.671875, -7.99609375, -4.3203125, -0.64453125, 3.03125, 6.70703125, 10.3828125, 14.05859375, 17.734375, 21.41015625, 25.0859375, 28.76171875, 32.4375, 36.11328125, 39.7890625, 43.46484375, 47.140625, 50.81640625, 54.4921875, 58.16796875, 61.84375, 65.51953125, 69.1953125, 72.87109375, 76.546875, 80.22265625, 83.8984375, 87.57421875, 91.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 44.0, 430.0, 460.0, 75.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.61212158203125, -81.81055450439453, -76.00898742675781, -70.20741271972656, -64.40585327148438, -58.60428237915039, -52.802711486816406, -47.00114440917969, -41.19957733154297, -35.39801025390625, -29.5964412689209, -23.794872283935547, -17.993305206298828, -12.19173812866211, -6.390167236328125, -0.5886001586914062, 5.2129669189453125, 11.014534950256348, 16.816102981567383, 22.617671966552734, 28.419239044189453, 34.22080612182617, 40.022377014160156, 45.823944091796875, 51.625511169433594, 57.42707824707031, 63.22864532470703, 69.03021240234375, 74.831787109375, 80.63334655761719, 86.43492126464844, 92.23648834228516, 98.03805541992188, 103.8396224975586, 109.64118957519531, 115.44276428222656, 121.24432373046875, 127.0458984375, 132.84747314453125, 138.64903259277344, 144.45059204101562, 150.25216674804688, 156.05372619628906, 161.8553009033203, 167.6568603515625, 173.45843505859375, 179.260009765625, 185.0615692138672, 190.86314392089844, 196.6647186279297, 202.46627807617188, 208.26785278320312, 214.0694122314453, 219.87098693847656, 225.67254638671875, 231.47412109375, 237.27569580078125, 243.0772705078125, 248.8788299560547, 254.68040466308594, 260.4819641113281, 266.2835388183594, 272.0851135253906, 277.88665771484375, 283.688232421875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 10.0, 14.0, 15.0, 18.0, 18.0, 21.0, 27.0, 24.0, 21.0, 33.0, 32.0, 46.0, 49.0, 36.0, 44.0, 51.0, 34.0, 49.0, 55.0, 44.0, 43.0, 29.0, 29.0, 32.0, 32.0, 30.0, 21.0, 24.0, 15.0, 19.0, 14.0, 19.0, 6.0, 6.0, 8.0, 6.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.53916931152344, -41.313228607177734, -40.08728790283203, -38.861351013183594, -37.63541030883789, -36.40946960449219, -35.183528900146484, -33.95758819580078, -32.731651306152344, -31.50571060180664, -30.27977180480957, -29.053831100463867, -27.827892303466797, -26.601951599121094, -25.37601089477539, -24.15007209777832, -22.924131393432617, -21.698190689086914, -20.472251892089844, -19.24631118774414, -18.02037239074707, -16.794431686401367, -15.56849193572998, -14.342552185058594, -13.116612434387207, -11.89067268371582, -10.664732933044434, -9.438793182373047, -8.212852478027344, -6.986913204193115, -5.76097297668457, -4.535033226013184, -3.309093475341797, -2.08315372467041, -0.8572137355804443, 0.3687262535095215, 1.5946660041809082, 2.820605754852295, 4.04654598236084, 5.272485733032227, 6.498425483703613, 7.724365234375, 8.950304985046387, 10.176244735717773, 11.402185440063477, 12.628124237060547, 13.85406494140625, 15.080004692077637, 16.305944442749023, 17.531885147094727, 18.757823944091797, 19.9837646484375, 21.20970344543457, 22.435644149780273, 23.661582946777344, 24.887523651123047, 26.11346435546875, 27.339405059814453, 28.565343856811523, 29.791284561157227, 31.017223358154297, 32.2431640625, 33.4691047668457, 34.695045471191406, 35.920982360839844]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 7.0, 7.0, 8.0, 9.0, 14.0, 20.0, 26.0, 22.0, 23.0, 32.0, 33.0, 30.0, 28.0, 34.0, 37.0, 36.0, 48.0, 55.0, 43.0, 45.0, 41.0, 24.0, 32.0, 41.0, 38.0, 30.0, 22.0, 33.0, 27.0, 29.0, 24.0, 22.0, 17.0, 19.0, 9.0, 3.0, 2.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.51171875, -6.2928466796875, -6.073974609375, -5.8551025390625, -5.63623046875, -5.4173583984375, -5.198486328125, -4.9796142578125, -4.7607421875, -4.5418701171875, -4.322998046875, -4.1041259765625, -3.88525390625, -3.6663818359375, -3.447509765625, -3.2286376953125, -3.009765625, -2.7908935546875, -2.572021484375, -2.3531494140625, -2.13427734375, -1.9154052734375, -1.696533203125, -1.4776611328125, -1.2587890625, -1.0399169921875, -0.821044921875, -0.6021728515625, -0.38330078125, -0.1644287109375, 0.054443359375, 0.2733154296875, 0.4921875, 0.7110595703125, 0.929931640625, 1.1488037109375, 1.36767578125, 1.5865478515625, 1.805419921875, 2.0242919921875, 2.2431640625, 2.4620361328125, 2.680908203125, 2.8997802734375, 3.11865234375, 3.3375244140625, 3.556396484375, 3.7752685546875, 3.994140625, 4.2130126953125, 4.431884765625, 4.6507568359375, 4.86962890625, 5.0885009765625, 5.307373046875, 5.5262451171875, 5.7451171875, 5.9639892578125, 6.182861328125, 6.4017333984375, 6.62060546875, 6.8394775390625, 7.058349609375, 7.2772216796875, 7.49609375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 16.0, 9.0, 12.0, 20.0, 50.0, 58.0, 91.0, 170.0, 246.0, 338.0, 492.0, 718.0, 1007.0, 1479.0, 2085.0, 2942.0, 4389.0, 6360.0, 9391.0, 13893.0, 20580.0, 31233.0, 48640.0, 80304.0, 138135.0, 213606.0, 182488.0, 107490.0, 63208.0, 39778.0, 25661.0, 17148.0, 11458.0, 7689.0, 5388.0, 3657.0, 2525.0, 1803.0, 1278.0, 859.0, 628.0, 435.0, 295.0, 176.0, 126.0, 65.0, 49.0, 27.0, 15.0, 13.0, 8.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.84326171875, -0.8167190551757812, -0.7901763916015625, -0.7636337280273438, -0.737091064453125, -0.7105484008789062, -0.6840057373046875, -0.6574630737304688, -0.63092041015625, -0.6043777465820312, -0.5778350830078125, -0.5512924194335938, -0.524749755859375, -0.49820709228515625, -0.4716644287109375, -0.44512176513671875, -0.4185791015625, -0.39203643798828125, -0.3654937744140625, -0.33895111083984375, -0.312408447265625, -0.28586578369140625, -0.2593231201171875, -0.23278045654296875, -0.20623779296875, -0.17969512939453125, -0.1531524658203125, -0.12660980224609375, -0.100067138671875, -0.07352447509765625, -0.0469818115234375, -0.02043914794921875, 0.006103515625, 0.03264617919921875, 0.0591888427734375, 0.08573150634765625, 0.112274169921875, 0.13881683349609375, 0.1653594970703125, 0.19190216064453125, 0.21844482421875, 0.24498748779296875, 0.2715301513671875, 0.29807281494140625, 0.324615478515625, 0.35115814208984375, 0.3777008056640625, 0.40424346923828125, 0.4307861328125, 0.45732879638671875, 0.4838714599609375, 0.5104141235351562, 0.536956787109375, 0.5634994506835938, 0.5900421142578125, 0.6165847778320312, 0.64312744140625, 0.6696701049804688, 0.6962127685546875, 0.7227554321289062, 0.749298095703125, 0.7758407592773438, 0.8023834228515625, 0.8289260864257812, 0.85546875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 10.0, 5.0, 14.0, 11.0, 10.0, 13.0, 14.0, 18.0, 24.0, 19.0, 27.0, 26.0, 35.0, 39.0, 33.0, 40.0, 43.0, 48.0, 38.0, 1062.0, 39.0, 39.0, 38.0, 40.0, 22.0, 34.0, 29.0, 31.0, 27.0, 30.0, 31.0, 25.0, 21.0, 16.0, 10.0, 14.0, 11.0, 14.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.9454345703125, -3.816650390625, -3.6878662109375, -3.55908203125, -3.4302978515625, -3.301513671875, -3.1727294921875, -3.0439453125, -2.9151611328125, -2.786376953125, -2.6575927734375, -2.52880859375, -2.4000244140625, -2.271240234375, -2.1424560546875, -2.013671875, -1.8848876953125, -1.756103515625, -1.6273193359375, -1.49853515625, -1.3697509765625, -1.240966796875, -1.1121826171875, -0.9833984375, -0.8546142578125, -0.725830078125, -0.5970458984375, -0.46826171875, -0.3394775390625, -0.210693359375, -0.0819091796875, 0.046875, 0.1756591796875, 0.304443359375, 0.4332275390625, 0.56201171875, 0.6907958984375, 0.819580078125, 0.9483642578125, 1.0771484375, 1.2059326171875, 1.334716796875, 1.4635009765625, 1.59228515625, 1.7210693359375, 1.849853515625, 1.9786376953125, 2.107421875, 2.2362060546875, 2.364990234375, 2.4937744140625, 2.62255859375, 2.7513427734375, 2.880126953125, 3.0089111328125, 3.1376953125, 3.2664794921875, 3.395263671875, 3.5240478515625, 3.65283203125, 3.7816162109375, 3.910400390625, 4.0391845703125, 4.16796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 13.0, 25.0, 26.0, 54.0, 57.0, 100.0, 167.0, 264.0, 440.0, 700.0, 1215.0, 2009.0, 3298.0, 5706.0, 10047.0, 17603.0, 31345.0, 57347.0, 107622.0, 197239.0, 1295831.0, 166805.0, 89077.0, 48082.0, 26513.0, 14989.0, 8668.0, 4935.0, 2780.0, 1663.0, 992.0, 585.0, 361.0, 193.0, 141.0, 86.0, 49.0, 33.0, 24.0, 13.0, 9.0, 7.0, 6.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73193359375, -0.70611572265625, -0.6802978515625, -0.65447998046875, -0.628662109375, -0.60284423828125, -0.5770263671875, -0.55120849609375, -0.525390625, -0.49957275390625, -0.4737548828125, -0.44793701171875, -0.422119140625, -0.39630126953125, -0.3704833984375, -0.34466552734375, -0.31884765625, -0.29302978515625, -0.2672119140625, -0.24139404296875, -0.215576171875, -0.18975830078125, -0.1639404296875, -0.13812255859375, -0.1123046875, -0.08648681640625, -0.0606689453125, -0.03485107421875, -0.009033203125, 0.01678466796875, 0.0426025390625, 0.06842041015625, 0.09423828125, 0.12005615234375, 0.1458740234375, 0.17169189453125, 0.197509765625, 0.22332763671875, 0.2491455078125, 0.27496337890625, 0.30078125, 0.32659912109375, 0.3524169921875, 0.37823486328125, 0.404052734375, 0.42987060546875, 0.4556884765625, 0.48150634765625, 0.50732421875, 0.53314208984375, 0.5589599609375, 0.58477783203125, 0.610595703125, 0.63641357421875, 0.6622314453125, 0.68804931640625, 0.7138671875, 0.73968505859375, 0.7655029296875, 0.79132080078125, 0.817138671875, 0.84295654296875, 0.8687744140625, 0.89459228515625, 0.92041015625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 6.0, 7.0, 12.0, 8.0, 18.0, 17.0, 29.0, 20.0, 41.0, 44.0, 44.0, 48.0, 61.0, 63.0, 64.0, 63.0, 59.0, 49.0, 53.0, 54.0, 32.0, 44.0, 24.0, 30.0, 18.0, 19.0, 13.0, 14.0, 9.0, 5.0, 8.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00217437744140625, -0.002096414566040039, -0.002018451690673828, -0.0019404888153076172, -0.0018625259399414062, -0.0017845630645751953, -0.0017066001892089844, -0.0016286373138427734, -0.0015506744384765625, -0.0014727115631103516, -0.0013947486877441406, -0.0013167858123779297, -0.0012388229370117188, -0.0011608600616455078, -0.0010828971862792969, -0.001004934310913086, -0.000926971435546875, -0.0008490085601806641, -0.0007710456848144531, -0.0006930828094482422, -0.0006151199340820312, -0.0005371570587158203, -0.0004591941833496094, -0.00038123130798339844, -0.0003032684326171875, -0.00022530555725097656, -0.00014734268188476562, -6.937980651855469e-05, 8.58306884765625e-06, 8.654594421386719e-05, 0.00016450881958007812, 0.00024247169494628906, 0.0003204345703125, 0.00039839744567871094, 0.0004763603210449219, 0.0005543231964111328, 0.0006322860717773438, 0.0007102489471435547, 0.0007882118225097656, 0.0008661746978759766, 0.0009441375732421875, 0.0010221004486083984, 0.0011000633239746094, 0.0011780261993408203, 0.0012559890747070312, 0.0013339519500732422, 0.0014119148254394531, 0.001489877700805664, 0.001567840576171875, 0.001645803451538086, 0.0017237663269042969, 0.0018017292022705078, 0.0018796920776367188, 0.0019576549530029297, 0.0020356178283691406, 0.0021135807037353516, 0.0021915435791015625, 0.0022695064544677734, 0.0023474693298339844, 0.0024254322052001953, 0.0025033950805664062, 0.002581357955932617, 0.002659320831298828, 0.002737283706665039, 0.00281524658203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 10.0, 8.0, 27.0, 21.0, 26.0, 32.0, 46.0, 51.0, 57.0, 94.0, 141.0, 168.0, 249.0, 365.0, 684.0, 2128.0, 859295.0, 182208.0, 1280.0, 562.0, 317.0, 217.0, 134.0, 105.0, 73.0, 57.0, 42.0, 33.0, 20.0, 21.0, 21.0, 10.0, 5.0, 10.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.047515869140625, -0.04615306854248047, -0.04479026794433594, -0.043427467346191406, -0.042064666748046875, -0.040701866149902344, -0.03933906555175781, -0.03797626495361328, -0.03661346435546875, -0.03525066375732422, -0.03388786315917969, -0.032525062561035156, -0.031162261962890625, -0.029799461364746094, -0.028436660766601562, -0.02707386016845703, -0.0257110595703125, -0.02434825897216797, -0.022985458374023438, -0.021622657775878906, -0.020259857177734375, -0.018897056579589844, -0.017534255981445312, -0.01617145538330078, -0.01480865478515625, -0.013445854187011719, -0.012083053588867188, -0.010720252990722656, -0.009357452392578125, -0.007994651794433594, -0.0066318511962890625, -0.005269050598144531, -0.00390625, -0.0025434494018554688, -0.0011806488037109375, 0.00018215179443359375, 0.001544952392578125, 0.0029077529907226562, 0.0042705535888671875, 0.005633354187011719, 0.00699615478515625, 0.008358955383300781, 0.009721755981445312, 0.011084556579589844, 0.012447357177734375, 0.013810157775878906, 0.015172958374023438, 0.01653575897216797, 0.0178985595703125, 0.01926136016845703, 0.020624160766601562, 0.021986961364746094, 0.023349761962890625, 0.024712562561035156, 0.026075363159179688, 0.02743816375732422, 0.02880096435546875, 0.03016376495361328, 0.03152656555175781, 0.032889366149902344, 0.034252166748046875, 0.035614967346191406, 0.03697776794433594, 0.03834056854248047, 0.039703369140625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [56.0, 955.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010350876254960895, -0.0002198097645305097, 0.00059546809643507, 0.0014107458991929889, 0.0022260239347815514, 0.0030413013882935047, 0.0038565793074667454, 0.004671857226639986, 0.005487135145813227, 0.006302413064986467, 0.007117690984159708, 0.007932968437671661, 0.008748246356844902, 0.009563524276018143, 0.010378802195191383, 0.011194080114364624, 0.012009358033537865, 0.012824635952711105, 0.013639913871884346, 0.014455191791057587, 0.015270469710230827, 0.016085747629404068, 0.01690102554857731, 0.01771630346775055, 0.01853158138692379, 0.01934685930609703, 0.02016213722527027, 0.020977415144443512, 0.021792693063616753, 0.022607970982789993, 0.023423248901963234, 0.024238526821136475, 0.025053804740309715, 0.025869082659482956, 0.026684360578656197, 0.027499638497829437, 0.028314916417002678, 0.02913019433617592, 0.02994547225534916, 0.0307607501745224, 0.03157602623105049, 0.03239130228757858, 0.03320658206939697, 0.034021858125925064, 0.034837137907743454, 0.035652413964271545, 0.036467693746089935, 0.03728296980261803, 0.03809824958443642, 0.03891352564096451, 0.0397288054227829, 0.04054408147931099, 0.04135936126112938, 0.04217463731765747, 0.04298991709947586, 0.04380519315600395, 0.04462047293782234, 0.04543574899435043, 0.04625102877616882, 0.047066304832696915, 0.047881584614515305, 0.048696860671043396, 0.049512140452861786, 0.05032741650938988, 0.05114269629120827]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 5.0, 8.0, 10.0, 17.0, 26.0, 24.0, 30.0, 29.0, 42.0, 53.0, 62.0, 46.0, 58.0, 73.0, 70.0, 65.0, 44.0, 66.0, 65.0, 50.0, 38.0, 39.0, 23.0, 28.0, 15.0, 10.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.002855837345123291, -0.0027908040210604668, -0.0027257706969976425, -0.0026607373729348183, -0.002595704048871994, -0.0025306707248091698, -0.0024656374007463455, -0.0024006040766835213, -0.002335570752620697, -0.0022705374285578728, -0.0022055041044950485, -0.0021404707804322243, -0.0020754374563694, -0.0020104041323065758, -0.0019453708082437515, -0.0018803374841809273, -0.001815304160118103, -0.0017502708360552788, -0.0016852375119924545, -0.0016202041879296303, -0.001555170863866806, -0.0014901375398039818, -0.0014251042157411575, -0.0013600708916783333, -0.001295037567615509, -0.0012300042435526848, -0.0011649709194898605, -0.0010999375954270363, -0.001034904271364212, -0.0009698709473013878, -0.0009048376232385635, -0.0008398042991757393, -0.000774770975112915, -0.0007097376510500908, -0.0006447043269872665, -0.0005796710029244423, -0.000514637678861618, -0.0004496043547987938, -0.00038457103073596954, -0.0003195377066731453, -0.00025450438261032104, -0.0001894710585474968, -0.00012443773448467255, -5.94044104218483e-05, 5.628913640975952e-06, 7.06622377038002e-05, 0.00013569556176662445, 0.0002007288858294487, 0.00026576220989227295, 0.0003307955339550972, 0.00039582885801792145, 0.0004608621820807457, 0.00052589550614357, 0.0005909288302063942, 0.0006559621542692184, 0.0007209954783320427, 0.0007860288023948669, 0.0008510621264576912, 0.0009160954505205154, 0.0009811287745833397, 0.001046162098646164, 0.0011111954227089882, 0.0011762287467718124, 0.0012412620708346367, 0.001306295394897461]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 7.0, 7.0, 8.0, 9.0, 14.0, 20.0, 26.0, 22.0, 23.0, 32.0, 33.0, 30.0, 28.0, 34.0, 37.0, 36.0, 48.0, 55.0, 43.0, 45.0, 41.0, 24.0, 32.0, 41.0, 38.0, 30.0, 22.0, 33.0, 27.0, 29.0, 24.0, 22.0, 17.0, 19.0, 9.0, 3.0, 2.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.51171875, -6.2928466796875, -6.073974609375, -5.8551025390625, -5.63623046875, -5.4173583984375, -5.198486328125, -4.9796142578125, -4.7607421875, -4.5418701171875, -4.322998046875, -4.1041259765625, -3.88525390625, -3.6663818359375, -3.447509765625, -3.2286376953125, -3.009765625, -2.7908935546875, -2.572021484375, -2.3531494140625, -2.13427734375, -1.9154052734375, -1.696533203125, -1.4776611328125, -1.2587890625, -1.0399169921875, -0.821044921875, -0.6021728515625, -0.38330078125, -0.1644287109375, 0.054443359375, 0.2733154296875, 0.4921875, 0.7110595703125, 0.929931640625, 1.1488037109375, 1.36767578125, 1.5865478515625, 1.805419921875, 2.0242919921875, 2.2431640625, 2.4620361328125, 2.680908203125, 2.8997802734375, 3.11865234375, 3.3375244140625, 3.556396484375, 3.7752685546875, 3.994140625, 4.2130126953125, 4.431884765625, 4.6507568359375, 4.86962890625, 5.0885009765625, 5.307373046875, 5.5262451171875, 5.7451171875, 5.9639892578125, 6.182861328125, 6.4017333984375, 6.62060546875, 6.8394775390625, 7.058349609375, 7.2772216796875, 7.49609375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 9.0, 6.0, 15.0, 13.0, 24.0, 30.0, 35.0, 52.0, 56.0, 89.0, 143.0, 190.0, 248.0, 380.0, 492.0, 688.0, 1013.0, 1492.0, 2581.0, 5677.0, 18922.0, 90323.0, 480420.0, 356058.0, 63536.0, 14478.0, 4762.0, 2265.0, 1287.0, 964.0, 647.0, 450.0, 357.0, 258.0, 162.0, 121.0, 87.0, 61.0, 54.0, 38.0, 18.0, 13.0, 13.0, 12.0, 7.0, 8.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9765625, -11.60107421875, -11.2255859375, -10.85009765625, -10.474609375, -10.09912109375, -9.7236328125, -9.34814453125, -8.97265625, -8.59716796875, -8.2216796875, -7.84619140625, -7.470703125, -7.09521484375, -6.7197265625, -6.34423828125, -5.96875, -5.59326171875, -5.2177734375, -4.84228515625, -4.466796875, -4.09130859375, -3.7158203125, -3.34033203125, -2.96484375, -2.58935546875, -2.2138671875, -1.83837890625, -1.462890625, -1.08740234375, -0.7119140625, -0.33642578125, 0.0390625, 0.41455078125, 0.7900390625, 1.16552734375, 1.541015625, 1.91650390625, 2.2919921875, 2.66748046875, 3.04296875, 3.41845703125, 3.7939453125, 4.16943359375, 4.544921875, 4.92041015625, 5.2958984375, 5.67138671875, 6.046875, 6.42236328125, 6.7978515625, 7.17333984375, 7.548828125, 7.92431640625, 8.2998046875, 8.67529296875, 9.05078125, 9.42626953125, 9.8017578125, 10.17724609375, 10.552734375, 10.92822265625, 11.3037109375, 11.67919921875, 12.0546875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 10.0, 7.0, 9.0, 13.0, 20.0, 15.0, 20.0, 24.0, 22.0, 31.0, 35.0, 31.0, 56.0, 56.0, 74.0, 97.0, 283.0, 1545.0, 174.0, 87.0, 48.0, 52.0, 42.0, 54.0, 38.0, 33.0, 24.0, 19.0, 20.0, 21.0, 11.0, 9.0, 9.0, 5.0, 10.0, 7.0, 2.0, 7.0, 7.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.0546875, -14.5211181640625, -13.987548828125, -13.4539794921875, -12.92041015625, -12.3868408203125, -11.853271484375, -11.3197021484375, -10.7861328125, -10.2525634765625, -9.718994140625, -9.1854248046875, -8.65185546875, -8.1182861328125, -7.584716796875, -7.0511474609375, -6.517578125, -5.9840087890625, -5.450439453125, -4.9168701171875, -4.38330078125, -3.8497314453125, -3.316162109375, -2.7825927734375, -2.2490234375, -1.7154541015625, -1.181884765625, -0.6483154296875, -0.11474609375, 0.4188232421875, 0.952392578125, 1.4859619140625, 2.01953125, 2.5531005859375, 3.086669921875, 3.6202392578125, 4.15380859375, 4.6873779296875, 5.220947265625, 5.7545166015625, 6.2880859375, 6.8216552734375, 7.355224609375, 7.8887939453125, 8.42236328125, 8.9559326171875, 9.489501953125, 10.0230712890625, 10.556640625, 11.0902099609375, 11.623779296875, 12.1573486328125, 12.69091796875, 13.2244873046875, 13.758056640625, 14.2916259765625, 14.8251953125, 15.3587646484375, 15.892333984375, 16.4259033203125, 16.95947265625, 17.4930419921875, 18.026611328125, 18.5601806640625, 19.09375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 6.0, 14.0, 9.0, 24.0, 18.0, 23.0, 43.0, 50.0, 59.0, 91.0, 151.0, 216.0, 407.0, 813.0, 3367.0, 3101719.0, 36195.0, 1228.0, 491.0, 254.0, 145.0, 108.0, 71.0, 55.0, 29.0, 19.0, 17.0, 13.0, 13.0, 6.0, 13.0, 5.0, 3.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.75, -64.8271484375, -62.904296875, -60.9814453125, -59.05859375, -57.1357421875, -55.212890625, -53.2900390625, -51.3671875, -49.4443359375, -47.521484375, -45.5986328125, -43.67578125, -41.7529296875, -39.830078125, -37.9072265625, -35.984375, -34.0615234375, -32.138671875, -30.2158203125, -28.29296875, -26.3701171875, -24.447265625, -22.5244140625, -20.6015625, -18.6787109375, -16.755859375, -14.8330078125, -12.91015625, -10.9873046875, -9.064453125, -7.1416015625, -5.21875, -3.2958984375, -1.373046875, 0.5498046875, 2.47265625, 4.3955078125, 6.318359375, 8.2412109375, 10.1640625, 12.0869140625, 14.009765625, 15.9326171875, 17.85546875, 19.7783203125, 21.701171875, 23.6240234375, 25.546875, 27.4697265625, 29.392578125, 31.3154296875, 33.23828125, 35.1611328125, 37.083984375, 39.0068359375, 40.9296875, 42.8525390625, 44.775390625, 46.6982421875, 48.62109375, 50.5439453125, 52.466796875, 54.3896484375, 56.3125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 48.0, 734.0, 228.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.92311096191406, -202.90771484375, -196.89231872558594, -190.8769073486328, -184.86151123046875, -178.8461151123047, -172.83071899414062, -166.8153076171875, -160.79991149902344, -154.78451538085938, -148.7691192626953, -142.7537078857422, -136.73831176757812, -130.72291564941406, -124.70751953125, -118.6921157836914, -112.67671966552734, -106.66132354736328, -100.64591979980469, -94.63052368164062, -88.61511993408203, -82.59972381591797, -76.58432006835938, -70.56892395019531, -64.55352783203125, -58.53812789916992, -52.522727966308594, -46.50733184814453, -40.49192810058594, -34.476531982421875, -28.461132049560547, -22.44573211669922, -16.430328369140625, -10.414928436279297, -4.399529457092285, 1.6158695220947266, 7.631269454956055, 13.646669387817383, 19.662067413330078, 25.677467346191406, 31.692867279052734, 37.70826721191406, 43.72366714477539, 49.73906707763672, 55.75446319580078, 61.769866943359375, 67.78526306152344, 73.8006591796875, 79.8160629272461, 85.83145904541016, 91.84686279296875, 97.86225891113281, 103.8776626586914, 109.89305877685547, 115.90846252441406, 121.92385864257812, 127.93925476074219, 133.95465087890625, 139.9700469970703, 145.98545837402344, 152.0008544921875, 158.01625061035156, 164.03164672851562, 170.04705810546875, 176.0624542236328]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 6.0, 7.0, 10.0, 12.0, 12.0, 10.0, 18.0, 23.0, 28.0, 23.0, 25.0, 31.0, 27.0, 32.0, 39.0, 37.0, 44.0, 37.0, 58.0, 48.0, 36.0, 33.0, 37.0, 44.0, 30.0, 30.0, 33.0, 18.0, 35.0, 28.0, 26.0, 25.0, 17.0, 13.0, 13.0, 18.0, 6.0, 6.0, 6.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.710960388183594, -48.23847198486328, -46.765987396240234, -45.29350280761719, -43.821014404296875, -42.34852600097656, -40.876041412353516, -39.40355682373047, -37.931068420410156, -36.458580017089844, -34.9860954284668, -33.51361083984375, -32.04112243652344, -30.568635940551758, -29.096149444580078, -27.6236629486084, -26.15117645263672, -24.67868995666504, -23.20620346069336, -21.73371696472168, -20.26123046875, -18.78874397277832, -17.31625747680664, -15.843770980834961, -14.371284484863281, -12.898797988891602, -11.426311492919922, -9.953824996948242, -8.481338500976562, -7.008852005004883, -5.536365509033203, -4.063879013061523, -2.5913925170898438, -1.118906021118164, 0.3535804748535156, 1.8260669708251953, 3.298553466796875, 4.771039962768555, 6.243526458740234, 7.716012954711914, 9.188499450683594, 10.660985946655273, 12.133472442626953, 13.605958938598633, 15.078445434570312, 16.550931930541992, 18.023418426513672, 19.49590492248535, 20.96839141845703, 22.44087791442871, 23.91336441040039, 25.38585090637207, 26.85833740234375, 28.33082389831543, 29.80331039428711, 31.27579689025879, 32.74828338623047, 34.22077178955078, 35.69325637817383, 37.165740966796875, 38.63822937011719, 40.1107177734375, 41.58320236206055, 43.055686950683594, 44.528175354003906]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 8.0, 11.0, 10.0, 16.0, 13.0, 18.0, 23.0, 18.0, 31.0, 33.0, 39.0, 41.0, 44.0, 51.0, 50.0, 43.0, 46.0, 36.0, 36.0, 58.0, 41.0, 42.0, 33.0, 44.0, 38.0, 27.0, 20.0, 31.0, 15.0, 23.0, 12.0, 15.0, 11.0, 6.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.36328125, -7.11932373046875, -6.8753662109375, -6.63140869140625, -6.387451171875, -6.14349365234375, -5.8995361328125, -5.65557861328125, -5.41162109375, -5.16766357421875, -4.9237060546875, -4.67974853515625, -4.435791015625, -4.19183349609375, -3.9478759765625, -3.70391845703125, -3.4599609375, -3.21600341796875, -2.9720458984375, -2.72808837890625, -2.484130859375, -2.24017333984375, -1.9962158203125, -1.75225830078125, -1.50830078125, -1.26434326171875, -1.0203857421875, -0.77642822265625, -0.532470703125, -0.28851318359375, -0.0445556640625, 0.19940185546875, 0.443359375, 0.68731689453125, 0.9312744140625, 1.17523193359375, 1.419189453125, 1.66314697265625, 1.9071044921875, 2.15106201171875, 2.39501953125, 2.63897705078125, 2.8829345703125, 3.12689208984375, 3.370849609375, 3.61480712890625, 3.8587646484375, 4.10272216796875, 4.3466796875, 4.59063720703125, 4.8345947265625, 5.07855224609375, 5.322509765625, 5.56646728515625, 5.8104248046875, 6.05438232421875, 6.29833984375, 6.54229736328125, 6.7862548828125, 7.03021240234375, 7.274169921875, 7.51812744140625, 7.7620849609375, 8.00604248046875, 8.25]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 7.0, 11.0, 8.0, 18.0, 21.0, 30.0, 32.0, 62.0, 56.0, 86.0, 145.0, 188.0, 264.0, 463.0, 852.0, 2251.0, 7867.0, 59855.0, 1161659.0, 2705491.0, 230804.0, 17412.0, 3745.0, 1320.0, 580.0, 297.0, 210.0, 124.0, 96.0, 83.0, 67.0, 39.0, 36.0, 26.0, 16.0, 19.0, 19.0, 4.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.90625, -15.362060546875, -14.81787109375, -14.273681640625, -13.7294921875, -13.185302734375, -12.64111328125, -12.096923828125, -11.552734375, -11.008544921875, -10.46435546875, -9.920166015625, -9.3759765625, -8.831787109375, -8.28759765625, -7.743408203125, -7.19921875, -6.655029296875, -6.11083984375, -5.566650390625, -5.0224609375, -4.478271484375, -3.93408203125, -3.389892578125, -2.845703125, -2.301513671875, -1.75732421875, -1.213134765625, -0.6689453125, -0.124755859375, 0.41943359375, 0.963623046875, 1.5078125, 2.052001953125, 2.59619140625, 3.140380859375, 3.6845703125, 4.228759765625, 4.77294921875, 5.317138671875, 5.861328125, 6.405517578125, 6.94970703125, 7.493896484375, 8.0380859375, 8.582275390625, 9.12646484375, 9.670654296875, 10.21484375, 10.759033203125, 11.30322265625, 11.847412109375, 12.3916015625, 12.935791015625, 13.47998046875, 14.024169921875, 14.568359375, 15.112548828125, 15.65673828125, 16.200927734375, 16.7451171875, 17.289306640625, 17.83349609375, 18.377685546875, 18.921875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 18.0, 13.0, 17.0, 17.0, 28.0, 42.0, 68.0, 76.0, 123.0, 155.0, 228.0, 322.0, 481.0, 637.0, 553.0, 360.0, 218.0, 199.0, 130.0, 84.0, 63.0, 70.0, 48.0, 35.0, 26.0, 15.0, 11.0, 6.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.7265625, -14.33544921875, -13.9443359375, -13.55322265625, -13.162109375, -12.77099609375, -12.3798828125, -11.98876953125, -11.59765625, -11.20654296875, -10.8154296875, -10.42431640625, -10.033203125, -9.64208984375, -9.2509765625, -8.85986328125, -8.46875, -8.07763671875, -7.6865234375, -7.29541015625, -6.904296875, -6.51318359375, -6.1220703125, -5.73095703125, -5.33984375, -4.94873046875, -4.5576171875, -4.16650390625, -3.775390625, -3.38427734375, -2.9931640625, -2.60205078125, -2.2109375, -1.81982421875, -1.4287109375, -1.03759765625, -0.646484375, -0.25537109375, 0.1357421875, 0.52685546875, 0.91796875, 1.30908203125, 1.7001953125, 2.09130859375, 2.482421875, 2.87353515625, 3.2646484375, 3.65576171875, 4.046875, 4.43798828125, 4.8291015625, 5.22021484375, 5.611328125, 6.00244140625, 6.3935546875, 6.78466796875, 7.17578125, 7.56689453125, 7.9580078125, 8.34912109375, 8.740234375, 9.13134765625, 9.5224609375, 9.91357421875, 10.3046875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 4.0, 4.0, 13.0, 18.0, 45.0, 51.0, 107.0, 208.0, 473.0, 1244.0, 5797.0, 468210.0, 3691047.0, 23814.0, 2018.0, 649.0, 249.0, 139.0, 75.0, 42.0, 28.0, 18.0, 11.0, 7.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.96875, -37.72021484375, -36.4716796875, -35.22314453125, -33.974609375, -32.72607421875, -31.4775390625, -30.22900390625, -28.98046875, -27.73193359375, -26.4833984375, -25.23486328125, -23.986328125, -22.73779296875, -21.4892578125, -20.24072265625, -18.9921875, -17.74365234375, -16.4951171875, -15.24658203125, -13.998046875, -12.74951171875, -11.5009765625, -10.25244140625, -9.00390625, -7.75537109375, -6.5068359375, -5.25830078125, -4.009765625, -2.76123046875, -1.5126953125, -0.26416015625, 0.984375, 2.23291015625, 3.4814453125, 4.72998046875, 5.978515625, 7.22705078125, 8.4755859375, 9.72412109375, 10.97265625, 12.22119140625, 13.4697265625, 14.71826171875, 15.966796875, 17.21533203125, 18.4638671875, 19.71240234375, 20.9609375, 22.20947265625, 23.4580078125, 24.70654296875, 25.955078125, 27.20361328125, 28.4521484375, 29.70068359375, 30.94921875, 32.19775390625, 33.4462890625, 34.69482421875, 35.943359375, 37.19189453125, 38.4404296875, 39.68896484375, 40.9375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 65.0, 925.0, 26.0, 4.0, 0.0, 0.0, 1.0], "bins": [-877.8282470703125, -862.8021240234375, -847.7760620117188, -832.75, -817.723876953125, -802.69775390625, -787.6716918945312, -772.6456298828125, -757.6195068359375, -742.5933837890625, -727.5673217773438, -712.541259765625, -697.51513671875, -682.489013671875, -667.4629516601562, -652.4368896484375, -637.4107666015625, -622.3846435546875, -607.3585815429688, -592.33251953125, -577.306396484375, -562.2802734375, -547.2542114257812, -532.2281494140625, -517.2020263671875, -502.1759338378906, -487.14984130859375, -472.1237487792969, -457.09765625, -442.0715637207031, -427.04547119140625, -412.0193786621094, -396.9932861328125, -381.9671936035156, -366.94110107421875, -351.9150085449219, -336.888916015625, -321.8628234863281, -306.83673095703125, -291.8106384277344, -276.7845458984375, -261.7584533691406, -246.73236083984375, -231.70626831054688, -216.68017578125, -201.65408325195312, -186.62799072265625, -171.60189819335938, -156.5758056640625, -141.54971313476562, -126.52362060546875, -111.49752807617188, -96.471435546875, -81.44534301757812, -66.41925048828125, -51.393157958984375, -36.36707305908203, -21.340980529785156, -6.314888000488281, 8.711204528808594, 23.73729705810547, 38.763389587402344, 53.78948211669922, 68.8155746459961, 83.84166717529297]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 7.0, 4.0, 15.0, 13.0, 12.0, 22.0, 22.0, 23.0, 22.0, 27.0, 31.0, 32.0, 45.0, 46.0, 53.0, 54.0, 38.0, 39.0, 44.0, 46.0, 40.0, 45.0, 48.0, 32.0, 35.0, 27.0, 18.0, 16.0, 13.0, 24.0, 14.0, 13.0, 13.0, 14.0, 12.0, 10.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.21849822998047, -39.870723724365234, -38.52294921875, -37.17517852783203, -35.8274040222168, -34.47962951660156, -33.13185501098633, -31.784080505371094, -30.43630599975586, -29.088531494140625, -27.740758895874023, -26.39298439025879, -25.045209884643555, -23.697437286376953, -22.34966278076172, -21.001888275146484, -19.654115676879883, -18.30634117126465, -16.958568572998047, -15.610794067382812, -14.263019561767578, -12.91524600982666, -11.567472457885742, -10.219697952270508, -8.87192440032959, -7.524150371551514, -6.1763763427734375, -4.8286027908325195, -3.4808287620544434, -2.133054733276367, -0.7852811813354492, 0.5624933242797852, 1.9102668762207031, 3.2580409049987793, 4.6058149337768555, 5.953588485717773, 7.30136251449585, 8.649136543273926, 9.996910095214844, 11.344684600830078, 12.692458152770996, 14.040231704711914, 15.388006210327148, 16.73577880859375, 18.083553314208984, 19.43132781982422, 20.779102325439453, 22.126876831054688, 23.47464942932129, 24.822423934936523, 26.170196533203125, 27.51797103881836, 28.865745544433594, 30.213520050048828, 31.56129264831543, 32.90906524658203, 34.256839752197266, 35.6046142578125, 36.952388763427734, 38.30016326904297, 39.64793395996094, 40.99570846557617, 42.343482971191406, 43.69125747680664, 45.039031982421875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 7.0, 11.0, 10.0, 8.0, 21.0, 24.0, 23.0, 23.0, 23.0, 35.0, 33.0, 35.0, 46.0, 54.0, 46.0, 46.0, 52.0, 49.0, 54.0, 49.0, 44.0, 39.0, 33.0, 37.0, 29.0, 28.0, 26.0, 27.0, 13.0, 10.0, 18.0, 7.0, 12.0, 8.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.56494140625, -6.3759765625, -6.18701171875, -5.998046875, -5.80908203125, -5.6201171875, -5.43115234375, -5.2421875, -5.05322265625, -4.8642578125, -4.67529296875, -4.486328125, -4.29736328125, -4.1083984375, -3.91943359375, -3.73046875, -3.54150390625, -3.3525390625, -3.16357421875, -2.974609375, -2.78564453125, -2.5966796875, -2.40771484375, -2.21875, -2.02978515625, -1.8408203125, -1.65185546875, -1.462890625, -1.27392578125, -1.0849609375, -0.89599609375, -0.70703125, -0.51806640625, -0.3291015625, -0.14013671875, 0.048828125, 0.23779296875, 0.4267578125, 0.61572265625, 0.8046875, 0.99365234375, 1.1826171875, 1.37158203125, 1.560546875, 1.74951171875, 1.9384765625, 2.12744140625, 2.31640625, 2.50537109375, 2.6943359375, 2.88330078125, 3.072265625, 3.26123046875, 3.4501953125, 3.63916015625, 3.828125, 4.01708984375, 4.2060546875, 4.39501953125, 4.583984375, 4.77294921875, 4.9619140625, 5.15087890625, 5.33984375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 7.0, 7.0, 9.0, 19.0, 22.0, 40.0, 42.0, 66.0, 97.0, 118.0, 189.0, 230.0, 357.0, 487.0, 640.0, 934.0, 1296.0, 1769.0, 2559.0, 3505.0, 5139.0, 7519.0, 11091.0, 17117.0, 26390.0, 42101.0, 69008.0, 118177.0, 191284.0, 203960.0, 133178.0, 77372.0, 46738.0, 29159.0, 18610.0, 12237.0, 8098.0, 5521.0, 3904.0, 2762.0, 1921.0, 1390.0, 944.0, 705.0, 525.0, 375.0, 297.0, 204.0, 131.0, 87.0, 80.0, 44.0, 35.0, 25.0, 15.0, 12.0, 10.0, 7.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.6220703125, -0.6020736694335938, -0.5820770263671875, -0.5620803833007812, -0.542083740234375, -0.5220870971679688, -0.5020904541015625, -0.48209381103515625, -0.46209716796875, -0.44210052490234375, -0.4221038818359375, -0.40210723876953125, -0.382110595703125, -0.36211395263671875, -0.3421173095703125, -0.32212066650390625, -0.3021240234375, -0.28212738037109375, -0.2621307373046875, -0.24213409423828125, -0.222137451171875, -0.20214080810546875, -0.1821441650390625, -0.16214752197265625, -0.14215087890625, -0.12215423583984375, -0.1021575927734375, -0.08216094970703125, -0.062164306640625, -0.04216766357421875, -0.0221710205078125, -0.00217437744140625, 0.017822265625, 0.03781890869140625, 0.0578155517578125, 0.07781219482421875, 0.097808837890625, 0.11780548095703125, 0.1378021240234375, 0.15779876708984375, 0.17779541015625, 0.19779205322265625, 0.2177886962890625, 0.23778533935546875, 0.257781982421875, 0.27777862548828125, 0.2977752685546875, 0.31777191162109375, 0.3377685546875, 0.35776519775390625, 0.3777618408203125, 0.39775848388671875, 0.417755126953125, 0.43775177001953125, 0.4577484130859375, 0.47774505615234375, 0.49774169921875, 0.5177383422851562, 0.5377349853515625, 0.5577316284179688, 0.577728271484375, 0.5977249145507812, 0.6177215576171875, 0.6377182006835938, 0.65771484375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 3.0, 1.0, 5.0, 8.0, 8.0, 6.0, 16.0, 18.0, 17.0, 21.0, 27.0, 27.0, 26.0, 27.0, 29.0, 32.0, 26.0, 38.0, 51.0, 56.0, 46.0, 1070.0, 54.0, 35.0, 38.0, 36.0, 26.0, 38.0, 33.0, 34.0, 33.0, 22.0, 22.0, 18.0, 14.0, 13.0, 12.0, 14.0, 5.0, 12.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.478515625, -3.371337890625, -3.26416015625, -3.156982421875, -3.0498046875, -2.942626953125, -2.83544921875, -2.728271484375, -2.62109375, -2.513916015625, -2.40673828125, -2.299560546875, -2.1923828125, -2.085205078125, -1.97802734375, -1.870849609375, -1.763671875, -1.656494140625, -1.54931640625, -1.442138671875, -1.3349609375, -1.227783203125, -1.12060546875, -1.013427734375, -0.90625, -0.799072265625, -0.69189453125, -0.584716796875, -0.4775390625, -0.370361328125, -0.26318359375, -0.156005859375, -0.048828125, 0.058349609375, 0.16552734375, 0.272705078125, 0.3798828125, 0.487060546875, 0.59423828125, 0.701416015625, 0.80859375, 0.915771484375, 1.02294921875, 1.130126953125, 1.2373046875, 1.344482421875, 1.45166015625, 1.558837890625, 1.666015625, 1.773193359375, 1.88037109375, 1.987548828125, 2.0947265625, 2.201904296875, 2.30908203125, 2.416259765625, 2.5234375, 2.630615234375, 2.73779296875, 2.844970703125, 2.9521484375, 3.059326171875, 3.16650390625, 3.273681640625, 3.380859375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 5.0, 13.0, 22.0, 23.0, 41.0, 48.0, 97.0, 131.0, 217.0, 311.0, 473.0, 762.0, 1193.0, 1857.0, 3028.0, 4942.0, 7999.0, 13899.0, 23807.0, 40539.0, 71963.0, 126860.0, 217354.0, 1253651.0, 139914.0, 79021.0, 44535.0, 25740.0, 15314.0, 8946.0, 5442.0, 3285.0, 2077.0, 1323.0, 769.0, 559.0, 324.0, 210.0, 152.0, 97.0, 50.0, 45.0, 32.0, 17.0, 13.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.595703125, -0.57769775390625, -0.5596923828125, -0.54168701171875, -0.523681640625, -0.50567626953125, -0.4876708984375, -0.46966552734375, -0.45166015625, -0.43365478515625, -0.4156494140625, -0.39764404296875, -0.379638671875, -0.36163330078125, -0.3436279296875, -0.32562255859375, -0.3076171875, -0.28961181640625, -0.2716064453125, -0.25360107421875, -0.235595703125, -0.21759033203125, -0.1995849609375, -0.18157958984375, -0.16357421875, -0.14556884765625, -0.1275634765625, -0.10955810546875, -0.091552734375, -0.07354736328125, -0.0555419921875, -0.03753662109375, -0.01953125, -0.00152587890625, 0.0164794921875, 0.03448486328125, 0.052490234375, 0.07049560546875, 0.0885009765625, 0.10650634765625, 0.12451171875, 0.14251708984375, 0.1605224609375, 0.17852783203125, 0.196533203125, 0.21453857421875, 0.2325439453125, 0.25054931640625, 0.2685546875, 0.28656005859375, 0.3045654296875, 0.32257080078125, 0.340576171875, 0.35858154296875, 0.3765869140625, 0.39459228515625, 0.41259765625, 0.43060302734375, 0.4486083984375, 0.46661376953125, 0.484619140625, 0.50262451171875, 0.5206298828125, 0.53863525390625, 0.556640625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 8.0, 13.0, 14.0, 25.0, 22.0, 20.0, 39.0, 40.0, 50.0, 58.0, 53.0, 69.0, 70.0, 60.0, 73.0, 58.0, 58.0, 42.0, 46.0, 43.0, 24.0, 14.0, 17.0, 12.0, 14.0, 7.0, 6.0, 11.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0023441314697265625, -0.0022708475589752197, -0.002197563648223877, -0.002124279737472534, -0.0020509958267211914, -0.0019777119159698486, -0.0019044280052185059, -0.001831144094467163, -0.0017578601837158203, -0.0016845762729644775, -0.0016112923622131348, -0.001538008451461792, -0.0014647245407104492, -0.0013914406299591064, -0.0013181567192077637, -0.001244872808456421, -0.0011715888977050781, -0.0010983049869537354, -0.0010250210762023926, -0.0009517371654510498, -0.000878453254699707, -0.0008051693439483643, -0.0007318854331970215, -0.0006586015224456787, -0.0005853176116943359, -0.0005120337009429932, -0.0004387497901916504, -0.0003654658794403076, -0.00029218196868896484, -0.00021889805793762207, -0.0001456141471862793, -7.233023643493652e-05, 9.5367431640625e-07, 7.423758506774902e-05, 0.0001475214958190918, 0.00022080540657043457, 0.00029408931732177734, 0.0003673732280731201, 0.0004406571388244629, 0.0005139410495758057, 0.0005872249603271484, 0.0006605088710784912, 0.000733792781829834, 0.0008070766925811768, 0.0008803606033325195, 0.0009536445140838623, 0.001026928424835205, 0.0011002123355865479, 0.0011734962463378906, 0.0012467801570892334, 0.0013200640678405762, 0.001393347978591919, 0.0014666318893432617, 0.0015399158000946045, 0.0016131997108459473, 0.00168648362159729, 0.0017597675323486328, 0.0018330514430999756, 0.0019063353538513184, 0.001979619264602661, 0.002052903175354004, 0.0021261870861053467, 0.0021994709968566895, 0.0022727549076080322, 0.002346038818359375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 5.0, 11.0, 18.0, 23.0, 28.0, 30.0, 42.0, 49.0, 79.0, 132.0, 176.0, 300.0, 453.0, 928.0, 21364.0, 1020948.0, 2171.0, 636.0, 362.0, 213.0, 158.0, 97.0, 81.0, 66.0, 47.0, 32.0, 25.0, 13.0, 15.0, 10.0, 3.0, 6.0, 2.0, 0.0, 7.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04681396484375, -0.045317649841308594, -0.04382133483886719, -0.04232501983642578, -0.040828704833984375, -0.03933238983154297, -0.03783607482910156, -0.036339759826660156, -0.03484344482421875, -0.033347129821777344, -0.03185081481933594, -0.03035449981689453, -0.028858184814453125, -0.02736186981201172, -0.025865554809570312, -0.024369239807128906, -0.0228729248046875, -0.021376609802246094, -0.019880294799804688, -0.01838397979736328, -0.016887664794921875, -0.015391349792480469, -0.013895034790039062, -0.012398719787597656, -0.01090240478515625, -0.009406089782714844, -0.007909774780273438, -0.006413459777832031, -0.004917144775390625, -0.0034208297729492188, -0.0019245147705078125, -0.00042819976806640625, 0.001068115234375, 0.0025644302368164062, 0.0040607452392578125, 0.005557060241699219, 0.007053375244140625, 0.008549690246582031, 0.010046005249023438, 0.011542320251464844, 0.01303863525390625, 0.014534950256347656, 0.016031265258789062, 0.01752758026123047, 0.019023895263671875, 0.02052021026611328, 0.022016525268554688, 0.023512840270996094, 0.0250091552734375, 0.026505470275878906, 0.028001785278320312, 0.02949810028076172, 0.030994415283203125, 0.03249073028564453, 0.03398704528808594, 0.035483360290527344, 0.03697967529296875, 0.038475990295410156, 0.03997230529785156, 0.04146862030029297, 0.042964935302734375, 0.04446125030517578, 0.04595756530761719, 0.047453880310058594, 0.0489501953125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 752.0, 263.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011446215212345123, -0.00053387664956972, 7.686822209507227e-05, 0.0006876131519675255, 0.0012983579654246569, 0.0019091027788817883, 0.0025198478251695633, 0.003130592405796051, 0.003741337452083826, 0.004352082498371601, 0.004962827078998089, 0.005573572125285864, 0.006184317171573639, 0.006795061752200127, 0.007405806798487902, 0.008016550913453102, 0.008627296425402164, 0.009238041006028652, 0.009848786517977715, 0.010459531098604202, 0.01107027567923069, 0.011681020259857178, 0.01229176577180624, 0.012902510352432728, 0.01351325586438179, 0.014124000445008278, 0.01473474595695734, 0.015345490537583828, 0.01595623604953289, 0.016566980630159378, 0.017177725210785866, 0.017788469791412354, 0.01839921437203884, 0.01900995895266533, 0.019620703533291817, 0.020231448113918304, 0.02084219455718994, 0.02145293913781643, 0.022063683718442917, 0.022674428299069405, 0.023285172879695892, 0.02389591746032238, 0.024506662040948868, 0.025117408484220505, 0.025728153064846992, 0.02633889764547348, 0.026949642226099968, 0.027560386806726456, 0.028171133249998093, 0.02878187783062458, 0.029392622411251068, 0.030003368854522705, 0.030614113435149193, 0.03122485801577568, 0.03183560073375702, 0.032446347177028656, 0.033057089895009995, 0.03366783633828163, 0.03427857905626297, 0.03488932549953461, 0.035500068217515945, 0.03611081466078758, 0.03672155737876892, 0.03733230382204056, 0.037943050265312195]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 13.0, 15.0, 17.0, 29.0, 29.0, 35.0, 40.0, 44.0, 43.0, 52.0, 59.0, 50.0, 57.0, 62.0, 51.0, 49.0, 43.0, 50.0, 40.0, 30.0, 35.0, 27.0, 27.0, 24.0, 14.0, 19.0, 11.0, 7.0, 7.0, 1.0, 8.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.0020979642868041992, -0.002047979272902012, -0.0019979942589998245, -0.0019480092450976372, -0.0018980242311954498, -0.0018480392172932625, -0.0017980542033910751, -0.0017480691894888878, -0.0016980841755867004, -0.001648099161684513, -0.0015981141477823257, -0.0015481291338801384, -0.001498144119977951, -0.0014481591060757637, -0.0013981740921735764, -0.001348189078271389, -0.0012982040643692017, -0.0012482190504670143, -0.001198234036564827, -0.0011482490226626396, -0.0010982640087604523, -0.001048278994858265, -0.0009982939809560776, -0.0009483089670538902, -0.0008983239531517029, -0.0008483389392495155, -0.0007983539253473282, -0.0007483689114451408, -0.0006983838975429535, -0.0006483988836407661, -0.0005984138697385788, -0.0005484288558363914, -0.0004984438419342041, -0.00044845882803201675, -0.0003984738141298294, -0.00034848880022764206, -0.0002985037863254547, -0.00024851877242326736, -0.00019853375852108002, -0.00014854874461889267, -9.856373071670532e-05, -4.8578716814517975e-05, 1.4062970876693726e-06, 5.139131098985672e-05, 0.00010137632489204407, 0.00015136133879423141, 0.00020134635269641876, 0.0002513313665986061, 0.00030131638050079346, 0.0003513013944029808, 0.00040128640830516815, 0.0004512714222073555, 0.0005012564361095428, 0.0005512414500117302, 0.0006012264639139175, 0.0006512114778161049, 0.0007011964917182922, 0.0007511815056204796, 0.0008011665195226669, 0.0008511515334248543, 0.0009011365473270416, 0.000951121561229229, 0.0010011065751314163, 0.0010510915890336037, 0.001101076602935791]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 7.0, 11.0, 10.0, 8.0, 21.0, 24.0, 23.0, 23.0, 23.0, 35.0, 33.0, 35.0, 46.0, 54.0, 46.0, 46.0, 52.0, 49.0, 54.0, 49.0, 44.0, 39.0, 33.0, 37.0, 29.0, 28.0, 26.0, 27.0, 13.0, 10.0, 18.0, 7.0, 12.0, 8.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.56494140625, -6.3759765625, -6.18701171875, -5.998046875, -5.80908203125, -5.6201171875, -5.43115234375, -5.2421875, -5.05322265625, -4.8642578125, -4.67529296875, -4.486328125, -4.29736328125, -4.1083984375, -3.91943359375, -3.73046875, -3.54150390625, -3.3525390625, -3.16357421875, -2.974609375, -2.78564453125, -2.5966796875, -2.40771484375, -2.21875, -2.02978515625, -1.8408203125, -1.65185546875, -1.462890625, -1.27392578125, -1.0849609375, -0.89599609375, -0.70703125, -0.51806640625, -0.3291015625, -0.14013671875, 0.048828125, 0.23779296875, 0.4267578125, 0.61572265625, 0.8046875, 0.99365234375, 1.1826171875, 1.37158203125, 1.560546875, 1.74951171875, 1.9384765625, 2.12744140625, 2.31640625, 2.50537109375, 2.6943359375, 2.88330078125, 3.072265625, 3.26123046875, 3.4501953125, 3.63916015625, 3.828125, 4.01708984375, 4.2060546875, 4.39501953125, 4.583984375, 4.77294921875, 4.9619140625, 5.15087890625, 5.33984375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 0.0, 3.0, 5.0, 5.0, 10.0, 11.0, 23.0, 28.0, 27.0, 61.0, 82.0, 119.0, 169.0, 253.0, 374.0, 566.0, 819.0, 1424.0, 2236.0, 4419.0, 11927.0, 76621.0, 718412.0, 197393.0, 20207.0, 5856.0, 2928.0, 1537.0, 1019.0, 685.0, 449.0, 248.0, 199.0, 139.0, 103.0, 63.0, 35.0, 34.0, 13.0, 19.0, 15.0, 11.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.765625, -13.28564453125, -12.8056640625, -12.32568359375, -11.845703125, -11.36572265625, -10.8857421875, -10.40576171875, -9.92578125, -9.44580078125, -8.9658203125, -8.48583984375, -8.005859375, -7.52587890625, -7.0458984375, -6.56591796875, -6.0859375, -5.60595703125, -5.1259765625, -4.64599609375, -4.166015625, -3.68603515625, -3.2060546875, -2.72607421875, -2.24609375, -1.76611328125, -1.2861328125, -0.80615234375, -0.326171875, 0.15380859375, 0.6337890625, 1.11376953125, 1.59375, 2.07373046875, 2.5537109375, 3.03369140625, 3.513671875, 3.99365234375, 4.4736328125, 4.95361328125, 5.43359375, 5.91357421875, 6.3935546875, 6.87353515625, 7.353515625, 7.83349609375, 8.3134765625, 8.79345703125, 9.2734375, 9.75341796875, 10.2333984375, 10.71337890625, 11.193359375, 11.67333984375, 12.1533203125, 12.63330078125, 13.11328125, 13.59326171875, 14.0732421875, 14.55322265625, 15.033203125, 15.51318359375, 15.9931640625, 16.47314453125, 16.953125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 7.0, 3.0, 7.0, 10.0, 12.0, 13.0, 19.0, 21.0, 25.0, 23.0, 42.0, 41.0, 30.0, 52.0, 57.0, 83.0, 215.0, 1654.0, 246.0, 89.0, 63.0, 51.0, 48.0, 37.0, 39.0, 20.0, 26.0, 25.0, 12.0, 12.0, 13.0, 9.0, 8.0, 4.0, 11.0, 5.0, 8.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.03125, -13.556640625, -13.08203125, -12.607421875, -12.1328125, -11.658203125, -11.18359375, -10.708984375, -10.234375, -9.759765625, -9.28515625, -8.810546875, -8.3359375, -7.861328125, -7.38671875, -6.912109375, -6.4375, -5.962890625, -5.48828125, -5.013671875, -4.5390625, -4.064453125, -3.58984375, -3.115234375, -2.640625, -2.166015625, -1.69140625, -1.216796875, -0.7421875, -0.267578125, 0.20703125, 0.681640625, 1.15625, 1.630859375, 2.10546875, 2.580078125, 3.0546875, 3.529296875, 4.00390625, 4.478515625, 4.953125, 5.427734375, 5.90234375, 6.376953125, 6.8515625, 7.326171875, 7.80078125, 8.275390625, 8.75, 9.224609375, 9.69921875, 10.173828125, 10.6484375, 11.123046875, 11.59765625, 12.072265625, 12.546875, 13.021484375, 13.49609375, 13.970703125, 14.4453125, 14.919921875, 15.39453125, 15.869140625, 16.34375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 6.0, 10.0, 13.0, 11.0, 20.0, 32.0, 26.0, 38.0, 45.0, 73.0, 70.0, 119.0, 167.0, 257.0, 492.0, 1067.0, 9359.0, 3118035.0, 13236.0, 1197.0, 496.0, 252.0, 183.0, 115.0, 92.0, 71.0, 56.0, 30.0, 28.0, 30.0, 25.0, 14.0, 6.0, 3.0, 2.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.8125, -42.4658203125, -41.119140625, -39.7724609375, -38.42578125, -37.0791015625, -35.732421875, -34.3857421875, -33.0390625, -31.6923828125, -30.345703125, -28.9990234375, -27.65234375, -26.3056640625, -24.958984375, -23.6123046875, -22.265625, -20.9189453125, -19.572265625, -18.2255859375, -16.87890625, -15.5322265625, -14.185546875, -12.8388671875, -11.4921875, -10.1455078125, -8.798828125, -7.4521484375, -6.10546875, -4.7587890625, -3.412109375, -2.0654296875, -0.71875, 0.6279296875, 1.974609375, 3.3212890625, 4.66796875, 6.0146484375, 7.361328125, 8.7080078125, 10.0546875, 11.4013671875, 12.748046875, 14.0947265625, 15.44140625, 16.7880859375, 18.134765625, 19.4814453125, 20.828125, 22.1748046875, 23.521484375, 24.8681640625, 26.21484375, 27.5615234375, 28.908203125, 30.2548828125, 31.6015625, 32.9482421875, 34.294921875, 35.6416015625, 36.98828125, 38.3349609375, 39.681640625, 41.0283203125, 42.375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 20.0, 77.0, 179.0, 333.0, 257.0, 88.0, 39.0, 10.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.76789093017578, -79.79903411865234, -77.8301773071289, -75.86132049560547, -73.89246368408203, -71.9236068725586, -69.95475006103516, -67.98589324951172, -66.01703643798828, -64.04817962646484, -62.079322814941406, -60.11046600341797, -58.14160919189453, -56.172752380371094, -54.203895568847656, -52.23503875732422, -50.26618194580078, -48.297325134277344, -46.328468322753906, -44.35961151123047, -42.39075469970703, -40.421897888183594, -38.453041076660156, -36.48418426513672, -34.51533126831055, -32.54647445678711, -30.577617645263672, -28.608760833740234, -26.639904022216797, -24.67104721069336, -22.702190399169922, -20.733333587646484, -18.764476776123047, -16.79561996459961, -14.826763153076172, -12.857906341552734, -10.889049530029297, -8.920193672180176, -6.951336860656738, -4.982480049133301, -3.0136232376098633, -1.0447665452957153, 0.9240901470184326, 2.892946720123291, 4.8618035316467285, 6.830659866333008, 8.799516677856445, 10.768373489379883, 12.73723030090332, 14.706087112426758, 16.674943923950195, 18.643800735473633, 20.61265754699707, 22.581512451171875, 24.550369262695312, 26.51922607421875, 28.488082885742188, 30.456939697265625, 32.42579650878906, 34.3946533203125, 36.36351013183594, 38.332366943359375, 40.30122375488281, 42.27008056640625, 44.23893737792969]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 6.0, 7.0, 6.0, 10.0, 12.0, 14.0, 12.0, 22.0, 21.0, 37.0, 30.0, 35.0, 36.0, 36.0, 34.0, 58.0, 54.0, 48.0, 46.0, 46.0, 46.0, 37.0, 41.0, 45.0, 36.0, 34.0, 36.0, 23.0, 15.0, 18.0, 18.0, 18.0, 19.0, 13.0, 9.0, 2.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.32217788696289, -34.93650817871094, -33.55084228515625, -32.1651725769043, -30.779502868652344, -29.393835067749023, -28.008167266845703, -26.62249755859375, -25.23682975769043, -23.85116195678711, -22.465492248535156, -21.079824447631836, -19.694156646728516, -18.308486938476562, -16.922819137573242, -15.537150382995605, -14.151481628417969, -12.765812873840332, -11.380144119262695, -9.994476318359375, -8.608807563781738, -7.223138809204102, -5.837471008300781, -4.4518022537231445, -3.066133499145508, -1.6804649829864502, -0.2947964668273926, 1.090871810913086, 2.4765405654907227, 3.8622093200683594, 5.24787712097168, 6.633545875549316, 8.019218444824219, 9.404887199401855, 10.790555953979492, 12.176223754882812, 13.56189250946045, 14.947561264038086, 16.333229064941406, 17.71889877319336, 19.10456657409668, 20.490234375, 21.875904083251953, 23.261571884155273, 24.647239685058594, 26.032909393310547, 27.418577194213867, 28.804244995117188, 30.18991470336914, 31.57558250427246, 32.96125030517578, 34.346920013427734, 35.73258972167969, 37.118255615234375, 38.50392532348633, 39.88959503173828, 41.27526092529297, 42.66093063354492, 44.04659652709961, 45.43226623535156, 46.817935943603516, 48.20360565185547, 49.589271545410156, 50.97494125366211, 52.36061096191406]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 8.0, 6.0, 7.0, 13.0, 20.0, 21.0, 14.0, 25.0, 37.0, 27.0, 39.0, 46.0, 52.0, 52.0, 56.0, 55.0, 50.0, 48.0, 52.0, 52.0, 37.0, 40.0, 43.0, 33.0, 23.0, 33.0, 25.0, 18.0, 15.0, 9.0, 7.0, 10.0, 6.0, 7.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-8.4453125, -8.23016357421875, -8.0150146484375, -7.79986572265625, -7.584716796875, -7.36956787109375, -7.1544189453125, -6.93927001953125, -6.72412109375, -6.50897216796875, -6.2938232421875, -6.07867431640625, -5.863525390625, -5.64837646484375, -5.4332275390625, -5.21807861328125, -5.0029296875, -4.78778076171875, -4.5726318359375, -4.35748291015625, -4.142333984375, -3.92718505859375, -3.7120361328125, -3.49688720703125, -3.28173828125, -3.06658935546875, -2.8514404296875, -2.63629150390625, -2.421142578125, -2.20599365234375, -1.9908447265625, -1.77569580078125, -1.560546875, -1.34539794921875, -1.1302490234375, -0.91510009765625, -0.699951171875, -0.48480224609375, -0.2696533203125, -0.05450439453125, 0.16064453125, 0.37579345703125, 0.5909423828125, 0.80609130859375, 1.021240234375, 1.23638916015625, 1.4515380859375, 1.66668701171875, 1.8818359375, 2.09698486328125, 2.3121337890625, 2.52728271484375, 2.742431640625, 2.95758056640625, 3.1727294921875, 3.38787841796875, 3.60302734375, 3.81817626953125, 4.0333251953125, 4.24847412109375, 4.463623046875, 4.67877197265625, 4.8939208984375, 5.10906982421875, 5.32421875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 2.0, 5.0, 10.0, 11.0, 14.0, 18.0, 25.0, 36.0, 40.0, 60.0, 61.0, 107.0, 166.0, 196.0, 319.0, 512.0, 774.0, 1377.0, 2452.0, 4824.0, 10949.0, 38124.0, 260956.0, 1456664.0, 1921304.0, 407484.0, 60104.0, 14695.0, 6000.0, 2836.0, 1574.0, 913.0, 556.0, 351.0, 231.0, 152.0, 105.0, 81.0, 45.0, 41.0, 21.0, 14.0, 32.0, 14.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.5, -9.2215576171875, -8.943115234375, -8.6646728515625, -8.38623046875, -8.1077880859375, -7.829345703125, -7.5509033203125, -7.2724609375, -6.9940185546875, -6.715576171875, -6.4371337890625, -6.15869140625, -5.8802490234375, -5.601806640625, -5.3233642578125, -5.044921875, -4.7664794921875, -4.488037109375, -4.2095947265625, -3.93115234375, -3.6527099609375, -3.374267578125, -3.0958251953125, -2.8173828125, -2.5389404296875, -2.260498046875, -1.9820556640625, -1.70361328125, -1.4251708984375, -1.146728515625, -0.8682861328125, -0.58984375, -0.3114013671875, -0.032958984375, 0.2454833984375, 0.52392578125, 0.8023681640625, 1.080810546875, 1.3592529296875, 1.6376953125, 1.9161376953125, 2.194580078125, 2.4730224609375, 2.75146484375, 3.0299072265625, 3.308349609375, 3.5867919921875, 3.865234375, 4.1436767578125, 4.422119140625, 4.7005615234375, 4.97900390625, 5.2574462890625, 5.535888671875, 5.8143310546875, 6.0927734375, 6.3712158203125, 6.649658203125, 6.9281005859375, 7.20654296875, 7.4849853515625, 7.763427734375, 8.0418701171875, 8.3203125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 9.0, 19.0, 86.0, 247.0, 625.0, 1685.0, 956.0, 328.0, 94.0, 19.0, 13.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.34619140625, -31.2548828125, -30.16357421875, -29.072265625, -27.98095703125, -26.8896484375, -25.79833984375, -24.70703125, -23.61572265625, -22.5244140625, -21.43310546875, -20.341796875, -19.25048828125, -18.1591796875, -17.06787109375, -15.9765625, -14.88525390625, -13.7939453125, -12.70263671875, -11.611328125, -10.52001953125, -9.4287109375, -8.33740234375, -7.24609375, -6.15478515625, -5.0634765625, -3.97216796875, -2.880859375, -1.78955078125, -0.6982421875, 0.39306640625, 1.484375, 2.57568359375, 3.6669921875, 4.75830078125, 5.849609375, 6.94091796875, 8.0322265625, 9.12353515625, 10.21484375, 11.30615234375, 12.3974609375, 13.48876953125, 14.580078125, 15.67138671875, 16.7626953125, 17.85400390625, 18.9453125, 20.03662109375, 21.1279296875, 22.21923828125, 23.310546875, 24.40185546875, 25.4931640625, 26.58447265625, 27.67578125, 28.76708984375, 29.8583984375, 30.94970703125, 32.041015625, 33.13232421875, 34.2236328125, 35.31494140625, 36.40625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 12.0, 28.0, 56.0, 175.0, 565.0, 1972.0, 73297.0, 4111303.0, 5234.0, 1072.0, 318.0, 126.0, 50.0, 21.0, 12.0, 5.0, 7.0, 5.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.0625, -53.30078125, -51.5390625, -49.77734375, -48.015625, -46.25390625, -44.4921875, -42.73046875, -40.96875, -39.20703125, -37.4453125, -35.68359375, -33.921875, -32.16015625, -30.3984375, -28.63671875, -26.875, -25.11328125, -23.3515625, -21.58984375, -19.828125, -18.06640625, -16.3046875, -14.54296875, -12.78125, -11.01953125, -9.2578125, -7.49609375, -5.734375, -3.97265625, -2.2109375, -0.44921875, 1.3125, 3.07421875, 4.8359375, 6.59765625, 8.359375, 10.12109375, 11.8828125, 13.64453125, 15.40625, 17.16796875, 18.9296875, 20.69140625, 22.453125, 24.21484375, 25.9765625, 27.73828125, 29.5, 31.26171875, 33.0234375, 34.78515625, 36.546875, 38.30859375, 40.0703125, 41.83203125, 43.59375, 45.35546875, 47.1171875, 48.87890625, 50.640625, 52.40234375, 54.1640625, 55.92578125, 57.6875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 37.0, 278.0, 505.0, 174.0, 14.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.3079833984375, -119.59233093261719, -114.8766860961914, -110.16104125976562, -105.44538879394531, -100.729736328125, -96.01409149169922, -91.29844665527344, -86.58279418945312, -81.86714172363281, -77.15149688720703, -72.43585205078125, -67.72019958496094, -63.00455093383789, -58.288902282714844, -53.5732536315918, -48.85760498046875, -44.1419563293457, -39.426307678222656, -34.71065902709961, -29.995010375976562, -25.279361724853516, -20.56371307373047, -15.848064422607422, -11.132415771484375, -6.416767120361328, -1.7011184692382812, 3.0145301818847656, 7.7301788330078125, 12.44582748413086, 17.161476135253906, 21.877124786376953, 26.592758178710938, 31.308406829833984, 36.02405548095703, 40.73970413208008, 45.455352783203125, 50.17100143432617, 54.88665008544922, 59.602298736572266, 64.31794738769531, 69.03359985351562, 73.7492446899414, 78.46488952636719, 83.1805419921875, 87.89619445800781, 92.6118392944336, 97.32748413085938, 102.04313659667969, 106.7587890625, 111.47443389892578, 116.19007873535156, 120.90573120117188, 125.62138366699219, 130.3370361328125, 135.05267333984375, 139.76832580566406, 144.48397827148438, 149.19961547851562, 153.91526794433594, 158.63092041015625, 163.34657287597656, 168.06222534179688, 172.77786254882812, 177.49351501464844]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 4.0, 6.0, 5.0, 6.0, 7.0, 19.0, 19.0, 13.0, 24.0, 26.0, 26.0, 28.0, 29.0, 47.0, 41.0, 51.0, 37.0, 42.0, 39.0, 57.0, 42.0, 42.0, 44.0, 46.0, 41.0, 24.0, 39.0, 29.0, 28.0, 20.0, 18.0, 9.0, 16.0, 12.0, 8.0, 16.0, 8.0, 10.0, 3.0, 5.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.028053283691406, -37.715789794921875, -36.403526306152344, -35.09126281738281, -33.77899932861328, -32.46673583984375, -31.154470443725586, -29.842205047607422, -28.52994155883789, -27.21767807006836, -25.905414581298828, -24.593151092529297, -23.280885696411133, -21.9686222076416, -20.65635871887207, -19.344093322753906, -18.031831741333008, -16.719568252563477, -15.407303810119629, -14.095040321350098, -12.78277587890625, -11.470512390136719, -10.158248901367188, -8.84598445892334, -7.533720970153809, -6.221457004547119, -4.90919303894043, -3.5969295501708984, -2.284665584564209, -0.9724016189575195, 0.3398618698120117, 1.6521263122558594, 2.9643898010253906, 4.27665376663208, 5.5889177322387695, 6.901181221008301, 8.213445663452148, 9.52570915222168, 10.837972640991211, 12.150237083435059, 13.46250057220459, 14.774764060974121, 16.08702850341797, 17.3992919921875, 18.71155548095703, 20.023818969726562, 21.336082458496094, 22.648347854614258, 23.96061134338379, 25.27287483215332, 26.58513832092285, 27.897403717041016, 29.209667205810547, 30.521930694580078, 31.83419418334961, 33.14645767211914, 34.45872116088867, 35.7709846496582, 37.083248138427734, 38.395511627197266, 39.7077751159668, 41.020042419433594, 42.332305908203125, 43.644569396972656, 44.95683288574219]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 0.0, 4.0, 6.0, 2.0, 3.0, 10.0, 4.0, 8.0, 9.0, 11.0, 8.0, 13.0, 17.0, 14.0, 15.0, 30.0, 29.0, 27.0, 33.0, 24.0, 43.0, 29.0, 30.0, 41.0, 33.0, 40.0, 48.0, 47.0, 43.0, 48.0, 39.0, 36.0, 34.0, 32.0, 35.0, 23.0, 24.0, 25.0, 10.0, 14.0, 10.0, 9.0, 6.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 7.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.8359375, -3.70758056640625, -3.5792236328125, -3.45086669921875, -3.322509765625, -3.19415283203125, -3.0657958984375, -2.93743896484375, -2.80908203125, -2.68072509765625, -2.5523681640625, -2.42401123046875, -2.295654296875, -2.16729736328125, -2.0389404296875, -1.91058349609375, -1.7822265625, -1.65386962890625, -1.5255126953125, -1.39715576171875, -1.268798828125, -1.14044189453125, -1.0120849609375, -0.88372802734375, -0.75537109375, -0.62701416015625, -0.4986572265625, -0.37030029296875, -0.241943359375, -0.11358642578125, 0.0147705078125, 0.14312744140625, 0.271484375, 0.39984130859375, 0.5281982421875, 0.65655517578125, 0.784912109375, 0.91326904296875, 1.0416259765625, 1.16998291015625, 1.29833984375, 1.42669677734375, 1.5550537109375, 1.68341064453125, 1.811767578125, 1.94012451171875, 2.0684814453125, 2.19683837890625, 2.3251953125, 2.45355224609375, 2.5819091796875, 2.71026611328125, 2.838623046875, 2.96697998046875, 3.0953369140625, 3.22369384765625, 3.35205078125, 3.48040771484375, 3.6087646484375, 3.73712158203125, 3.865478515625, 3.99383544921875, 4.1221923828125, 4.25054931640625, 4.37890625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 17.0, 18.0, 12.0, 34.0, 47.0, 88.0, 114.0, 157.0, 199.0, 313.0, 403.0, 595.0, 883.0, 1269.0, 1951.0, 2957.0, 4450.0, 6854.0, 10989.0, 17409.0, 29387.0, 52234.0, 97966.0, 185731.0, 255804.0, 169070.0, 89091.0, 47916.0, 26940.0, 16506.0, 10110.0, 6404.0, 4039.0, 2824.0, 1875.0, 1231.0, 834.0, 591.0, 349.0, 259.0, 174.0, 136.0, 115.0, 73.0, 49.0, 30.0, 24.0, 15.0, 12.0, 11.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58935546875, -0.5699844360351562, -0.5506134033203125, -0.5312423706054688, -0.511871337890625, -0.49250030517578125, -0.4731292724609375, -0.45375823974609375, -0.43438720703125, -0.41501617431640625, -0.3956451416015625, -0.37627410888671875, -0.356903076171875, -0.33753204345703125, -0.3181610107421875, -0.29878997802734375, -0.2794189453125, -0.26004791259765625, -0.2406768798828125, -0.22130584716796875, -0.201934814453125, -0.18256378173828125, -0.1631927490234375, -0.14382171630859375, -0.12445068359375, -0.10507965087890625, -0.0857086181640625, -0.06633758544921875, -0.046966552734375, -0.02759552001953125, -0.0082244873046875, 0.01114654541015625, 0.030517578125, 0.04988861083984375, 0.0692596435546875, 0.08863067626953125, 0.108001708984375, 0.12737274169921875, 0.1467437744140625, 0.16611480712890625, 0.18548583984375, 0.20485687255859375, 0.2242279052734375, 0.24359893798828125, 0.262969970703125, 0.28234100341796875, 0.3017120361328125, 0.32108306884765625, 0.3404541015625, 0.35982513427734375, 0.3791961669921875, 0.39856719970703125, 0.417938232421875, 0.43730926513671875, 0.4566802978515625, 0.47605133056640625, 0.49542236328125, 0.5147933959960938, 0.5341644287109375, 0.5535354614257812, 0.572906494140625, 0.5922775268554688, 0.6116485595703125, 0.6310195922851562, 0.650390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 6.0, 10.0, 11.0, 14.0, 22.0, 18.0, 23.0, 29.0, 28.0, 35.0, 29.0, 33.0, 31.0, 31.0, 40.0, 35.0, 41.0, 40.0, 1072.0, 41.0, 34.0, 39.0, 31.0, 35.0, 31.0, 22.0, 26.0, 22.0, 27.0, 21.0, 16.0, 16.0, 13.0, 15.0, 10.0, 15.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.859375, -2.778076171875, -2.69677734375, -2.615478515625, -2.5341796875, -2.452880859375, -2.37158203125, -2.290283203125, -2.208984375, -2.127685546875, -2.04638671875, -1.965087890625, -1.8837890625, -1.802490234375, -1.72119140625, -1.639892578125, -1.55859375, -1.477294921875, -1.39599609375, -1.314697265625, -1.2333984375, -1.152099609375, -1.07080078125, -0.989501953125, -0.908203125, -0.826904296875, -0.74560546875, -0.664306640625, -0.5830078125, -0.501708984375, -0.42041015625, -0.339111328125, -0.2578125, -0.176513671875, -0.09521484375, -0.013916015625, 0.0673828125, 0.148681640625, 0.22998046875, 0.311279296875, 0.392578125, 0.473876953125, 0.55517578125, 0.636474609375, 0.7177734375, 0.799072265625, 0.88037109375, 0.961669921875, 1.04296875, 1.124267578125, 1.20556640625, 1.286865234375, 1.3681640625, 1.449462890625, 1.53076171875, 1.612060546875, 1.693359375, 1.774658203125, 1.85595703125, 1.937255859375, 2.0185546875, 2.099853515625, 2.18115234375, 2.262451171875, 2.34375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 6.0, 10.0, 21.0, 20.0, 37.0, 62.0, 90.0, 128.0, 225.0, 348.0, 599.0, 958.0, 1519.0, 2646.0, 4361.0, 7299.0, 12503.0, 21733.0, 37855.0, 69330.0, 127592.0, 230837.0, 1267561.0, 139119.0, 74551.0, 41511.0, 23384.0, 13296.0, 7764.0, 4641.0, 2717.0, 1701.0, 1027.0, 642.0, 345.0, 251.0, 162.0, 85.0, 73.0, 43.0, 28.0, 18.0, 9.0, 9.0, 11.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5283203125, -0.5113143920898438, -0.4943084716796875, -0.47730255126953125, -0.460296630859375, -0.44329071044921875, -0.4262847900390625, -0.40927886962890625, -0.39227294921875, -0.37526702880859375, -0.3582611083984375, -0.34125518798828125, -0.324249267578125, -0.30724334716796875, -0.2902374267578125, -0.27323150634765625, -0.2562255859375, -0.23921966552734375, -0.2222137451171875, -0.20520782470703125, -0.188201904296875, -0.17119598388671875, -0.1541900634765625, -0.13718414306640625, -0.12017822265625, -0.10317230224609375, -0.0861663818359375, -0.06916046142578125, -0.052154541015625, -0.03514862060546875, -0.0181427001953125, -0.00113677978515625, 0.015869140625, 0.03287506103515625, 0.0498809814453125, 0.06688690185546875, 0.083892822265625, 0.10089874267578125, 0.1179046630859375, 0.13491058349609375, 0.15191650390625, 0.16892242431640625, 0.1859283447265625, 0.20293426513671875, 0.219940185546875, 0.23694610595703125, 0.2539520263671875, 0.27095794677734375, 0.2879638671875, 0.30496978759765625, 0.3219757080078125, 0.33898162841796875, 0.355987548828125, 0.37299346923828125, 0.3899993896484375, 0.40700531005859375, 0.42401123046875, 0.44101715087890625, 0.4580230712890625, 0.47502899169921875, 0.492034912109375, 0.5090408325195312, 0.5260467529296875, 0.5430526733398438, 0.56005859375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 9.0, 4.0, 8.0, 12.0, 15.0, 24.0, 20.0, 43.0, 37.0, 63.0, 54.0, 68.0, 66.0, 85.0, 77.0, 85.0, 67.0, 51.0, 40.0, 41.0, 36.0, 28.0, 10.0, 10.0, 12.0, 5.0, 6.0, 6.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015535354614257812, -0.00149555504322052, -0.0014375746250152588, -0.0013795942068099976, -0.0013216137886047363, -0.001263633370399475, -0.0012056529521942139, -0.0011476725339889526, -0.0010896921157836914, -0.0010317116975784302, -0.0009737312793731689, -0.0009157508611679077, -0.0008577704429626465, -0.0007997900247573853, -0.000741809606552124, -0.0006838291883468628, -0.0006258487701416016, -0.0005678683519363403, -0.0005098879337310791, -0.00045190751552581787, -0.00039392709732055664, -0.0003359466791152954, -0.0002779662609100342, -0.00021998584270477295, -0.00016200542449951172, -0.00010402500629425049, -4.604458808898926e-05, 1.1935830116271973e-05, 6.99162483215332e-05, 0.00012789666652679443, 0.00018587708473205566, 0.0002438575029373169, 0.0003018379211425781, 0.00035981833934783936, 0.0004177987575531006, 0.0004757791757583618, 0.000533759593963623, 0.0005917400121688843, 0.0006497204303741455, 0.0007077008485794067, 0.000765681266784668, 0.0008236616849899292, 0.0008816421031951904, 0.0009396225214004517, 0.0009976029396057129, 0.0010555833578109741, 0.0011135637760162354, 0.0011715441942214966, 0.0012295246124267578, 0.001287505030632019, 0.0013454854488372803, 0.0014034658670425415, 0.0014614462852478027, 0.001519426703453064, 0.0015774071216583252, 0.0016353875398635864, 0.0016933679580688477, 0.0017513483762741089, 0.0018093287944793701, 0.0018673092126846313, 0.0019252896308898926, 0.001983270049095154, 0.002041250467300415, 0.0020992308855056763, 0.0021572113037109375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 9.0, 8.0, 6.0, 18.0, 18.0, 25.0, 36.0, 39.0, 45.0, 76.0, 88.0, 129.0, 190.0, 321.0, 483.0, 950.0, 8580.0, 1032903.0, 2423.0, 791.0, 427.0, 288.0, 175.0, 132.0, 90.0, 67.0, 65.0, 35.0, 26.0, 26.0, 15.0, 18.0, 6.0, 6.0, 8.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03228759765625, -0.031258583068847656, -0.030229568481445312, -0.02920055389404297, -0.028171539306640625, -0.02714252471923828, -0.026113510131835938, -0.025084495544433594, -0.02405548095703125, -0.023026466369628906, -0.021997451782226562, -0.02096843719482422, -0.019939422607421875, -0.01891040802001953, -0.017881393432617188, -0.016852378845214844, -0.0158233642578125, -0.014794349670410156, -0.013765335083007812, -0.012736320495605469, -0.011707305908203125, -0.010678291320800781, -0.009649276733398438, -0.008620262145996094, -0.00759124755859375, -0.006562232971191406, -0.0055332183837890625, -0.004504203796386719, -0.003475189208984375, -0.0024461746215820312, -0.0014171600341796875, -0.00038814544677734375, 0.000640869140625, 0.0016698837280273438, 0.0026988983154296875, 0.0037279129028320312, 0.004756927490234375, 0.005785942077636719, 0.0068149566650390625, 0.007843971252441406, 0.00887298583984375, 0.009902000427246094, 0.010931015014648438, 0.011960029602050781, 0.012989044189453125, 0.014018058776855469, 0.015047073364257812, 0.016076087951660156, 0.0171051025390625, 0.018134117126464844, 0.019163131713867188, 0.02019214630126953, 0.021221160888671875, 0.02225017547607422, 0.023279190063476562, 0.024308204650878906, 0.02533721923828125, 0.026366233825683594, 0.027395248413085938, 0.02842426300048828, 0.029453277587890625, 0.03048229217529297, 0.03151130676269531, 0.032540321350097656, 0.0335693359375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 861.0, 139.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003612068947404623, -0.0033659166656434536, -0.003119764616712928, -0.002873612567782402, -0.0026274602860212326, -0.002381308004260063, -0.0021351559553295374, -0.0018890037899836898, -0.0016428516246378422, -0.0013966994592919946, -0.001150547293946147, -0.0009043951286002994, -0.0006582429632544518, -0.00041209079790860415, -0.00016593863256275654, 8.021353278309107e-05, 0.0003263656981289387, 0.0005725178634747863, 0.0008186700288206339, 0.0010648221941664815, 0.001310974359512329, 0.0015571265248581767, 0.0018032786902040243, 0.00204943073913455, 0.0022955830208957195, 0.002541735302656889, 0.0027878873515874147, 0.0030340394005179405, 0.00328019168227911, 0.0035263439640402794, 0.003772496012970805, 0.004018648061901331, 0.004264800809323788, 0.004510953091084957, 0.0047571053728461266, 0.005003257188946009, 0.005249409470707178, 0.0054955617524683475, 0.00574171356856823, 0.005987865850329399, 0.0062340181320905685, 0.006480170413851738, 0.006726322695612907, 0.0069724745117127895, 0.007218626793473959, 0.007464779075235128, 0.0077109308913350105, 0.00795708317309618, 0.00820323545485735, 0.008449387736618519, 0.008695540018379688, 0.008941692300140858, 0.009187843650579453, 0.009433995932340622, 0.009680148214101791, 0.00992630049586296, 0.01017245277762413, 0.0104186050593853, 0.010664757341146469, 0.010910909622907639, 0.011157061904668808, 0.011403213255107403, 0.011649365536868572, 0.011895517818629742, 0.012141670100390911]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 9.0, 4.0, 8.0, 2.0, 7.0, 10.0, 6.0, 14.0, 24.0, 21.0, 21.0, 27.0, 23.0, 37.0, 32.0, 42.0, 39.0, 40.0, 44.0, 42.0, 45.0, 39.0, 41.0, 43.0, 40.0, 36.0, 27.0, 36.0, 36.0, 30.0, 25.0, 26.0, 27.0, 21.0, 15.0, 14.0, 10.0, 8.0, 6.0, 11.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008364319801330566, -0.0008103298023343086, -0.0007842276245355606, -0.0007581254467368126, -0.0007320232689380646, -0.0007059210911393166, -0.0006798189133405685, -0.0006537167355418205, -0.0006276145577430725, -0.0006015123799443245, -0.0005754102021455765, -0.0005493080243468285, -0.0005232058465480804, -0.0004971036687493324, -0.0004710014909505844, -0.0004448993131518364, -0.0004187971353530884, -0.00039269495755434036, -0.00036659277975559235, -0.00034049060195684433, -0.0003143884241580963, -0.0002882862463593483, -0.0002621840685606003, -0.00023608189076185226, -0.00020997971296310425, -0.00018387753516435623, -0.00015777535736560822, -0.0001316731795668602, -0.00010557100176811218, -7.946882396936417e-05, -5.336664617061615e-05, -2.7264468371868134e-05, -1.1622905731201172e-06, 2.49398872256279e-05, 5.1042065024375916e-05, 7.714424282312393e-05, 0.00010324642062187195, 0.00012934859842061996, 0.00015545077621936798, 0.000181552954018116, 0.00020765513181686401, 0.00023375730961561203, 0.00025985948741436005, 0.00028596166521310806, 0.0003120638430118561, 0.0003381660208106041, 0.0003642681986093521, 0.00039037037640810013, 0.00041647255420684814, 0.00044257473200559616, 0.0004686769098043442, 0.0004947790876030922, 0.0005208812654018402, 0.0005469834432005882, 0.0005730856209993362, 0.0005991877987980843, 0.0006252899765968323, 0.0006513921543955803, 0.0006774943321943283, 0.0007035965099930763, 0.0007296986877918243, 0.0007558008655905724, 0.0007819030433893204, 0.0008080052211880684, 0.0008341073989868164]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 0.0, 4.0, 6.0, 2.0, 3.0, 10.0, 4.0, 8.0, 9.0, 11.0, 8.0, 13.0, 17.0, 14.0, 15.0, 30.0, 29.0, 27.0, 33.0, 24.0, 43.0, 29.0, 31.0, 40.0, 33.0, 40.0, 48.0, 47.0, 43.0, 48.0, 40.0, 35.0, 34.0, 33.0, 34.0, 23.0, 24.0, 25.0, 10.0, 14.0, 10.0, 9.0, 6.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 7.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.8359375, -3.70758056640625, -3.5792236328125, -3.45086669921875, -3.322509765625, -3.19415283203125, -3.0657958984375, -2.93743896484375, -2.80908203125, -2.68072509765625, -2.5523681640625, -2.42401123046875, -2.295654296875, -2.16729736328125, -2.0389404296875, -1.91058349609375, -1.7822265625, -1.65386962890625, -1.5255126953125, -1.39715576171875, -1.268798828125, -1.14044189453125, -1.0120849609375, -0.88372802734375, -0.75537109375, -0.62701416015625, -0.4986572265625, -0.37030029296875, -0.241943359375, -0.11358642578125, 0.0147705078125, 0.14312744140625, 0.271484375, 0.39984130859375, 0.5281982421875, 0.65655517578125, 0.784912109375, 0.91326904296875, 1.0416259765625, 1.16998291015625, 1.29833984375, 1.42669677734375, 1.5550537109375, 1.68341064453125, 1.811767578125, 1.94012451171875, 2.0684814453125, 2.19683837890625, 2.3251953125, 2.45355224609375, 2.5819091796875, 2.71026611328125, 2.838623046875, 2.96697998046875, 3.0953369140625, 3.22369384765625, 3.35205078125, 3.48040771484375, 3.6087646484375, 3.73712158203125, 3.865478515625, 3.99383544921875, 4.1221923828125, 4.25054931640625, 4.37890625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 9.0, 15.0, 11.0, 12.0, 21.0, 25.0, 25.0, 42.0, 44.0, 58.0, 101.0, 102.0, 179.0, 222.0, 306.0, 427.0, 703.0, 1200.0, 2338.0, 5273.0, 14022.0, 53856.0, 323901.0, 524177.0, 87237.0, 20479.0, 6793.0, 2878.0, 1470.0, 836.0, 494.0, 361.0, 246.0, 181.0, 123.0, 101.0, 67.0, 47.0, 34.0, 28.0, 21.0, 15.0, 11.0, 9.0, 8.0, 7.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-6.90625, -6.67718505859375, -6.4481201171875, -6.21905517578125, -5.989990234375, -5.76092529296875, -5.5318603515625, -5.30279541015625, -5.07373046875, -4.84466552734375, -4.6156005859375, -4.38653564453125, -4.157470703125, -3.92840576171875, -3.6993408203125, -3.47027587890625, -3.2412109375, -3.01214599609375, -2.7830810546875, -2.55401611328125, -2.324951171875, -2.09588623046875, -1.8668212890625, -1.63775634765625, -1.40869140625, -1.17962646484375, -0.9505615234375, -0.72149658203125, -0.492431640625, -0.26336669921875, -0.0343017578125, 0.19476318359375, 0.423828125, 0.65289306640625, 0.8819580078125, 1.11102294921875, 1.340087890625, 1.56915283203125, 1.7982177734375, 2.02728271484375, 2.25634765625, 2.48541259765625, 2.7144775390625, 2.94354248046875, 3.172607421875, 3.40167236328125, 3.6307373046875, 3.85980224609375, 4.0888671875, 4.31793212890625, 4.5469970703125, 4.77606201171875, 5.005126953125, 5.23419189453125, 5.4632568359375, 5.69232177734375, 5.92138671875, 6.15045166015625, 6.3795166015625, 6.60858154296875, 6.837646484375, 7.06671142578125, 7.2957763671875, 7.52484130859375, 7.75390625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 11.0, 8.0, 9.0, 15.0, 19.0, 16.0, 17.0, 26.0, 27.0, 44.0, 51.0, 49.0, 85.0, 116.0, 448.0, 1597.0, 111.0, 73.0, 48.0, 47.0, 38.0, 45.0, 23.0, 23.0, 29.0, 14.0, 10.0, 4.0, 9.0, 5.0, 9.0, 6.0, 2.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.40625, -9.991455078125, -9.57666015625, -9.161865234375, -8.7470703125, -8.332275390625, -7.91748046875, -7.502685546875, -7.087890625, -6.673095703125, -6.25830078125, -5.843505859375, -5.4287109375, -5.013916015625, -4.59912109375, -4.184326171875, -3.76953125, -3.354736328125, -2.93994140625, -2.525146484375, -2.1103515625, -1.695556640625, -1.28076171875, -0.865966796875, -0.451171875, -0.036376953125, 0.37841796875, 0.793212890625, 1.2080078125, 1.622802734375, 2.03759765625, 2.452392578125, 2.8671875, 3.281982421875, 3.69677734375, 4.111572265625, 4.5263671875, 4.941162109375, 5.35595703125, 5.770751953125, 6.185546875, 6.600341796875, 7.01513671875, 7.429931640625, 7.8447265625, 8.259521484375, 8.67431640625, 9.089111328125, 9.50390625, 9.918701171875, 10.33349609375, 10.748291015625, 11.1630859375, 11.577880859375, 11.99267578125, 12.407470703125, 12.822265625, 13.237060546875, 13.65185546875, 14.066650390625, 14.4814453125, 14.896240234375, 15.31103515625, 15.725830078125, 16.140625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 8.0, 9.0, 3.0, 9.0, 11.0, 7.0, 20.0, 21.0, 31.0, 56.0, 87.0, 129.0, 226.0, 455.0, 1288.0, 416160.0, 2724655.0, 1413.0, 469.0, 274.0, 119.0, 85.0, 55.0, 25.0, 24.0, 18.0, 14.0, 8.0, 4.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-47.71875, -46.46435546875, -45.2099609375, -43.95556640625, -42.701171875, -41.44677734375, -40.1923828125, -38.93798828125, -37.68359375, -36.42919921875, -35.1748046875, -33.92041015625, -32.666015625, -31.41162109375, -30.1572265625, -28.90283203125, -27.6484375, -26.39404296875, -25.1396484375, -23.88525390625, -22.630859375, -21.37646484375, -20.1220703125, -18.86767578125, -17.61328125, -16.35888671875, -15.1044921875, -13.85009765625, -12.595703125, -11.34130859375, -10.0869140625, -8.83251953125, -7.578125, -6.32373046875, -5.0693359375, -3.81494140625, -2.560546875, -1.30615234375, -0.0517578125, 1.20263671875, 2.45703125, 3.71142578125, 4.9658203125, 6.22021484375, 7.474609375, 8.72900390625, 9.9833984375, 11.23779296875, 12.4921875, 13.74658203125, 15.0009765625, 16.25537109375, 17.509765625, 18.76416015625, 20.0185546875, 21.27294921875, 22.52734375, 23.78173828125, 25.0361328125, 26.29052734375, 27.544921875, 28.79931640625, 30.0537109375, 31.30810546875, 32.5625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [4.0, 9.0, 19.0, 78.0, 153.0, 246.0, 259.0, 139.0, 70.0, 23.0, 8.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.243184566497803, -3.504897117614746, -2.7666096687316895, -2.028322458267212, -1.2900350093841553, -0.5517475605010986, 0.1865396499633789, 0.9248270988464355, 1.6631145477294922, 2.401401996612549, 3.1396894454956055, 3.877976655960083, 4.616264343261719, 5.354551315307617, 6.092838764190674, 6.8311262130737305, 7.569413661956787, 8.307701110839844, 9.045988082885742, 9.784276008605957, 10.522562980651855, 11.26085090637207, 11.999137878417969, 12.737424850463867, 13.475712776184082, 14.21399974822998, 14.952287673950195, 15.690574645996094, 16.428861618041992, 17.167150497436523, 17.905437469482422, 18.64372444152832, 19.38201332092285, 20.12030029296875, 20.85858726501465, 21.59687614440918, 22.335163116455078, 23.073450088500977, 23.811737060546875, 24.550025939941406, 25.288312911987305, 26.026599884033203, 26.7648868560791, 27.503175735473633, 28.24146270751953, 28.97974967956543, 29.718036651611328, 30.45632553100586, 31.194610595703125, 31.932897567749023, 32.67118453979492, 33.40947341918945, 34.14775848388672, 34.88604736328125, 35.62433624267578, 36.36262130737305, 37.10091018676758, 37.83919906616211, 38.577484130859375, 39.315773010253906, 40.05405807495117, 40.7923469543457, 41.530635833740234, 42.2689208984375, 43.00720977783203]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 6.0, 6.0, 9.0, 6.0, 3.0, 13.0, 11.0, 8.0, 14.0, 21.0, 15.0, 22.0, 23.0, 26.0, 33.0, 30.0, 30.0, 40.0, 43.0, 46.0, 40.0, 33.0, 43.0, 31.0, 40.0, 30.0, 35.0, 30.0, 46.0, 27.0, 25.0, 21.0, 28.0, 20.0, 16.0, 26.0, 22.0, 13.0, 14.0, 11.0, 11.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-23.05164337158203, -22.2810001373291, -21.510358810424805, -20.739715576171875, -19.969074249267578, -19.19843101501465, -18.42778778076172, -17.657146453857422, -16.886503219604492, -16.115859985351562, -15.345218658447266, -14.574575424194336, -13.803933143615723, -13.03329086303711, -12.26264762878418, -11.492005348205566, -10.721363067626953, -9.95072078704834, -9.180078506469727, -8.409435272216797, -7.638792991638184, -6.86815071105957, -6.097507953643799, -5.326865196228027, -4.556222915649414, -3.7855803966522217, -3.0149378776550293, -2.244295358657837, -1.4736528396606445, -0.7030103206634521, 0.06763219833374023, 0.8382749557495117, 1.608917236328125, 2.3795597553253174, 3.1502022743225098, 3.920844793319702, 4.6914873123168945, 5.462129592895508, 6.232772350311279, 7.003415107727051, 7.774057388305664, 8.544699668884277, 9.31534194946289, 10.08598518371582, 10.856627464294434, 11.627269744873047, 12.397912979125977, 13.16855525970459, 13.939197540283203, 14.709839820861816, 15.48048210144043, 16.25112533569336, 17.021766662597656, 17.792409896850586, 18.563053131103516, 19.333694458007812, 20.104337692260742, 20.874980926513672, 21.64562225341797, 22.4162654876709, 23.186908721923828, 23.957550048828125, 24.728193283081055, 25.498836517333984, 26.26947784423828]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 7.0, 5.0, 10.0, 7.0, 10.0, 8.0, 17.0, 27.0, 19.0, 22.0, 27.0, 32.0, 33.0, 37.0, 33.0, 34.0, 60.0, 37.0, 38.0, 61.0, 49.0, 51.0, 45.0, 42.0, 35.0, 36.0, 42.0, 28.0, 21.0, 26.0, 16.0, 13.0, 10.0, 14.0, 13.0, 4.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.30859375, -5.1435546875, -4.978515625, -4.8134765625, -4.6484375, -4.4833984375, -4.318359375, -4.1533203125, -3.98828125, -3.8232421875, -3.658203125, -3.4931640625, -3.328125, -3.1630859375, -2.998046875, -2.8330078125, -2.66796875, -2.5029296875, -2.337890625, -2.1728515625, -2.0078125, -1.8427734375, -1.677734375, -1.5126953125, -1.34765625, -1.1826171875, -1.017578125, -0.8525390625, -0.6875, -0.5224609375, -0.357421875, -0.1923828125, -0.02734375, 0.1376953125, 0.302734375, 0.4677734375, 0.6328125, 0.7978515625, 0.962890625, 1.1279296875, 1.29296875, 1.4580078125, 1.623046875, 1.7880859375, 1.953125, 2.1181640625, 2.283203125, 2.4482421875, 2.61328125, 2.7783203125, 2.943359375, 3.1083984375, 3.2734375, 3.4384765625, 3.603515625, 3.7685546875, 3.93359375, 4.0986328125, 4.263671875, 4.4287109375, 4.59375, 4.7587890625, 4.923828125, 5.0888671875, 5.25390625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 6.0, 9.0, 8.0, 17.0, 20.0, 26.0, 44.0, 32.0, 53.0, 76.0, 90.0, 107.0, 135.0, 210.0, 256.0, 385.0, 618.0, 1189.0, 3628.0, 46896.0, 3683444.0, 445041.0, 7740.0, 1744.0, 771.0, 491.0, 302.0, 207.0, 147.0, 145.0, 95.0, 79.0, 55.0, 35.0, 39.0, 30.0, 16.0, 23.0, 21.0, 9.0, 10.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.40625, -30.446044921875, -29.48583984375, -28.525634765625, -27.5654296875, -26.605224609375, -25.64501953125, -24.684814453125, -23.724609375, -22.764404296875, -21.80419921875, -20.843994140625, -19.8837890625, -18.923583984375, -17.96337890625, -17.003173828125, -16.04296875, -15.082763671875, -14.12255859375, -13.162353515625, -12.2021484375, -11.241943359375, -10.28173828125, -9.321533203125, -8.361328125, -7.401123046875, -6.44091796875, -5.480712890625, -4.5205078125, -3.560302734375, -2.60009765625, -1.639892578125, -0.6796875, 0.280517578125, 1.24072265625, 2.200927734375, 3.1611328125, 4.121337890625, 5.08154296875, 6.041748046875, 7.001953125, 7.962158203125, 8.92236328125, 9.882568359375, 10.8427734375, 11.802978515625, 12.76318359375, 13.723388671875, 14.68359375, 15.643798828125, 16.60400390625, 17.564208984375, 18.5244140625, 19.484619140625, 20.44482421875, 21.405029296875, 22.365234375, 23.325439453125, 24.28564453125, 25.245849609375, 26.2060546875, 27.166259765625, 28.12646484375, 29.086669921875, 30.046875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 7.0, 14.0, 13.0, 27.0, 35.0, 43.0, 58.0, 112.0, 170.0, 245.0, 378.0, 514.0, 592.0, 523.0, 431.0, 279.0, 195.0, 144.0, 77.0, 57.0, 40.0, 31.0, 17.0, 15.0, 9.0, 8.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.3671875, -9.0804443359375, -8.793701171875, -8.5069580078125, -8.22021484375, -7.9334716796875, -7.646728515625, -7.3599853515625, -7.0732421875, -6.7864990234375, -6.499755859375, -6.2130126953125, -5.92626953125, -5.6395263671875, -5.352783203125, -5.0660400390625, -4.779296875, -4.4925537109375, -4.205810546875, -3.9190673828125, -3.63232421875, -3.3455810546875, -3.058837890625, -2.7720947265625, -2.4853515625, -2.1986083984375, -1.911865234375, -1.6251220703125, -1.33837890625, -1.0516357421875, -0.764892578125, -0.4781494140625, -0.19140625, 0.0953369140625, 0.382080078125, 0.6688232421875, 0.95556640625, 1.2423095703125, 1.529052734375, 1.8157958984375, 2.1025390625, 2.3892822265625, 2.676025390625, 2.9627685546875, 3.24951171875, 3.5362548828125, 3.822998046875, 4.1097412109375, 4.396484375, 4.6832275390625, 4.969970703125, 5.2567138671875, 5.54345703125, 5.8302001953125, 6.116943359375, 6.4036865234375, 6.6904296875, 6.9771728515625, 7.263916015625, 7.5506591796875, 7.83740234375, 8.1241455078125, 8.410888671875, 8.6976318359375, 8.984375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 23.0, 12.0, 36.0, 52.0, 106.0, 274.0, 777.0, 2414.0, 11196.0, 105131.0, 2777698.0, 1233180.0, 53430.0, 7227.0, 1681.0, 582.0, 212.0, 103.0, 56.0, 24.0, 17.0, 10.0, 10.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0625, -10.61767578125, -10.1728515625, -9.72802734375, -9.283203125, -8.83837890625, -8.3935546875, -7.94873046875, -7.50390625, -7.05908203125, -6.6142578125, -6.16943359375, -5.724609375, -5.27978515625, -4.8349609375, -4.39013671875, -3.9453125, -3.50048828125, -3.0556640625, -2.61083984375, -2.166015625, -1.72119140625, -1.2763671875, -0.83154296875, -0.38671875, 0.05810546875, 0.5029296875, 0.94775390625, 1.392578125, 1.83740234375, 2.2822265625, 2.72705078125, 3.171875, 3.61669921875, 4.0615234375, 4.50634765625, 4.951171875, 5.39599609375, 5.8408203125, 6.28564453125, 6.73046875, 7.17529296875, 7.6201171875, 8.06494140625, 8.509765625, 8.95458984375, 9.3994140625, 9.84423828125, 10.2890625, 10.73388671875, 11.1787109375, 11.62353515625, 12.068359375, 12.51318359375, 12.9580078125, 13.40283203125, 13.84765625, 14.29248046875, 14.7373046875, 15.18212890625, 15.626953125, 16.07177734375, 16.5166015625, 16.96142578125, 17.40625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 9.0, 11.0, 20.0, 38.0, 80.0, 93.0, 148.0, 170.0, 134.0, 132.0, 74.0, 45.0, 19.0, 10.0, 8.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.44524383544922, -54.77109909057617, -52.096954345703125, -49.422813415527344, -46.7486686706543, -44.07452392578125, -41.4003791809082, -38.726234436035156, -36.052093505859375, -33.37794876098633, -30.703805923461914, -28.029661178588867, -25.355518341064453, -22.681373596191406, -20.00722885131836, -17.333086013793945, -14.658939361572266, -11.984795570373535, -9.310651779174805, -6.636507034301758, -3.9623632431030273, -1.2882194519042969, 1.38592529296875, 4.060068130493164, 6.734212875366211, 9.408356666564941, 12.082500457763672, 14.756645202636719, 17.430789947509766, 20.10493278503418, 22.779077529907227, 25.45322036743164, 28.127365112304688, 30.801509857177734, 33.47565460205078, 36.14979553222656, 38.82394027709961, 41.498085021972656, 44.1722297668457, 46.84637451171875, 49.52051544189453, 52.19466018676758, 54.868804931640625, 57.542945861816406, 60.21709060668945, 62.8912353515625, 65.56538391113281, 68.2395248413086, 70.91366577148438, 73.58780670166016, 76.26195526123047, 78.93609619140625, 81.61024475097656, 84.28438568115234, 86.95852661132812, 89.63267517089844, 92.30682373046875, 94.98096466064453, 97.65511322021484, 100.32925415039062, 103.00340270996094, 105.67754364013672, 108.3516845703125, 111.02583312988281, 113.6999740600586]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 6.0, 8.0, 8.0, 9.0, 15.0, 11.0, 17.0, 23.0, 24.0, 27.0, 28.0, 25.0, 29.0, 24.0, 42.0, 36.0, 38.0, 52.0, 37.0, 26.0, 48.0, 47.0, 30.0, 29.0, 41.0, 38.0, 32.0, 36.0, 35.0, 20.0, 19.0, 21.0, 18.0, 11.0, 18.0, 13.0, 7.0, 13.0, 8.0, 9.0, 4.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.084197998046875, -26.1844482421875, -25.284700393676758, -24.384950637817383, -23.48520278930664, -22.585453033447266, -21.68570327758789, -20.785953521728516, -19.886205673217773, -18.9864559173584, -18.086708068847656, -17.18695831298828, -16.287208557128906, -15.387460708618164, -14.487710952758789, -13.58796215057373, -12.688213348388672, -11.788464546203613, -10.888715744018555, -9.98896598815918, -9.089217185974121, -8.189468383789062, -7.289719104766846, -6.389969825744629, -5.49022102355957, -4.590472221374512, -3.690722942352295, -2.7909739017486572, -1.8912248611450195, -0.9914760589599609, -0.09172677993774414, 0.8080224990844727, 1.7077693939208984, 2.607518434524536, 3.507267475128174, 4.407016754150391, 5.306765556335449, 6.206514358520508, 7.106263637542725, 8.006012916564941, 8.90576171875, 9.805510520935059, 10.705259323120117, 11.605009078979492, 12.50475788116455, 13.40450668334961, 14.304256439208984, 15.204005241394043, 16.1037540435791, 17.003503799438477, 17.90325164794922, 18.803001403808594, 19.70275115966797, 20.60249900817871, 21.502248764038086, 22.401996612548828, 23.301746368408203, 24.201496124267578, 25.10124397277832, 26.000993728637695, 26.900741577148438, 27.800491333007812, 28.700241088867188, 29.599990844726562, 30.499738693237305]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 10.0, 9.0, 15.0, 11.0, 20.0, 18.0, 16.0, 22.0, 32.0, 20.0, 24.0, 29.0, 30.0, 31.0, 34.0, 43.0, 42.0, 35.0, 47.0, 33.0, 37.0, 31.0, 39.0, 40.0, 33.0, 30.0, 25.0, 31.0, 25.0, 26.0, 17.0, 15.0, 24.0, 14.0, 10.0, 8.0, 12.0, 6.0, 11.0, 10.0, 4.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-42.59375, -41.2333984375, -39.873046875, -38.5126953125, -37.15234375, -35.7919921875, -34.431640625, -33.0712890625, -31.7109375, -30.3505859375, -28.990234375, -27.6298828125, -26.26953125, -24.9091796875, -23.548828125, -22.1884765625, -20.828125, -19.4677734375, -18.107421875, -16.7470703125, -15.38671875, -14.0263671875, -12.666015625, -11.3056640625, -9.9453125, -8.5849609375, -7.224609375, -5.8642578125, -4.50390625, -3.1435546875, -1.783203125, -0.4228515625, 0.9375, 2.2978515625, 3.658203125, 5.0185546875, 6.37890625, 7.7392578125, 9.099609375, 10.4599609375, 11.8203125, 13.1806640625, 14.541015625, 15.9013671875, 17.26171875, 18.6220703125, 19.982421875, 21.3427734375, 22.703125, 24.0634765625, 25.423828125, 26.7841796875, 28.14453125, 29.5048828125, 30.865234375, 32.2255859375, 33.5859375, 34.9462890625, 36.306640625, 37.6669921875, 39.02734375, 40.3876953125, 41.748046875, 43.1083984375, 44.46875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 12.0, 3.0, 15.0, 14.0, 21.0, 36.0, 46.0, 66.0, 92.0, 137.0, 163.0, 270.0, 365.0, 564.0, 745.0, 1106.0, 1590.0, 2315.0, 3508.0, 5365.0, 8277.0, 12489.0, 20248.0, 31952.0, 51580.0, 81918.0, 126912.0, 174760.0, 174876.0, 126072.0, 82268.0, 51296.0, 32045.0, 19996.0, 12728.0, 8158.0, 5377.0, 3475.0, 2378.0, 1586.0, 1075.0, 785.0, 574.0, 367.0, 270.0, 197.0, 136.0, 100.0, 61.0, 59.0, 30.0, 24.0, 19.0, 18.0, 3.0, 9.0, 4.0, 4.0, 4.0, 2.0], "bins": [-4.2265625, -4.094482421875, -3.96240234375, -3.830322265625, -3.6982421875, -3.566162109375, -3.43408203125, -3.302001953125, -3.169921875, -3.037841796875, -2.90576171875, -2.773681640625, -2.6416015625, -2.509521484375, -2.37744140625, -2.245361328125, -2.11328125, -1.981201171875, -1.84912109375, -1.717041015625, -1.5849609375, -1.452880859375, -1.32080078125, -1.188720703125, -1.056640625, -0.924560546875, -0.79248046875, -0.660400390625, -0.5283203125, -0.396240234375, -0.26416015625, -0.132080078125, 0.0, 0.132080078125, 0.26416015625, 0.396240234375, 0.5283203125, 0.660400390625, 0.79248046875, 0.924560546875, 1.056640625, 1.188720703125, 1.32080078125, 1.452880859375, 1.5849609375, 1.717041015625, 1.84912109375, 1.981201171875, 2.11328125, 2.245361328125, 2.37744140625, 2.509521484375, 2.6416015625, 2.773681640625, 2.90576171875, 3.037841796875, 3.169921875, 3.302001953125, 3.43408203125, 3.566162109375, 3.6982421875, 3.830322265625, 3.96240234375, 4.094482421875, 4.2265625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 1.0, 2.0, 5.0, 4.0, 11.0, 7.0, 8.0, 14.0, 12.0, 21.0, 18.0, 27.0, 32.0, 31.0, 37.0, 37.0, 36.0, 39.0, 41.0, 51.0, 42.0, 1067.0, 41.0, 47.0, 49.0, 35.0, 48.0, 32.0, 38.0, 37.0, 23.0, 18.0, 26.0, 17.0, 19.0, 11.0, 11.0, 8.0, 7.0, 7.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.8125, -23.7919921875, -22.771484375, -21.7509765625, -20.73046875, -19.7099609375, -18.689453125, -17.6689453125, -16.6484375, -15.6279296875, -14.607421875, -13.5869140625, -12.56640625, -11.5458984375, -10.525390625, -9.5048828125, -8.484375, -7.4638671875, -6.443359375, -5.4228515625, -4.40234375, -3.3818359375, -2.361328125, -1.3408203125, -0.3203125, 0.7001953125, 1.720703125, 2.7412109375, 3.76171875, 4.7822265625, 5.802734375, 6.8232421875, 7.84375, 8.8642578125, 9.884765625, 10.9052734375, 11.92578125, 12.9462890625, 13.966796875, 14.9873046875, 16.0078125, 17.0283203125, 18.048828125, 19.0693359375, 20.08984375, 21.1103515625, 22.130859375, 23.1513671875, 24.171875, 25.1923828125, 26.212890625, 27.2333984375, 28.25390625, 29.2744140625, 30.294921875, 31.3154296875, 32.3359375, 33.3564453125, 34.376953125, 35.3974609375, 36.41796875, 37.4384765625, 38.458984375, 39.4794921875, 40.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 12.0, 13.0, 28.0, 23.0, 43.0, 66.0, 103.0, 143.0, 219.0, 323.0, 557.0, 878.0, 1367.0, 2179.0, 3615.0, 6280.0, 10174.0, 18275.0, 32544.0, 60119.0, 111510.0, 191309.0, 1279580.0, 167332.0, 93223.0, 50677.0, 27796.0, 15730.0, 9076.0, 5335.0, 3170.0, 2030.0, 1201.0, 823.0, 487.0, 290.0, 200.0, 133.0, 89.0, 58.0, 39.0, 32.0, 15.0, 14.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.7578125, -5.585205078125, -5.41259765625, -5.239990234375, -5.0673828125, -4.894775390625, -4.72216796875, -4.549560546875, -4.376953125, -4.204345703125, -4.03173828125, -3.859130859375, -3.6865234375, -3.513916015625, -3.34130859375, -3.168701171875, -2.99609375, -2.823486328125, -2.65087890625, -2.478271484375, -2.3056640625, -2.133056640625, -1.96044921875, -1.787841796875, -1.615234375, -1.442626953125, -1.27001953125, -1.097412109375, -0.9248046875, -0.752197265625, -0.57958984375, -0.406982421875, -0.234375, -0.061767578125, 0.11083984375, 0.283447265625, 0.4560546875, 0.628662109375, 0.80126953125, 0.973876953125, 1.146484375, 1.319091796875, 1.49169921875, 1.664306640625, 1.8369140625, 2.009521484375, 2.18212890625, 2.354736328125, 2.52734375, 2.699951171875, 2.87255859375, 3.045166015625, 3.2177734375, 3.390380859375, 3.56298828125, 3.735595703125, 3.908203125, 4.080810546875, 4.25341796875, 4.426025390625, 4.5986328125, 4.771240234375, 4.94384765625, 5.116455078125, 5.2890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 5.0, 8.0, 5.0, 10.0, 3.0, 8.0, 11.0, 12.0, 7.0, 22.0, 15.0, 24.0, 24.0, 43.0, 37.0, 61.0, 74.0, 93.0, 79.0, 76.0, 66.0, 52.0, 44.0, 41.0, 36.0, 27.0, 15.0, 18.0, 10.0, 9.0, 15.0, 13.0, 3.0, 7.0, 2.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.06610107421875, -0.06407356262207031, -0.062046051025390625, -0.06001853942871094, -0.05799102783203125, -0.05596351623535156, -0.053936004638671875, -0.05190849304199219, -0.0498809814453125, -0.04785346984863281, -0.045825958251953125, -0.04379844665527344, -0.04177093505859375, -0.03974342346191406, -0.037715911865234375, -0.03568840026855469, -0.033660888671875, -0.03163337707519531, -0.029605865478515625, -0.027578353881835938, -0.02555084228515625, -0.023523330688476562, -0.021495819091796875, -0.019468307495117188, -0.0174407958984375, -0.015413284301757812, -0.013385772705078125, -0.011358261108398438, -0.00933074951171875, -0.0073032379150390625, -0.005275726318359375, -0.0032482147216796875, -0.001220703125, 0.0008068084716796875, 0.002834320068359375, 0.0048618316650390625, 0.00688934326171875, 0.008916854858398438, 0.010944366455078125, 0.012971878051757812, 0.0149993896484375, 0.017026901245117188, 0.019054412841796875, 0.021081924438476562, 0.02310943603515625, 0.025136947631835938, 0.027164459228515625, 0.029191970825195312, 0.031219482421875, 0.03324699401855469, 0.035274505615234375, 0.03730201721191406, 0.03932952880859375, 0.04135704040527344, 0.043384552001953125, 0.04541206359863281, 0.0474395751953125, 0.04946708679199219, 0.051494598388671875, 0.05352210998535156, 0.05554962158203125, 0.05757713317871094, 0.059604644775390625, 0.06163215637207031, 0.06365966796875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 4.0, 12.0, 17.0, 9.0, 17.0, 21.0, 26.0, 31.0, 28.0, 46.0, 53.0, 74.0, 80.0, 96.0, 132.0, 164.0, 244.0, 326.0, 556.0, 1035.0, 2121.0, 5079.0, 13413.0, 40509.0, 142992.0, 513543.0, 234296.0, 60817.0, 19499.0, 6974.0, 2861.0, 1247.0, 655.0, 380.0, 271.0, 172.0, 150.0, 113.0, 91.0, 74.0, 58.0, 54.0, 43.0, 37.0, 36.0, 19.0, 15.0, 13.0, 9.0, 3.0, 12.0, 9.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.36376953125, -0.3522834777832031, -0.34079742431640625, -0.3293113708496094, -0.3178253173828125, -0.3063392639160156, -0.29485321044921875, -0.2833671569824219, -0.271881103515625, -0.2603950500488281, -0.24890899658203125, -0.23742294311523438, -0.2259368896484375, -0.21445083618164062, -0.20296478271484375, -0.19147872924804688, -0.17999267578125, -0.16850662231445312, -0.15702056884765625, -0.14553451538085938, -0.1340484619140625, -0.12256240844726562, -0.11107635498046875, -0.09959030151367188, -0.088104248046875, -0.07661819458007812, -0.06513214111328125, -0.053646087646484375, -0.0421600341796875, -0.030673980712890625, -0.01918792724609375, -0.007701873779296875, 0.0037841796875, 0.015270233154296875, 0.02675628662109375, 0.038242340087890625, 0.0497283935546875, 0.061214447021484375, 0.07270050048828125, 0.08418655395507812, 0.095672607421875, 0.10715866088867188, 0.11864471435546875, 0.13013076782226562, 0.1416168212890625, 0.15310287475585938, 0.16458892822265625, 0.17607498168945312, 0.18756103515625, 0.19904708862304688, 0.21053314208984375, 0.22201919555664062, 0.2335052490234375, 0.24499130249023438, 0.25647735595703125, 0.2679634094238281, 0.279449462890625, 0.2909355163574219, 0.30242156982421875, 0.3139076232910156, 0.3253936767578125, 0.3368797302246094, 0.34836578369140625, 0.3598518371582031, 0.371337890625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 13.0, 20.0, 14.0, 31.0, 72.0, 112.0, 174.0, 165.0, 141.0, 92.0, 62.0, 37.0, 14.0, 14.0, 10.0, 13.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07205367088317871, -0.06828658282756805, -0.0645194947719574, -0.06075240299105644, -0.056985314935445786, -0.05321822315454483, -0.049451135098934174, -0.04568404704332352, -0.04191695898771286, -0.0381498709321022, -0.03438277915120125, -0.03061569109559059, -0.026848603039979935, -0.02308151312172413, -0.019314423203468323, -0.015547335147857666, -0.01178024336695671, -0.00801315438002348, -0.004246064927428961, -0.00047897547483444214, 0.003288113512098789, 0.007055202499032021, 0.010822292417287827, 0.014589380472898483, 0.01835647039115429, 0.022123560309410095, 0.025890648365020752, 0.029657738283276558, 0.033424828201532364, 0.03719191625714302, 0.040959008038043976, 0.04472609609365463, 0.04849318414926529, 0.052260272204875946, 0.0560273639857769, 0.05979445204138756, 0.06356154382228851, 0.06732863187789917, 0.07109571993350983, 0.07486280798912048, 0.07862989604473114, 0.0823969841003418, 0.08616407215595245, 0.08993116021156311, 0.09369825571775436, 0.09746534377336502, 0.10123243182897568, 0.10499951988458633, 0.10876661539077759, 0.11253370344638824, 0.1163007915019989, 0.12006787955760956, 0.12383497506380081, 0.12760205566883087, 0.13136914372444153, 0.13513624668121338, 0.13890331983566284, 0.1426704078912735, 0.14643749594688416, 0.1502045840024948, 0.15397167205810547, 0.15773876011371613, 0.16150584816932678, 0.16527295112609863, 0.1690400391817093]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 7.0, 5.0, 3.0, 4.0, 5.0, 7.0, 12.0, 10.0, 11.0, 13.0, 14.0, 16.0, 19.0, 27.0, 23.0, 27.0, 29.0, 28.0, 43.0, 31.0, 41.0, 52.0, 29.0, 39.0, 45.0, 48.0, 33.0, 45.0, 36.0, 32.0, 34.0, 24.0, 23.0, 20.0, 24.0, 23.0, 25.0, 20.0, 15.0, 14.0, 10.0, 6.0, 7.0, 3.0, 5.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.03513616323471069, -0.03407980874180794, -0.03302345424890518, -0.03196709603071213, -0.030910741537809372, -0.029854387044906616, -0.02879803068935871, -0.027741674333810806, -0.02668531984090805, -0.025628965348005295, -0.02457260899245739, -0.023516252636909485, -0.02245989814400673, -0.021403543651103973, -0.02034718729555607, -0.019290830940008163, -0.018234476447105408, -0.017178121954202652, -0.016121765598654747, -0.015065410174429417, -0.014009054750204086, -0.012952699325978756, -0.011896343901753426, -0.010839988477528095, -0.009783633053302765, -0.008727277629077435, -0.007670922204852104, -0.006614566780626774, -0.0055582113564014435, -0.004501855932176113, -0.0034455005079507828, -0.0023891450837254524, -0.001332789659500122, -0.0002764342352747917, 0.0007799211889505386, 0.001836276613175869, 0.0028926320374011993, 0.00394898746162653, 0.00500534288585186, 0.00606169831007719, 0.007118053734302521, 0.008174409158527851, 0.009230764582753181, 0.010287120006978512, 0.011343475431203842, 0.012399830855429173, 0.013456186279654503, 0.014512541703879833, 0.015568897128105164, 0.01662525162100792, 0.017681607976555824, 0.01873796433210373, 0.019794318825006485, 0.02085067331790924, 0.021907029673457146, 0.02296338602900505, 0.024019740521907806, 0.025076095014810562, 0.026132451370358467, 0.027188807725906372, 0.028245162218809128, 0.029301516711711884, 0.03035787306725979, 0.031414229422807693, 0.03247058391571045]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 7.0, 10.0, 10.0, 15.0, 10.0, 19.0, 20.0, 16.0, 20.0, 31.0, 23.0, 24.0, 30.0, 26.0, 34.0, 35.0, 42.0, 42.0, 34.0, 49.0, 31.0, 36.0, 34.0, 38.0, 39.0, 34.0, 33.0, 20.0, 34.0, 25.0, 25.0, 13.0, 20.0, 23.0, 13.0, 11.0, 7.0, 13.0, 6.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-42.5625, -41.20361328125, -39.8447265625, -38.48583984375, -37.126953125, -35.76806640625, -34.4091796875, -33.05029296875, -31.69140625, -30.33251953125, -28.9736328125, -27.61474609375, -26.255859375, -24.89697265625, -23.5380859375, -22.17919921875, -20.8203125, -19.46142578125, -18.1025390625, -16.74365234375, -15.384765625, -14.02587890625, -12.6669921875, -11.30810546875, -9.94921875, -8.59033203125, -7.2314453125, -5.87255859375, -4.513671875, -3.15478515625, -1.7958984375, -0.43701171875, 0.921875, 2.28076171875, 3.6396484375, 4.99853515625, 6.357421875, 7.71630859375, 9.0751953125, 10.43408203125, 11.79296875, 13.15185546875, 14.5107421875, 15.86962890625, 17.228515625, 18.58740234375, 19.9462890625, 21.30517578125, 22.6640625, 24.02294921875, 25.3818359375, 26.74072265625, 28.099609375, 29.45849609375, 30.8173828125, 32.17626953125, 33.53515625, 34.89404296875, 36.2529296875, 37.61181640625, 38.970703125, 40.32958984375, 41.6884765625, 43.04736328125, 44.40625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 11.0, 14.0, 13.0, 15.0, 17.0, 36.0, 38.0, 59.0, 83.0, 101.0, 189.0, 305.0, 539.0, 892.0, 1645.0, 2976.0, 6207.0, 16346.0, 60693.0, 306090.0, 501120.0, 108559.0, 25467.0, 8656.0, 3762.0, 1906.0, 1052.0, 652.0, 382.0, 225.0, 145.0, 112.0, 54.0, 45.0, 39.0, 31.0, 16.0, 11.0, 13.0, 9.0, 11.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.5234375, -11.1539306640625, -10.784423828125, -10.4149169921875, -10.04541015625, -9.6759033203125, -9.306396484375, -8.9368896484375, -8.5673828125, -8.1978759765625, -7.828369140625, -7.4588623046875, -7.08935546875, -6.7198486328125, -6.350341796875, -5.9808349609375, -5.611328125, -5.2418212890625, -4.872314453125, -4.5028076171875, -4.13330078125, -3.7637939453125, -3.394287109375, -3.0247802734375, -2.6552734375, -2.2857666015625, -1.916259765625, -1.5467529296875, -1.17724609375, -0.8077392578125, -0.438232421875, -0.0687255859375, 0.30078125, 0.6702880859375, 1.039794921875, 1.4093017578125, 1.77880859375, 2.1483154296875, 2.517822265625, 2.8873291015625, 3.2568359375, 3.6263427734375, 3.995849609375, 4.3653564453125, 4.73486328125, 5.1043701171875, 5.473876953125, 5.8433837890625, 6.212890625, 6.5823974609375, 6.951904296875, 7.3214111328125, 7.69091796875, 8.0604248046875, 8.429931640625, 8.7994384765625, 9.1689453125, 9.5384521484375, 9.907958984375, 10.2774658203125, 10.64697265625, 11.0164794921875, 11.385986328125, 11.7554931640625, 12.125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 8.0, 17.0, 9.0, 25.0, 32.0, 37.0, 54.0, 67.0, 94.0, 81.0, 1971.0, 275.0, 78.0, 80.0, 59.0, 44.0, 39.0, 32.0, 14.0, 15.0, 9.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.875, -143.7626953125, -139.650390625, -135.5380859375, -131.42578125, -127.3134765625, -123.201171875, -119.0888671875, -114.9765625, -110.8642578125, -106.751953125, -102.6396484375, -98.52734375, -94.4150390625, -90.302734375, -86.1904296875, -82.078125, -77.9658203125, -73.853515625, -69.7412109375, -65.62890625, -61.5166015625, -57.404296875, -53.2919921875, -49.1796875, -45.0673828125, -40.955078125, -36.8427734375, -32.73046875, -28.6181640625, -24.505859375, -20.3935546875, -16.28125, -12.1689453125, -8.056640625, -3.9443359375, 0.16796875, 4.2802734375, 8.392578125, 12.5048828125, 16.6171875, 20.7294921875, 24.841796875, 28.9541015625, 33.06640625, 37.1787109375, 41.291015625, 45.4033203125, 49.515625, 53.6279296875, 57.740234375, 61.8525390625, 65.96484375, 70.0771484375, 74.189453125, 78.3017578125, 82.4140625, 86.5263671875, 90.638671875, 94.7509765625, 98.86328125, 102.9755859375, 107.087890625, 111.2001953125, 115.3125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 16.0, 12.0, 20.0, 24.0, 46.0, 78.0, 112.0, 254.0, 500.0, 1309.0, 4723.0, 149646.0, 2966920.0, 18150.0, 2321.0, 790.0, 343.0, 191.0, 93.0, 52.0, 36.0, 26.0, 14.0, 11.0, 5.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.40625, -30.4013671875, -29.396484375, -28.3916015625, -27.38671875, -26.3818359375, -25.376953125, -24.3720703125, -23.3671875, -22.3623046875, -21.357421875, -20.3525390625, -19.34765625, -18.3427734375, -17.337890625, -16.3330078125, -15.328125, -14.3232421875, -13.318359375, -12.3134765625, -11.30859375, -10.3037109375, -9.298828125, -8.2939453125, -7.2890625, -6.2841796875, -5.279296875, -4.2744140625, -3.26953125, -2.2646484375, -1.259765625, -0.2548828125, 0.75, 1.7548828125, 2.759765625, 3.7646484375, 4.76953125, 5.7744140625, 6.779296875, 7.7841796875, 8.7890625, 9.7939453125, 10.798828125, 11.8037109375, 12.80859375, 13.8134765625, 14.818359375, 15.8232421875, 16.828125, 17.8330078125, 18.837890625, 19.8427734375, 20.84765625, 21.8525390625, 22.857421875, 23.8623046875, 24.8671875, 25.8720703125, 26.876953125, 27.8818359375, 28.88671875, 29.8916015625, 30.896484375, 31.9013671875, 32.90625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 11.0, 24.0, 68.0, 167.0, 347.0, 225.0, 93.0, 26.0, 19.0, 8.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.62771606445312, -86.21513366699219, -78.80254364013672, -71.38995361328125, -63.97737121582031, -56.56478500366211, -49.152198791503906, -41.7396125793457, -34.3270263671875, -26.914440155029297, -19.501853942871094, -12.08926773071289, -4.6766815185546875, 2.7359046936035156, 10.148490905761719, 17.561077117919922, 24.973663330078125, 32.38624954223633, 39.79883575439453, 47.211421966552734, 54.62400817871094, 62.03659439086914, 69.44918060302734, 76.86177062988281, 84.27435302734375, 91.68693542480469, 99.09952545166016, 106.51211547851562, 113.92469787597656, 121.3372802734375, 128.7498779296875, 136.16246032714844, 143.57504272460938, 150.9876251220703, 158.40020751953125, 165.81280517578125, 173.2253875732422, 180.63796997070312, 188.05056762695312, 195.46315002441406, 202.875732421875, 210.28831481933594, 217.70089721679688, 225.11349487304688, 232.5260772705078, 239.93865966796875, 247.35125732421875, 254.7638397216797, 262.1764221191406, 269.5890197753906, 277.0015869140625, 284.4141845703125, 291.8267822265625, 299.2393493652344, 306.6519470214844, 314.06451416015625, 321.47711181640625, 328.88970947265625, 336.3022766113281, 343.7148742675781, 351.12744140625, 358.5400390625, 365.95263671875, 373.3652038574219, 380.7778015136719]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 12.0, 12.0, 19.0, 15.0, 25.0, 35.0, 29.0, 34.0, 48.0, 53.0, 53.0, 55.0, 51.0, 49.0, 43.0, 46.0, 61.0, 41.0, 42.0, 61.0, 34.0, 25.0, 19.0, 19.0, 22.0, 21.0, 8.0, 9.0, 12.0, 10.0, 3.0, 8.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-114.47296142578125, -111.21401977539062, -107.955078125, -104.69613647460938, -101.43719482421875, -98.17825317382812, -94.9193115234375, -91.66036987304688, -88.40142822265625, -85.14248657226562, -81.883544921875, -78.62460327148438, -75.36566162109375, -72.10671997070312, -68.8477783203125, -65.58883666992188, -62.32990264892578, -59.070960998535156, -55.81201934814453, -52.553077697753906, -49.29413604736328, -46.035194396972656, -42.7762565612793, -39.51731491088867, -36.25837326049805, -32.99943161010742, -29.740489959716797, -26.481550216674805, -23.22260856628418, -19.963666915893555, -16.704727172851562, -13.445785522460938, -10.186843872070312, -6.927902698516846, -3.668961524963379, -0.4100208282470703, 2.8489208221435547, 6.10786247253418, 9.366802215576172, 12.625743865966797, 15.884685516357422, 19.143627166748047, 22.402568817138672, 25.661508560180664, 28.92045021057129, 32.17938995361328, 35.438331604003906, 38.69727325439453, 41.956214904785156, 45.21515655517578, 48.474098205566406, 51.73303985595703, 54.991981506347656, 58.25092315673828, 61.50986099243164, 64.768798828125, 68.02774047851562, 71.28668212890625, 74.54562377929688, 77.8045654296875, 81.06350708007812, 84.32244873046875, 87.58139038085938, 90.84033203125, 94.09927368164062]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 8.0, 11.0, 15.0, 19.0, 28.0, 37.0, 65.0, 92.0, 131.0, 141.0, 191.0, 285.0, 343.0, 465.0, 624.0, 905.0, 1040176.0, 1711.0, 904.0, 612.0, 418.0, 344.0, 272.0, 213.0, 138.0, 121.0, 81.0, 50.0, 48.0, 22.0, 30.0, 18.0, 15.0, 10.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.43365478515625, -26.28952980041504, -25.145404815673828, -24.00128173828125, -22.85715675354004, -21.713031768798828, -20.568906784057617, -19.424781799316406, -18.280658721923828, -17.136533737182617, -15.992409706115723, -14.848284721374512, -13.704160690307617, -12.560035705566406, -11.415910720825195, -10.2717866897583, -9.127660751342773, -7.983536243438721, -6.839411735534668, -5.695286750793457, -4.551162242889404, -3.4070377349853516, -2.2629127502441406, -1.118788719177246, 0.025336265563964844, 1.1694608926773071, 2.3135855197906494, 3.4577102661132812, 4.601834774017334, 5.745959281921387, 6.890084266662598, 8.034208297729492, 9.178333282470703, 10.322458267211914, 11.466582298278809, 12.61070728302002, 13.754831314086914, 14.898956298828125, 16.043081283569336, 17.187206268310547, 18.331329345703125, 19.475454330444336, 20.619579315185547, 21.763702392578125, 22.907827377319336, 24.051952362060547, 25.196077346801758, 26.34020233154297, 27.48432731628418, 28.62845230102539, 29.7725772857666, 30.916702270507812, 32.06082534790039, 33.20494842529297, 34.34907531738281, 35.49319839477539, 36.637325286865234, 37.78144836425781, 38.925575256347656, 40.069698333740234, 41.21382522583008, 42.357948303222656, 43.5020751953125, 44.64619827270508, 45.790321350097656]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 7.0, 6.0, 6.0, 4.0, 6.0, 8.0, 10.0, 18.0, 31.0, 57.0, 153.0, 10681.0, 51451892.0, 170.0, 48.0, 18.0, 14.0, 6.0, 7.0, 3.0, 8.0, 5.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2576.9765625, -2478.245849609375, -2379.51513671875, -2280.784423828125, -2182.0537109375, -2083.322998046875, -1984.59228515625, -1885.861572265625, -1787.130859375, -1688.400146484375, -1589.66943359375, -1490.938720703125, -1392.2080078125, -1293.477294921875, -1194.74658203125, -1096.015869140625, -997.2850341796875, -898.5543212890625, -799.8236083984375, -701.0928955078125, -602.3621826171875, -503.6314392089844, -404.90069580078125, -306.16998291015625, -207.43927001953125, -108.70854949951172, -9.977828979492188, 88.75289916992188, 187.48361206054688, 286.2143249511719, 384.945068359375, 483.67578125, 582.406494140625, 681.13720703125, 779.867919921875, 878.5986328125, 977.329345703125, 1076.06005859375, 1174.790771484375, 1273.521484375, 1372.252197265625, 1470.98291015625, 1569.713623046875, 1668.4443359375, 1767.175048828125, 1865.90576171875, 1964.636474609375, 2063.3671875, 2162.09814453125, 2260.828857421875, 2359.5595703125, 2458.290283203125, 2557.02099609375, 2655.751708984375, 2754.482421875, 2853.213134765625, 2951.94384765625, 3050.674560546875, 3149.4052734375, 3248.135986328125, 3346.86669921875, 3445.597412109375, 3544.328125, 3643.058837890625, 3741.78955078125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 11.0, 7.0, 7.0, 22.0, 38.0, 42.0, 63.0, 92.0, 121.0, 151.0, 202.0, 296.0, 379.0, 493.0, 833.0, 1177.0, 1647.0, 2427.0, 3529.0, 5489.0, 8623.0, 13538.0, 22836.0, 38799.0, 68611.0, 129379.0, 244227.0, 442904.0, 2928465.0, 1457480.0, 414743.0, 226887.0, 119603.0, 64500.0, 35892.0, 21091.0, 12758.0, 8105.0, 5143.0, 3307.0, 2320.0, 1588.0, 1052.0, 706.0, 546.0, 346.0, 290.0, 201.0, 130.0, 88.0, 74.0, 60.0, 34.0, 28.0, 23.0, 19.0, 10.0, 8.0, 5.0], "bins": [-2.091796875, -2.0301666259765625, -1.968536376953125, -1.9069061279296875, -1.84527587890625, -1.7836456298828125, -1.722015380859375, -1.6603851318359375, -1.5987548828125, -1.5371246337890625, -1.475494384765625, -1.4138641357421875, -1.35223388671875, -1.2906036376953125, -1.228973388671875, -1.1673431396484375, -1.105712890625, -1.0440826416015625, -0.982452392578125, -0.9208221435546875, -0.85919189453125, -0.7975616455078125, -0.735931396484375, -0.6743011474609375, -0.6126708984375, -0.5510406494140625, -0.489410400390625, -0.4277801513671875, -0.36614990234375, -0.3045196533203125, -0.242889404296875, -0.1812591552734375, -0.11962890625, -0.0579986572265625, 0.003631591796875, 0.0652618408203125, 0.12689208984375, 0.1885223388671875, 0.250152587890625, 0.3117828369140625, 0.3734130859375, 0.4350433349609375, 0.496673583984375, 0.5583038330078125, 0.61993408203125, 0.6815643310546875, 0.743194580078125, 0.8048248291015625, 0.866455078125, 0.9280853271484375, 0.989715576171875, 1.0513458251953125, 1.11297607421875, 1.1746063232421875, 1.236236572265625, 1.2978668212890625, 1.3594970703125, 1.4211273193359375, 1.482757568359375, 1.5443878173828125, 1.60601806640625, 1.6676483154296875, 1.729278564453125, 1.7909088134765625, 1.8525390625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 9.0, 10.0, 6.0, 10.0, 15.0, 7.0, 17.0, 21.0, 14.0, 23.0, 36.0, 32.0, 34.0, 31.0, 33.0, 44.0, 37.0, 46.0, 129.0, 759.0, 244.0, 43.0, 33.0, 39.0, 45.0, 37.0, 32.0, 20.0, 25.0, 22.0, 26.0, 18.0, 20.0, 29.0, 11.0, 8.0, 13.0, 6.0, 4.0, 6.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.2890625, -8.966552734375, -8.64404296875, -8.321533203125, -7.9990234375, -7.676513671875, -7.35400390625, -7.031494140625, -6.708984375, -6.386474609375, -6.06396484375, -5.741455078125, -5.4189453125, -5.096435546875, -4.77392578125, -4.451416015625, -4.12890625, -3.806396484375, -3.48388671875, -3.161376953125, -2.8388671875, -2.516357421875, -2.19384765625, -1.871337890625, -1.548828125, -1.226318359375, -0.90380859375, -0.581298828125, -0.2587890625, 0.063720703125, 0.38623046875, 0.708740234375, 1.03125, 1.353759765625, 1.67626953125, 1.998779296875, 2.3212890625, 2.643798828125, 2.96630859375, 3.288818359375, 3.611328125, 3.933837890625, 4.25634765625, 4.578857421875, 4.9013671875, 5.223876953125, 5.54638671875, 5.868896484375, 6.19140625, 6.513916015625, 6.83642578125, 7.158935546875, 7.4814453125, 7.803955078125, 8.12646484375, 8.448974609375, 8.771484375, 9.093994140625, 9.41650390625, 9.739013671875, 10.0615234375, 10.384033203125, 10.70654296875, 11.029052734375, 11.3515625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 10.0, 32.0, 33.0, 42.0, 73.0, 108.0, 167.0, 223.0, 294.0, 451.0, 638.0, 1065.0, 1621.0, 2474.0, 3801.0, 5940.0, 9829.0, 15979.0, 27510.0, 47915.0, 84866.0, 156282.0, 298747.0, 587823.0, 3764142.0, 606279.0, 308329.0, 160117.0, 86595.0, 48067.0, 28051.0, 16457.0, 10107.0, 6183.0, 3929.0, 2487.0, 1591.0, 1032.0, 715.0, 454.0, 325.0, 218.0, 128.0, 96.0, 68.0, 30.0, 24.0, 18.0, 25.0, 15.0, 10.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0], "bins": [-2.296875, -2.22161865234375, -2.1463623046875, -2.07110595703125, -1.995849609375, -1.92059326171875, -1.8453369140625, -1.77008056640625, -1.69482421875, -1.61956787109375, -1.5443115234375, -1.46905517578125, -1.393798828125, -1.31854248046875, -1.2432861328125, -1.16802978515625, -1.0927734375, -1.01751708984375, -0.9422607421875, -0.86700439453125, -0.791748046875, -0.71649169921875, -0.6412353515625, -0.56597900390625, -0.49072265625, -0.41546630859375, -0.3402099609375, -0.26495361328125, -0.189697265625, -0.11444091796875, -0.0391845703125, 0.03607177734375, 0.111328125, 0.18658447265625, 0.2618408203125, 0.33709716796875, 0.412353515625, 0.48760986328125, 0.5628662109375, 0.63812255859375, 0.71337890625, 0.78863525390625, 0.8638916015625, 0.93914794921875, 1.014404296875, 1.08966064453125, 1.1649169921875, 1.24017333984375, 1.3154296875, 1.39068603515625, 1.4659423828125, 1.54119873046875, 1.616455078125, 1.69171142578125, 1.7669677734375, 1.84222412109375, 1.91748046875, 1.99273681640625, 2.0679931640625, 2.14324951171875, 2.218505859375, 2.29376220703125, 2.3690185546875, 2.44427490234375, 2.51953125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 4.0, 2.0, 14.0, 13.0, 22.0, 17.0, 19.0, 12.0, 20.0, 28.0, 20.0, 37.0, 29.0, 30.0, 36.0, 31.0, 39.0, 36.0, 101.0, 681.0, 338.0, 57.0, 41.0, 42.0, 40.0, 47.0, 39.0, 23.0, 23.0, 25.0, 19.0, 21.0, 26.0, 12.0, 13.0, 11.0, 12.0, 8.0, 6.0, 9.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.90625, -7.666259765625, -7.42626953125, -7.186279296875, -6.9462890625, -6.706298828125, -6.46630859375, -6.226318359375, -5.986328125, -5.746337890625, -5.50634765625, -5.266357421875, -5.0263671875, -4.786376953125, -4.54638671875, -4.306396484375, -4.06640625, -3.826416015625, -3.58642578125, -3.346435546875, -3.1064453125, -2.866455078125, -2.62646484375, -2.386474609375, -2.146484375, -1.906494140625, -1.66650390625, -1.426513671875, -1.1865234375, -0.946533203125, -0.70654296875, -0.466552734375, -0.2265625, 0.013427734375, 0.25341796875, 0.493408203125, 0.7333984375, 0.973388671875, 1.21337890625, 1.453369140625, 1.693359375, 1.933349609375, 2.17333984375, 2.413330078125, 2.6533203125, 2.893310546875, 3.13330078125, 3.373291015625, 3.61328125, 3.853271484375, 4.09326171875, 4.333251953125, 4.5732421875, 4.813232421875, 5.05322265625, 5.293212890625, 5.533203125, 5.773193359375, 6.01318359375, 6.253173828125, 6.4931640625, 6.733154296875, 6.97314453125, 7.213134765625, 7.453125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 1.0, 5.0, 7.0, 13.0, 24.0, 26.0, 32.0, 50.0, 71.0, 72.0, 105.0, 136.0, 192.0, 289.0, 312.0, 452.0, 706.0, 965.0, 1557.0, 2628.0, 4359.0, 8559.0, 19359.0, 62235.0, 5495867.0, 595629.0, 58679.0, 18992.0, 8323.0, 4279.0, 2475.0, 1561.0, 1012.0, 672.0, 460.0, 353.0, 259.0, 159.0, 140.0, 100.0, 84.0, 61.0, 42.0, 39.0, 27.0, 21.0, 12.0, 14.0, 12.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-10.609375, -10.2877197265625, -9.966064453125, -9.6444091796875, -9.32275390625, -9.0010986328125, -8.679443359375, -8.3577880859375, -8.0361328125, -7.7144775390625, -7.392822265625, -7.0711669921875, -6.74951171875, -6.4278564453125, -6.106201171875, -5.7845458984375, -5.462890625, -5.1412353515625, -4.819580078125, -4.4979248046875, -4.17626953125, -3.8546142578125, -3.532958984375, -3.2113037109375, -2.8896484375, -2.5679931640625, -2.246337890625, -1.9246826171875, -1.60302734375, -1.2813720703125, -0.959716796875, -0.6380615234375, -0.31640625, 0.0052490234375, 0.326904296875, 0.6485595703125, 0.97021484375, 1.2918701171875, 1.613525390625, 1.9351806640625, 2.2568359375, 2.5784912109375, 2.900146484375, 3.2218017578125, 3.54345703125, 3.8651123046875, 4.186767578125, 4.5084228515625, 4.830078125, 5.1517333984375, 5.473388671875, 5.7950439453125, 6.11669921875, 6.4383544921875, 6.760009765625, 7.0816650390625, 7.4033203125, 7.7249755859375, 8.046630859375, 8.3682861328125, 8.68994140625, 9.0115966796875, 9.333251953125, 9.6549072265625, 9.9765625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 5.0, 6.0, 4.0, 5.0, 9.0, 12.0, 10.0, 9.0, 23.0, 16.0, 20.0, 18.0, 21.0, 19.0, 25.0, 31.0, 44.0, 32.0, 32.0, 38.0, 51.0, 74.0, 141.0, 505.0, 394.0, 75.0, 40.0, 30.0, 32.0, 36.0, 26.0, 31.0, 19.0, 18.0, 20.0, 19.0, 12.0, 23.0, 9.0, 16.0, 15.0, 17.0, 10.0, 7.0, 2.0, 9.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.0703125, -4.90692138671875, -4.7435302734375, -4.58013916015625, -4.416748046875, -4.25335693359375, -4.0899658203125, -3.92657470703125, -3.76318359375, -3.59979248046875, -3.4364013671875, -3.27301025390625, -3.109619140625, -2.94622802734375, -2.7828369140625, -2.61944580078125, -2.4560546875, -2.29266357421875, -2.1292724609375, -1.96588134765625, -1.802490234375, -1.63909912109375, -1.4757080078125, -1.31231689453125, -1.14892578125, -0.98553466796875, -0.8221435546875, -0.65875244140625, -0.495361328125, -0.33197021484375, -0.1685791015625, -0.00518798828125, 0.158203125, 0.32159423828125, 0.4849853515625, 0.64837646484375, 0.811767578125, 0.97515869140625, 1.1385498046875, 1.30194091796875, 1.46533203125, 1.62872314453125, 1.7921142578125, 1.95550537109375, 2.118896484375, 2.28228759765625, 2.4456787109375, 2.60906982421875, 2.7724609375, 2.93585205078125, 3.0992431640625, 3.26263427734375, 3.426025390625, 3.58941650390625, 3.7528076171875, 3.91619873046875, 4.07958984375, 4.24298095703125, 4.4063720703125, 4.56976318359375, 4.733154296875, 4.89654541015625, 5.0599365234375, 5.22332763671875, 5.38671875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 10.0, 9.0, 37.0, 80.0, 176.0, 309.0, 233.0, 98.0, 23.0, 11.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.99706268310547, -43.09306335449219, -42.189064025878906, -41.285064697265625, -40.381065368652344, -39.47706604003906, -38.57306671142578, -37.669071197509766, -36.765071868896484, -35.8610725402832, -34.95707321166992, -34.05307388305664, -33.14907455444336, -32.245079040527344, -31.34107780456543, -30.43707847595215, -29.533079147338867, -28.629079818725586, -27.725080490112305, -26.821083068847656, -25.917083740234375, -25.013084411621094, -24.109085083007812, -23.20508575439453, -22.30108642578125, -21.39708709716797, -20.493087768554688, -19.589088439941406, -18.685091018676758, -17.781091690063477, -16.877092361450195, -15.973093032836914, -15.069096565246582, -14.1650972366333, -13.261098861694336, -12.357099533081055, -11.453100204467773, -10.549101829528809, -9.645102500915527, -8.741104125976562, -7.837104797363281, -6.933105945587158, -6.029107093811035, -5.125107765197754, -4.221108913421631, -3.317110061645508, -2.4131107330322266, -1.5091118812561035, -0.6051130294799805, 0.29888594150543213, 1.2028849124908447, 2.106884002685547, 3.01088285446167, 3.914881706237793, 4.818881034851074, 5.722879886627197, 6.62687873840332, 7.530877590179443, 8.434876441955566, 9.338875770568848, 10.242874145507812, 11.146873474121094, 12.050872802734375, 12.954872131347656, 13.858870506286621]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 17.0, 22.0, 24.0, 23.0, 38.0, 42.0, 39.0, 53.0, 70.0, 67.0, 61.0, 71.0, 77.0, 71.0, 73.0, 55.0, 48.0, 25.0, 28.0, 17.0, 14.0, 12.0, 14.0, 8.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.263928413391113, -14.757878303527832, -14.25182819366455, -13.74577808380127, -13.239728927612305, -12.733678817749023, -12.227628707885742, -11.721578598022461, -11.21552848815918, -10.709478378295898, -10.203428268432617, -9.697378158569336, -9.191328048706055, -8.685277938842773, -8.179228782653809, -7.673178672790527, -7.167128562927246, -6.661078453063965, -6.155028343200684, -5.6489787101745605, -5.142928600311279, -4.636878490447998, -4.130828857421875, -3.6247787475585938, -3.1187286376953125, -2.6126785278320312, -2.106628656387329, -1.6005786657333374, -1.0945286750793457, -0.5884785652160645, -0.0824286937713623, 0.42362117767333984, 0.9296722412109375, 1.4357222318649292, 1.941772222518921, 2.447822093963623, 2.9538722038269043, 3.4599223136901855, 3.9659721851348877, 4.47202205657959, 4.978072166442871, 5.484122276306152, 5.990172386169434, 6.496222019195557, 7.002272129058838, 7.508322238922119, 8.014371871948242, 8.520421981811523, 9.026472091674805, 9.532522201538086, 10.038572311401367, 10.544622421264648, 11.05067253112793, 11.556722640991211, 12.062771797180176, 12.568821907043457, 13.074872016906738, 13.58092212677002, 14.0869722366333, 14.593022346496582, 15.099071502685547, 15.605121612548828, 16.11117172241211, 16.61722183227539, 17.123271942138672]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 8.0, 8.0, 14.0, 10.0, 22.0, 34.0, 43.0, 51.0, 76.0, 112.0, 158.0, 208.0, 315.0, 482.0, 732.0, 1237.0, 1983.0, 3272.0, 6075.0, 12140.0, 29409.0, 105581.0, 3804638.0, 153821.0, 38835.0, 16019.0, 7727.0, 4329.0, 2527.0, 1543.0, 939.0, 611.0, 402.0, 282.0, 177.0, 130.0, 89.0, 69.0, 33.0, 42.0, 18.0, 22.0, 10.0, 16.0, 7.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.2049560546875, -0.19803237915039062, -0.19110870361328125, -0.18418502807617188, -0.1772613525390625, -0.17033767700195312, -0.16341400146484375, -0.15649032592773438, -0.149566650390625, -0.14264297485351562, -0.13571929931640625, -0.12879562377929688, -0.1218719482421875, -0.11494827270507812, -0.10802459716796875, -0.10110092163085938, -0.09417724609375, -0.08725357055664062, -0.08032989501953125, -0.07340621948242188, -0.0664825439453125, -0.059558868408203125, -0.05263519287109375, -0.045711517333984375, -0.038787841796875, -0.031864166259765625, -0.02494049072265625, -0.018016815185546875, -0.0110931396484375, -0.004169464111328125, 0.00275421142578125, 0.009677886962890625, 0.0166015625, 0.023525238037109375, 0.03044891357421875, 0.037372589111328125, 0.0442962646484375, 0.051219940185546875, 0.05814361572265625, 0.06506729125976562, 0.071990966796875, 0.07891464233398438, 0.08583831787109375, 0.09276199340820312, 0.0996856689453125, 0.10660934448242188, 0.11353302001953125, 0.12045669555664062, 0.12738037109375, 0.13430404663085938, 0.14122772216796875, 0.14815139770507812, 0.1550750732421875, 0.16199874877929688, 0.16892242431640625, 0.17584609985351562, 0.182769775390625, 0.18969345092773438, 0.19661712646484375, 0.20354080200195312, 0.2104644775390625, 0.21738815307617188, 0.22431182861328125, 0.23123550415039062, 0.2381591796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 1.0, 3.0, 8.0, 5.0, 10.0, 15.0, 19.0, 20.0, 44.0, 751.0, 19.0, 20.0, 17.0, 6.0, 8.0, 3.0, 7.0, 3.0, 5.0, 3.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06097412109375, -0.05882549285888672, -0.05667686462402344, -0.054528236389160156, -0.052379608154296875, -0.050230979919433594, -0.04808235168457031, -0.04593372344970703, -0.04378509521484375, -0.04163646697998047, -0.03948783874511719, -0.037339210510253906, -0.035190582275390625, -0.033041954040527344, -0.030893325805664062, -0.02874469757080078, -0.0265960693359375, -0.02444744110107422, -0.022298812866210938, -0.020150184631347656, -0.018001556396484375, -0.015852928161621094, -0.013704299926757812, -0.011555671691894531, -0.00940704345703125, -0.007258415222167969, -0.0051097869873046875, -0.0029611587524414062, -0.000812530517578125, 0.0013360977172851562, 0.0034847259521484375, 0.005633354187011719, 0.007781982421875, 0.009930610656738281, 0.012079238891601562, 0.014227867126464844, 0.016376495361328125, 0.018525123596191406, 0.020673751831054688, 0.02282238006591797, 0.02497100830078125, 0.02711963653564453, 0.029268264770507812, 0.031416893005371094, 0.033565521240234375, 0.035714149475097656, 0.03786277770996094, 0.04001140594482422, 0.0421600341796875, 0.04430866241455078, 0.04645729064941406, 0.048605918884277344, 0.050754547119140625, 0.052903175354003906, 0.05505180358886719, 0.05720043182373047, 0.05934906005859375, 0.06149768829345703, 0.06364631652832031, 0.0657949447631836, 0.06794357299804688, 0.07009220123291016, 0.07224082946777344, 0.07438945770263672, 0.0765380859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 11.0, 10.0, 12.0, 28.0, 31.0, 52.0, 76.0, 145.0, 272.0, 430.0, 894.0, 1901.0, 4254.0, 10652.0, 30840.0, 106418.0, 517918.0, 2725018.0, 622595.0, 119964.0, 33609.0, 11176.0, 4300.0, 1873.0, 865.0, 380.0, 232.0, 118.0, 66.0, 49.0, 30.0, 18.0, 21.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.223876953125, -0.21757888793945312, -0.21128082275390625, -0.20498275756835938, -0.1986846923828125, -0.19238662719726562, -0.18608856201171875, -0.17979049682617188, -0.173492431640625, -0.16719436645507812, -0.16089630126953125, -0.15459823608398438, -0.1483001708984375, -0.14200210571289062, -0.13570404052734375, -0.12940597534179688, -0.12310791015625, -0.11680984497070312, -0.11051177978515625, -0.10421371459960938, -0.0979156494140625, -0.09161758422851562, -0.08531951904296875, -0.07902145385742188, -0.072723388671875, -0.06642532348632812, -0.06012725830078125, -0.053829193115234375, -0.0475311279296875, -0.041233062744140625, -0.03493499755859375, -0.028636932373046875, -0.0223388671875, -0.016040802001953125, -0.00974273681640625, -0.003444671630859375, 0.0028533935546875, 0.009151458740234375, 0.01544952392578125, 0.021747589111328125, 0.028045654296875, 0.034343719482421875, 0.04064178466796875, 0.046939849853515625, 0.0532379150390625, 0.059535980224609375, 0.06583404541015625, 0.07213211059570312, 0.07843017578125, 0.08472824096679688, 0.09102630615234375, 0.09732437133789062, 0.1036224365234375, 0.10992050170898438, 0.11621856689453125, 0.12251663208007812, 0.128814697265625, 0.13511276245117188, 0.14141082763671875, 0.14770889282226562, 0.1540069580078125, 0.16030502319335938, 0.16660308837890625, 0.17290115356445312, 0.17919921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 4.0, 7.0, 7.0, 7.0, 9.0, 18.0, 30.0, 28.0, 42.0, 44.0, 89.0, 85.0, 127.0, 205.0, 287.0, 476.0, 777.0, 656.0, 367.0, 235.0, 172.0, 97.0, 69.0, 45.0, 55.0, 32.0, 23.0, 22.0, 16.0, 11.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0823974609375, -0.08009052276611328, -0.07778358459472656, -0.07547664642333984, -0.07316970825195312, -0.0708627700805664, -0.06855583190917969, -0.06624889373779297, -0.06394195556640625, -0.06163501739501953, -0.05932807922363281, -0.057021141052246094, -0.054714202880859375, -0.052407264709472656, -0.05010032653808594, -0.04779338836669922, -0.0454864501953125, -0.04317951202392578, -0.04087257385253906, -0.038565635681152344, -0.036258697509765625, -0.033951759338378906, -0.03164482116699219, -0.02933788299560547, -0.02703094482421875, -0.02472400665283203, -0.022417068481445312, -0.020110130310058594, -0.017803192138671875, -0.015496253967285156, -0.013189315795898438, -0.010882377624511719, -0.008575439453125, -0.006268501281738281, -0.0039615631103515625, -0.0016546249389648438, 0.000652313232421875, 0.0029592514038085938, 0.0052661895751953125, 0.007573127746582031, 0.00988006591796875, 0.012187004089355469, 0.014493942260742188, 0.016800880432128906, 0.019107818603515625, 0.021414756774902344, 0.023721694946289062, 0.02602863311767578, 0.0283355712890625, 0.03064250946044922, 0.03294944763183594, 0.035256385803222656, 0.037563323974609375, 0.039870262145996094, 0.04217720031738281, 0.04448413848876953, 0.04679107666015625, 0.04909801483154297, 0.05140495300292969, 0.053711891174316406, 0.056018829345703125, 0.058325767517089844, 0.06063270568847656, 0.06293964385986328, 0.06524658203125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 14.0, 28.0, 37.0, 79.0, 143.0, 207.0, 226.0, 145.0, 58.0, 39.0, 15.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7778091430664062, -0.7519026398658752, -0.7259961366653442, -0.700089693069458, -0.674183189868927, -0.648276686668396, -0.622370183467865, -0.596463680267334, -0.5705572366714478, -0.5446507334709167, -0.5187442302703857, -0.4928377568721771, -0.4669312834739685, -0.4410247802734375, -0.4151182770729065, -0.3892117738723755, -0.3633052706718445, -0.3373987674713135, -0.31149229407310486, -0.28558579087257385, -0.25967931747436523, -0.23377281427383423, -0.20786631107330322, -0.1819598227739334, -0.1560533344745636, -0.1301468461751938, -0.10424035042524338, -0.07833385467529297, -0.05242736637592316, -0.026520878076553345, -0.0006143748760223389, 0.025292113423347473, 0.05119854211807251, 0.07710503041744232, 0.10301152616739273, 0.12891802191734314, 0.15482451021671295, 0.18073099851608276, 0.20663750171661377, 0.23254399001598358, 0.2584504783153534, 0.2843569815158844, 0.310263454914093, 0.336169958114624, 0.36207646131515503, 0.38798293471336365, 0.41388943791389465, 0.43979591131210327, 0.4657024145126343, 0.4916089177131653, 0.5175154209136963, 0.5434218645095825, 0.5693283677101135, 0.5952348709106445, 0.6211413741111755, 0.6470478773117065, 0.6729543209075928, 0.6988608241081238, 0.7247673273086548, 0.750673770904541, 0.776580274105072, 0.802486777305603, 0.828393280506134, 0.854299783706665, 0.880206286907196]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 9.0, 8.0, 19.0, 20.0, 22.0, 30.0, 36.0, 35.0, 47.0, 54.0, 61.0, 59.0, 67.0, 78.0, 70.0, 60.0, 61.0, 56.0, 56.0, 26.0, 30.0, 20.0, 21.0, 13.0, 12.0, 8.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38632452487945557, -0.37400761246681213, -0.3616907000541687, -0.34937378764152527, -0.33705687522888184, -0.3247399628162384, -0.31242305040359497, -0.30010613799095154, -0.2877892255783081, -0.2754723131656647, -0.26315540075302124, -0.2508384883403778, -0.23852157592773438, -0.22620466351509094, -0.2138877511024475, -0.20157083868980408, -0.18925391137599945, -0.17693699896335602, -0.16462008655071259, -0.15230317413806915, -0.13998626172542572, -0.1276693493127823, -0.11535242944955826, -0.10303551703691483, -0.09071860462427139, -0.07840169221162796, -0.06608477979898453, -0.053767863661050797, -0.041450951248407364, -0.02913403883576393, -0.0168171226978302, -0.004500210285186768, 0.007816702127456665, 0.020133614540100098, 0.03245052695274353, 0.04476744309067726, 0.057084355503320694, 0.06940126419067383, 0.08171818405389786, 0.09403509646654129, 0.10635200887918472, 0.11866892129182816, 0.13098584115505219, 0.14330275356769562, 0.15561966598033905, 0.16793657839298248, 0.18025349080562592, 0.19257040321826935, 0.20488731563091278, 0.2172042280435562, 0.22952114045619965, 0.24183805286884308, 0.2541549801826477, 0.26647189259529114, 0.27878880500793457, 0.291105717420578, 0.30342262983322144, 0.31573954224586487, 0.3280564546585083, 0.34037336707115173, 0.35269027948379517, 0.3650071918964386, 0.37732410430908203, 0.38964101672172546, 0.4019579291343689]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 8.0, 13.0, 5.0, 17.0, 17.0, 34.0, 44.0, 63.0, 79.0, 128.0, 180.0, 261.0, 422.0, 617.0, 890.0, 1479.0, 2346.0, 3811.0, 6338.0, 12112.0, 25601.0, 226965.0, 699391.0, 33924.0, 14625.0, 7580.0, 4351.0, 2621.0, 1639.0, 967.0, 688.0, 408.0, 286.0, 192.0, 125.0, 97.0, 66.0, 45.0, 36.0, 19.0, 25.0, 13.0, 8.0, 3.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.31787109375, -0.3079795837402344, -0.29808807373046875, -0.2881965637207031, -0.2783050537109375, -0.2684135437011719, -0.25852203369140625, -0.24863052368164062, -0.238739013671875, -0.22884750366210938, -0.21895599365234375, -0.20906448364257812, -0.1991729736328125, -0.18928146362304688, -0.17938995361328125, -0.16949844360351562, -0.15960693359375, -0.14971542358398438, -0.13982391357421875, -0.12993240356445312, -0.1200408935546875, -0.11014938354492188, -0.10025787353515625, -0.09036636352539062, -0.080474853515625, -0.07058334350585938, -0.06069183349609375, -0.050800323486328125, -0.0409088134765625, -0.031017303466796875, -0.02112579345703125, -0.011234283447265625, -0.0013427734375, 0.008548736572265625, 0.01844024658203125, 0.028331756591796875, 0.0382232666015625, 0.048114776611328125, 0.05800628662109375, 0.06789779663085938, 0.077789306640625, 0.08768081665039062, 0.09757232666015625, 0.10746383666992188, 0.1173553466796875, 0.12724685668945312, 0.13713836669921875, 0.14702987670898438, 0.15692138671875, 0.16681289672851562, 0.17670440673828125, 0.18659591674804688, 0.1964874267578125, 0.20637893676757812, 0.21627044677734375, 0.22616195678710938, 0.236053466796875, 0.24594497680664062, 0.25583648681640625, 0.2657279968261719, 0.2756195068359375, 0.2855110168457031, 0.29540252685546875, 0.3052940368652344, 0.315185546875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 12.0, 13.0, 19.0, 26.0, 181.0, 426.0, 184.0, 31.0, 15.0, 8.0, 8.0, 9.0, 2.0, 3.0, 7.0, 4.0, 5.0, 2.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0614013671875, -0.05939292907714844, -0.057384490966796875, -0.05537605285644531, -0.05336761474609375, -0.05135917663574219, -0.049350738525390625, -0.04734230041503906, -0.0453338623046875, -0.04332542419433594, -0.041316986083984375, -0.03930854797363281, -0.03730010986328125, -0.03529167175292969, -0.033283233642578125, -0.03127479553222656, -0.029266357421875, -0.027257919311523438, -0.025249481201171875, -0.023241043090820312, -0.02123260498046875, -0.019224166870117188, -0.017215728759765625, -0.015207290649414062, -0.0131988525390625, -0.011190414428710938, -0.009181976318359375, -0.0071735382080078125, -0.00516510009765625, -0.0031566619873046875, -0.001148223876953125, 0.0008602142333984375, 0.00286865234375, 0.0048770904541015625, 0.006885528564453125, 0.008893966674804688, 0.01090240478515625, 0.012910842895507812, 0.014919281005859375, 0.016927719116210938, 0.0189361572265625, 0.020944595336914062, 0.022953033447265625, 0.024961471557617188, 0.02696990966796875, 0.028978347778320312, 0.030986785888671875, 0.03299522399902344, 0.035003662109375, 0.03701210021972656, 0.039020538330078125, 0.04102897644042969, 0.04303741455078125, 0.04504585266113281, 0.047054290771484375, 0.04906272888183594, 0.0510711669921875, 0.05307960510253906, 0.055088043212890625, 0.05709648132324219, 0.05910491943359375, 0.06111335754394531, 0.06312179565429688, 0.06513023376464844, 0.067138671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 11.0, 13.0, 11.0, 19.0, 26.0, 36.0, 51.0, 86.0, 141.0, 211.0, 306.0, 557.0, 1038.0, 2093.0, 5188.0, 14830.0, 52014.0, 218862.0, 507783.0, 180027.0, 43579.0, 12728.0, 4606.0, 1982.0, 945.0, 527.0, 304.0, 165.0, 131.0, 97.0, 41.0, 45.0, 24.0, 21.0, 12.0, 5.0, 5.0, 9.0, 6.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.3056640625, -0.2967872619628906, -0.28791046142578125, -0.2790336608886719, -0.2701568603515625, -0.2612800598144531, -0.25240325927734375, -0.24352645874023438, -0.234649658203125, -0.22577285766601562, -0.21689605712890625, -0.20801925659179688, -0.1991424560546875, -0.19026565551757812, -0.18138885498046875, -0.17251205444335938, -0.16363525390625, -0.15475845336914062, -0.14588165283203125, -0.13700485229492188, -0.1281280517578125, -0.11925125122070312, -0.11037445068359375, -0.10149765014648438, -0.092620849609375, -0.08374404907226562, -0.07486724853515625, -0.06599044799804688, -0.0571136474609375, -0.048236846923828125, -0.03936004638671875, -0.030483245849609375, -0.0216064453125, -0.012729644775390625, -0.00385284423828125, 0.005023956298828125, 0.0139007568359375, 0.022777557373046875, 0.03165435791015625, 0.040531158447265625, 0.049407958984375, 0.058284759521484375, 0.06716156005859375, 0.07603836059570312, 0.0849151611328125, 0.09379196166992188, 0.10266876220703125, 0.11154556274414062, 0.12042236328125, 0.12929916381835938, 0.13817596435546875, 0.14705276489257812, 0.1559295654296875, 0.16480636596679688, 0.17368316650390625, 0.18255996704101562, 0.191436767578125, 0.20031356811523438, 0.20919036865234375, 0.21806716918945312, 0.2269439697265625, 0.23582077026367188, 0.24469757080078125, 0.2535743713378906, 0.262451171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 12.0, 11.0, 11.0, 14.0, 21.0, 25.0, 21.0, 28.0, 29.0, 31.0, 34.0, 41.0, 51.0, 46.0, 41.0, 48.0, 46.0, 52.0, 50.0, 45.0, 47.0, 27.0, 42.0, 34.0, 37.0, 34.0, 19.0, 23.0, 13.0, 15.0, 13.0, 8.0, 2.0, 9.0, 7.0, 6.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.253173828125, -0.24493789672851562, -0.23670196533203125, -0.22846603393554688, -0.2202301025390625, -0.21199417114257812, -0.20375823974609375, -0.19552230834960938, -0.187286376953125, -0.17905044555664062, -0.17081451416015625, -0.16257858276367188, -0.1543426513671875, -0.14610671997070312, -0.13787078857421875, -0.12963485717773438, -0.12139892578125, -0.11316299438476562, -0.10492706298828125, -0.09669113159179688, -0.0884552001953125, -0.08021926879882812, -0.07198333740234375, -0.06374740600585938, -0.055511474609375, -0.047275543212890625, -0.03903961181640625, -0.030803680419921875, -0.0225677490234375, -0.014331817626953125, -0.00609588623046875, 0.002140045166015625, 0.0103759765625, 0.018611907958984375, 0.02684783935546875, 0.035083770751953125, 0.0433197021484375, 0.051555633544921875, 0.05979156494140625, 0.06802749633789062, 0.076263427734375, 0.08449935913085938, 0.09273529052734375, 0.10097122192382812, 0.1092071533203125, 0.11744308471679688, 0.12567901611328125, 0.13391494750976562, 0.14215087890625, 0.15038681030273438, 0.15862274169921875, 0.16685867309570312, 0.1750946044921875, 0.18333053588867188, 0.19156646728515625, 0.19980239868164062, 0.208038330078125, 0.21627426147460938, 0.22451019287109375, 0.23274612426757812, 0.2409820556640625, 0.24921798706054688, 0.25745391845703125, 0.2656898498535156, 0.27392578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 4.0, 5.0, 11.0, 10.0, 18.0, 24.0, 52.0, 62.0, 98.0, 176.0, 272.0, 529.0, 1157.0, 2838.0, 8840.0, 60830.0, 877939.0, 80101.0, 9944.0, 3124.0, 1210.0, 544.0, 290.0, 151.0, 83.0, 72.0, 50.0, 44.0, 25.0, 18.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.505828857421875, -0.48870849609375, -0.471588134765625, -0.4544677734375, -0.437347412109375, -0.42022705078125, -0.403106689453125, -0.385986328125, -0.368865966796875, -0.35174560546875, -0.334625244140625, -0.3175048828125, -0.300384521484375, -0.28326416015625, -0.266143798828125, -0.2490234375, -0.231903076171875, -0.21478271484375, -0.197662353515625, -0.1805419921875, -0.163421630859375, -0.14630126953125, -0.129180908203125, -0.112060546875, -0.094940185546875, -0.07781982421875, -0.060699462890625, -0.0435791015625, -0.026458740234375, -0.00933837890625, 0.007781982421875, 0.02490234375, 0.042022705078125, 0.05914306640625, 0.076263427734375, 0.0933837890625, 0.110504150390625, 0.12762451171875, 0.144744873046875, 0.161865234375, 0.178985595703125, 0.19610595703125, 0.213226318359375, 0.2303466796875, 0.247467041015625, 0.26458740234375, 0.281707763671875, 0.298828125, 0.315948486328125, 0.33306884765625, 0.350189208984375, 0.3673095703125, 0.384429931640625, 0.40155029296875, 0.418670654296875, 0.435791015625, 0.452911376953125, 0.47003173828125, 0.487152099609375, 0.5042724609375, 0.521392822265625, 0.53851318359375, 0.555633544921875, 0.57275390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 8.0, 4.0, 1.0, 8.0, 6.0, 11.0, 15.0, 18.0, 28.0, 35.0, 51.0, 46.0, 70.0, 59.0, 73.0, 58.0, 100.0, 75.0, 59.0, 51.0, 43.0, 33.0, 39.0, 24.0, 21.0, 7.0, 15.0, 9.0, 5.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.722574234008789e-05, -1.6555190086364746e-05, -1.58846378326416e-05, -1.5214085578918457e-05, -1.4543533325195312e-05, -1.3872981071472168e-05, -1.3202428817749023e-05, -1.2531876564025879e-05, -1.1861324310302734e-05, -1.119077205657959e-05, -1.0520219802856445e-05, -9.8496675491333e-06, -9.179115295410156e-06, -8.508563041687012e-06, -7.838010787963867e-06, -7.167458534240723e-06, -6.496906280517578e-06, -5.826354026794434e-06, -5.155801773071289e-06, -4.4852495193481445e-06, -3.814697265625e-06, -3.1441450119018555e-06, -2.473592758178711e-06, -1.8030405044555664e-06, -1.1324882507324219e-06, -4.6193599700927734e-07, 2.086162567138672e-07, 8.791685104370117e-07, 1.5497207641601562e-06, 2.2202730178833008e-06, 2.8908252716064453e-06, 3.56137752532959e-06, 4.231929779052734e-06, 4.902482032775879e-06, 5.5730342864990234e-06, 6.243586540222168e-06, 6.9141387939453125e-06, 7.584691047668457e-06, 8.255243301391602e-06, 8.925795555114746e-06, 9.59634780883789e-06, 1.0266900062561035e-05, 1.093745231628418e-05, 1.1608004570007324e-05, 1.2278556823730469e-05, 1.2949109077453613e-05, 1.3619661331176758e-05, 1.4290213584899902e-05, 1.4960765838623047e-05, 1.563131809234619e-05, 1.6301870346069336e-05, 1.697242259979248e-05, 1.7642974853515625e-05, 1.831352710723877e-05, 1.8984079360961914e-05, 1.965463161468506e-05, 2.0325183868408203e-05, 2.0995736122131348e-05, 2.1666288375854492e-05, 2.2336840629577637e-05, 2.300739288330078e-05, 2.3677945137023926e-05, 2.434849739074707e-05, 2.5019049644470215e-05, 2.568960189819336e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 7.0, 5.0, 17.0, 23.0, 25.0, 51.0, 62.0, 91.0, 113.0, 201.0, 291.0, 410.0, 741.0, 1351.0, 2493.0, 4686.0, 10600.0, 26936.0, 82704.0, 312472.0, 426013.0, 116963.0, 35916.0, 13589.0, 6000.0, 2900.0, 1555.0, 845.0, 516.0, 305.0, 207.0, 128.0, 97.0, 73.0, 47.0, 30.0, 22.0, 16.0, 13.0, 5.0, 5.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.23828125, -0.23109054565429688, -0.22389984130859375, -0.21670913696289062, -0.2095184326171875, -0.20232772827148438, -0.19513702392578125, -0.18794631958007812, -0.180755615234375, -0.17356491088867188, -0.16637420654296875, -0.15918350219726562, -0.1519927978515625, -0.14480209350585938, -0.13761138916015625, -0.13042068481445312, -0.12322998046875, -0.11603927612304688, -0.10884857177734375, -0.10165786743164062, -0.0944671630859375, -0.08727645874023438, -0.08008575439453125, -0.07289505004882812, -0.065704345703125, -0.058513641357421875, -0.05132293701171875, -0.044132232666015625, -0.0369415283203125, -0.029750823974609375, -0.02256011962890625, -0.015369415283203125, -0.0081787109375, -0.000988006591796875, 0.00620269775390625, 0.013393402099609375, 0.0205841064453125, 0.027774810791015625, 0.03496551513671875, 0.042156219482421875, 0.049346923828125, 0.056537628173828125, 0.06372833251953125, 0.07091903686523438, 0.0781097412109375, 0.08530044555664062, 0.09249114990234375, 0.09968185424804688, 0.10687255859375, 0.11406326293945312, 0.12125396728515625, 0.12844467163085938, 0.1356353759765625, 0.14282608032226562, 0.15001678466796875, 0.15720748901367188, 0.164398193359375, 0.17158889770507812, 0.17877960205078125, 0.18597030639648438, 0.1931610107421875, 0.20035171508789062, 0.20754241943359375, 0.21473312377929688, 0.221923828125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 5.0, 3.0, 8.0, 12.0, 16.0, 15.0, 26.0, 35.0, 28.0, 38.0, 49.0, 44.0, 62.0, 77.0, 71.0, 69.0, 56.0, 50.0, 58.0, 47.0, 48.0, 30.0, 27.0, 20.0, 35.0, 12.0, 10.0, 7.0, 9.0, 4.0, 6.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.204833984375, -0.19755172729492188, -0.19026947021484375, -0.18298721313476562, -0.1757049560546875, -0.16842269897460938, -0.16114044189453125, -0.15385818481445312, -0.146575927734375, -0.13929367065429688, -0.13201141357421875, -0.12472915649414062, -0.1174468994140625, -0.11016464233398438, -0.10288238525390625, -0.09560012817382812, -0.08831787109375, -0.08103561401367188, -0.07375335693359375, -0.06647109985351562, -0.0591888427734375, -0.051906585693359375, -0.04462432861328125, -0.037342071533203125, -0.030059814453125, -0.022777557373046875, -0.01549530029296875, -0.008213043212890625, -0.0009307861328125, 0.006351470947265625, 0.01363372802734375, 0.020915985107421875, 0.0281982421875, 0.035480499267578125, 0.04276275634765625, 0.050045013427734375, 0.0573272705078125, 0.06460952758789062, 0.07189178466796875, 0.07917404174804688, 0.086456298828125, 0.09373855590820312, 0.10102081298828125, 0.10830307006835938, 0.1155853271484375, 0.12286758422851562, 0.13014984130859375, 0.13743209838867188, 0.14471435546875, 0.15199661254882812, 0.15927886962890625, 0.16656112670898438, 0.1738433837890625, 0.18112564086914062, 0.18840789794921875, 0.19569015502929688, 0.202972412109375, 0.21025466918945312, 0.21753692626953125, 0.22481918334960938, 0.2321014404296875, 0.23938369750976562, 0.24666595458984375, 0.2539482116699219, 0.26123046875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 18.0, 25.0, 83.0, 195.0, 336.0, 200.0, 74.0, 25.0, 13.0, 6.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.972434043884277, -4.819847106933594, -4.667260646820068, -4.514673709869385, -4.362086772918701, -4.209499835968018, -4.056913375854492, -3.9043264389038086, -3.751739501953125, -3.5991528034210205, -3.446565866470337, -3.2939791679382324, -3.141392230987549, -2.9888055324554443, -2.83621883392334, -2.6836318969726562, -2.5310451984405518, -2.3784584999084473, -2.2258715629577637, -2.073284864425659, -1.9206979274749756, -1.768111228942871, -1.615524411201477, -1.462937593460083, -1.310350775718689, -1.157763957977295, -1.0051771402359009, -0.8525903820991516, -0.7000035643577576, -0.5474167466163635, -0.39482998847961426, -0.24224317073822021, -0.08965635299682617, 0.06293044984340668, 0.21551725268363953, 0.3681040406227112, 0.5206908583641052, 0.6732776761054993, 0.8258644342422485, 0.9784512519836426, 1.1310380697250366, 1.2836248874664307, 1.4362117052078247, 1.5887985229492188, 1.7413852214813232, 1.8939721584320068, 2.0465588569641113, 2.199145793914795, 2.3517324924468994, 2.504319190979004, 2.6569061279296875, 2.809492826461792, 2.9620797634124756, 3.11466646194458, 3.2672533988952637, 3.419840097427368, 3.5724267959594727, 3.725013494491577, 3.8776004314422607, 4.030187129974365, 4.182774066925049, 4.335361003875732, 4.487947463989258, 4.640534400939941, 4.793121337890625]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 5.0, 7.0, 8.0, 17.0, 23.0, 32.0, 60.0, 93.0, 153.0, 168.0, 145.0, 96.0, 52.0, 43.0, 24.0, 12.0, 10.0, 5.0, 9.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.309418201446533, -5.1514363288879395, -4.993454933166504, -4.83547306060791, -4.677491188049316, -4.519509315490723, -4.361527442932129, -4.203546047210693, -4.0455641746521, -3.887582302093506, -3.729600667953491, -3.5716190338134766, -3.413637161254883, -3.255655288696289, -3.0976736545562744, -2.9396920204162598, -2.781710147857666, -2.6237282752990723, -2.4657466411590576, -2.307765007019043, -2.149783134460449, -1.991801381111145, -1.8338196277618408, -1.6758378744125366, -1.5178561210632324, -1.3598743677139282, -1.201892614364624, -1.0439108610153198, -0.8859291076660156, -0.7279473543167114, -0.5699656009674072, -0.411983847618103, -0.25400257110595703, -0.09602081775665283, 0.06196093559265137, 0.21994268894195557, 0.37792444229125977, 0.535906195640564, 0.6938879489898682, 0.8518697023391724, 1.0098514556884766, 1.1678332090377808, 1.325814962387085, 1.4837967157363892, 1.6417784690856934, 1.7997602224349976, 1.9577419757843018, 2.1157236099243164, 2.27370548248291, 2.431687355041504, 2.5896689891815186, 2.747650623321533, 2.905632495880127, 3.0636143684387207, 3.2215960025787354, 3.37957763671875, 3.5375595092773438, 3.6955413818359375, 3.853523015975952, 4.011504650115967, 4.1694865226745605, 4.327468395233154, 4.48544979095459, 4.643431663513184, 4.801413536071777]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 13.0, 8.0, 9.0, 7.0, 13.0, 21.0, 34.0, 82.0, 260.0, 1243.0, 9365.0, 654588.0, 3512291.0, 13534.0, 2011.0, 478.0, 156.0, 60.0, 28.0, 18.0, 14.0, 8.0, 11.0, 5.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.729522705078125, -1.66998291015625, -1.610443115234375, -1.5509033203125, -1.491363525390625, -1.43182373046875, -1.372283935546875, -1.312744140625, -1.253204345703125, -1.19366455078125, -1.134124755859375, -1.0745849609375, -1.015045166015625, -0.95550537109375, -0.895965576171875, -0.83642578125, -0.776885986328125, -0.71734619140625, -0.657806396484375, -0.5982666015625, -0.538726806640625, -0.47918701171875, -0.419647216796875, -0.360107421875, -0.300567626953125, -0.24102783203125, -0.181488037109375, -0.1219482421875, -0.062408447265625, -0.00286865234375, 0.056671142578125, 0.1162109375, 0.175750732421875, 0.23529052734375, 0.294830322265625, 0.3543701171875, 0.413909912109375, 0.47344970703125, 0.532989501953125, 0.592529296875, 0.652069091796875, 0.71160888671875, 0.771148681640625, 0.8306884765625, 0.890228271484375, 0.94976806640625, 1.009307861328125, 1.06884765625, 1.128387451171875, 1.18792724609375, 1.247467041015625, 1.3070068359375, 1.366546630859375, 1.42608642578125, 1.485626220703125, 1.545166015625, 1.604705810546875, 1.66424560546875, 1.723785400390625, 1.7833251953125, 1.842864990234375, 1.90240478515625, 1.961944580078125, 2.021484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 5.0, 8.0, 8.0, 16.0, 13.0, 10.0, 29.0, 58.0, 108.0, 169.0, 191.0, 150.0, 61.0, 55.0, 16.0, 11.0, 5.0, 5.0, 13.0, 12.0, 6.0, 3.0, 2.0, 4.0, 6.0, 3.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.034820556640625, -0.033509254455566406, -0.03219795227050781, -0.03088665008544922, -0.029575347900390625, -0.02826404571533203, -0.026952743530273438, -0.025641441345214844, -0.02433013916015625, -0.023018836975097656, -0.021707534790039062, -0.02039623260498047, -0.019084930419921875, -0.01777362823486328, -0.016462326049804688, -0.015151023864746094, -0.0138397216796875, -0.012528419494628906, -0.011217117309570312, -0.009905815124511719, -0.008594512939453125, -0.007283210754394531, -0.0059719085693359375, -0.004660606384277344, -0.00334930419921875, -0.0020380020141601562, -0.0007266998291015625, 0.0005846023559570312, 0.001895904541015625, 0.0032072067260742188, 0.0045185089111328125, 0.005829811096191406, 0.00714111328125, 0.008452415466308594, 0.009763717651367188, 0.011075019836425781, 0.012386322021484375, 0.013697624206542969, 0.015008926391601562, 0.016320228576660156, 0.01763153076171875, 0.018942832946777344, 0.020254135131835938, 0.02156543731689453, 0.022876739501953125, 0.02418804168701172, 0.025499343872070312, 0.026810646057128906, 0.0281219482421875, 0.029433250427246094, 0.030744552612304688, 0.03205585479736328, 0.033367156982421875, 0.03467845916748047, 0.03598976135253906, 0.037301063537597656, 0.03861236572265625, 0.039923667907714844, 0.04123497009277344, 0.04254627227783203, 0.043857574462890625, 0.04516887664794922, 0.04648017883300781, 0.047791481018066406, 0.049102783203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 7.0, 7.0, 12.0, 7.0, 18.0, 33.0, 33.0, 72.0, 81.0, 130.0, 180.0, 306.0, 601.0, 1145.0, 2458.0, 6579.0, 21231.0, 97273.0, 1304138.0, 2593578.0, 127856.0, 25318.0, 7466.0, 2806.0, 1278.0, 670.0, 354.0, 216.0, 132.0, 104.0, 56.0, 40.0, 27.0, 20.0, 12.0, 10.0, 12.0, 6.0, 4.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441650390625, -0.4259223937988281, -0.41019439697265625, -0.3944664001464844, -0.3787384033203125, -0.3630104064941406, -0.34728240966796875, -0.3315544128417969, -0.315826416015625, -0.3000984191894531, -0.28437042236328125, -0.2686424255371094, -0.2529144287109375, -0.23718643188476562, -0.22145843505859375, -0.20573043823242188, -0.19000244140625, -0.17427444458007812, -0.15854644775390625, -0.14281845092773438, -0.1270904541015625, -0.11136245727539062, -0.09563446044921875, -0.07990646362304688, -0.064178466796875, -0.048450469970703125, -0.03272247314453125, -0.016994476318359375, -0.0012664794921875, 0.014461517333984375, 0.03018951416015625, 0.045917510986328125, 0.0616455078125, 0.07737350463867188, 0.09310150146484375, 0.10882949829101562, 0.1245574951171875, 0.14028549194335938, 0.15601348876953125, 0.17174148559570312, 0.187469482421875, 0.20319747924804688, 0.21892547607421875, 0.23465347290039062, 0.2503814697265625, 0.2661094665527344, 0.28183746337890625, 0.2975654602050781, 0.31329345703125, 0.3290214538574219, 0.34474945068359375, 0.3604774475097656, 0.3762054443359375, 0.3919334411621094, 0.40766143798828125, 0.4233894348144531, 0.439117431640625, 0.4548454284667969, 0.47057342529296875, 0.4863014221191406, 0.5020294189453125, 0.5177574157714844, 0.5334854125976562, 0.5492134094238281, 0.56494140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 13.0, 24.0, 15.0, 29.0, 39.0, 67.0, 97.0, 173.0, 337.0, 856.0, 1486.0, 475.0, 191.0, 92.0, 69.0, 23.0, 29.0, 14.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06597900390625, -0.06301498413085938, -0.06005096435546875, -0.057086944580078125, -0.0541229248046875, -0.051158905029296875, -0.04819488525390625, -0.045230865478515625, -0.042266845703125, -0.039302825927734375, -0.03633880615234375, -0.033374786376953125, -0.0304107666015625, -0.027446746826171875, -0.02448272705078125, -0.021518707275390625, -0.0185546875, -0.015590667724609375, -0.01262664794921875, -0.009662628173828125, -0.0066986083984375, -0.003734588623046875, -0.00077056884765625, 0.002193450927734375, 0.005157470703125, 0.008121490478515625, 0.01108551025390625, 0.014049530029296875, 0.0170135498046875, 0.019977569580078125, 0.02294158935546875, 0.025905609130859375, 0.02886962890625, 0.031833648681640625, 0.03479766845703125, 0.037761688232421875, 0.0407257080078125, 0.043689727783203125, 0.04665374755859375, 0.049617767333984375, 0.052581787109375, 0.055545806884765625, 0.05850982666015625, 0.061473846435546875, 0.0644378662109375, 0.06740188598632812, 0.07036590576171875, 0.07332992553710938, 0.0762939453125, 0.07925796508789062, 0.08222198486328125, 0.08518600463867188, 0.0881500244140625, 0.09111404418945312, 0.09407806396484375, 0.09704208374023438, 0.100006103515625, 0.10297012329101562, 0.10593414306640625, 0.10889816284179688, 0.1118621826171875, 0.11482620239257812, 0.11779022216796875, 0.12075424194335938, 0.12371826171875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 10.0, 9.0, 20.0, 57.0, 162.0, 391.0, 267.0, 58.0, 16.0, 9.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6056296825408936, -1.5581352710723877, -1.5106408596038818, -1.463146448135376, -1.4156520366668701, -1.3681575059890747, -1.3206630945205688, -1.273168683052063, -1.2256742715835571, -1.1781798601150513, -1.1306854486465454, -1.0831910371780396, -1.0356965065002441, -0.9882021546363831, -0.9407076835632324, -0.8932132720947266, -0.8457188606262207, -0.7982244491577148, -0.750730037689209, -0.7032355666160583, -0.6557411551475525, -0.6082467436790466, -0.560752272605896, -0.5132578611373901, -0.4657634496688843, -0.4182690382003784, -0.37077459692955017, -0.3232801556587219, -0.27578574419021606, -0.228291317820549, -0.18079689145088196, -0.1333024501800537, -0.08580803871154785, -0.0383136123418808, 0.009180814027786255, 0.05667524039745331, 0.10416966676712036, 0.15166409313678741, 0.19915851950645447, 0.24665296077728271, 0.2941473722457886, 0.34164178371429443, 0.3891362249851227, 0.4366306662559509, 0.4841250777244568, 0.5316194891929626, 0.5791139602661133, 0.6266083717346191, 0.674102783203125, 0.7215971946716309, 0.7690916061401367, 0.8165860772132874, 0.8640804886817932, 0.9115749001502991, 0.9590693712234497, 1.0065637826919556, 1.0540581941604614, 1.1015526056289673, 1.1490470170974731, 1.196541428565979, 1.2440359592437744, 1.2915303707122803, 1.3390247821807861, 1.386519193649292, 1.4340136051177979]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 14.0, 14.0, 19.0, 17.0, 18.0, 33.0, 32.0, 50.0, 52.0, 68.0, 74.0, 82.0, 82.0, 69.0, 64.0, 74.0, 59.0, 40.0, 38.0, 22.0, 15.0, 21.0, 18.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6058225631713867, -0.5881983637809753, -0.5705742239952087, -0.5529500246047974, -0.5353258848190308, -0.5177016854286194, -0.5000775456428528, -0.4824533462524414, -0.4648291766643524, -0.4472050070762634, -0.42958083748817444, -0.41195666790008545, -0.3943324685096741, -0.37670832872390747, -0.3590841293334961, -0.3414599597454071, -0.3238357901573181, -0.3062116205692291, -0.28858745098114014, -0.27096328139305115, -0.25333911180496216, -0.23571492731571198, -0.2180907428264618, -0.2004665732383728, -0.1828424036502838, -0.16521823406219482, -0.14759406447410583, -0.12996987998485565, -0.11234571039676666, -0.09472154080867767, -0.07709736377000809, -0.0594731867313385, -0.04184907674789429, -0.024224903434515, -0.006600730121135712, 0.011023443192243576, 0.028647616505622864, 0.04627178609371185, 0.06389596313238144, 0.08152014017105103, 0.09914430975914001, 0.116768479347229, 0.134392648935318, 0.15201683342456818, 0.16964100301265717, 0.18726517260074615, 0.20488935708999634, 0.22251352667808533, 0.24013769626617432, 0.2577618658542633, 0.2753860354423523, 0.2930102050304413, 0.3106343746185303, 0.32825857400894165, 0.34588274359703064, 0.36350691318511963, 0.3811310827732086, 0.3987552523612976, 0.4163794219493866, 0.4340035915374756, 0.45162779092788696, 0.46925193071365356, 0.48687613010406494, 0.5045002698898315, 0.5221244692802429]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 13.0, 12.0, 10.0, 19.0, 16.0, 31.0, 41.0, 60.0, 108.0, 200.0, 432.0, 1133.0, 3974.0, 21125.0, 364981.0, 620383.0, 28594.0, 4945.0, 1377.0, 502.0, 192.0, 120.0, 51.0, 41.0, 40.0, 29.0, 21.0, 13.0, 8.0, 7.0, 13.0, 8.0, 10.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8408203125, -0.814605712890625, -0.78839111328125, -0.762176513671875, -0.7359619140625, -0.709747314453125, -0.68353271484375, -0.657318115234375, -0.631103515625, -0.604888916015625, -0.57867431640625, -0.552459716796875, -0.5262451171875, -0.500030517578125, -0.47381591796875, -0.447601318359375, -0.42138671875, -0.395172119140625, -0.36895751953125, -0.342742919921875, -0.3165283203125, -0.290313720703125, -0.26409912109375, -0.237884521484375, -0.211669921875, -0.185455322265625, -0.15924072265625, -0.133026123046875, -0.1068115234375, -0.080596923828125, -0.05438232421875, -0.028167724609375, -0.001953125, 0.024261474609375, 0.05047607421875, 0.076690673828125, 0.1029052734375, 0.129119873046875, 0.15533447265625, 0.181549072265625, 0.207763671875, 0.233978271484375, 0.26019287109375, 0.286407470703125, 0.3126220703125, 0.338836669921875, 0.36505126953125, 0.391265869140625, 0.41748046875, 0.443695068359375, 0.46990966796875, 0.496124267578125, 0.5223388671875, 0.548553466796875, 0.57476806640625, 0.600982666015625, 0.627197265625, 0.653411865234375, 0.67962646484375, 0.705841064453125, 0.7320556640625, 0.758270263671875, 0.78448486328125, 0.810699462890625, 0.8369140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 15.0, 28.0, 49.0, 76.0, 136.0, 203.0, 194.0, 117.0, 81.0, 37.0, 20.0, 13.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.1181640625, -0.11569547653198242, -0.11322689056396484, -0.11075830459594727, -0.10828971862792969, -0.10582113265991211, -0.10335254669189453, -0.10088396072387695, -0.09841537475585938, -0.0959467887878418, -0.09347820281982422, -0.09100961685180664, -0.08854103088378906, -0.08607244491577148, -0.0836038589477539, -0.08113527297973633, -0.07866668701171875, -0.07619810104370117, -0.0737295150756836, -0.07126092910766602, -0.06879234313964844, -0.06632375717163086, -0.06385517120361328, -0.0613865852355957, -0.058917999267578125, -0.05644941329956055, -0.05398082733154297, -0.05151224136352539, -0.04904365539550781, -0.046575069427490234, -0.044106483459472656, -0.04163789749145508, -0.0391693115234375, -0.03670072555541992, -0.034232139587402344, -0.031763553619384766, -0.029294967651367188, -0.02682638168334961, -0.02435779571533203, -0.021889209747314453, -0.019420623779296875, -0.016952037811279297, -0.014483451843261719, -0.01201486587524414, -0.009546279907226562, -0.007077693939208984, -0.004609107971191406, -0.002140522003173828, 0.00032806396484375, 0.002796649932861328, 0.005265235900878906, 0.007733821868896484, 0.010202407836914062, 0.01267099380493164, 0.015139579772949219, 0.017608165740966797, 0.020076751708984375, 0.022545337677001953, 0.02501392364501953, 0.02748250961303711, 0.029951095581054688, 0.032419681549072266, 0.034888267517089844, 0.03735685348510742, 0.039825439453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 10.0, 6.0, 6.0, 7.0, 12.0, 30.0, 87.0, 472.0, 7848.0, 791643.0, 244937.0, 2999.0, 312.0, 76.0, 25.0, 15.0, 3.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.1943359375, -1.1529541015625, -1.111572265625, -1.0701904296875, -1.02880859375, -0.9874267578125, -0.946044921875, -0.9046630859375, -0.86328125, -0.8218994140625, -0.780517578125, -0.7391357421875, -0.69775390625, -0.6563720703125, -0.614990234375, -0.5736083984375, -0.5322265625, -0.4908447265625, -0.449462890625, -0.4080810546875, -0.36669921875, -0.3253173828125, -0.283935546875, -0.2425537109375, -0.201171875, -0.1597900390625, -0.118408203125, -0.0770263671875, -0.03564453125, 0.0057373046875, 0.047119140625, 0.0885009765625, 0.1298828125, 0.1712646484375, 0.212646484375, 0.2540283203125, 0.29541015625, 0.3367919921875, 0.378173828125, 0.4195556640625, 0.4609375, 0.5023193359375, 0.543701171875, 0.5850830078125, 0.62646484375, 0.6678466796875, 0.709228515625, 0.7506103515625, 0.7919921875, 0.8333740234375, 0.874755859375, 0.9161376953125, 0.95751953125, 0.9989013671875, 1.040283203125, 1.0816650390625, 1.123046875, 1.1644287109375, 1.205810546875, 1.2471923828125, 1.28857421875, 1.3299560546875, 1.371337890625, 1.4127197265625, 1.4541015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 8.0, 15.0, 11.0, 12.0, 19.0, 22.0, 20.0, 20.0, 32.0, 33.0, 33.0, 33.0, 40.0, 42.0, 33.0, 36.0, 51.0, 46.0, 46.0, 39.0, 34.0, 47.0, 34.0, 33.0, 36.0, 33.0, 26.0, 22.0, 17.0, 21.0, 10.0, 15.0, 13.0, 10.0, 13.0, 6.0, 5.0, 10.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1451416015625, -0.14005470275878906, -0.13496780395507812, -0.1298809051513672, -0.12479400634765625, -0.11970710754394531, -0.11462020874023438, -0.10953330993652344, -0.1044464111328125, -0.09935951232910156, -0.09427261352539062, -0.08918571472167969, -0.08409881591796875, -0.07901191711425781, -0.07392501831054688, -0.06883811950683594, -0.063751220703125, -0.05866432189941406, -0.053577423095703125, -0.04849052429199219, -0.04340362548828125, -0.03831672668457031, -0.033229827880859375, -0.028142929077148438, -0.0230560302734375, -0.017969131469726562, -0.012882232666015625, -0.0077953338623046875, -0.00270843505859375, 0.0023784637451171875, 0.007465362548828125, 0.012552261352539062, 0.01763916015625, 0.022726058959960938, 0.027812957763671875, 0.03289985656738281, 0.03798675537109375, 0.04307365417480469, 0.048160552978515625, 0.05324745178222656, 0.0583343505859375, 0.06342124938964844, 0.06850814819335938, 0.07359504699707031, 0.07868194580078125, 0.08376884460449219, 0.08885574340820312, 0.09394264221191406, 0.099029541015625, 0.10411643981933594, 0.10920333862304688, 0.11429023742675781, 0.11937713623046875, 0.12446403503417969, 0.12955093383789062, 0.13463783264160156, 0.1397247314453125, 0.14481163024902344, 0.14989852905273438, 0.1549854278564453, 0.16007232666015625, 0.1651592254638672, 0.17024612426757812, 0.17533302307128906, 0.180419921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 15.0, 34.0, 127.0, 1855.0, 1044700.0, 1604.0, 119.0, 42.0, 19.0, 11.0, 8.0, 3.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16796875, -6.84906005859375, -6.5301513671875, -6.21124267578125, -5.892333984375, -5.57342529296875, -5.2545166015625, -4.93560791015625, -4.61669921875, -4.29779052734375, -3.9788818359375, -3.65997314453125, -3.341064453125, -3.02215576171875, -2.7032470703125, -2.38433837890625, -2.0654296875, -1.74652099609375, -1.4276123046875, -1.10870361328125, -0.789794921875, -0.47088623046875, -0.1519775390625, 0.16693115234375, 0.48583984375, 0.80474853515625, 1.1236572265625, 1.44256591796875, 1.761474609375, 2.08038330078125, 2.3992919921875, 2.71820068359375, 3.037109375, 3.35601806640625, 3.6749267578125, 3.99383544921875, 4.312744140625, 4.63165283203125, 4.9505615234375, 5.26947021484375, 5.58837890625, 5.90728759765625, 6.2261962890625, 6.54510498046875, 6.864013671875, 7.18292236328125, 7.5018310546875, 7.82073974609375, 8.1396484375, 8.45855712890625, 8.7774658203125, 9.09637451171875, 9.415283203125, 9.73419189453125, 10.0531005859375, 10.37200927734375, 10.69091796875, 11.00982666015625, 11.3287353515625, 11.64764404296875, 11.966552734375, 12.28546142578125, 12.6043701171875, 12.92327880859375, 13.2421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 8.0, 10.0, 19.0, 27.0, 22.0, 36.0, 55.0, 65.0, 121.0, 129.0, 147.0, 89.0, 87.0, 53.0, 32.0, 27.0, 18.0, 12.0, 10.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.064508438110352e-05, -7.841922342777252e-05, -7.619336247444153e-05, -7.396750152111053e-05, -7.174164056777954e-05, -6.951577961444855e-05, -6.728991866111755e-05, -6.506405770778656e-05, -6.283819675445557e-05, -6.061233580112457e-05, -5.838647484779358e-05, -5.6160613894462585e-05, -5.393475294113159e-05, -5.17088919878006e-05, -4.9483031034469604e-05, -4.725717008113861e-05, -4.503130912780762e-05, -4.2805448174476624e-05, -4.057958722114563e-05, -3.8353726267814636e-05, -3.612786531448364e-05, -3.390200436115265e-05, -3.1676143407821655e-05, -2.945028245449066e-05, -2.7224421501159668e-05, -2.4998560547828674e-05, -2.277269959449768e-05, -2.0546838641166687e-05, -1.8320977687835693e-05, -1.60951167345047e-05, -1.3869255781173706e-05, -1.1643394827842712e-05, -9.417533874511719e-06, -7.191672921180725e-06, -4.9658119678497314e-06, -2.739951014518738e-06, -5.140900611877441e-07, 1.7117708921432495e-06, 3.937631845474243e-06, 6.163492798805237e-06, 8.38935375213623e-06, 1.0615214705467224e-05, 1.2841075658798218e-05, 1.5066936612129211e-05, 1.7292797565460205e-05, 1.95186585187912e-05, 2.1744519472122192e-05, 2.3970380425453186e-05, 2.619624137878418e-05, 2.8422102332115173e-05, 3.064796328544617e-05, 3.287382423877716e-05, 3.5099685192108154e-05, 3.732554614543915e-05, 3.955140709877014e-05, 4.1777268052101135e-05, 4.400312900543213e-05, 4.622898995876312e-05, 4.8454850912094116e-05, 5.068071186542511e-05, 5.2906572818756104e-05, 5.51324337720871e-05, 5.735829472541809e-05, 5.9584155678749084e-05, 6.181001663208008e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 11.0, 12.0, 13.0, 24.0, 39.0, 77.0, 84.0, 173.0, 240.0, 567.0, 1027.0, 2899.0, 9040.0, 47778.0, 896184.0, 73264.0, 11442.0, 3223.0, 1214.0, 539.0, 289.0, 164.0, 92.0, 40.0, 44.0, 27.0, 16.0, 10.0, 6.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.775390625, -1.7281494140625, -1.680908203125, -1.6336669921875, -1.58642578125, -1.5391845703125, -1.491943359375, -1.4447021484375, -1.3974609375, -1.3502197265625, -1.302978515625, -1.2557373046875, -1.20849609375, -1.1612548828125, -1.114013671875, -1.0667724609375, -1.01953125, -0.9722900390625, -0.925048828125, -0.8778076171875, -0.83056640625, -0.7833251953125, -0.736083984375, -0.6888427734375, -0.6416015625, -0.5943603515625, -0.547119140625, -0.4998779296875, -0.45263671875, -0.4053955078125, -0.358154296875, -0.3109130859375, -0.263671875, -0.2164306640625, -0.169189453125, -0.1219482421875, -0.07470703125, -0.0274658203125, 0.019775390625, 0.0670166015625, 0.1142578125, 0.1614990234375, 0.208740234375, 0.2559814453125, 0.30322265625, 0.3504638671875, 0.397705078125, 0.4449462890625, 0.4921875, 0.5394287109375, 0.586669921875, 0.6339111328125, 0.68115234375, 0.7283935546875, 0.775634765625, 0.8228759765625, 0.8701171875, 0.9173583984375, 0.964599609375, 1.0118408203125, 1.05908203125, 1.1063232421875, 1.153564453125, 1.2008056640625, 1.248046875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 4.0, 6.0, 10.0, 13.0, 13.0, 30.0, 44.0, 105.0, 213.0, 252.0, 135.0, 51.0, 28.0, 22.0, 8.0, 14.0, 14.0, 10.0, 3.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9831161499023438, -0.9535369873046875, -0.9239578247070312, -0.894378662109375, -0.8647994995117188, -0.8352203369140625, -0.8056411743164062, -0.77606201171875, -0.7464828491210938, -0.7169036865234375, -0.6873245239257812, -0.657745361328125, -0.6281661987304688, -0.5985870361328125, -0.5690078735351562, -0.5394287109375, -0.5098495483398438, -0.4802703857421875, -0.45069122314453125, -0.421112060546875, -0.39153289794921875, -0.3619537353515625, -0.33237457275390625, -0.30279541015625, -0.27321624755859375, -0.2436370849609375, -0.21405792236328125, -0.184478759765625, -0.15489959716796875, -0.1253204345703125, -0.09574127197265625, -0.066162109375, -0.03658294677734375, -0.0070037841796875, 0.02257537841796875, 0.052154541015625, 0.08173370361328125, 0.1113128662109375, 0.14089202880859375, 0.17047119140625, 0.20005035400390625, 0.2296295166015625, 0.25920867919921875, 0.288787841796875, 0.31836700439453125, 0.3479461669921875, 0.37752532958984375, 0.4071044921875, 0.43668365478515625, 0.4662628173828125, 0.49584197998046875, 0.525421142578125, 0.5550003051757812, 0.5845794677734375, 0.6141586303710938, 0.64373779296875, 0.6733169555664062, 0.7028961181640625, 0.7324752807617188, 0.762054443359375, 0.7916336059570312, 0.8212127685546875, 0.8507919311523438, 0.88037109375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 12.0, 16.0, 28.0, 78.0, 168.0, 213.0, 242.0, 108.0, 60.0, 31.0, 16.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.424810886383057, -5.306727409362793, -5.188643932342529, -5.070559978485107, -4.952476501464844, -4.83439302444458, -4.716309547424316, -4.598226070404053, -4.480142593383789, -4.362059116363525, -4.243975639343262, -4.12589168548584, -4.007808208465576, -3.8897247314453125, -3.771641254425049, -3.653557777404785, -3.5354738235473633, -3.4173903465270996, -3.299306631088257, -3.181223154067993, -3.0631394386291504, -2.9450559616088867, -2.826972484588623, -2.7088890075683594, -2.5908052921295166, -2.472721815109253, -2.35463809967041, -2.2365546226501465, -2.118471145629883, -2.00038743019104, -1.8823039531707764, -1.7642203569412231, -1.646136999130249, -1.5280534029006958, -1.4099698066711426, -1.291886329650879, -1.1738027334213257, -1.0557191371917725, -0.937635600566864, -0.8195520639419556, -0.7014684677124023, -0.5833848714828491, -0.4653013348579407, -0.34721776843070984, -0.229134202003479, -0.11105060577392578, 0.007032930850982666, 0.1251164674758911, 0.24320006370544434, 0.36128363013267517, 0.479367196559906, 0.5974507331848145, 0.7155343294143677, 0.8336179256439209, 0.9517014622688293, 1.0697849988937378, 1.187868595123291, 1.3059521913528442, 1.4240357875823975, 1.5421192646026611, 1.6602028608322144, 1.7782864570617676, 1.8963699340820312, 2.014453411102295, 2.1325371265411377]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 7.0, 16.0, 23.0, 34.0, 36.0, 42.0, 61.0, 64.0, 79.0, 81.0, 85.0, 86.0, 70.0, 63.0, 45.0, 49.0, 40.0, 27.0, 19.0, 19.0, 9.0, 10.0, 2.0, 3.0, 7.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.428568124771118, -2.3419911861419678, -2.2554140090942383, -2.168837070465088, -2.0822601318359375, -1.995682954788208, -1.9091060161590576, -1.8225289583206177, -1.7359519004821777, -1.6493748426437378, -1.5627977848052979, -1.4762208461761475, -1.3896437883377075, -1.3030667304992676, -1.2164897918701172, -1.1299127340316772, -1.0433356761932373, -0.9567586183547974, -0.8701816201210022, -0.783604621887207, -0.6970275640487671, -0.6104505062103271, -0.523873507976532, -0.4372965097427368, -0.3507194519042969, -0.2641424238681793, -0.17756539583206177, -0.09098836779594421, -0.00441133975982666, 0.0821656882762909, 0.16874271631240845, 0.2553197145462036, 0.34189653396606445, 0.428473562002182, 0.5150505900382996, 0.6016275882720947, 0.6882046461105347, 0.7747817039489746, 0.8613587021827698, 0.9479357004165649, 1.0345127582550049, 1.1210898160934448, 1.2076668739318848, 1.2942438125610352, 1.380820870399475, 1.467397928237915, 1.5539748668670654, 1.6405519247055054, 1.7271289825439453, 1.8137060403823853, 1.9002830982208252, 1.9868600368499756, 2.073437213897705, 2.1600141525268555, 2.246591091156006, 2.3331680297851562, 2.4197452068328857, 2.506322145462036, 2.5928993225097656, 2.679476261138916, 2.7660531997680664, 2.852630376815796, 2.9392073154449463, 3.025784492492676, 3.112361431121826]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 7.0, 13.0, 19.0, 22.0, 35.0, 47.0, 59.0, 66.0, 101.0, 115.0, 191.0, 276.0, 535.0, 906.0, 1633.0, 3404.0, 9100.0, 33407.0, 747845.0, 3329821.0, 46385.0, 11405.0, 4423.0, 1922.0, 1040.0, 573.0, 338.0, 215.0, 126.0, 69.0, 48.0, 31.0, 24.0, 19.0, 14.0, 8.0, 9.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 5.0, 0.0, 4.0, 1.0], "bins": [-1.12109375, -1.09002685546875, -1.0589599609375, -1.02789306640625, -0.996826171875, -0.96575927734375, -0.9346923828125, -0.90362548828125, -0.87255859375, -0.84149169921875, -0.8104248046875, -0.77935791015625, -0.748291015625, -0.71722412109375, -0.6861572265625, -0.65509033203125, -0.6240234375, -0.59295654296875, -0.5618896484375, -0.53082275390625, -0.499755859375, -0.46868896484375, -0.4376220703125, -0.40655517578125, -0.37548828125, -0.34442138671875, -0.3133544921875, -0.28228759765625, -0.251220703125, -0.22015380859375, -0.1890869140625, -0.15802001953125, -0.126953125, -0.09588623046875, -0.0648193359375, -0.03375244140625, -0.002685546875, 0.02838134765625, 0.0594482421875, 0.09051513671875, 0.12158203125, 0.15264892578125, 0.1837158203125, 0.21478271484375, 0.245849609375, 0.27691650390625, 0.3079833984375, 0.33905029296875, 0.3701171875, 0.40118408203125, 0.4322509765625, 0.46331787109375, 0.494384765625, 0.52545166015625, 0.5565185546875, 0.58758544921875, 0.61865234375, 0.64971923828125, 0.6807861328125, 0.71185302734375, 0.742919921875, 0.77398681640625, 0.8050537109375, 0.83612060546875, 0.8671875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 6.0, 7.0, 13.0, 11.0, 29.0, 33.0, 56.0, 59.0, 102.0, 121.0, 114.0, 102.0, 84.0, 58.0, 46.0, 42.0, 23.0, 21.0, 18.0, 11.0, 5.0, 8.0, 7.0, 7.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054595947265625, -0.05306053161621094, -0.051525115966796875, -0.04998970031738281, -0.04845428466796875, -0.04691886901855469, -0.045383453369140625, -0.04384803771972656, -0.0423126220703125, -0.04077720642089844, -0.039241790771484375, -0.03770637512207031, -0.03617095947265625, -0.03463554382324219, -0.033100128173828125, -0.03156471252441406, -0.030029296875, -0.028493881225585938, -0.026958465576171875, -0.025423049926757812, -0.02388763427734375, -0.022352218627929688, -0.020816802978515625, -0.019281387329101562, -0.0177459716796875, -0.016210556030273438, -0.014675140380859375, -0.013139724731445312, -0.01160430908203125, -0.010068893432617188, -0.008533477783203125, -0.0069980621337890625, -0.005462646484375, -0.0039272308349609375, -0.002391815185546875, -0.0008563995361328125, 0.00067901611328125, 0.0022144317626953125, 0.003749847412109375, 0.0052852630615234375, 0.0068206787109375, 0.008356094360351562, 0.009891510009765625, 0.011426925659179688, 0.01296234130859375, 0.014497756958007812, 0.016033172607421875, 0.017568588256835938, 0.01910400390625, 0.020639419555664062, 0.022174835205078125, 0.023710250854492188, 0.02524566650390625, 0.026781082153320312, 0.028316497802734375, 0.029851913452148438, 0.0313873291015625, 0.03292274475097656, 0.034458160400390625, 0.03599357604980469, 0.03752899169921875, 0.03906440734863281, 0.040599822998046875, 0.04213523864746094, 0.043670654296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 1.0, 5.0, 12.0, 11.0, 8.0, 19.0, 11.0, 26.0, 28.0, 57.0, 125.0, 313.0, 1183.0, 8582.0, 253006.0, 3894634.0, 32441.0, 2819.0, 550.0, 192.0, 76.0, 41.0, 44.0, 19.0, 11.0, 14.0, 14.0, 7.0, 7.0, 4.0, 2.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.875, -1.8246612548828125, -1.774322509765625, -1.7239837646484375, -1.67364501953125, -1.6233062744140625, -1.572967529296875, -1.5226287841796875, -1.4722900390625, -1.4219512939453125, -1.371612548828125, -1.3212738037109375, -1.27093505859375, -1.2205963134765625, -1.170257568359375, -1.1199188232421875, -1.069580078125, -1.0192413330078125, -0.968902587890625, -0.9185638427734375, -0.86822509765625, -0.8178863525390625, -0.767547607421875, -0.7172088623046875, -0.6668701171875, -0.6165313720703125, -0.566192626953125, -0.5158538818359375, -0.46551513671875, -0.4151763916015625, -0.364837646484375, -0.3144989013671875, -0.26416015625, -0.2138214111328125, -0.163482666015625, -0.1131439208984375, -0.06280517578125, -0.0124664306640625, 0.037872314453125, 0.0882110595703125, 0.1385498046875, 0.1888885498046875, 0.239227294921875, 0.2895660400390625, 0.33990478515625, 0.3902435302734375, 0.440582275390625, 0.4909210205078125, 0.541259765625, 0.5915985107421875, 0.641937255859375, 0.6922760009765625, 0.74261474609375, 0.7929534912109375, 0.843292236328125, 0.8936309814453125, 0.9439697265625, 0.9943084716796875, 1.044647216796875, 1.0949859619140625, 1.14532470703125, 1.1956634521484375, 1.246002197265625, 1.2963409423828125, 1.3466796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 3.0, 8.0, 13.0, 18.0, 18.0, 24.0, 42.0, 53.0, 92.0, 131.0, 254.0, 661.0, 1392.0, 633.0, 294.0, 168.0, 71.0, 62.0, 32.0, 22.0, 18.0, 13.0, 8.0, 9.0, 5.0, 1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07427978515625, -0.07125282287597656, -0.06822586059570312, -0.06519889831542969, -0.06217193603515625, -0.05914497375488281, -0.056118011474609375, -0.05309104919433594, -0.0500640869140625, -0.04703712463378906, -0.044010162353515625, -0.04098320007324219, -0.03795623779296875, -0.03492927551269531, -0.031902313232421875, -0.028875350952148438, -0.025848388671875, -0.022821426391601562, -0.019794464111328125, -0.016767501831054688, -0.01374053955078125, -0.010713577270507812, -0.007686614990234375, -0.0046596527099609375, -0.0016326904296875, 0.0013942718505859375, 0.004421234130859375, 0.0074481964111328125, 0.01047515869140625, 0.013502120971679688, 0.016529083251953125, 0.019556045532226562, 0.0225830078125, 0.025609970092773438, 0.028636932373046875, 0.03166389465332031, 0.03469085693359375, 0.03771781921386719, 0.040744781494140625, 0.04377174377441406, 0.0467987060546875, 0.04982566833496094, 0.052852630615234375, 0.05587959289550781, 0.05890655517578125, 0.06193351745605469, 0.06496047973632812, 0.06798744201660156, 0.071014404296875, 0.07404136657714844, 0.07706832885742188, 0.08009529113769531, 0.08312225341796875, 0.08614921569824219, 0.08917617797851562, 0.09220314025878906, 0.0952301025390625, 0.09825706481933594, 0.10128402709960938, 0.10431098937988281, 0.10733795166015625, 0.11036491394042969, 0.11339187622070312, 0.11641883850097656, 0.11944580078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 18.0, 245.0, 529.0, 147.0, 43.0, 8.0, 8.0, 3.0, 1.0], "bins": [-4.585784435272217, -4.505848407745361, -4.425912380218506, -4.34597635269165, -4.266040802001953, -4.186104774475098, -4.106168746948242, -4.026232719421387, -3.9462966918945312, -3.866360664367676, -3.7864246368408203, -3.706488847732544, -3.6265528202056885, -3.546616792678833, -3.4666810035705566, -3.386744976043701, -3.3068089485168457, -3.2268729209899902, -3.1469368934631348, -3.0670011043548584, -2.987065076828003, -2.9071290493011475, -2.827193260192871, -2.7472572326660156, -2.66732120513916, -2.5873851776123047, -2.507449150085449, -2.427513360977173, -2.3475773334503174, -2.267641305923462, -2.1877055168151855, -2.10776948928833, -2.0278334617614746, -1.9478974342346191, -1.8679615259170532, -1.7880256175994873, -1.7080895900726318, -1.6281535625457764, -1.5482176542282104, -1.4682817459106445, -1.388345718383789, -1.3084096908569336, -1.2284737825393677, -1.1485378742218018, -1.0686018466949463, -0.9886658787727356, -0.9087299108505249, -0.8287939429283142, -0.7488580346107483, -0.6689220666885376, -0.5889860987663269, -0.5090501308441162, -0.4291141629219055, -0.3491781949996948, -0.26924222707748413, -0.18930625915527344, -0.10937029123306274, -0.02943432331085205, 0.05050164461135864, 0.13043761253356934, 0.21037358045578003, 0.2903095483779907, 0.3702455163002014, 0.4501814842224121, 0.5301174521446228]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 13.0, 17.0, 20.0, 50.0, 61.0, 78.0, 83.0, 105.0, 134.0, 90.0, 81.0, 79.0, 55.0, 48.0, 32.0, 18.0, 12.0, 9.0, 6.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.3663687705993652, -1.3385528326034546, -1.310736894607544, -1.2829209566116333, -1.2551050186157227, -1.2272891998291016, -1.1994731426239014, -1.1716573238372803, -1.1438413858413696, -1.116025447845459, -1.0882095098495483, -1.0603935718536377, -1.032577633857727, -1.0047616958618164, -0.9769458174705505, -0.9491298794746399, -0.9213139414787292, -0.8934980034828186, -0.865682065486908, -0.8378661870956421, -0.8100502490997314, -0.7822343111038208, -0.7544183731079102, -0.7266024351119995, -0.6987864971160889, -0.6709705591201782, -0.6431546211242676, -0.6153386831283569, -0.5875228047370911, -0.5597068667411804, -0.5318909287452698, -0.5040749907493591, -0.47625917196273804, -0.4484432339668274, -0.42062732577323914, -0.3928113877773285, -0.36499547958374023, -0.3371795415878296, -0.30936360359191895, -0.2815476655960083, -0.25373175740242004, -0.2259158343076706, -0.19809991121292114, -0.1702839732170105, -0.14246805012226105, -0.1146521270275116, -0.08683618903160095, -0.0590202659368515, -0.03120434284210205, -0.0033884160220623016, 0.024427510797977448, 0.052243441343307495, 0.08005936443805695, 0.1078752875328064, 0.13569122552871704, 0.1635071486234665, 0.19132307171821594, 0.2191389948129654, 0.24695491790771484, 0.2747708559036255, 0.30258679389953613, 0.3304027020931244, 0.35821864008903503, 0.3860345482826233, 0.41385048627853394]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 13.0, 17.0, 19.0, 20.0, 30.0, 43.0, 38.0, 50.0, 49.0, 56.0, 61.0, 604.0, 201236.0, 844680.0, 1182.0, 87.0, 48.0, 39.0, 41.0, 39.0, 26.0, 24.0, 32.0, 22.0, 13.0, 13.0, 7.0, 9.0, 10.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.6328125, -2.54534912109375, -2.4578857421875, -2.37042236328125, -2.282958984375, -2.19549560546875, -2.1080322265625, -2.02056884765625, -1.93310546875, -1.84564208984375, -1.7581787109375, -1.67071533203125, -1.583251953125, -1.49578857421875, -1.4083251953125, -1.32086181640625, -1.2333984375, -1.14593505859375, -1.0584716796875, -0.97100830078125, -0.883544921875, -0.79608154296875, -0.7086181640625, -0.62115478515625, -0.53369140625, -0.44622802734375, -0.3587646484375, -0.27130126953125, -0.183837890625, -0.09637451171875, -0.0089111328125, 0.07855224609375, 0.166015625, 0.25347900390625, 0.3409423828125, 0.42840576171875, 0.515869140625, 0.60333251953125, 0.6907958984375, 0.77825927734375, 0.86572265625, 0.95318603515625, 1.0406494140625, 1.12811279296875, 1.215576171875, 1.30303955078125, 1.3905029296875, 1.47796630859375, 1.5654296875, 1.65289306640625, 1.7403564453125, 1.82781982421875, 1.915283203125, 2.00274658203125, 2.0902099609375, 2.17767333984375, 2.26513671875, 2.35260009765625, 2.4400634765625, 2.52752685546875, 2.614990234375, 2.70245361328125, 2.7899169921875, 2.87738037109375, 2.96484375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 16.0, 74.0, 257.0, 356.0, 224.0, 62.0, 17.0, 4.0, 1.0, 2.0], "bins": [-0.36865234375, -0.3622255325317383, -0.35579872131347656, -0.34937191009521484, -0.3429450988769531, -0.3365182876586914, -0.3300914764404297, -0.32366466522216797, -0.31723785400390625, -0.31081104278564453, -0.3043842315673828, -0.2979574203491211, -0.2915306091308594, -0.28510379791259766, -0.27867698669433594, -0.2722501754760742, -0.2658233642578125, -0.2593965530395508, -0.25296974182128906, -0.24654293060302734, -0.24011611938476562, -0.2336893081665039, -0.2272624969482422, -0.22083568572998047, -0.21440887451171875, -0.20798206329345703, -0.2015552520751953, -0.1951284408569336, -0.18870162963867188, -0.18227481842041016, -0.17584800720214844, -0.16942119598388672, -0.162994384765625, -0.15656757354736328, -0.15014076232910156, -0.14371395111083984, -0.13728713989257812, -0.1308603286743164, -0.12443351745605469, -0.11800670623779297, -0.11157989501953125, -0.10515308380126953, -0.09872627258300781, -0.0922994613647461, -0.08587265014648438, -0.07944583892822266, -0.07301902770996094, -0.06659221649169922, -0.0601654052734375, -0.05373859405517578, -0.04731178283691406, -0.040884971618652344, -0.034458160400390625, -0.028031349182128906, -0.021604537963867188, -0.015177726745605469, -0.00875091552734375, -0.0023241043090820312, 0.0041027069091796875, 0.010529518127441406, 0.016956329345703125, 0.023383140563964844, 0.029809951782226562, 0.03623676300048828, 0.04266357421875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 8.0, 15.0, 21.0, 27.0, 34.0, 54.0, 101.0, 163.0, 307.0, 705.0, 1779.0, 5795.0, 24837.0, 165652.0, 622193.0, 189517.0, 27701.0, 6169.0, 1923.0, 748.0, 370.0, 180.0, 90.0, 50.0, 34.0, 23.0, 15.0, 13.0, 4.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.79296875, -0.7706527709960938, -0.7483367919921875, -0.7260208129882812, -0.703704833984375, -0.6813888549804688, -0.6590728759765625, -0.6367568969726562, -0.61444091796875, -0.5921249389648438, -0.5698089599609375, -0.5474929809570312, -0.525177001953125, -0.5028610229492188, -0.4805450439453125, -0.45822906494140625, -0.4359130859375, -0.41359710693359375, -0.3912811279296875, -0.36896514892578125, -0.346649169921875, -0.32433319091796875, -0.3020172119140625, -0.27970123291015625, -0.25738525390625, -0.23506927490234375, -0.2127532958984375, -0.19043731689453125, -0.168121337890625, -0.14580535888671875, -0.1234893798828125, -0.10117340087890625, -0.078857421875, -0.05654144287109375, -0.0342254638671875, -0.01190948486328125, 0.010406494140625, 0.03272247314453125, 0.0550384521484375, 0.07735443115234375, 0.09967041015625, 0.12198638916015625, 0.1443023681640625, 0.16661834716796875, 0.188934326171875, 0.21125030517578125, 0.2335662841796875, 0.25588226318359375, 0.2781982421875, 0.30051422119140625, 0.3228302001953125, 0.34514617919921875, 0.367462158203125, 0.38977813720703125, 0.4120941162109375, 0.43441009521484375, 0.45672607421875, 0.47904205322265625, 0.5013580322265625, 0.5236740112304688, 0.545989990234375, 0.5683059692382812, 0.5906219482421875, 0.6129379272460938, 0.63525390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 11.0, 7.0, 6.0, 11.0, 12.0, 19.0, 13.0, 19.0, 20.0, 26.0, 36.0, 49.0, 40.0, 42.0, 37.0, 45.0, 51.0, 45.0, 61.0, 51.0, 59.0, 41.0, 48.0, 31.0, 38.0, 31.0, 26.0, 23.0, 20.0, 16.0, 15.0, 9.0, 9.0, 7.0, 4.0, 3.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.314697265625, -0.3054008483886719, -0.29610443115234375, -0.2868080139160156, -0.2775115966796875, -0.2682151794433594, -0.25891876220703125, -0.24962234497070312, -0.240325927734375, -0.23102951049804688, -0.22173309326171875, -0.21243667602539062, -0.2031402587890625, -0.19384384155273438, -0.18454742431640625, -0.17525100708007812, -0.16595458984375, -0.15665817260742188, -0.14736175537109375, -0.13806533813476562, -0.1287689208984375, -0.11947250366210938, -0.11017608642578125, -0.10087966918945312, -0.091583251953125, -0.08228683471679688, -0.07299041748046875, -0.06369400024414062, -0.0543975830078125, -0.045101165771484375, -0.03580474853515625, -0.026508331298828125, -0.0172119140625, -0.007915496826171875, 0.00138092041015625, 0.010677337646484375, 0.0199737548828125, 0.029270172119140625, 0.03856658935546875, 0.047863006591796875, 0.057159423828125, 0.06645584106445312, 0.07575225830078125, 0.08504867553710938, 0.0943450927734375, 0.10364151000976562, 0.11293792724609375, 0.12223434448242188, 0.13153076171875, 0.14082717895507812, 0.15012359619140625, 0.15942001342773438, 0.1687164306640625, 0.17801284790039062, 0.18730926513671875, 0.19660568237304688, 0.205902099609375, 0.21519851684570312, 0.22449493408203125, 0.23379135131835938, 0.2430877685546875, 0.2523841857910156, 0.26168060302734375, 0.2709770202636719, 0.2802734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 6.0, 6.0, 10.0, 5.0, 19.0, 18.0, 30.0, 44.0, 60.0, 84.0, 146.0, 176.0, 323.0, 573.0, 1032.0, 2257.0, 5781.0, 18391.0, 83155.0, 412102.0, 411744.0, 83603.0, 18371.0, 5731.0, 2377.0, 1087.0, 550.0, 281.0, 174.0, 134.0, 96.0, 46.0, 36.0, 28.0, 19.0, 12.0, 9.0, 13.0, 5.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.556640625, -0.5419921875, -0.52734375, -0.5126953125, -0.498046875, -0.4833984375, -0.46875, -0.4541015625, -0.439453125, -0.4248046875, -0.41015625, -0.3955078125, -0.380859375, -0.3662109375, -0.3515625, -0.3369140625, -0.322265625, -0.3076171875, -0.29296875, -0.2783203125, -0.263671875, -0.2490234375, -0.234375, -0.2197265625, -0.205078125, -0.1904296875, -0.17578125, -0.1611328125, -0.146484375, -0.1318359375, -0.1171875, -0.1025390625, -0.087890625, -0.0732421875, -0.05859375, -0.0439453125, -0.029296875, -0.0146484375, 0.0, 0.0146484375, 0.029296875, 0.0439453125, 0.05859375, 0.0732421875, 0.087890625, 0.1025390625, 0.1171875, 0.1318359375, 0.146484375, 0.1611328125, 0.17578125, 0.1904296875, 0.205078125, 0.2197265625, 0.234375, 0.2490234375, 0.263671875, 0.2783203125, 0.29296875, 0.3076171875, 0.322265625, 0.3369140625, 0.3515625, 0.3662109375, 0.380859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 6.0, 2.0, 4.0, 9.0, 9.0, 13.0, 18.0, 36.0, 39.0, 60.0, 108.0, 109.0, 149.0, 123.0, 88.0, 78.0, 50.0, 31.0, 16.0, 14.0, 12.0, 10.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010305643081665039, -0.00010038074105978012, -9.770505130290985e-05, -9.502936154603958e-05, -9.235367178916931e-05, -8.967798203229904e-05, -8.700229227542877e-05, -8.43266025185585e-05, -8.165091276168823e-05, -7.897522300481796e-05, -7.629953324794769e-05, -7.362384349107742e-05, -7.094815373420715e-05, -6.827246397733688e-05, -6.559677422046661e-05, -6.292108446359634e-05, -6.0245394706726074e-05, -5.7569704949855804e-05, -5.4894015192985535e-05, -5.2218325436115265e-05, -4.9542635679244995e-05, -4.6866945922374725e-05, -4.4191256165504456e-05, -4.1515566408634186e-05, -3.8839876651763916e-05, -3.6164186894893646e-05, -3.3488497138023376e-05, -3.081280738115311e-05, -2.8137117624282837e-05, -2.5461427867412567e-05, -2.2785738110542297e-05, -2.0110048353672028e-05, -1.7434358596801758e-05, -1.4758668839931488e-05, -1.2082979083061218e-05, -9.407289326190948e-06, -6.731599569320679e-06, -4.055909812450409e-06, -1.3802200555801392e-06, 1.2954697012901306e-06, 3.9711594581604e-06, 6.64684921503067e-06, 9.32253897190094e-06, 1.199822872877121e-05, 1.467391848564148e-05, 1.734960824251175e-05, 2.002529799938202e-05, 2.270098775625229e-05, 2.537667751312256e-05, 2.805236726999283e-05, 3.07280570268631e-05, 3.340374678373337e-05, 3.607943654060364e-05, 3.875512629747391e-05, 4.143081605434418e-05, 4.410650581121445e-05, 4.678219556808472e-05, 4.9457885324954987e-05, 5.2133575081825256e-05, 5.4809264838695526e-05, 5.7484954595565796e-05, 6.0160644352436066e-05, 6.283633410930634e-05, 6.55120238661766e-05, 6.818771362304688e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 10.0, 15.0, 13.0, 26.0, 46.0, 69.0, 124.0, 221.0, 379.0, 956.0, 2553.0, 9792.0, 91500.0, 837106.0, 91716.0, 9581.0, 2611.0, 918.0, 391.0, 216.0, 115.0, 71.0, 50.0, 23.0, 21.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.125, -1.0923919677734375, -1.059783935546875, -1.0271759033203125, -0.99456787109375, -0.9619598388671875, -0.929351806640625, -0.8967437744140625, -0.8641357421875, -0.8315277099609375, -0.798919677734375, -0.7663116455078125, -0.73370361328125, -0.7010955810546875, -0.668487548828125, -0.6358795166015625, -0.603271484375, -0.5706634521484375, -0.538055419921875, -0.5054473876953125, -0.47283935546875, -0.4402313232421875, -0.407623291015625, -0.3750152587890625, -0.3424072265625, -0.3097991943359375, -0.277191162109375, -0.2445831298828125, -0.21197509765625, -0.1793670654296875, -0.146759033203125, -0.1141510009765625, -0.08154296875, -0.0489349365234375, -0.016326904296875, 0.0162811279296875, 0.04888916015625, 0.0814971923828125, 0.114105224609375, 0.1467132568359375, 0.1793212890625, 0.2119293212890625, 0.244537353515625, 0.2771453857421875, 0.30975341796875, 0.3423614501953125, 0.374969482421875, 0.4075775146484375, 0.440185546875, 0.4727935791015625, 0.505401611328125, 0.5380096435546875, 0.57061767578125, 0.6032257080078125, 0.635833740234375, 0.6684417724609375, 0.7010498046875, 0.7336578369140625, 0.766265869140625, 0.7988739013671875, 0.83148193359375, 0.8640899658203125, 0.896697998046875, 0.9293060302734375, 0.9619140625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 12.0, 13.0, 35.0, 77.0, 128.0, 187.0, 192.0, 149.0, 91.0, 53.0, 27.0, 15.0, 9.0, 5.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.6266517639160156, -0.6107254028320312, -0.5947990417480469, -0.5788726806640625, -0.5629463195800781, -0.5470199584960938, -0.5310935974121094, -0.515167236328125, -0.4992408752441406, -0.48331451416015625, -0.4673881530761719, -0.4514617919921875, -0.4355354309082031, -0.41960906982421875, -0.4036827087402344, -0.38775634765625, -0.3718299865722656, -0.35590362548828125, -0.3399772644042969, -0.3240509033203125, -0.3081245422363281, -0.29219818115234375, -0.2762718200683594, -0.260345458984375, -0.24441909790039062, -0.22849273681640625, -0.21256637573242188, -0.1966400146484375, -0.18071365356445312, -0.16478729248046875, -0.14886093139648438, -0.1329345703125, -0.11700820922851562, -0.10108184814453125, -0.08515548706054688, -0.0692291259765625, -0.053302764892578125, -0.03737640380859375, -0.021450042724609375, -0.005523681640625, 0.010402679443359375, 0.02632904052734375, 0.042255401611328125, 0.0581817626953125, 0.07410812377929688, 0.09003448486328125, 0.10596084594726562, 0.12188720703125, 0.13781356811523438, 0.15373992919921875, 0.16966629028320312, 0.1855926513671875, 0.20151901245117188, 0.21744537353515625, 0.23337173461914062, 0.249298095703125, 0.2652244567871094, 0.28115081787109375, 0.2970771789550781, 0.3130035400390625, 0.3289299011230469, 0.34485626220703125, 0.3607826232910156, 0.376708984375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 19.0, 68.0, 250.0, 356.0, 190.0, 79.0, 23.0, 7.0, 9.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.066506385803223, -3.8166847229003906, -3.5668630599975586, -3.3170413970947266, -3.0672199726104736, -2.8173983097076416, -2.5675766468048096, -2.3177552223205566, -2.0679335594177246, -1.8181118965148926, -1.56829035282135, -1.318468689918518, -1.0686471462249756, -0.8188254833221436, -0.5690038204193115, -0.31918227672576904, -0.06936049461364746, 0.180461123585701, 0.43028274178504944, 0.6801043748855591, 0.9299259781837463, 1.1797475814819336, 1.4295692443847656, 1.679390788078308, 1.9292124509811401, 2.1790339946746826, 2.4288556575775146, 2.6786773204803467, 2.9284989833831787, 3.1783204078674316, 3.4281420707702637, 3.6779637336730957, 3.9277853965759277, 4.17760705947876, 4.427428722381592, 4.677250385284424, 4.927072048187256, 5.17689323425293, 5.426714897155762, 5.676536560058594, 5.926358222961426, 6.176179885864258, 6.42600154876709, 6.675823211669922, 6.925644874572754, 7.175466537475586, 7.425288200378418, 7.675109386444092, 7.924931526184082, 8.174753189086914, 8.424574851989746, 8.674396514892578, 8.92421817779541, 9.174039840698242, 9.423861503601074, 9.673683166503906, 9.923503875732422, 10.173325538635254, 10.423147201538086, 10.672968864440918, 10.92279052734375, 11.172612190246582, 11.422433853149414, 11.672255516052246, 11.922077178955078]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 4.0, 1.0, 2.0, 7.0, 8.0, 11.0, 14.0, 21.0, 28.0, 23.0, 38.0, 29.0, 44.0, 40.0, 44.0, 45.0, 53.0, 66.0, 59.0, 59.0, 53.0, 51.0, 51.0, 43.0, 33.0, 38.0, 25.0, 27.0, 15.0, 25.0, 17.0, 8.0, 7.0, 9.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.217620849609375, -2.146178960800171, -2.074737071990967, -2.003295421600342, -1.9318535327911377, -1.8604116439819336, -1.7889697551727295, -1.7175278663635254, -1.6460860967636108, -1.5746442079544067, -1.5032024383544922, -1.431760549545288, -1.360318660736084, -1.2888768911361694, -1.2174350023269653, -1.1459932327270508, -1.0745513439178467, -1.0031094551086426, -0.931667685508728, -0.8602257966995239, -0.7887839674949646, -0.7173421382904053, -0.6459002494812012, -0.5744584202766418, -0.5030165910720825, -0.4315747618675232, -0.3601329028606415, -0.28869104385375977, -0.21724921464920044, -0.1458073854446411, -0.0743655264377594, -0.0029236674308776855, 0.06851816177368164, 0.13996000587940216, 0.21140184998512268, 0.2828437089920044, 0.3542855381965637, 0.42572736740112305, 0.49716922640800476, 0.5686110854148865, 0.6400529146194458, 0.7114947438240051, 0.7829365730285645, 0.8543784618377686, 0.9258202910423279, 0.9972621202468872, 1.0687040090560913, 1.1401457786560059, 1.21158766746521, 1.283029556274414, 1.3544713258743286, 1.4259132146835327, 1.4973549842834473, 1.5687968730926514, 1.6402387619018555, 1.7116806507110596, 1.7831224203109741, 1.8545643091201782, 1.9260060787200928, 1.9974479675292969, 2.068889856338501, 2.140331745147705, 2.21177339553833, 2.283215284347534, 2.3546571731567383]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 7.0, 9.0, 14.0, 22.0, 32.0, 60.0, 82.0, 120.0, 226.0, 474.0, 14112.0, 4177800.0, 1107.0, 139.0, 62.0, 14.0, 7.0, 3.0, 3.0], "bins": [-14.96875, -14.70281982421875, -14.4368896484375, -14.17095947265625, -13.905029296875, -13.63909912109375, -13.3731689453125, -13.10723876953125, -12.84130859375, -12.57537841796875, -12.3094482421875, -12.04351806640625, -11.777587890625, -11.51165771484375, -11.2457275390625, -10.97979736328125, -10.7138671875, -10.44793701171875, -10.1820068359375, -9.91607666015625, -9.650146484375, -9.38421630859375, -9.1182861328125, -8.85235595703125, -8.58642578125, -8.32049560546875, -8.0545654296875, -7.78863525390625, -7.522705078125, -7.25677490234375, -6.9908447265625, -6.72491455078125, -6.458984375, -6.19305419921875, -5.9271240234375, -5.66119384765625, -5.395263671875, -5.12933349609375, -4.8634033203125, -4.59747314453125, -4.33154296875, -4.06561279296875, -3.7996826171875, -3.53375244140625, -3.267822265625, -3.00189208984375, -2.7359619140625, -2.47003173828125, -2.2041015625, -1.93817138671875, -1.6722412109375, -1.40631103515625, -1.140380859375, -0.87445068359375, -0.6085205078125, -0.34259033203125, -0.07666015625, 0.18927001953125, 0.4552001953125, 0.72113037109375, 0.987060546875, 1.25299072265625, 1.5189208984375, 1.78485107421875, 2.05078125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 9.0, 28.0, 63.0, 154.0, 210.0, 235.0, 156.0, 85.0, 50.0, 8.0, 8.0, 1.0, 4.0], "bins": [-0.373046875, -0.3663954734802246, -0.3597440719604492, -0.35309267044067383, -0.34644126892089844, -0.33978986740112305, -0.33313846588134766, -0.32648706436157227, -0.3198356628417969, -0.3131842613220215, -0.3065328598022461, -0.2998814582824707, -0.2932300567626953, -0.2865786552429199, -0.27992725372314453, -0.27327585220336914, -0.26662445068359375, -0.25997304916381836, -0.25332164764404297, -0.24667024612426758, -0.2400188446044922, -0.2333674430847168, -0.2267160415649414, -0.22006464004516602, -0.21341323852539062, -0.20676183700561523, -0.20011043548583984, -0.19345903396606445, -0.18680763244628906, -0.18015623092651367, -0.17350482940673828, -0.1668534278869629, -0.1602020263671875, -0.1535506248474121, -0.14689922332763672, -0.14024782180786133, -0.13359642028808594, -0.12694501876831055, -0.12029361724853516, -0.11364221572875977, -0.10699081420898438, -0.10033941268920898, -0.0936880111694336, -0.0870366096496582, -0.08038520812988281, -0.07373380661010742, -0.06708240509033203, -0.06043100357055664, -0.05377960205078125, -0.04712820053100586, -0.04047679901123047, -0.03382539749145508, -0.027173995971679688, -0.020522594451904297, -0.013871192932128906, -0.007219791412353516, -0.000568389892578125, 0.006083011627197266, 0.012734413146972656, 0.019385814666748047, 0.026037216186523438, 0.03268861770629883, 0.03934001922607422, 0.04599142074584961, 0.052642822265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 9.0, 6.0, 15.0, 14.0, 28.0, 49.0, 42.0, 64.0, 120.0, 171.0, 272.0, 1264.0, 202102.0, 3986110.0, 2882.0, 483.0, 216.0, 149.0, 95.0, 58.0, 40.0, 36.0, 15.0, 15.0, 9.0, 6.0, 11.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.859375, -8.658538818359375, -8.45770263671875, -8.256866455078125, -8.0560302734375, -7.855194091796875, -7.65435791015625, -7.453521728515625, -7.252685546875, -7.051849365234375, -6.85101318359375, -6.650177001953125, -6.4493408203125, -6.248504638671875, -6.04766845703125, -5.846832275390625, -5.64599609375, -5.445159912109375, -5.24432373046875, -5.043487548828125, -4.8426513671875, -4.641815185546875, -4.44097900390625, -4.240142822265625, -4.039306640625, -3.838470458984375, -3.63763427734375, -3.436798095703125, -3.2359619140625, -3.035125732421875, -2.83428955078125, -2.633453369140625, -2.4326171875, -2.231781005859375, -2.03094482421875, -1.830108642578125, -1.6292724609375, -1.428436279296875, -1.22760009765625, -1.026763916015625, -0.825927734375, -0.625091552734375, -0.42425537109375, -0.223419189453125, -0.0225830078125, 0.178253173828125, 0.37908935546875, 0.579925537109375, 0.78076171875, 0.981597900390625, 1.18243408203125, 1.383270263671875, 1.5841064453125, 1.784942626953125, 1.98577880859375, 2.186614990234375, 2.387451171875, 2.588287353515625, 2.78912353515625, 2.989959716796875, 3.1907958984375, 3.391632080078125, 3.59246826171875, 3.793304443359375, 3.994140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 58.0, 217.0, 2496.0, 1014.0, 168.0, 65.0, 23.0, 17.0, 8.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57568359375, -0.556396484375, -0.537109375, -0.517822265625, -0.49853515625, -0.479248046875, -0.4599609375, -0.440673828125, -0.42138671875, -0.402099609375, -0.3828125, -0.363525390625, -0.34423828125, -0.324951171875, -0.3056640625, -0.286376953125, -0.26708984375, -0.247802734375, -0.228515625, -0.209228515625, -0.18994140625, -0.170654296875, -0.1513671875, -0.132080078125, -0.11279296875, -0.093505859375, -0.07421875, -0.054931640625, -0.03564453125, -0.016357421875, 0.0029296875, 0.022216796875, 0.04150390625, 0.060791015625, 0.080078125, 0.099365234375, 0.11865234375, 0.137939453125, 0.1572265625, 0.176513671875, 0.19580078125, 0.215087890625, 0.234375, 0.253662109375, 0.27294921875, 0.292236328125, 0.3115234375, 0.330810546875, 0.35009765625, 0.369384765625, 0.388671875, 0.407958984375, 0.42724609375, 0.446533203125, 0.4658203125, 0.485107421875, 0.50439453125, 0.523681640625, 0.54296875, 0.562255859375, 0.58154296875, 0.600830078125, 0.6201171875, 0.639404296875, 0.65869140625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 12.0, 24.0, 86.0, 252.0, 373.0, 178.0, 42.0, 13.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1140847206115723, -2.952277660369873, -2.790470600128174, -2.6286633014678955, -2.4668562412261963, -2.305049180984497, -2.1432418823242188, -1.9814348220825195, -1.8196277618408203, -1.657820701599121, -1.4960135221481323, -1.3342063426971436, -1.1723992824554443, -1.0105922222137451, -0.8487850427627563, -0.6869778633117676, -0.5251708030700684, -0.36336368322372437, -0.20155656337738037, -0.03974944353103638, 0.12205767631530762, 0.2838647961616516, 0.4456719160079956, 0.6074790954589844, 0.7692861557006836, 0.9310932755470276, 1.0929003953933716, 1.2547075748443604, 1.4165146350860596, 1.5783216953277588, 1.7401288747787476, 1.9019360542297363, 2.0637435913085938, 2.225550651550293, 2.387357711791992, 2.5491650104522705, 2.7109720706939697, 2.872779130935669, 3.0345864295959473, 3.1963934898376465, 3.3582005500793457, 3.520007610321045, 3.681814670562744, 3.8436219692230225, 4.005429267883301, 4.167236328125, 4.329043388366699, 4.490850448608398, 4.652657508850098, 4.814464569091797, 4.976271629333496, 5.138078689575195, 5.2998857498168945, 5.461693286895752, 5.623500347137451, 5.78530740737915, 5.94711446762085, 6.108921527862549, 6.270728588104248, 6.432535648345947, 6.594343185424805, 6.756150245666504, 6.917957305908203, 7.079764366149902, 7.241571426391602]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 17.0, 24.0, 16.0, 31.0, 35.0, 42.0, 54.0, 64.0, 62.0, 75.0, 72.0, 74.0, 64.0, 66.0, 49.0, 51.0, 47.0, 45.0, 26.0, 21.0, 16.0, 12.0, 10.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380401849746704, -1.3349392414093018, -1.2894765138626099, -1.2440139055252075, -1.1985511779785156, -1.1530885696411133, -1.107625961303711, -1.062163233757019, -1.0167005062103271, -0.97123783826828, -0.9257751703262329, -0.8803125619888306, -0.8348498344421387, -0.7893872261047363, -0.7439245581626892, -0.6984618902206421, -0.6529992818832397, -0.6075366139411926, -0.5620739459991455, -0.5166113376617432, -0.47114863991737366, -0.42568597197532654, -0.3802233338356018, -0.3347606658935547, -0.28929799795150757, -0.24383533000946045, -0.19837267696857452, -0.1529100239276886, -0.10744735598564148, -0.06198468804359436, -0.01652204990386963, 0.02894061803817749, 0.07440328598022461, 0.11986594647169113, 0.16532860696315765, 0.21079126000404358, 0.2562539279460907, 0.3017165958881378, 0.34717923402786255, 0.39264190196990967, 0.4381045699119568, 0.4835672378540039, 0.529029905796051, 0.5744925737380981, 0.6199551820755005, 0.6654179096221924, 0.7108805179595947, 0.7563431859016418, 0.801805853843689, 0.8472685217857361, 0.8927311897277832, 0.9381937980651855, 0.9836565256118774, 1.0291191339492798, 1.0745818614959717, 1.120044469833374, 1.1655070781707764, 1.2109696865081787, 1.2564324140548706, 1.301895022392273, 1.3473577499389648, 1.3928203582763672, 1.4382829666137695, 1.4837456941604614, 1.5292084217071533]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 6.0, 12.0, 4.0, 13.0, 31.0, 26.0, 39.0, 58.0, 105.0, 206.0, 694.0, 4768.0, 166775.0, 854547.0, 18932.0, 1585.0, 359.0, 118.0, 71.0, 51.0, 35.0, 40.0, 29.0, 11.0, 9.0, 4.0, 8.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.8203125, -2.72705078125, -2.6337890625, -2.54052734375, -2.447265625, -2.35400390625, -2.2607421875, -2.16748046875, -2.07421875, -1.98095703125, -1.8876953125, -1.79443359375, -1.701171875, -1.60791015625, -1.5146484375, -1.42138671875, -1.328125, -1.23486328125, -1.1416015625, -1.04833984375, -0.955078125, -0.86181640625, -0.7685546875, -0.67529296875, -0.58203125, -0.48876953125, -0.3955078125, -0.30224609375, -0.208984375, -0.11572265625, -0.0224609375, 0.07080078125, 0.1640625, 0.25732421875, 0.3505859375, 0.44384765625, 0.537109375, 0.63037109375, 0.7236328125, 0.81689453125, 0.91015625, 1.00341796875, 1.0966796875, 1.18994140625, 1.283203125, 1.37646484375, 1.4697265625, 1.56298828125, 1.65625, 1.74951171875, 1.8427734375, 1.93603515625, 2.029296875, 2.12255859375, 2.2158203125, 2.30908203125, 2.40234375, 2.49560546875, 2.5888671875, 2.68212890625, 2.775390625, 2.86865234375, 2.9619140625, 3.05517578125, 3.1484375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 19.0, 66.0, 108.0, 186.0, 205.0, 212.0, 111.0, 65.0, 24.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39599609375, -0.3876628875732422, -0.3793296813964844, -0.37099647521972656, -0.36266326904296875, -0.35433006286621094, -0.3459968566894531, -0.3376636505126953, -0.3293304443359375, -0.3209972381591797, -0.3126640319824219, -0.30433082580566406, -0.29599761962890625, -0.28766441345214844, -0.2793312072753906, -0.2709980010986328, -0.262664794921875, -0.2543315887451172, -0.24599838256835938, -0.23766517639160156, -0.22933197021484375, -0.22099876403808594, -0.21266555786132812, -0.2043323516845703, -0.1959991455078125, -0.1876659393310547, -0.17933273315429688, -0.17099952697753906, -0.16266632080078125, -0.15433311462402344, -0.14599990844726562, -0.1376667022705078, -0.12933349609375, -0.12100028991699219, -0.11266708374023438, -0.10433387756347656, -0.09600067138671875, -0.08766746520996094, -0.07933425903320312, -0.07100105285644531, -0.0626678466796875, -0.05433464050292969, -0.046001434326171875, -0.03766822814941406, -0.02933502197265625, -0.021001815795898438, -0.012668609619140625, -0.0043354034423828125, 0.003997802734375, 0.012331008911132812, 0.020664215087890625, 0.028997421264648438, 0.03733062744140625, 0.04566383361816406, 0.053997039794921875, 0.06233024597167969, 0.0706634521484375, 0.07899665832519531, 0.08732986450195312, 0.09566307067871094, 0.10399627685546875, 0.11232948303222656, 0.12066268920898438, 0.1289958953857422, 0.1373291015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 9.0, 10.0, 6.0, 11.0, 17.0, 20.0, 31.0, 23.0, 47.0, 41.0, 79.0, 141.0, 190.0, 323.0, 527.0, 1109.0, 2520.0, 7633.0, 31246.0, 171401.0, 564230.0, 216419.0, 38059.0, 8921.0, 2869.0, 1172.0, 567.0, 321.0, 213.0, 108.0, 79.0, 58.0, 46.0, 26.0, 21.0, 23.0, 13.0, 16.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.837890625, -0.81292724609375, -0.7879638671875, -0.76300048828125, -0.738037109375, -0.71307373046875, -0.6881103515625, -0.66314697265625, -0.63818359375, -0.61322021484375, -0.5882568359375, -0.56329345703125, -0.538330078125, -0.51336669921875, -0.4884033203125, -0.46343994140625, -0.4384765625, -0.41351318359375, -0.3885498046875, -0.36358642578125, -0.338623046875, -0.31365966796875, -0.2886962890625, -0.26373291015625, -0.23876953125, -0.21380615234375, -0.1888427734375, -0.16387939453125, -0.138916015625, -0.11395263671875, -0.0889892578125, -0.06402587890625, -0.0390625, -0.01409912109375, 0.0108642578125, 0.03582763671875, 0.060791015625, 0.08575439453125, 0.1107177734375, 0.13568115234375, 0.16064453125, 0.18560791015625, 0.2105712890625, 0.23553466796875, 0.260498046875, 0.28546142578125, 0.3104248046875, 0.33538818359375, 0.3603515625, 0.38531494140625, 0.4102783203125, 0.43524169921875, 0.460205078125, 0.48516845703125, 0.5101318359375, 0.53509521484375, 0.56005859375, 0.58502197265625, 0.6099853515625, 0.63494873046875, 0.659912109375, 0.68487548828125, 0.7098388671875, 0.73480224609375, 0.759765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 3.0, 8.0, 8.0, 9.0, 10.0, 12.0, 11.0, 6.0, 28.0, 30.0, 40.0, 32.0, 40.0, 48.0, 63.0, 36.0, 52.0, 38.0, 59.0, 52.0, 49.0, 49.0, 41.0, 32.0, 38.0, 34.0, 26.0, 15.0, 24.0, 22.0, 14.0, 12.0, 9.0, 12.0, 5.0, 4.0, 6.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.4345703125, -0.422210693359375, -0.40985107421875, -0.397491455078125, -0.3851318359375, -0.372772216796875, -0.36041259765625, -0.348052978515625, -0.335693359375, -0.323333740234375, -0.31097412109375, -0.298614501953125, -0.2862548828125, -0.273895263671875, -0.26153564453125, -0.249176025390625, -0.23681640625, -0.224456787109375, -0.21209716796875, -0.199737548828125, -0.1873779296875, -0.175018310546875, -0.16265869140625, -0.150299072265625, -0.137939453125, -0.125579833984375, -0.11322021484375, -0.100860595703125, -0.0885009765625, -0.076141357421875, -0.06378173828125, -0.051422119140625, -0.0390625, -0.026702880859375, -0.01434326171875, -0.001983642578125, 0.0103759765625, 0.022735595703125, 0.03509521484375, 0.047454833984375, 0.059814453125, 0.072174072265625, 0.08453369140625, 0.096893310546875, 0.1092529296875, 0.121612548828125, 0.13397216796875, 0.146331787109375, 0.15869140625, 0.171051025390625, 0.18341064453125, 0.195770263671875, 0.2081298828125, 0.220489501953125, 0.23284912109375, 0.245208740234375, 0.257568359375, 0.269927978515625, 0.28228759765625, 0.294647216796875, 0.3070068359375, 0.319366455078125, 0.33172607421875, 0.344085693359375, 0.3564453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 4.0, 1.0, 5.0, 4.0, 10.0, 10.0, 18.0, 38.0, 33.0, 68.0, 118.0, 237.0, 493.0, 1407.0, 7410.0, 116903.0, 886979.0, 29389.0, 3751.0, 903.0, 341.0, 164.0, 104.0, 63.0, 33.0, 26.0, 14.0, 8.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6416015625, -1.5951080322265625, -1.548614501953125, -1.5021209716796875, -1.45562744140625, -1.4091339111328125, -1.362640380859375, -1.3161468505859375, -1.2696533203125, -1.2231597900390625, -1.176666259765625, -1.1301727294921875, -1.08367919921875, -1.0371856689453125, -0.990692138671875, -0.9441986083984375, -0.897705078125, -0.8512115478515625, -0.804718017578125, -0.7582244873046875, -0.71173095703125, -0.6652374267578125, -0.618743896484375, -0.5722503662109375, -0.5257568359375, -0.4792633056640625, -0.432769775390625, -0.3862762451171875, -0.33978271484375, -0.2932891845703125, -0.246795654296875, -0.2003021240234375, -0.15380859375, -0.1073150634765625, -0.060821533203125, -0.0143280029296875, 0.03216552734375, 0.0786590576171875, 0.125152587890625, 0.1716461181640625, 0.2181396484375, 0.2646331787109375, 0.311126708984375, 0.3576202392578125, 0.40411376953125, 0.4506072998046875, 0.497100830078125, 0.5435943603515625, 0.590087890625, 0.6365814208984375, 0.683074951171875, 0.7295684814453125, 0.77606201171875, 0.8225555419921875, 0.869049072265625, 0.9155426025390625, 0.9620361328125, 1.0085296630859375, 1.055023193359375, 1.1015167236328125, 1.14801025390625, 1.1945037841796875, 1.240997314453125, 1.2874908447265625, 1.333984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 13.0, 15.0, 29.0, 33.0, 44.0, 102.0, 161.0, 191.0, 164.0, 116.0, 59.0, 23.0, 17.0, 11.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012600421905517578, -0.00012107379734516144, -0.0001161433756351471, -0.00011121295392513275, -0.00010628253221511841, -0.00010135211050510406, -9.642168879508972e-05, -9.149126708507538e-05, -8.656084537506104e-05, -8.163042366504669e-05, -7.670000195503235e-05, -7.1769580245018e-05, -6.683915853500366e-05, -6.190873682498932e-05, -5.6978315114974976e-05, -5.204789340496063e-05, -4.711747169494629e-05, -4.2187049984931946e-05, -3.72566282749176e-05, -3.232620656490326e-05, -2.7395784854888916e-05, -2.2465363144874573e-05, -1.753494143486023e-05, -1.2604519724845886e-05, -7.674098014831543e-06, -2.7436763048171997e-06, 2.1867454051971436e-06, 7.117167115211487e-06, 1.204758882522583e-05, 1.6978010535240173e-05, 2.1908432245254517e-05, 2.683885395526886e-05, 3.17692756652832e-05, 3.6699697375297546e-05, 4.163011908531189e-05, 4.656054079532623e-05, 5.1490962505340576e-05, 5.642138421535492e-05, 6.135180592536926e-05, 6.62822276353836e-05, 7.121264934539795e-05, 7.614307105541229e-05, 8.107349276542664e-05, 8.600391447544098e-05, 9.093433618545532e-05, 9.586475789546967e-05, 0.00010079517960548401, 0.00010572560131549835, 0.0001106560230255127, 0.00011558644473552704, 0.00012051686644554138, 0.00012544728815555573, 0.00013037770986557007, 0.0001353081315755844, 0.00014023855328559875, 0.0001451689749956131, 0.00015009939670562744, 0.00015502981841564178, 0.00015996024012565613, 0.00016489066183567047, 0.00016982108354568481, 0.00017475150525569916, 0.0001796819269657135, 0.00018461234867572784, 0.0001895427703857422]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 8.0, 10.0, 23.0, 34.0, 49.0, 68.0, 151.0, 320.0, 806.0, 2764.0, 13564.0, 212739.0, 772559.0, 37612.0, 5510.0, 1411.0, 478.0, 187.0, 91.0, 57.0, 28.0, 18.0, 7.0, 12.0, 14.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.421875, -1.3846893310546875, -1.347503662109375, -1.3103179931640625, -1.27313232421875, -1.2359466552734375, -1.198760986328125, -1.1615753173828125, -1.1243896484375, -1.0872039794921875, -1.050018310546875, -1.0128326416015625, -0.97564697265625, -0.9384613037109375, -0.901275634765625, -0.8640899658203125, -0.826904296875, -0.7897186279296875, -0.752532958984375, -0.7153472900390625, -0.67816162109375, -0.6409759521484375, -0.603790283203125, -0.5666046142578125, -0.5294189453125, -0.4922332763671875, -0.455047607421875, -0.4178619384765625, -0.38067626953125, -0.3434906005859375, -0.306304931640625, -0.2691192626953125, -0.23193359375, -0.1947479248046875, -0.157562255859375, -0.1203765869140625, -0.08319091796875, -0.0460052490234375, -0.008819580078125, 0.0283660888671875, 0.0655517578125, 0.1027374267578125, 0.139923095703125, 0.1771087646484375, 0.21429443359375, 0.2514801025390625, 0.288665771484375, 0.3258514404296875, 0.363037109375, 0.4002227783203125, 0.437408447265625, 0.4745941162109375, 0.51177978515625, 0.5489654541015625, 0.586151123046875, 0.6233367919921875, 0.6605224609375, 0.6977081298828125, 0.734893798828125, 0.7720794677734375, 0.80926513671875, 0.8464508056640625, 0.883636474609375, 0.9208221435546875, 0.9580078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 9.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 10.0, 18.0, 46.0, 58.0, 86.0, 149.0, 157.0, 143.0, 107.0, 65.0, 51.0, 29.0, 16.0, 11.0, 7.0, 3.0, 4.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.65234375, -0.6367225646972656, -0.6211013793945312, -0.6054801940917969, -0.5898590087890625, -0.5742378234863281, -0.5586166381835938, -0.5429954528808594, -0.527374267578125, -0.5117530822753906, -0.49613189697265625, -0.4805107116699219, -0.4648895263671875, -0.4492683410644531, -0.43364715576171875, -0.4180259704589844, -0.40240478515625, -0.3867835998535156, -0.37116241455078125, -0.3555412292480469, -0.3399200439453125, -0.3242988586425781, -0.30867767333984375, -0.2930564880371094, -0.277435302734375, -0.2618141174316406, -0.24619293212890625, -0.23057174682617188, -0.2149505615234375, -0.19932937622070312, -0.18370819091796875, -0.16808700561523438, -0.1524658203125, -0.13684463500976562, -0.12122344970703125, -0.10560226440429688, -0.0899810791015625, -0.07435989379882812, -0.05873870849609375, -0.043117523193359375, -0.027496337890625, -0.011875152587890625, 0.00374603271484375, 0.019367218017578125, 0.0349884033203125, 0.050609588623046875, 0.06623077392578125, 0.08185195922851562, 0.09747314453125, 0.11309432983398438, 0.12871551513671875, 0.14433670043945312, 0.1599578857421875, 0.17557907104492188, 0.19120025634765625, 0.20682144165039062, 0.222442626953125, 0.23806381225585938, 0.25368499755859375, 0.2693061828613281, 0.2849273681640625, 0.3005485534667969, 0.31616973876953125, 0.3317909240722656, 0.347412109375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 166.0, 696.0, 125.0, 16.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.394973754882812, -12.669388771057129, -11.943802833557129, -11.218217849731445, -10.492631912231445, -9.767046928405762, -9.041461944580078, -8.315876007080078, -7.5902910232543945, -6.864705562591553, -6.139120101928711, -5.413535118103027, -4.6879496574401855, -3.9623641967773438, -3.23677921295166, -2.5111937522888184, -1.7856082916259766, -1.0600229501724243, -0.33443760871887207, 0.3911476135253906, 1.1167330741882324, 1.8423185348510742, 2.567903518676758, 3.2934889793395996, 4.019074440002441, 4.744659900665283, 5.470245361328125, 6.195830345153809, 6.92141580581665, 7.647001266479492, 8.372586250305176, 9.09817123413086, 9.82375717163086, 10.549342155456543, 11.274928092956543, 12.000513076782227, 12.726099014282227, 13.45168399810791, 14.177268981933594, 14.902854919433594, 15.628439903259277, 16.35402488708496, 17.07961082458496, 17.805194854736328, 18.530780792236328, 19.256366729736328, 19.981952667236328, 20.707536697387695, 21.433122634887695, 22.158708572387695, 22.884292602539062, 23.609878540039062, 24.335464477539062, 25.061050415039062, 25.78663444519043, 26.51222038269043, 27.237804412841797, 27.963390350341797, 28.688974380493164, 29.414560317993164, 30.140146255493164, 30.86573028564453, 31.59131622314453, 32.31690216064453, 33.04248809814453]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 16.0, 20.0, 17.0, 28.0, 34.0, 45.0, 58.0, 57.0, 59.0, 65.0, 76.0, 87.0, 76.0, 74.0, 53.0, 49.0, 48.0, 35.0, 33.0, 23.0, 16.0, 11.0, 5.0, 9.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.332628011703491, -3.1939985752105713, -3.0553689002990723, -2.9167394638061523, -2.7781097888946533, -2.6394803524017334, -2.5008506774902344, -2.3622212409973145, -2.2235918045043945, -2.0849623680114746, -1.9463326930999756, -1.8077032566070557, -1.6690735816955566, -1.5304441452026367, -1.3918145895004272, -1.2531850337982178, -1.1145553588867188, -0.9759258031845093, -0.8372962474822998, -0.6986667513847351, -0.5600371956825256, -0.42140763998031616, -0.28277814388275146, -0.144148588180542, -0.0055190324783325195, 0.13311050832271576, 0.27174004912376404, 0.4103695750236511, 0.5489991307258606, 0.6876286864280701, 0.8262581825256348, 0.9648877382278442, 1.1035170555114746, 1.242146611213684, 1.3807761669158936, 1.5194056034088135, 1.6580352783203125, 1.7966647148132324, 1.935294270515442, 2.0739238262176514, 2.2125535011291504, 2.3511829376220703, 2.4898126125335693, 2.6284420490264893, 2.7670717239379883, 2.905701160430908, 3.044330596923828, 3.182960271835327, 3.321589708328247, 3.460219144821167, 3.598848819732666, 3.737478256225586, 3.876107931137085, 4.014737606048584, 4.153367042541504, 4.291996479034424, 4.430625915527344, 4.569255352020264, 4.707884788513184, 4.846514701843262, 4.985144138336182, 5.123773574829102, 5.2624030113220215, 5.401032447814941, 5.5396623611450195]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 9.0, 12.0, 12.0, 13.0, 22.0, 20.0, 20.0, 20.0, 40.0, 30.0, 31.0, 43.0, 66.0, 83.0, 130.0, 291.0, 831.0, 3318.0, 26825.0, 3333543.0, 804908.0, 20220.0, 2728.0, 622.0, 219.0, 102.0, 50.0, 20.0, 13.0, 11.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.46875, -3.38189697265625, -3.2950439453125, -3.20819091796875, -3.121337890625, -3.03448486328125, -2.9476318359375, -2.86077880859375, -2.77392578125, -2.68707275390625, -2.6002197265625, -2.51336669921875, -2.426513671875, -2.33966064453125, -2.2528076171875, -2.16595458984375, -2.0791015625, -1.99224853515625, -1.9053955078125, -1.81854248046875, -1.731689453125, -1.64483642578125, -1.5579833984375, -1.47113037109375, -1.38427734375, -1.29742431640625, -1.2105712890625, -1.12371826171875, -1.036865234375, -0.95001220703125, -0.8631591796875, -0.77630615234375, -0.689453125, -0.60260009765625, -0.5157470703125, -0.42889404296875, -0.342041015625, -0.25518798828125, -0.1683349609375, -0.08148193359375, 0.00537109375, 0.09222412109375, 0.1790771484375, 0.26593017578125, 0.352783203125, 0.43963623046875, 0.5264892578125, 0.61334228515625, 0.7001953125, 0.78704833984375, 0.8739013671875, 0.96075439453125, 1.047607421875, 1.13446044921875, 1.2213134765625, 1.30816650390625, 1.39501953125, 1.48187255859375, 1.5687255859375, 1.65557861328125, 1.742431640625, 1.82928466796875, 1.9161376953125, 2.00299072265625, 2.08984375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 9.0, 18.0, 38.0, 51.0, 77.0, 118.0, 153.0, 136.0, 122.0, 111.0, 77.0, 42.0, 23.0, 16.0, 12.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.33642578125, -0.32973575592041016, -0.3230457305908203, -0.31635570526123047, -0.3096656799316406, -0.3029756546020508, -0.29628562927246094, -0.2895956039428711, -0.28290557861328125, -0.2762155532836914, -0.26952552795410156, -0.2628355026245117, -0.2561454772949219, -0.24945545196533203, -0.2427654266357422, -0.23607540130615234, -0.2293853759765625, -0.22269535064697266, -0.2160053253173828, -0.20931529998779297, -0.20262527465820312, -0.19593524932861328, -0.18924522399902344, -0.1825551986694336, -0.17586517333984375, -0.1691751480102539, -0.16248512268066406, -0.15579509735107422, -0.14910507202148438, -0.14241504669189453, -0.1357250213623047, -0.12903499603271484, -0.122344970703125, -0.11565494537353516, -0.10896492004394531, -0.10227489471435547, -0.09558486938476562, -0.08889484405517578, -0.08220481872558594, -0.0755147933959961, -0.06882476806640625, -0.062134742736816406, -0.05544471740722656, -0.04875469207763672, -0.042064666748046875, -0.03537464141845703, -0.028684616088867188, -0.021994590759277344, -0.0153045654296875, -0.008614540100097656, -0.0019245147705078125, 0.004765510559082031, 0.011455535888671875, 0.01814556121826172, 0.024835586547851562, 0.031525611877441406, 0.03821563720703125, 0.044905662536621094, 0.05159568786621094, 0.05828571319580078, 0.06497573852539062, 0.07166576385498047, 0.07835578918457031, 0.08504581451416016, 0.09173583984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 16.0, 20.0, 17.0, 28.0, 70.0, 100.0, 212.0, 599.0, 2686.0, 4050738.0, 137639.0, 1523.0, 335.0, 124.0, 69.0, 40.0, 28.0, 18.0, 8.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.828125, -13.54522705078125, -13.2623291015625, -12.97943115234375, -12.696533203125, -12.41363525390625, -12.1307373046875, -11.84783935546875, -11.56494140625, -11.28204345703125, -10.9991455078125, -10.71624755859375, -10.433349609375, -10.15045166015625, -9.8675537109375, -9.58465576171875, -9.3017578125, -9.01885986328125, -8.7359619140625, -8.45306396484375, -8.170166015625, -7.88726806640625, -7.6043701171875, -7.32147216796875, -7.03857421875, -6.75567626953125, -6.4727783203125, -6.18988037109375, -5.906982421875, -5.62408447265625, -5.3411865234375, -5.05828857421875, -4.775390625, -4.49249267578125, -4.2095947265625, -3.92669677734375, -3.643798828125, -3.36090087890625, -3.0780029296875, -2.79510498046875, -2.51220703125, -2.22930908203125, -1.9464111328125, -1.66351318359375, -1.380615234375, -1.09771728515625, -0.8148193359375, -0.53192138671875, -0.2490234375, 0.03387451171875, 0.3167724609375, 0.59967041015625, 0.882568359375, 1.16546630859375, 1.4483642578125, 1.73126220703125, 2.01416015625, 2.29705810546875, 2.5799560546875, 2.86285400390625, 3.145751953125, 3.42864990234375, 3.7115478515625, 3.99444580078125, 4.27734375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 10.0, 28.0, 65.0, 268.0, 2330.0, 1071.0, 191.0, 71.0, 24.0, 8.0, 7.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2294921875, -1.2062339782714844, -1.1829757690429688, -1.1597175598144531, -1.1364593505859375, -1.1132011413574219, -1.0899429321289062, -1.0666847229003906, -1.043426513671875, -1.0201683044433594, -0.9969100952148438, -0.9736518859863281, -0.9503936767578125, -0.9271354675292969, -0.9038772583007812, -0.8806190490722656, -0.85736083984375, -0.8341026306152344, -0.8108444213867188, -0.7875862121582031, -0.7643280029296875, -0.7410697937011719, -0.7178115844726562, -0.6945533752441406, -0.671295166015625, -0.6480369567871094, -0.6247787475585938, -0.6015205383300781, -0.5782623291015625, -0.5550041198730469, -0.5317459106445312, -0.5084877014160156, -0.4852294921875, -0.4619712829589844, -0.43871307373046875, -0.4154548645019531, -0.3921966552734375, -0.3689384460449219, -0.34568023681640625, -0.3224220275878906, -0.299163818359375, -0.2759056091308594, -0.25264739990234375, -0.22938919067382812, -0.2061309814453125, -0.18287277221679688, -0.15961456298828125, -0.13635635375976562, -0.11309814453125, -0.08983993530273438, -0.06658172607421875, -0.043323516845703125, -0.0200653076171875, 0.003192901611328125, 0.02645111083984375, 0.049709320068359375, 0.072967529296875, 0.09622573852539062, 0.11948394775390625, 0.14274215698242188, 0.1660003662109375, 0.18925857543945312, 0.21251678466796875, 0.23577499389648438, 0.259033203125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 13.0, 28.0, 74.0, 208.0, 366.0, 196.0, 58.0, 28.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.702433586120605, -8.515105247497559, -8.327775955200195, -8.140447616577148, -7.953118324279785, -7.765789985656738, -7.578461170196533, -7.391132354736328, -7.203803539276123, -7.016474723815918, -6.829145908355713, -6.641817092895508, -6.454488754272461, -6.267159938812256, -6.079831123352051, -5.892502307891846, -5.705173492431641, -5.5178446769714355, -5.3305158615112305, -5.143187046051025, -4.95585823059082, -4.768529891967773, -4.581201076507568, -4.393872261047363, -4.206543445587158, -4.019214630126953, -3.831885814666748, -3.644557237625122, -3.457228422164917, -3.269899606704712, -3.082571029663086, -2.895242214202881, -2.707913637161255, -2.52058482170105, -2.333256244659424, -2.1459274291992188, -1.9585986137390137, -1.7712697982788086, -1.583941102027893, -1.3966124057769775, -1.2092835903167725, -1.0219547748565674, -0.8346260786056519, -0.6472973227500916, -0.45996856689453125, -0.27263981103897095, -0.08531105518341064, 0.10201764106750488, 0.28934645652770996, 0.47667521238327026, 0.6640039682388306, 0.8513327240943909, 1.0386614799499512, 1.2259902954101562, 1.4133189916610718, 1.6006476879119873, 1.7879765033721924, 1.9753053188323975, 2.1626338958740234, 2.3499627113342285, 2.5372915267944336, 2.7246203422546387, 2.9119491577148438, 3.0992777347564697, 3.286606550216675]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 11.0, 26.0, 33.0, 47.0, 54.0, 87.0, 95.0, 101.0, 102.0, 98.0, 96.0, 73.0, 60.0, 39.0, 32.0, 11.0, 8.0, 11.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0964064598083496, -3.000277519226074, -2.9041483402252197, -2.8080193996429443, -2.71189022064209, -2.6157612800598145, -2.519632339477539, -2.4235033988952637, -2.327374219894409, -2.231245279312134, -2.1351161003112793, -2.038987159729004, -1.942858099937439, -1.846729040145874, -1.7506000995635986, -1.6544710397720337, -1.5583419799804688, -1.4622129201889038, -1.3660838603973389, -1.2699549198150635, -1.1738258600234985, -1.0776968002319336, -0.9815678000450134, -0.8854387998580933, -0.7893097400665283, -0.6931806802749634, -0.5970516800880432, -0.500922679901123, -0.4047936201095581, -0.30866459012031555, -0.212535560131073, -0.11640655994415283, -0.020277738571166992, 0.07585129141807556, 0.17198032140731812, 0.26810935139656067, 0.3642383813858032, 0.4603674113750458, 0.5564964413642883, 0.6526254415512085, 0.7487545013427734, 0.8448835611343384, 0.9410125613212585, 1.0371415615081787, 1.1332706212997437, 1.2293996810913086, 1.325528621673584, 1.421657681465149, 1.5177867412567139, 1.6139158010482788, 1.7100448608398438, 1.8061738014221191, 1.902302861213684, 1.998431921005249, 2.0945608615875244, 2.190690040588379, 2.2868189811706543, 2.3829479217529297, 2.479077100753784, 2.5752060413360596, 2.671335220336914, 2.7674641609191895, 2.863593101501465, 2.9597220420837402, 3.0558512210845947]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 11.0, 6.0, 7.0, 14.0, 28.0, 33.0, 38.0, 76.0, 106.0, 187.0, 356.0, 872.0, 2785.0, 15452.0, 193535.0, 761857.0, 62793.0, 7264.0, 1764.0, 621.0, 282.0, 158.0, 99.0, 65.0, 44.0, 24.0, 18.0, 14.0, 11.0, 11.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.54296875, -2.468841552734375, -2.39471435546875, -2.320587158203125, -2.2464599609375, -2.172332763671875, -2.09820556640625, -2.024078369140625, -1.949951171875, -1.875823974609375, -1.80169677734375, -1.727569580078125, -1.6534423828125, -1.579315185546875, -1.50518798828125, -1.431060791015625, -1.35693359375, -1.282806396484375, -1.20867919921875, -1.134552001953125, -1.0604248046875, -0.986297607421875, -0.91217041015625, -0.838043212890625, -0.763916015625, -0.689788818359375, -0.61566162109375, -0.541534423828125, -0.4674072265625, -0.393280029296875, -0.31915283203125, -0.245025634765625, -0.1708984375, -0.096771240234375, -0.02264404296875, 0.051483154296875, 0.1256103515625, 0.199737548828125, 0.27386474609375, 0.347991943359375, 0.422119140625, 0.496246337890625, 0.57037353515625, 0.644500732421875, 0.7186279296875, 0.792755126953125, 0.86688232421875, 0.941009521484375, 1.01513671875, 1.089263916015625, 1.16339111328125, 1.237518310546875, 1.3116455078125, 1.385772705078125, 1.45989990234375, 1.534027099609375, 1.608154296875, 1.682281494140625, 1.75640869140625, 1.830535888671875, 1.9046630859375, 1.978790283203125, 2.05291748046875, 2.127044677734375, 2.201171875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 10.0, 16.0, 30.0, 46.0, 73.0, 87.0, 96.0, 136.0, 130.0, 105.0, 83.0, 71.0, 43.0, 28.0, 21.0, 10.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.38037109375, -0.3719196319580078, -0.3634681701660156, -0.35501670837402344, -0.34656524658203125, -0.33811378479003906, -0.3296623229980469, -0.3212108612060547, -0.3127593994140625, -0.3043079376220703, -0.2958564758300781, -0.28740501403808594, -0.27895355224609375, -0.27050209045410156, -0.2620506286621094, -0.2535991668701172, -0.245147705078125, -0.2366962432861328, -0.22824478149414062, -0.21979331970214844, -0.21134185791015625, -0.20289039611816406, -0.19443893432617188, -0.1859874725341797, -0.1775360107421875, -0.1690845489501953, -0.16063308715820312, -0.15218162536621094, -0.14373016357421875, -0.13527870178222656, -0.12682723999023438, -0.11837577819824219, -0.10992431640625, -0.10147285461425781, -0.09302139282226562, -0.08456993103027344, -0.07611846923828125, -0.06766700744628906, -0.059215545654296875, -0.05076408386230469, -0.0423126220703125, -0.03386116027832031, -0.025409698486328125, -0.016958236694335938, -0.00850677490234375, -5.53131103515625e-05, 0.008396148681640625, 0.016847610473632812, 0.025299072265625, 0.03375053405761719, 0.042201995849609375, 0.05065345764160156, 0.05910491943359375, 0.06755638122558594, 0.07600784301757812, 0.08445930480957031, 0.0929107666015625, 0.10136222839355469, 0.10981369018554688, 0.11826515197753906, 0.12671661376953125, 0.13516807556152344, 0.14361953735351562, 0.1520709991455078, 0.1605224609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 6.0, 10.0, 17.0, 19.0, 23.0, 47.0, 61.0, 103.0, 194.0, 325.0, 692.0, 1595.0, 3844.0, 11491.0, 50529.0, 337455.0, 523778.0, 91606.0, 17647.0, 5247.0, 1954.0, 845.0, 403.0, 225.0, 143.0, 84.0, 57.0, 26.0, 34.0, 19.0, 14.0, 12.0, 4.0, 10.0, 4.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1435546875, -1.10906982421875, -1.0745849609375, -1.04010009765625, -1.005615234375, -0.97113037109375, -0.9366455078125, -0.90216064453125, -0.86767578125, -0.83319091796875, -0.7987060546875, -0.76422119140625, -0.729736328125, -0.69525146484375, -0.6607666015625, -0.62628173828125, -0.591796875, -0.55731201171875, -0.5228271484375, -0.48834228515625, -0.453857421875, -0.41937255859375, -0.3848876953125, -0.35040283203125, -0.31591796875, -0.28143310546875, -0.2469482421875, -0.21246337890625, -0.177978515625, -0.14349365234375, -0.1090087890625, -0.07452392578125, -0.0400390625, -0.00555419921875, 0.0289306640625, 0.06341552734375, 0.097900390625, 0.13238525390625, 0.1668701171875, 0.20135498046875, 0.23583984375, 0.27032470703125, 0.3048095703125, 0.33929443359375, 0.373779296875, 0.40826416015625, 0.4427490234375, 0.47723388671875, 0.51171875, 0.54620361328125, 0.5806884765625, 0.61517333984375, 0.649658203125, 0.68414306640625, 0.7186279296875, 0.75311279296875, 0.78759765625, 0.82208251953125, 0.8565673828125, 0.89105224609375, 0.925537109375, 0.96002197265625, 0.9945068359375, 1.02899169921875, 1.0634765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 3.0, 9.0, 13.0, 12.0, 15.0, 16.0, 14.0, 19.0, 30.0, 43.0, 37.0, 34.0, 49.0, 46.0, 54.0, 40.0, 48.0, 69.0, 48.0, 52.0, 43.0, 38.0, 36.0, 40.0, 34.0, 28.0, 19.0, 22.0, 14.0, 16.0, 10.0, 15.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.60498046875, -0.5870590209960938, -0.5691375732421875, -0.5512161254882812, -0.533294677734375, -0.5153732299804688, -0.4974517822265625, -0.47953033447265625, -0.46160888671875, -0.44368743896484375, -0.4257659912109375, -0.40784454345703125, -0.389923095703125, -0.37200164794921875, -0.3540802001953125, -0.33615875244140625, -0.3182373046875, -0.30031585693359375, -0.2823944091796875, -0.26447296142578125, -0.246551513671875, -0.22863006591796875, -0.2107086181640625, -0.19278717041015625, -0.17486572265625, -0.15694427490234375, -0.1390228271484375, -0.12110137939453125, -0.103179931640625, -0.08525848388671875, -0.0673370361328125, -0.04941558837890625, -0.031494140625, -0.01357269287109375, 0.0043487548828125, 0.02227020263671875, 0.040191650390625, 0.05811309814453125, 0.0760345458984375, 0.09395599365234375, 0.11187744140625, 0.12979888916015625, 0.1477203369140625, 0.16564178466796875, 0.183563232421875, 0.20148468017578125, 0.2194061279296875, 0.23732757568359375, 0.2552490234375, 0.27317047119140625, 0.2910919189453125, 0.30901336669921875, 0.326934814453125, 0.34485626220703125, 0.3627777099609375, 0.38069915771484375, 0.39862060546875, 0.41654205322265625, 0.4344635009765625, 0.45238494873046875, 0.470306396484375, 0.48822784423828125, 0.5061492919921875, 0.5240707397460938, 0.5419921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 10.0, 7.0, 15.0, 14.0, 19.0, 40.0, 50.0, 111.0, 193.0, 404.0, 772.0, 1910.0, 5636.0, 25856.0, 371294.0, 590955.0, 39818.0, 7196.0, 2318.0, 966.0, 447.0, 189.0, 119.0, 71.0, 50.0, 29.0, 16.0, 21.0, 9.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8662109375, -0.8400421142578125, -0.813873291015625, -0.7877044677734375, -0.76153564453125, -0.7353668212890625, -0.709197998046875, -0.6830291748046875, -0.6568603515625, -0.6306915283203125, -0.604522705078125, -0.5783538818359375, -0.55218505859375, -0.5260162353515625, -0.499847412109375, -0.4736785888671875, -0.447509765625, -0.4213409423828125, -0.395172119140625, -0.3690032958984375, -0.34283447265625, -0.3166656494140625, -0.290496826171875, -0.2643280029296875, -0.2381591796875, -0.2119903564453125, -0.185821533203125, -0.1596527099609375, -0.13348388671875, -0.1073150634765625, -0.081146240234375, -0.0549774169921875, -0.02880859375, -0.0026397705078125, 0.023529052734375, 0.0496978759765625, 0.07586669921875, 0.1020355224609375, 0.128204345703125, 0.1543731689453125, 0.1805419921875, 0.2067108154296875, 0.232879638671875, 0.2590484619140625, 0.28521728515625, 0.3113861083984375, 0.337554931640625, 0.3637237548828125, 0.389892578125, 0.4160614013671875, 0.442230224609375, 0.4683990478515625, 0.49456787109375, 0.5207366943359375, 0.546905517578125, 0.5730743408203125, 0.5992431640625, 0.6254119873046875, 0.651580810546875, 0.6777496337890625, 0.70391845703125, 0.7300872802734375, 0.756256103515625, 0.7824249267578125, 0.80859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 13.0, 19.0, 24.0, 28.0, 57.0, 73.0, 97.0, 120.0, 130.0, 124.0, 82.0, 57.0, 50.0, 30.0, 19.0, 14.0, 10.0, 9.0, 9.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00012421607971191406, -0.00012098532170057297, -0.00011775456368923187, -0.00011452380567789078, -0.00011129304766654968, -0.00010806228965520859, -0.00010483153164386749, -0.0001016007736325264, -9.83700156211853e-05, -9.513925760984421e-05, -9.190849959850311e-05, -8.867774158716202e-05, -8.544698357582092e-05, -8.221622556447983e-05, -7.898546755313873e-05, -7.575470954179764e-05, -7.252395153045654e-05, -6.929319351911545e-05, -6.606243550777435e-05, -6.283167749643326e-05, -5.960091948509216e-05, -5.637016147375107e-05, -5.313940346240997e-05, -4.990864545106888e-05, -4.667788743972778e-05, -4.344712942838669e-05, -4.021637141704559e-05, -3.69856134057045e-05, -3.37548553943634e-05, -3.052409738302231e-05, -2.7293339371681213e-05, -2.406258136034012e-05, -2.0831823348999023e-05, -1.760106533765793e-05, -1.4370307326316833e-05, -1.1139549314975739e-05, -7.908791303634644e-06, -4.678033292293549e-06, -1.4472752809524536e-06, 1.7834827303886414e-06, 5.014240741729736e-06, 8.244998753070831e-06, 1.1475756764411926e-05, 1.4706514775753021e-05, 1.7937272787094116e-05, 2.116803079843521e-05, 2.4398788809776306e-05, 2.76295468211174e-05, 3.0860304832458496e-05, 3.409106284379959e-05, 3.7321820855140686e-05, 4.055257886648178e-05, 4.3783336877822876e-05, 4.701409488916397e-05, 5.0244852900505066e-05, 5.347561091184616e-05, 5.6706368923187256e-05, 5.993712693452835e-05, 6.316788494586945e-05, 6.639864295721054e-05, 6.962940096855164e-05, 7.286015897989273e-05, 7.609091699123383e-05, 7.932167500257492e-05, 8.255243301391602e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 10.0, 7.0, 22.0, 23.0, 59.0, 72.0, 126.0, 258.0, 509.0, 1002.0, 2267.0, 5979.0, 20589.0, 217102.0, 721806.0, 60927.0, 10816.0, 3737.0, 1551.0, 781.0, 384.0, 177.0, 108.0, 72.0, 43.0, 33.0, 20.0, 13.0, 8.0, 7.0, 4.0, 5.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.896484375, -0.8710708618164062, -0.8456573486328125, -0.8202438354492188, -0.794830322265625, -0.7694168090820312, -0.7440032958984375, -0.7185897827148438, -0.69317626953125, -0.6677627563476562, -0.6423492431640625, -0.6169357299804688, -0.591522216796875, -0.5661087036132812, -0.5406951904296875, -0.5152816772460938, -0.4898681640625, -0.46445465087890625, -0.4390411376953125, -0.41362762451171875, -0.388214111328125, -0.36280059814453125, -0.3373870849609375, -0.31197357177734375, -0.28656005859375, -0.26114654541015625, -0.2357330322265625, -0.21031951904296875, -0.184906005859375, -0.15949249267578125, -0.1340789794921875, -0.10866546630859375, -0.083251953125, -0.05783843994140625, -0.0324249267578125, -0.00701141357421875, 0.018402099609375, 0.04381561279296875, 0.0692291259765625, 0.09464263916015625, 0.12005615234375, 0.14546966552734375, 0.1708831787109375, 0.19629669189453125, 0.221710205078125, 0.24712371826171875, 0.2725372314453125, 0.29795074462890625, 0.3233642578125, 0.34877777099609375, 0.3741912841796875, 0.39960479736328125, 0.425018310546875, 0.45043182373046875, 0.4758453369140625, 0.5012588500976562, 0.52667236328125, 0.5520858764648438, 0.5774993896484375, 0.6029129028320312, 0.628326416015625, 0.6537399291992188, 0.6791534423828125, 0.7045669555664062, 0.72998046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 12.0, 7.0, 12.0, 12.0, 36.0, 66.0, 73.0, 125.0, 142.0, 158.0, 124.0, 87.0, 54.0, 37.0, 17.0, 11.0, 11.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.6201171875, -0.6034126281738281, -0.5867080688476562, -0.5700035095214844, -0.5532989501953125, -0.5365943908691406, -0.5198898315429688, -0.5031852722167969, -0.486480712890625, -0.4697761535644531, -0.45307159423828125, -0.4363670349121094, -0.4196624755859375, -0.4029579162597656, -0.38625335693359375, -0.3695487976074219, -0.35284423828125, -0.3361396789550781, -0.31943511962890625, -0.3027305603027344, -0.2860260009765625, -0.2693214416503906, -0.25261688232421875, -0.23591232299804688, -0.219207763671875, -0.20250320434570312, -0.18579864501953125, -0.16909408569335938, -0.1523895263671875, -0.13568496704101562, -0.11898040771484375, -0.10227584838867188, -0.0855712890625, -0.06886672973632812, -0.05216217041015625, -0.035457611083984375, -0.0187530517578125, -0.002048492431640625, 0.01465606689453125, 0.031360626220703125, 0.048065185546875, 0.06476974487304688, 0.08147430419921875, 0.09817886352539062, 0.1148834228515625, 0.13158798217773438, 0.14829254150390625, 0.16499710083007812, 0.18170166015625, 0.19840621948242188, 0.21511077880859375, 0.23181533813476562, 0.2485198974609375, 0.2652244567871094, 0.28192901611328125, 0.2986335754394531, 0.315338134765625, 0.3320426940917969, 0.34874725341796875, 0.3654518127441406, 0.3821563720703125, 0.3988609313964844, 0.41556549072265625, 0.4322700500488281, 0.448974609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 73.0, 343.0, 463.0, 103.0, 17.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.177642822265625, -25.555749893188477, -24.93385887145996, -24.311965942382812, -23.690074920654297, -23.06818199157715, -22.4462890625, -21.824398040771484, -21.202505111694336, -20.580612182617188, -19.958721160888672, -19.336828231811523, -18.714935302734375, -18.09304428100586, -17.47115135192871, -16.849258422851562, -16.227367401123047, -15.605475425720215, -14.983583450317383, -14.361690521240234, -13.739798545837402, -13.11790657043457, -12.496013641357422, -11.87412166595459, -11.252229690551758, -10.630337715148926, -10.008445739746094, -9.386552810668945, -8.764660835266113, -8.142768859863281, -7.520876407623291, -6.898983955383301, -6.277091026306152, -5.65519905090332, -5.03330659866333, -4.41141414642334, -3.789522171020508, -3.1676299571990967, -2.5457377433776855, -1.9238452911376953, -1.3019533157348633, -0.6800611019134521, -0.058168888092041016, 0.5637233257293701, 1.1856155395507812, 1.8075077533721924, 2.4293999671936035, 3.0512924194335938, 3.673184394836426, 4.295076370239258, 4.916968822479248, 5.538861274719238, 6.16075325012207, 6.782645225524902, 7.404537677764893, 8.026430130004883, 8.648322105407715, 9.270214080810547, 9.892107009887695, 10.513998985290527, 11.13589096069336, 11.757782936096191, 12.379674911499023, 13.001567840576172, 13.623459815979004]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 9.0, 10.0, 14.0, 15.0, 26.0, 13.0, 28.0, 23.0, 30.0, 34.0, 36.0, 50.0, 50.0, 57.0, 55.0, 38.0, 50.0, 61.0, 41.0, 46.0, 43.0, 29.0, 37.0, 27.0, 22.0, 28.0, 21.0, 15.0, 14.0, 21.0, 11.0, 11.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1218209266662598, -3.0180411338806152, -2.91426157951355, -2.8104817867279053, -2.70670223236084, -2.6029224395751953, -2.49914288520813, -2.3953630924224854, -2.29158353805542, -2.1878037452697754, -2.08402419090271, -1.980244517326355, -1.87646484375, -1.7726850509643555, -1.66890549659729, -1.5651257038116455, -1.4613460302352905, -1.3575663566589355, -1.2537866830825806, -1.1500070095062256, -1.0462273359298706, -0.9424476027488708, -0.8386679291725159, -0.7348882555961609, -0.6311085820198059, -0.5273289084434509, -0.42354923486709595, -0.3197695314884186, -0.2159898579120636, -0.11221015453338623, -0.00843048095703125, 0.09534919261932373, 0.1991288661956787, 0.3029085397720337, 0.40668821334838867, 0.5104678869247437, 0.6142475605010986, 0.7180272936820984, 0.8218069672584534, 0.9255866408348083, 1.0293662548065186, 1.1331459283828735, 1.2369256019592285, 1.3407052755355835, 1.4444849491119385, 1.548264741897583, 1.6520442962646484, 1.755824089050293, 1.859603762626648, 1.963383436203003, 2.0671632289886475, 2.170942783355713, 2.2747225761413574, 2.378502130508423, 2.4822819232940674, 2.586061477661133, 2.6898412704467773, 2.793621063232422, 2.8974006175994873, 3.001180410385132, 3.1049599647521973, 3.208739757537842, 3.3125193119049072, 3.4162991046905518, 3.520078659057617]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 4.0, 7.0, 13.0, 8.0, 12.0, 17.0, 16.0, 23.0, 31.0, 33.0, 48.0, 71.0, 85.0, 126.0, 191.0, 301.0, 586.0, 1353.0, 4204.0, 18399.0, 178563.0, 3909916.0, 64907.0, 10893.0, 2754.0, 924.0, 415.0, 171.0, 109.0, 38.0, 21.0, 16.0, 7.0, 4.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.974609375, -2.89697265625, -2.8193359375, -2.74169921875, -2.6640625, -2.58642578125, -2.5087890625, -2.43115234375, -2.353515625, -2.27587890625, -2.1982421875, -2.12060546875, -2.04296875, -1.96533203125, -1.8876953125, -1.81005859375, -1.732421875, -1.65478515625, -1.5771484375, -1.49951171875, -1.421875, -1.34423828125, -1.2666015625, -1.18896484375, -1.111328125, -1.03369140625, -0.9560546875, -0.87841796875, -0.80078125, -0.72314453125, -0.6455078125, -0.56787109375, -0.490234375, -0.41259765625, -0.3349609375, -0.25732421875, -0.1796875, -0.10205078125, -0.0244140625, 0.05322265625, 0.130859375, 0.20849609375, 0.2861328125, 0.36376953125, 0.44140625, 0.51904296875, 0.5966796875, 0.67431640625, 0.751953125, 0.82958984375, 0.9072265625, 0.98486328125, 1.0625, 1.14013671875, 1.2177734375, 1.29541015625, 1.373046875, 1.45068359375, 1.5283203125, 1.60595703125, 1.68359375, 1.76123046875, 1.8388671875, 1.91650390625, 1.994140625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 9.0, 13.0, 20.0, 36.0, 46.0, 73.0, 102.0, 94.0, 135.0, 120.0, 102.0, 87.0, 65.0, 36.0, 30.0, 13.0, 10.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.402099609375, -0.3930950164794922, -0.3840904235839844, -0.37508583068847656, -0.36608123779296875, -0.35707664489746094, -0.3480720520019531, -0.3390674591064453, -0.3300628662109375, -0.3210582733154297, -0.3120536804199219, -0.30304908752441406, -0.29404449462890625, -0.28503990173339844, -0.2760353088378906, -0.2670307159423828, -0.258026123046875, -0.2490215301513672, -0.24001693725585938, -0.23101234436035156, -0.22200775146484375, -0.21300315856933594, -0.20399856567382812, -0.1949939727783203, -0.1859893798828125, -0.1769847869873047, -0.16798019409179688, -0.15897560119628906, -0.14997100830078125, -0.14096641540527344, -0.13196182250976562, -0.12295722961425781, -0.11395263671875, -0.10494804382324219, -0.09594345092773438, -0.08693885803222656, -0.07793426513671875, -0.06892967224121094, -0.059925079345703125, -0.05092048645019531, -0.0419158935546875, -0.03291130065917969, -0.023906707763671875, -0.014902114868164062, -0.00589752197265625, 0.0031070709228515625, 0.012111663818359375, 0.021116256713867188, 0.030120849609375, 0.03912544250488281, 0.048130035400390625, 0.05713462829589844, 0.06613922119140625, 0.07514381408691406, 0.08414840698242188, 0.09315299987792969, 0.1021575927734375, 0.11116218566894531, 0.12016677856445312, 0.12917137145996094, 0.13817596435546875, 0.14718055725097656, 0.15618515014648438, 0.1651897430419922, 0.1741943359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 21.0, 12.0, 23.0, 40.0, 52.0, 68.0, 124.0, 184.0, 401.0, 2177.0, 125713.0, 4058237.0, 6094.0, 636.0, 203.0, 106.0, 62.0, 38.0, 34.0, 21.0, 13.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.754241943359375, -7.57879638671875, -7.403350830078125, -7.2279052734375, -7.052459716796875, -6.87701416015625, -6.701568603515625, -6.526123046875, -6.350677490234375, -6.17523193359375, -5.999786376953125, -5.8243408203125, -5.648895263671875, -5.47344970703125, -5.298004150390625, -5.12255859375, -4.947113037109375, -4.77166748046875, -4.596221923828125, -4.4207763671875, -4.245330810546875, -4.06988525390625, -3.894439697265625, -3.718994140625, -3.543548583984375, -3.36810302734375, -3.192657470703125, -3.0172119140625, -2.841766357421875, -2.66632080078125, -2.490875244140625, -2.3154296875, -2.139984130859375, -1.96453857421875, -1.789093017578125, -1.6136474609375, -1.438201904296875, -1.26275634765625, -1.087310791015625, -0.911865234375, -0.736419677734375, -0.56097412109375, -0.385528564453125, -0.2100830078125, -0.034637451171875, 0.14080810546875, 0.316253662109375, 0.49169921875, 0.667144775390625, 0.84259033203125, 1.018035888671875, 1.1934814453125, 1.368927001953125, 1.54437255859375, 1.719818115234375, 1.895263671875, 2.070709228515625, 2.24615478515625, 2.421600341796875, 2.5970458984375, 2.772491455078125, 2.94793701171875, 3.123382568359375, 3.298828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 17.0, 52.0, 176.0, 2418.0, 1230.0, 141.0, 29.0, 10.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.7275390625, -1.6942520141601562, -1.6609649658203125, -1.6276779174804688, -1.594390869140625, -1.5611038208007812, -1.5278167724609375, -1.4945297241210938, -1.46124267578125, -1.4279556274414062, -1.3946685791015625, -1.3613815307617188, -1.328094482421875, -1.2948074340820312, -1.2615203857421875, -1.2282333374023438, -1.1949462890625, -1.1616592407226562, -1.1283721923828125, -1.0950851440429688, -1.061798095703125, -1.0285110473632812, -0.9952239990234375, -0.9619369506835938, -0.92864990234375, -0.8953628540039062, -0.8620758056640625, -0.8287887573242188, -0.795501708984375, -0.7622146606445312, -0.7289276123046875, -0.6956405639648438, -0.662353515625, -0.6290664672851562, -0.5957794189453125, -0.5624923706054688, -0.529205322265625, -0.49591827392578125, -0.4626312255859375, -0.42934417724609375, -0.39605712890625, -0.36277008056640625, -0.3294830322265625, -0.29619598388671875, -0.262908935546875, -0.22962188720703125, -0.1963348388671875, -0.16304779052734375, -0.1297607421875, -0.09647369384765625, -0.0631866455078125, -0.02989959716796875, 0.003387451171875, 0.03667449951171875, 0.0699615478515625, 0.10324859619140625, 0.13653564453125, 0.16982269287109375, 0.2031097412109375, 0.23639678955078125, 0.269683837890625, 0.30297088623046875, 0.3362579345703125, 0.36954498291015625, 0.40283203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 14.0, 22.0, 65.0, 185.0, 290.0, 253.0, 104.0, 37.0, 11.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.470098972320557, -5.325133323669434, -5.180168151855469, -5.035202503204346, -4.890236854553223, -4.745271682739258, -4.600306034088135, -4.455340385437012, -4.310375213623047, -4.165409564971924, -4.020444393157959, -3.875478744506836, -3.730513095855713, -3.585547685623169, -3.440582275390625, -3.295616626739502, -3.150650978088379, -3.005685567855835, -2.860719919204712, -2.715754508972168, -2.570788860321045, -2.425823450088501, -2.280858039855957, -2.135892391204834, -1.99092698097229, -1.8459614515304565, -1.700995922088623, -1.556030511856079, -1.4110649824142456, -1.266099452972412, -1.1211340427398682, -0.9761685132980347, -0.8312032222747803, -0.6862376928329468, -0.5412722229957581, -0.39630672335624695, -0.25134122371673584, -0.10637569427490234, 0.03858977556228638, 0.1835552453994751, 0.3285207748413086, 0.4734862744808197, 0.6184517741203308, 0.7634172439575195, 0.908382773399353, 1.0533483028411865, 1.1983137130737305, 1.343279242515564, 1.4882447719573975, 1.633210301399231, 1.7781758308410645, 1.9231412410736084, 2.0681066513061523, 2.2130722999572754, 2.3580377101898193, 2.5030031204223633, 2.6479687690734863, 2.7929341793060303, 2.9378998279571533, 3.0828652381896973, 3.2278308868408203, 3.3727962970733643, 3.517761707305908, 3.6627273559570312, 3.807692766189575]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 5.0, 7.0, 16.0, 22.0, 32.0, 35.0, 50.0, 53.0, 84.0, 66.0, 90.0, 80.0, 88.0, 64.0, 64.0, 59.0, 40.0, 45.0, 31.0, 26.0, 11.0, 10.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3638198375701904, -2.2956786155700684, -2.2275376319885254, -2.1593964099884033, -2.0912551879882812, -2.0231142044067383, -1.9549729824066162, -1.8868317604064941, -1.8186906576156616, -1.750549554824829, -1.682408332824707, -1.6142672300338745, -1.546126127243042, -1.47798490524292, -1.4098438024520874, -1.3417026996612549, -1.2735614776611328, -1.2054203748703003, -1.1372791528701782, -1.0691380500793457, -1.0009968280792236, -0.9328557252883911, -0.8647146224975586, -0.7965734601020813, -0.728432297706604, -0.6602911353111267, -0.5921499729156494, -0.5240088701248169, -0.4558677077293396, -0.3877265453338623, -0.3195854127407074, -0.2514442801475525, -0.1833028793334961, -0.11516173183917999, -0.04702058434486389, 0.02112056314945221, 0.08926171064376831, 0.1574028730392456, 0.2255440056324005, 0.2936851382255554, 0.3618263006210327, 0.42996746301651, 0.4981085956096649, 0.5662497282028198, 0.6343908905982971, 0.7025320529937744, 0.7706731557846069, 0.8388143181800842, 0.9069554805755615, 0.9750966429710388, 1.0432378053665161, 1.1113789081573486, 1.1795201301574707, 1.2476612329483032, 1.3158023357391357, 1.3839435577392578, 1.4520846605300903, 1.5202257633209229, 1.588366985321045, 1.6565080881118774, 1.72464919090271, 1.792790412902832, 1.8609315156936646, 1.929072618484497, 1.9972138404846191]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 20.0, 34.0, 49.0, 73.0, 159.0, 310.0, 736.0, 2375.0, 16470.0, 560255.0, 450631.0, 13928.0, 2172.0, 717.0, 286.0, 146.0, 77.0, 37.0, 24.0, 17.0, 4.0, 3.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.6666259765625, -2.559814453125, -2.4530029296875, -2.34619140625, -2.2393798828125, -2.132568359375, -2.0257568359375, -1.9189453125, -1.8121337890625, -1.705322265625, -1.5985107421875, -1.49169921875, -1.3848876953125, -1.278076171875, -1.1712646484375, -1.064453125, -0.9576416015625, -0.850830078125, -0.7440185546875, -0.63720703125, -0.5303955078125, -0.423583984375, -0.3167724609375, -0.2099609375, -0.1031494140625, 0.003662109375, 0.1104736328125, 0.21728515625, 0.3240966796875, 0.430908203125, 0.5377197265625, 0.64453125, 0.7513427734375, 0.858154296875, 0.9649658203125, 1.07177734375, 1.1785888671875, 1.285400390625, 1.3922119140625, 1.4990234375, 1.6058349609375, 1.712646484375, 1.8194580078125, 1.92626953125, 2.0330810546875, 2.139892578125, 2.2467041015625, 2.353515625, 2.4603271484375, 2.567138671875, 2.6739501953125, 2.78076171875, 2.8875732421875, 2.994384765625, 3.1011962890625, 3.2080078125, 3.3148193359375, 3.421630859375, 3.5284423828125, 3.63525390625, 3.7420654296875, 3.848876953125, 3.9556884765625, 4.0625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 13.0, 13.0, 23.0, 51.0, 51.0, 73.0, 73.0, 95.0, 110.0, 107.0, 102.0, 78.0, 61.0, 40.0, 38.0, 25.0, 18.0, 7.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.40673828125, -0.3970069885253906, -0.38727569580078125, -0.3775444030761719, -0.3678131103515625, -0.3580818176269531, -0.34835052490234375, -0.3386192321777344, -0.328887939453125, -0.3191566467285156, -0.30942535400390625, -0.2996940612792969, -0.2899627685546875, -0.2802314758300781, -0.27050018310546875, -0.2607688903808594, -0.25103759765625, -0.24130630493164062, -0.23157501220703125, -0.22184371948242188, -0.2121124267578125, -0.20238113403320312, -0.19264984130859375, -0.18291854858398438, -0.173187255859375, -0.16345596313476562, -0.15372467041015625, -0.14399337768554688, -0.1342620849609375, -0.12453079223632812, -0.11479949951171875, -0.10506820678710938, -0.0953369140625, -0.08560562133789062, -0.07587432861328125, -0.06614303588867188, -0.0564117431640625, -0.046680450439453125, -0.03694915771484375, -0.027217864990234375, -0.017486572265625, -0.007755279541015625, 0.00197601318359375, 0.011707305908203125, 0.0214385986328125, 0.031169891357421875, 0.04090118408203125, 0.050632476806640625, 0.06036376953125, 0.07009506225585938, 0.07982635498046875, 0.08955764770507812, 0.0992889404296875, 0.10902023315429688, 0.11875152587890625, 0.12848281860351562, 0.138214111328125, 0.14794540405273438, 0.15767669677734375, 0.16740798950195312, 0.1771392822265625, 0.18687057495117188, 0.19660186767578125, 0.20633316040039062, 0.216064453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 5.0, 17.0, 14.0, 30.0, 58.0, 85.0, 174.0, 339.0, 879.0, 2375.0, 8723.0, 63852.0, 743702.0, 205061.0, 17218.0, 3721.0, 1271.0, 521.0, 229.0, 106.0, 68.0, 29.0, 22.0, 9.0, 10.0, 9.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.220703125, -2.156707763671875, -2.09271240234375, -2.028717041015625, -1.9647216796875, -1.900726318359375, -1.83673095703125, -1.772735595703125, -1.708740234375, -1.644744873046875, -1.58074951171875, -1.516754150390625, -1.4527587890625, -1.388763427734375, -1.32476806640625, -1.260772705078125, -1.19677734375, -1.132781982421875, -1.06878662109375, -1.004791259765625, -0.9407958984375, -0.876800537109375, -0.81280517578125, -0.748809814453125, -0.684814453125, -0.620819091796875, -0.55682373046875, -0.492828369140625, -0.4288330078125, -0.364837646484375, -0.30084228515625, -0.236846923828125, -0.1728515625, -0.108856201171875, -0.04486083984375, 0.019134521484375, 0.0831298828125, 0.147125244140625, 0.21112060546875, 0.275115966796875, 0.339111328125, 0.403106689453125, 0.46710205078125, 0.531097412109375, 0.5950927734375, 0.659088134765625, 0.72308349609375, 0.787078857421875, 0.85107421875, 0.915069580078125, 0.97906494140625, 1.043060302734375, 1.1070556640625, 1.171051025390625, 1.23504638671875, 1.299041748046875, 1.363037109375, 1.427032470703125, 1.49102783203125, 1.555023193359375, 1.6190185546875, 1.683013916015625, 1.74700927734375, 1.811004638671875, 1.875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 7.0, 7.0, 8.0, 9.0, 22.0, 28.0, 31.0, 37.0, 41.0, 53.0, 68.0, 71.0, 59.0, 72.0, 83.0, 80.0, 69.0, 47.0, 50.0, 37.0, 30.0, 20.0, 22.0, 19.0, 11.0, 4.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.240234375, -1.2054824829101562, -1.1707305908203125, -1.1359786987304688, -1.101226806640625, -1.0664749145507812, -1.0317230224609375, -0.9969711303710938, -0.96221923828125, -0.9274673461914062, -0.8927154541015625, -0.8579635620117188, -0.823211669921875, -0.7884597778320312, -0.7537078857421875, -0.7189559936523438, -0.6842041015625, -0.6494522094726562, -0.6147003173828125, -0.5799484252929688, -0.545196533203125, -0.5104446411132812, -0.4756927490234375, -0.44094085693359375, -0.40618896484375, -0.37143707275390625, -0.3366851806640625, -0.30193328857421875, -0.267181396484375, -0.23242950439453125, -0.1976776123046875, -0.16292572021484375, -0.128173828125, -0.09342193603515625, -0.0586700439453125, -0.02391815185546875, 0.010833740234375, 0.04558563232421875, 0.0803375244140625, 0.11508941650390625, 0.14984130859375, 0.18459320068359375, 0.2193450927734375, 0.25409698486328125, 0.288848876953125, 0.32360076904296875, 0.3583526611328125, 0.39310455322265625, 0.4278564453125, 0.46260833740234375, 0.4973602294921875, 0.5321121215820312, 0.566864013671875, 0.6016159057617188, 0.6363677978515625, 0.6711196899414062, 0.70587158203125, 0.7406234741210938, 0.7753753662109375, 0.8101272583007812, 0.844879150390625, 0.8796310424804688, 0.9143829345703125, 0.9491348266601562, 0.98388671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 1.0, 3.0, 7.0, 11.0, 8.0, 14.0, 13.0, 16.0, 35.0, 41.0, 47.0, 84.0, 160.0, 252.0, 415.0, 729.0, 1386.0, 2867.0, 7451.0, 23423.0, 106552.0, 497975.0, 323975.0, 58314.0, 14798.0, 5224.0, 2198.0, 1033.0, 563.0, 338.0, 189.0, 134.0, 97.0, 53.0, 40.0, 24.0, 23.0, 17.0, 12.0, 7.0, 10.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.6044921875, -0.587615966796875, -0.57073974609375, -0.553863525390625, -0.5369873046875, -0.520111083984375, -0.50323486328125, -0.486358642578125, -0.469482421875, -0.452606201171875, -0.43572998046875, -0.418853759765625, -0.4019775390625, -0.385101318359375, -0.36822509765625, -0.351348876953125, -0.33447265625, -0.317596435546875, -0.30072021484375, -0.283843994140625, -0.2669677734375, -0.250091552734375, -0.23321533203125, -0.216339111328125, -0.199462890625, -0.182586669921875, -0.16571044921875, -0.148834228515625, -0.1319580078125, -0.115081787109375, -0.09820556640625, -0.081329345703125, -0.064453125, -0.047576904296875, -0.03070068359375, -0.013824462890625, 0.0030517578125, 0.019927978515625, 0.03680419921875, 0.053680419921875, 0.070556640625, 0.087432861328125, 0.10430908203125, 0.121185302734375, 0.1380615234375, 0.154937744140625, 0.17181396484375, 0.188690185546875, 0.20556640625, 0.222442626953125, 0.23931884765625, 0.256195068359375, 0.2730712890625, 0.289947509765625, 0.30682373046875, 0.323699951171875, 0.340576171875, 0.357452392578125, 0.37432861328125, 0.391204833984375, 0.4080810546875, 0.424957275390625, 0.44183349609375, 0.458709716796875, 0.4755859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 6.0, 5.0, 15.0, 12.0, 26.0, 26.0, 46.0, 47.0, 70.0, 91.0, 117.0, 127.0, 125.0, 83.0, 48.0, 44.0, 39.0, 23.0, 23.0, 6.0, 4.0, 7.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00017011165618896484, -0.00016617868095636368, -0.0001622457057237625, -0.00015831273049116135, -0.00015437975525856018, -0.00015044678002595901, -0.00014651380479335785, -0.00014258082956075668, -0.00013864785432815552, -0.00013471487909555435, -0.00013078190386295319, -0.00012684892863035202, -0.00012291595339775085, -0.00011898297816514969, -0.00011505000293254852, -0.00011111702769994736, -0.00010718405246734619, -0.00010325107723474503, -9.931810200214386e-05, -9.53851267695427e-05, -9.145215153694153e-05, -8.751917630434036e-05, -8.35862010717392e-05, -7.965322583913803e-05, -7.572025060653687e-05, -7.17872753739357e-05, -6.785430014133453e-05, -6.392132490873337e-05, -5.99883496761322e-05, -5.6055374443531036e-05, -5.212239921092987e-05, -4.8189423978328705e-05, -4.425644874572754e-05, -4.032347351312637e-05, -3.639049828052521e-05, -3.245752304792404e-05, -2.8524547815322876e-05, -2.459157258272171e-05, -2.0658597350120544e-05, -1.672562211751938e-05, -1.2792646884918213e-05, -8.859671652317047e-06, -4.926696419715881e-06, -9.937211871147156e-07, 2.93925404548645e-06, 6.872229278087616e-06, 1.0805204510688782e-05, 1.4738179743289948e-05, 1.8671154975891113e-05, 2.260413020849228e-05, 2.6537105441093445e-05, 3.047008067369461e-05, 3.4403055906295776e-05, 3.833603113889694e-05, 4.226900637149811e-05, 4.6201981604099274e-05, 5.013495683670044e-05, 5.4067932069301605e-05, 5.800090730190277e-05, 6.193388253450394e-05, 6.58668577671051e-05, 6.979983299970627e-05, 7.373280823230743e-05, 7.76657834649086e-05, 8.159875869750977e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 3.0, 13.0, 18.0, 40.0, 81.0, 122.0, 259.0, 428.0, 1019.0, 2616.0, 8315.0, 36580.0, 275942.0, 596525.0, 101745.0, 17181.0, 4627.0, 1637.0, 646.0, 327.0, 143.0, 89.0, 55.0, 38.0, 25.0, 16.0, 9.0, 11.0, 13.0, 1.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.70654296875, -0.6865081787109375, -0.666473388671875, -0.6464385986328125, -0.62640380859375, -0.6063690185546875, -0.586334228515625, -0.5662994384765625, -0.5462646484375, -0.5262298583984375, -0.506195068359375, -0.4861602783203125, -0.46612548828125, -0.4460906982421875, -0.426055908203125, -0.4060211181640625, -0.385986328125, -0.3659515380859375, -0.345916748046875, -0.3258819580078125, -0.30584716796875, -0.2858123779296875, -0.265777587890625, -0.2457427978515625, -0.2257080078125, -0.2056732177734375, -0.185638427734375, -0.1656036376953125, -0.14556884765625, -0.1255340576171875, -0.105499267578125, -0.0854644775390625, -0.0654296875, -0.0453948974609375, -0.025360107421875, -0.0053253173828125, 0.01470947265625, 0.0347442626953125, 0.054779052734375, 0.0748138427734375, 0.0948486328125, 0.1148834228515625, 0.134918212890625, 0.1549530029296875, 0.17498779296875, 0.1950225830078125, 0.215057373046875, 0.2350921630859375, 0.255126953125, 0.2751617431640625, 0.295196533203125, 0.3152313232421875, 0.33526611328125, 0.3553009033203125, 0.375335693359375, 0.3953704833984375, 0.4154052734375, 0.4354400634765625, 0.455474853515625, 0.4755096435546875, 0.49554443359375, 0.5155792236328125, 0.535614013671875, 0.5556488037109375, 0.57568359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 12.0, 10.0, 14.0, 26.0, 23.0, 34.0, 68.0, 73.0, 119.0, 120.0, 111.0, 92.0, 79.0, 63.0, 41.0, 32.0, 24.0, 8.0, 14.0, 6.0, 10.0, 4.0, 3.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.57470703125, -0.5596199035644531, -0.5445327758789062, -0.5294456481933594, -0.5143585205078125, -0.4992713928222656, -0.48418426513671875, -0.4690971374511719, -0.454010009765625, -0.4389228820800781, -0.42383575439453125, -0.4087486267089844, -0.3936614990234375, -0.3785743713378906, -0.36348724365234375, -0.3484001159667969, -0.33331298828125, -0.3182258605957031, -0.30313873291015625, -0.2880516052246094, -0.2729644775390625, -0.2578773498535156, -0.24279022216796875, -0.22770309448242188, -0.212615966796875, -0.19752883911132812, -0.18244171142578125, -0.16735458374023438, -0.1522674560546875, -0.13718032836914062, -0.12209320068359375, -0.10700607299804688, -0.0919189453125, -0.07683181762695312, -0.06174468994140625, -0.046657562255859375, -0.0315704345703125, -0.016483306884765625, -0.00139617919921875, 0.013690948486328125, 0.028778076171875, 0.043865203857421875, 0.05895233154296875, 0.07403945922851562, 0.0891265869140625, 0.10421371459960938, 0.11930084228515625, 0.13438796997070312, 0.14947509765625, 0.16456222534179688, 0.17964935302734375, 0.19473648071289062, 0.2098236083984375, 0.22491073608398438, 0.23999786376953125, 0.2550849914550781, 0.270172119140625, 0.2852592468261719, 0.30034637451171875, 0.3154335021972656, 0.3305206298828125, 0.3456077575683594, 0.36069488525390625, 0.3757820129394531, 0.390869140625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 19.0, 16.0, 46.0, 86.0, 135.0, 204.0, 183.0, 126.0, 62.0, 52.0, 29.0, 23.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.175352096557617, -11.8909912109375, -11.6066312789917, -11.322270393371582, -11.037910461425781, -10.753549575805664, -10.469188690185547, -10.184828758239746, -9.900467872619629, -9.616106986999512, -9.331747055053711, -9.047386169433594, -8.763026237487793, -8.478665351867676, -8.194305419921875, -7.909944534301758, -7.625584125518799, -7.34122371673584, -7.056863307952881, -6.772502899169922, -6.488142013549805, -6.203781604766846, -5.919421195983887, -5.635060787200928, -5.350700378417969, -5.06633996963501, -4.781979560852051, -4.497618675231934, -4.213258266448975, -3.9288978576660156, -3.6445374488830566, -3.3601770401000977, -3.0758161544799805, -2.7914557456970215, -2.5070950984954834, -2.2227346897125244, -1.9383741617202759, -1.6540136337280273, -1.3696532249450684, -1.0852926969528198, -0.8009321689605713, -0.5165716409683228, -0.232211172580719, 0.052149295806884766, 0.3365098237991333, 0.6208703517913818, 0.9052307605743408, 1.1895912885665894, 1.473951816558838, 1.7583123445510864, 2.042672872543335, 2.327033281326294, 2.611393928527832, 2.895754337310791, 3.18011474609375, 3.464475154876709, 3.748835802078247, 4.033196449279785, 4.317556858062744, 4.601917266845703, 4.886277675628662, 5.170638084411621, 5.454998970031738, 5.739359378814697, 6.023719787597656]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 10.0, 6.0, 8.0, 15.0, 11.0, 20.0, 15.0, 18.0, 24.0, 27.0, 46.0, 42.0, 42.0, 39.0, 53.0, 60.0, 48.0, 50.0, 40.0, 61.0, 47.0, 40.0, 40.0, 34.0, 32.0, 30.0, 24.0, 20.0, 12.0, 21.0, 12.0, 12.0, 10.0, 3.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-4.770001411437988, -4.629631042480469, -4.489260673522949, -4.34889030456543, -4.20851993560791, -4.068149566650391, -3.92777943611145, -3.7874090671539307, -3.647038698196411, -3.5066683292388916, -3.366297960281372, -3.2259275913238525, -3.085557460784912, -2.9451870918273926, -2.804816722869873, -2.6644463539123535, -2.524075984954834, -2.3837056159973145, -2.243335247039795, -2.1029648780822754, -1.9625946283340454, -1.8222242593765259, -1.681854009628296, -1.5414836406707764, -1.4011132717132568, -1.2607429027557373, -1.1203725337982178, -0.9800022840499878, -0.8396319150924683, -0.6992615461349487, -0.558891236782074, -0.4185209274291992, -0.2781505584716797, -0.13778021931648254, 0.0025901198387145996, 0.14296045899391174, 0.2833307981491089, 0.4237011671066284, 0.5640714764595032, 0.7044417858123779, 0.8448121547698975, 0.985182523727417, 1.1255528926849365, 1.2659231424331665, 1.406293511390686, 1.5466638803482056, 1.6870341300964355, 1.827404499053955, 1.9677748680114746, 2.108145236968994, 2.2485156059265137, 2.388885974884033, 2.5292563438415527, 2.6696267127990723, 2.8099968433380127, 2.9503672122955322, 3.0907375812530518, 3.2311079502105713, 3.371478319168091, 3.5118486881256104, 3.652218818664551, 3.7925891876220703, 3.93295955657959, 4.073329925537109, 4.213700294494629]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 4.0, 2.0, 10.0, 11.0, 12.0, 15.0, 18.0, 21.0, 20.0, 30.0, 36.0, 52.0, 47.0, 49.0, 79.0, 98.0, 143.0, 160.0, 232.0, 384.0, 710.0, 1235.0, 2823.0, 7460.0, 24687.0, 135258.0, 3723051.0, 245676.0, 35410.0, 10100.0, 3564.0, 1433.0, 695.0, 340.0, 172.0, 92.0, 60.0, 33.0, 21.0, 10.0, 10.0, 3.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.91796875, -2.8525543212890625, -2.787139892578125, -2.7217254638671875, -2.65631103515625, -2.5908966064453125, -2.525482177734375, -2.4600677490234375, -2.3946533203125, -2.3292388916015625, -2.263824462890625, -2.1984100341796875, -2.13299560546875, -2.0675811767578125, -2.002166748046875, -1.9367523193359375, -1.871337890625, -1.8059234619140625, -1.740509033203125, -1.6750946044921875, -1.60968017578125, -1.5442657470703125, -1.478851318359375, -1.4134368896484375, -1.3480224609375, -1.2826080322265625, -1.217193603515625, -1.1517791748046875, -1.08636474609375, -1.0209503173828125, -0.955535888671875, -0.8901214599609375, -0.82470703125, -0.7592926025390625, -0.693878173828125, -0.6284637451171875, -0.56304931640625, -0.4976348876953125, -0.432220458984375, -0.3668060302734375, -0.3013916015625, -0.2359771728515625, -0.170562744140625, -0.1051483154296875, -0.03973388671875, 0.0256805419921875, 0.091094970703125, 0.1565093994140625, 0.221923828125, 0.2873382568359375, 0.352752685546875, 0.4181671142578125, 0.48358154296875, 0.5489959716796875, 0.614410400390625, 0.6798248291015625, 0.7452392578125, 0.8106536865234375, 0.876068115234375, 0.9414825439453125, 1.00689697265625, 1.0723114013671875, 1.137725830078125, 1.2031402587890625, 1.2685546875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 11.0, 20.0, 25.0, 34.0, 52.0, 68.0, 64.0, 100.0, 109.0, 102.0, 109.0, 86.0, 64.0, 50.0, 40.0, 30.0, 13.0, 2.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.42444419860839844, -0.4143180847167969, -0.4041919708251953, -0.39406585693359375, -0.3839397430419922, -0.3738136291503906, -0.36368751525878906, -0.3535614013671875, -0.34343528747558594, -0.3333091735839844, -0.3231830596923828, -0.31305694580078125, -0.3029308319091797, -0.2928047180175781, -0.28267860412597656, -0.272552490234375, -0.26242637634277344, -0.2523002624511719, -0.2421741485595703, -0.23204803466796875, -0.2219219207763672, -0.21179580688476562, -0.20166969299316406, -0.1915435791015625, -0.18141746520996094, -0.17129135131835938, -0.1611652374267578, -0.15103912353515625, -0.1409130096435547, -0.13078689575195312, -0.12066078186035156, -0.11053466796875, -0.10040855407714844, -0.09028244018554688, -0.08015632629394531, -0.07003021240234375, -0.05990409851074219, -0.049777984619140625, -0.03965187072753906, -0.0295257568359375, -0.019399642944335938, -0.009273529052734375, 0.0008525848388671875, 0.01097869873046875, 0.021104812622070312, 0.031230926513671875, 0.04135704040527344, 0.051483154296875, 0.06160926818847656, 0.07173538208007812, 0.08186149597167969, 0.09198760986328125, 0.10211372375488281, 0.11223983764648438, 0.12236595153808594, 0.1324920654296875, 0.14261817932128906, 0.15274429321289062, 0.1628704071044922, 0.17299652099609375, 0.1831226348876953, 0.19324874877929688, 0.20337486267089844, 0.2135009765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 6.0, 7.0, 13.0, 31.0, 78.0, 146.0, 294.0, 1088.0, 9091.0, 4153450.0, 27882.0, 1546.0, 381.0, 146.0, 67.0, 30.0, 16.0, 11.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.265625, -11.9117431640625, -11.557861328125, -11.2039794921875, -10.85009765625, -10.4962158203125, -10.142333984375, -9.7884521484375, -9.4345703125, -9.0806884765625, -8.726806640625, -8.3729248046875, -8.01904296875, -7.6651611328125, -7.311279296875, -6.9573974609375, -6.603515625, -6.2496337890625, -5.895751953125, -5.5418701171875, -5.18798828125, -4.8341064453125, -4.480224609375, -4.1263427734375, -3.7724609375, -3.4185791015625, -3.064697265625, -2.7108154296875, -2.35693359375, -2.0030517578125, -1.649169921875, -1.2952880859375, -0.94140625, -0.5875244140625, -0.233642578125, 0.1202392578125, 0.47412109375, 0.8280029296875, 1.181884765625, 1.5357666015625, 1.8896484375, 2.2435302734375, 2.597412109375, 2.9512939453125, 3.30517578125, 3.6590576171875, 4.012939453125, 4.3668212890625, 4.720703125, 5.0745849609375, 5.428466796875, 5.7823486328125, 6.13623046875, 6.4901123046875, 6.843994140625, 7.1978759765625, 7.5517578125, 7.9056396484375, 8.259521484375, 8.6134033203125, 8.96728515625, 9.3211669921875, 9.675048828125, 10.0289306640625, 10.3828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 7.0, 9.0, 9.0, 11.0, 20.0, 42.0, 197.0, 2614.0, 1006.0, 111.0, 31.0, 11.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.32421875, -2.255523681640625, -2.18682861328125, -2.118133544921875, -2.0494384765625, -1.980743408203125, -1.91204833984375, -1.843353271484375, -1.774658203125, -1.705963134765625, -1.63726806640625, -1.568572998046875, -1.4998779296875, -1.431182861328125, -1.36248779296875, -1.293792724609375, -1.22509765625, -1.156402587890625, -1.08770751953125, -1.019012451171875, -0.9503173828125, -0.881622314453125, -0.81292724609375, -0.744232177734375, -0.675537109375, -0.606842041015625, -0.53814697265625, -0.469451904296875, -0.4007568359375, -0.332061767578125, -0.26336669921875, -0.194671630859375, -0.1259765625, -0.057281494140625, 0.01141357421875, 0.080108642578125, 0.1488037109375, 0.217498779296875, 0.28619384765625, 0.354888916015625, 0.423583984375, 0.492279052734375, 0.56097412109375, 0.629669189453125, 0.6983642578125, 0.767059326171875, 0.83575439453125, 0.904449462890625, 0.97314453125, 1.041839599609375, 1.11053466796875, 1.179229736328125, 1.2479248046875, 1.316619873046875, 1.38531494140625, 1.454010009765625, 1.522705078125, 1.591400146484375, 1.66009521484375, 1.728790283203125, 1.7974853515625, 1.866180419921875, 1.93487548828125, 2.003570556640625, 2.072265625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 12.0, 47.0, 208.0, 500.0, 188.0, 36.0, 11.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.29140281677246, -23.809968948364258, -23.328535079956055, -22.84710121154785, -22.36566734313965, -21.884233474731445, -21.402799606323242, -20.92136573791504, -20.439931869506836, -19.958498001098633, -19.47706413269043, -18.995630264282227, -18.514196395874023, -18.03276252746582, -17.551328659057617, -17.069894790649414, -16.58846092224121, -16.107027053833008, -15.625593185424805, -15.144159317016602, -14.662725448608398, -14.181291580200195, -13.699857711791992, -13.218423843383789, -12.736989974975586, -12.255556106567383, -11.77412223815918, -11.292688369750977, -10.811254501342773, -10.32982063293457, -9.848386764526367, -9.366952896118164, -8.885518074035645, -8.404084205627441, -7.922650337219238, -7.441216468811035, -6.959782600402832, -6.478348731994629, -5.996914863586426, -5.515480995178223, -5.0340471267700195, -4.552613258361816, -4.071179389953613, -3.58974552154541, -3.108311653137207, -2.626877784729004, -2.145443916320801, -1.6640100479125977, -1.1825761795043945, -0.7011423110961914, -0.21970844268798828, 0.26172542572021484, 0.743159294128418, 1.224593162536621, 1.7060270309448242, 2.1874608993530273, 2.6688947677612305, 3.1503286361694336, 3.6317625045776367, 4.11319637298584, 4.594630241394043, 5.076064109802246, 5.557497978210449, 6.038931846618652, 6.5203657150268555]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 0.0, 6.0, 7.0, 10.0, 13.0, 35.0, 48.0, 72.0, 82.0, 94.0, 100.0, 100.0, 93.0, 77.0, 84.0, 61.0, 39.0, 22.0, 24.0, 13.0, 14.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.191410064697266, -4.041649341583252, -3.8918888568878174, -3.7421281337738037, -3.592367649078369, -3.4426069259643555, -3.292846202850342, -3.1430857181549072, -2.9933252334594727, -2.843564510345459, -2.6938040256500244, -2.5440433025360107, -2.394282817840576, -2.2445220947265625, -2.094761371612549, -1.9450008869171143, -1.7952401638031006, -1.6454795598983765, -1.4957189559936523, -1.3459582328796387, -1.196197748184204, -1.0464370250701904, -0.8966764211654663, -0.7469158172607422, -0.5971552133560181, -0.44739460945129395, -0.29763397574424744, -0.14787334203720093, 0.0018872618675231934, 0.15164786577224731, 0.3014085292816162, 0.45116913318634033, 0.6009297370910645, 0.7506903409957886, 0.9004509449005127, 1.0502116680145264, 1.199972152709961, 1.3497328758239746, 1.4994934797286987, 1.6492540836334229, 1.799014687538147, 1.948775291442871, 2.0985360145568848, 2.2482964992523193, 2.398057222366333, 2.5478177070617676, 2.6975784301757812, 2.847339153289795, 2.9970996379852295, 3.146860361099243, 3.2966208457946777, 3.4463815689086914, 3.596142053604126, 3.7459027767181396, 3.895663261413574, 4.045423984527588, 4.195184707641602, 4.344945430755615, 4.494706153869629, 4.644466400146484, 4.794227123260498, 4.943987846374512, 5.093748569488525, 5.243509292602539, 5.3932695388793945]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 7.0, 8.0, 6.0, 6.0, 11.0, 8.0, 11.0, 22.0, 28.0, 47.0, 62.0, 92.0, 132.0, 196.0, 303.0, 522.0, 980.0, 2213.0, 6578.0, 26310.0, 168298.0, 633333.0, 171528.0, 26481.0, 6655.0, 2334.0, 1025.0, 496.0, 265.0, 194.0, 113.0, 88.0, 44.0, 39.0, 34.0, 19.0, 10.0, 12.0, 9.0, 6.0, 12.0, 5.0, 2.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.87109375, -1.81524658203125, -1.7593994140625, -1.70355224609375, -1.647705078125, -1.59185791015625, -1.5360107421875, -1.48016357421875, -1.42431640625, -1.36846923828125, -1.3126220703125, -1.25677490234375, -1.200927734375, -1.14508056640625, -1.0892333984375, -1.03338623046875, -0.9775390625, -0.92169189453125, -0.8658447265625, -0.80999755859375, -0.754150390625, -0.69830322265625, -0.6424560546875, -0.58660888671875, -0.53076171875, -0.47491455078125, -0.4190673828125, -0.36322021484375, -0.307373046875, -0.25152587890625, -0.1956787109375, -0.13983154296875, -0.083984375, -0.02813720703125, 0.0277099609375, 0.08355712890625, 0.139404296875, 0.19525146484375, 0.2510986328125, 0.30694580078125, 0.36279296875, 0.41864013671875, 0.4744873046875, 0.53033447265625, 0.586181640625, 0.64202880859375, 0.6978759765625, 0.75372314453125, 0.8095703125, 0.86541748046875, 0.9212646484375, 0.97711181640625, 1.032958984375, 1.08880615234375, 1.1446533203125, 1.20050048828125, 1.25634765625, 1.31219482421875, 1.3680419921875, 1.42388916015625, 1.479736328125, 1.53558349609375, 1.5914306640625, 1.64727783203125, 1.703125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 6.0, 15.0, 23.0, 17.0, 51.0, 69.0, 79.0, 102.0, 85.0, 115.0, 90.0, 94.0, 82.0, 53.0, 41.0, 29.0, 17.0, 9.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.44677734375, -0.4356727600097656, -0.42456817626953125, -0.4134635925292969, -0.4023590087890625, -0.3912544250488281, -0.38014984130859375, -0.3690452575683594, -0.357940673828125, -0.3468360900878906, -0.33573150634765625, -0.3246269226074219, -0.3135223388671875, -0.3024177551269531, -0.29131317138671875, -0.2802085876464844, -0.26910400390625, -0.2579994201660156, -0.24689483642578125, -0.23579025268554688, -0.2246856689453125, -0.21358108520507812, -0.20247650146484375, -0.19137191772460938, -0.180267333984375, -0.16916275024414062, -0.15805816650390625, -0.14695358276367188, -0.1358489990234375, -0.12474441528320312, -0.11363983154296875, -0.10253524780273438, -0.0914306640625, -0.08032608032226562, -0.06922149658203125, -0.058116912841796875, -0.0470123291015625, -0.035907745361328125, -0.02480316162109375, -0.013698577880859375, -0.002593994140625, 0.008510589599609375, 0.01961517333984375, 0.030719757080078125, 0.0418243408203125, 0.052928924560546875, 0.06403350830078125, 0.07513809204101562, 0.08624267578125, 0.09734725952148438, 0.10845184326171875, 0.11955642700195312, 0.1306610107421875, 0.14176559448242188, 0.15287017822265625, 0.16397476196289062, 0.175079345703125, 0.18618392944335938, 0.19728851318359375, 0.20839309692382812, 0.2194976806640625, 0.23060226440429688, 0.24170684814453125, 0.2528114318847656, 0.263916015625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 13.0, 20.0, 36.0, 39.0, 74.0, 133.0, 269.0, 669.0, 1708.0, 6191.0, 29036.0, 173133.0, 571332.0, 219030.0, 36180.0, 7260.0, 2006.0, 745.0, 297.0, 144.0, 67.0, 44.0, 23.0, 26.0, 10.0, 14.0, 12.0, 2.0, 8.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.091796875, -1.0560760498046875, -1.020355224609375, -0.9846343994140625, -0.94891357421875, -0.9131927490234375, -0.877471923828125, -0.8417510986328125, -0.8060302734375, -0.7703094482421875, -0.734588623046875, -0.6988677978515625, -0.66314697265625, -0.6274261474609375, -0.591705322265625, -0.5559844970703125, -0.520263671875, -0.4845428466796875, -0.448822021484375, -0.4131011962890625, -0.37738037109375, -0.3416595458984375, -0.305938720703125, -0.2702178955078125, -0.2344970703125, -0.1987762451171875, -0.163055419921875, -0.1273345947265625, -0.09161376953125, -0.0558929443359375, -0.020172119140625, 0.0155487060546875, 0.05126953125, 0.0869903564453125, 0.122711181640625, 0.1584320068359375, 0.19415283203125, 0.2298736572265625, 0.265594482421875, 0.3013153076171875, 0.3370361328125, 0.3727569580078125, 0.408477783203125, 0.4441986083984375, 0.47991943359375, 0.5156402587890625, 0.551361083984375, 0.5870819091796875, 0.622802734375, 0.6585235595703125, 0.694244384765625, 0.7299652099609375, 0.76568603515625, 0.8014068603515625, 0.837127685546875, 0.8728485107421875, 0.9085693359375, 0.9442901611328125, 0.980010986328125, 1.0157318115234375, 1.05145263671875, 1.0871734619140625, 1.122894287109375, 1.1586151123046875, 1.1943359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 12.0, 14.0, 19.0, 9.0, 25.0, 26.0, 31.0, 36.0, 40.0, 38.0, 39.0, 35.0, 51.0, 54.0, 44.0, 61.0, 51.0, 47.0, 46.0, 34.0, 48.0, 29.0, 43.0, 23.0, 19.0, 27.0, 18.0, 20.0, 9.0, 9.0, 5.0, 9.0, 8.0, 2.0, 7.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.701171875, -0.6781005859375, -0.655029296875, -0.6319580078125, -0.60888671875, -0.5858154296875, -0.562744140625, -0.5396728515625, -0.5166015625, -0.4935302734375, -0.470458984375, -0.4473876953125, -0.42431640625, -0.4012451171875, -0.378173828125, -0.3551025390625, -0.33203125, -0.3089599609375, -0.285888671875, -0.2628173828125, -0.23974609375, -0.2166748046875, -0.193603515625, -0.1705322265625, -0.1474609375, -0.1243896484375, -0.101318359375, -0.0782470703125, -0.05517578125, -0.0321044921875, -0.009033203125, 0.0140380859375, 0.037109375, 0.0601806640625, 0.083251953125, 0.1063232421875, 0.12939453125, 0.1524658203125, 0.175537109375, 0.1986083984375, 0.2216796875, 0.2447509765625, 0.267822265625, 0.2908935546875, 0.31396484375, 0.3370361328125, 0.360107421875, 0.3831787109375, 0.40625, 0.4293212890625, 0.452392578125, 0.4754638671875, 0.49853515625, 0.5216064453125, 0.544677734375, 0.5677490234375, 0.5908203125, 0.6138916015625, 0.636962890625, 0.6600341796875, 0.68310546875, 0.7061767578125, 0.729248046875, 0.7523193359375, 0.775390625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 2.0, 12.0, 17.0, 24.0, 47.0, 78.0, 124.0, 228.0, 539.0, 1280.0, 4799.0, 30497.0, 387699.0, 564677.0, 49008.0, 6633.0, 1675.0, 614.0, 270.0, 162.0, 60.0, 41.0, 20.0, 12.0, 12.0, 10.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6875, -0.6601104736328125, -0.632720947265625, -0.6053314208984375, -0.57794189453125, -0.5505523681640625, -0.523162841796875, -0.4957733154296875, -0.4683837890625, -0.4409942626953125, -0.413604736328125, -0.3862152099609375, -0.35882568359375, -0.3314361572265625, -0.304046630859375, -0.2766571044921875, -0.249267578125, -0.2218780517578125, -0.194488525390625, -0.1670989990234375, -0.13970947265625, -0.1123199462890625, -0.084930419921875, -0.0575408935546875, -0.0301513671875, -0.0027618408203125, 0.024627685546875, 0.0520172119140625, 0.07940673828125, 0.1067962646484375, 0.134185791015625, 0.1615753173828125, 0.18896484375, 0.2163543701171875, 0.243743896484375, 0.2711334228515625, 0.29852294921875, 0.3259124755859375, 0.353302001953125, 0.3806915283203125, 0.4080810546875, 0.4354705810546875, 0.462860107421875, 0.4902496337890625, 0.51763916015625, 0.5450286865234375, 0.572418212890625, 0.5998077392578125, 0.627197265625, 0.6545867919921875, 0.681976318359375, 0.7093658447265625, 0.73675537109375, 0.7641448974609375, 0.791534423828125, 0.8189239501953125, 0.8463134765625, 0.8737030029296875, 0.901092529296875, 0.9284820556640625, 0.95587158203125, 0.9832611083984375, 1.010650634765625, 1.0380401611328125, 1.0654296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 8.0, 2.0, 20.0, 10.0, 22.0, 40.0, 62.0, 87.0, 97.0, 130.0, 152.0, 111.0, 98.0, 47.0, 42.0, 32.0, 14.0, 8.0, 7.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012421607971191406, -0.00011979788541793823, -0.0001153796911239624, -0.00011096149682998657, -0.00010654330253601074, -0.00010212510824203491, -9.770691394805908e-05, -9.328871965408325e-05, -8.887052536010742e-05, -8.445233106613159e-05, -8.003413677215576e-05, -7.561594247817993e-05, -7.11977481842041e-05, -6.677955389022827e-05, -6.236135959625244e-05, -5.794316530227661e-05, -5.352497100830078e-05, -4.910677671432495e-05, -4.468858242034912e-05, -4.027038812637329e-05, -3.585219383239746e-05, -3.143399953842163e-05, -2.70158052444458e-05, -2.259761095046997e-05, -1.817941665649414e-05, -1.376122236251831e-05, -9.34302806854248e-06, -4.92483377456665e-06, -5.066394805908203e-07, 3.91155481338501e-06, 8.32974910736084e-06, 1.274794340133667e-05, 1.71661376953125e-05, 2.158433198928833e-05, 2.600252628326416e-05, 3.042072057723999e-05, 3.483891487121582e-05, 3.925710916519165e-05, 4.367530345916748e-05, 4.809349775314331e-05, 5.251169204711914e-05, 5.692988634109497e-05, 6.13480806350708e-05, 6.576627492904663e-05, 7.018446922302246e-05, 7.460266351699829e-05, 7.902085781097412e-05, 8.343905210494995e-05, 8.785724639892578e-05, 9.227544069290161e-05, 9.669363498687744e-05, 0.00010111182928085327, 0.0001055300235748291, 0.00010994821786880493, 0.00011436641216278076, 0.00011878460645675659, 0.00012320280075073242, 0.00012762099504470825, 0.00013203918933868408, 0.0001364573836326599, 0.00014087557792663574, 0.00014529377222061157, 0.0001497119665145874, 0.00015413016080856323, 0.00015854835510253906]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 10.0, 7.0, 19.0, 15.0, 27.0, 52.0, 89.0, 215.0, 533.0, 2242.0, 12495.0, 133208.0, 756807.0, 127950.0, 11892.0, 2014.0, 558.0, 177.0, 84.0, 54.0, 34.0, 26.0, 18.0, 8.0, 6.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.503997802734375, -0.47674560546875, -0.449493408203125, -0.4222412109375, -0.394989013671875, -0.36773681640625, -0.340484619140625, -0.313232421875, -0.285980224609375, -0.25872802734375, -0.231475830078125, -0.2042236328125, -0.176971435546875, -0.14971923828125, -0.122467041015625, -0.09521484375, -0.067962646484375, -0.04071044921875, -0.013458251953125, 0.0137939453125, 0.041046142578125, 0.06829833984375, 0.095550537109375, 0.122802734375, 0.150054931640625, 0.17730712890625, 0.204559326171875, 0.2318115234375, 0.259063720703125, 0.28631591796875, 0.313568115234375, 0.3408203125, 0.368072509765625, 0.39532470703125, 0.422576904296875, 0.4498291015625, 0.477081298828125, 0.50433349609375, 0.531585693359375, 0.558837890625, 0.586090087890625, 0.61334228515625, 0.640594482421875, 0.6678466796875, 0.695098876953125, 0.72235107421875, 0.749603271484375, 0.77685546875, 0.804107666015625, 0.83135986328125, 0.858612060546875, 0.8858642578125, 0.913116455078125, 0.94036865234375, 0.967620849609375, 0.994873046875, 1.022125244140625, 1.04937744140625, 1.076629638671875, 1.1038818359375, 1.131134033203125, 1.15838623046875, 1.185638427734375, 1.212890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 11.0, 9.0, 12.0, 15.0, 20.0, 34.0, 41.0, 64.0, 52.0, 71.0, 100.0, 92.0, 77.0, 73.0, 66.0, 61.0, 52.0, 35.0, 19.0, 21.0, 17.0, 14.0, 11.0, 6.0, 6.0, 2.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2420654296875, -0.23076820373535156, -0.21947097778320312, -0.2081737518310547, -0.19687652587890625, -0.1855792999267578, -0.17428207397460938, -0.16298484802246094, -0.1516876220703125, -0.14039039611816406, -0.12909317016601562, -0.11779594421386719, -0.10649871826171875, -0.09520149230957031, -0.08390426635742188, -0.07260704040527344, -0.061309814453125, -0.05001258850097656, -0.038715362548828125, -0.027418136596679688, -0.01612091064453125, -0.0048236846923828125, 0.006473541259765625, 0.017770767211914062, 0.0290679931640625, 0.04036521911621094, 0.051662445068359375, 0.06295967102050781, 0.07425689697265625, 0.08555412292480469, 0.09685134887695312, 0.10814857482910156, 0.11944580078125, 0.13074302673339844, 0.14204025268554688, 0.1533374786376953, 0.16463470458984375, 0.1759319305419922, 0.18722915649414062, 0.19852638244628906, 0.2098236083984375, 0.22112083435058594, 0.23241806030273438, 0.2437152862548828, 0.25501251220703125, 0.2663097381591797, 0.2776069641113281, 0.28890419006347656, 0.300201416015625, 0.31149864196777344, 0.3227958679199219, 0.3340930938720703, 0.34539031982421875, 0.3566875457763672, 0.3679847717285156, 0.37928199768066406, 0.3905792236328125, 0.40187644958496094, 0.4131736755371094, 0.4244709014892578, 0.43576812744140625, 0.4470653533935547, 0.4583625793457031, 0.46965980529785156, 0.48095703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 25.0, 55.0, 144.0, 281.0, 241.0, 144.0, 72.0, 26.0, 8.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.50307846069336, -19.111434936523438, -18.71979331970215, -18.328149795532227, -17.936508178710938, -17.544864654541016, -17.153221130371094, -16.761579513549805, -16.369935989379883, -15.978293418884277, -15.586650848388672, -15.19500732421875, -14.803364753723145, -14.411722183227539, -14.020079612731934, -13.628437042236328, -13.236794471740723, -12.845151901245117, -12.453509330749512, -12.061866760253906, -11.670223236083984, -11.278580665588379, -10.886938095092773, -10.495295524597168, -10.103652954101562, -9.712010383605957, -9.320367813110352, -8.92872428894043, -8.537081718444824, -8.145439147949219, -7.753796577453613, -7.362154006958008, -6.9705095291137695, -6.578866958618164, -6.1872239112854, -5.795581340789795, -5.403938293457031, -5.012295722961426, -4.62065315246582, -4.229010581970215, -3.837367534637451, -3.4457247257232666, -3.054081916809082, -2.6624393463134766, -2.270796537399292, -1.8791537284851074, -1.487511157989502, -1.0958683490753174, -0.7042255401611328, -0.312582790851593, 0.07905995845794678, 0.4707026481628418, 0.8623454570770264, 1.253988265991211, 1.6456308364868164, 2.037273645401001, 2.4289164543151855, 2.82055926322937, 3.2122020721435547, 3.60384464263916, 3.9954874515533447, 4.387130260467529, 4.778772830963135, 5.170415878295898, 5.562058448791504]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 7.0, 10.0, 16.0, 14.0, 20.0, 24.0, 30.0, 27.0, 34.0, 43.0, 51.0, 49.0, 55.0, 48.0, 47.0, 71.0, 52.0, 48.0, 47.0, 49.0, 46.0, 23.0, 29.0, 24.0, 27.0, 14.0, 22.0, 14.0, 16.0, 13.0, 4.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.57539176940918, -4.432658672332764, -4.289925575256348, -4.147192478179932, -4.004459381103516, -3.8617262840270996, -3.7189931869506836, -3.5762600898742676, -3.4335269927978516, -3.2907938957214355, -3.1480607986450195, -3.0053277015686035, -2.8625946044921875, -2.7198615074157715, -2.5771284103393555, -2.4343953132629395, -2.2916624546051025, -2.1489293575286865, -2.0061962604522705, -1.8634631633758545, -1.7207300662994385, -1.5779969692230225, -1.435263991355896, -1.29253089427948, -1.149797797203064, -1.007064700126648, -0.8643316030502319, -0.7215985655784607, -0.5788654685020447, -0.43613237142562866, -0.2933993339538574, -0.1506662368774414, -0.00793313980102539, 0.13479994237422943, 0.27753302454948425, 0.4202660918235779, 0.5629991888999939, 0.7057322859764099, 0.8484653234481812, 0.9911984205245972, 1.1339315176010132, 1.2766646146774292, 1.4193977117538452, 1.5621306896209717, 1.7048637866973877, 1.8475968837738037, 1.9903299808502197, 2.1330630779266357, 2.2757961750030518, 2.4185292720794678, 2.561262369155884, 2.7039954662323, 2.846728563308716, 2.989461660385132, 3.1321945190429688, 3.2749276161193848, 3.417660713195801, 3.560393810272217, 3.703126907348633, 3.845860004425049, 3.988593101501465, 4.131326198577881, 4.274059295654297, 4.416792392730713, 4.559525489807129]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 7.0, 13.0, 11.0, 11.0, 12.0, 15.0, 23.0, 34.0, 42.0, 56.0, 64.0, 100.0, 127.0, 175.0, 317.0, 573.0, 1106.0, 2593.0, 7793.0, 32349.0, 628880.0, 3455649.0, 47820.0, 10218.0, 3368.0, 1416.0, 651.0, 304.0, 216.0, 136.0, 74.0, 38.0, 28.0, 15.0, 7.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0], "bins": [-2.875, -2.809814453125, -2.74462890625, -2.679443359375, -2.6142578125, -2.549072265625, -2.48388671875, -2.418701171875, -2.353515625, -2.288330078125, -2.22314453125, -2.157958984375, -2.0927734375, -2.027587890625, -1.96240234375, -1.897216796875, -1.83203125, -1.766845703125, -1.70166015625, -1.636474609375, -1.5712890625, -1.506103515625, -1.44091796875, -1.375732421875, -1.310546875, -1.245361328125, -1.18017578125, -1.114990234375, -1.0498046875, -0.984619140625, -0.91943359375, -0.854248046875, -0.7890625, -0.723876953125, -0.65869140625, -0.593505859375, -0.5283203125, -0.463134765625, -0.39794921875, -0.332763671875, -0.267578125, -0.202392578125, -0.13720703125, -0.072021484375, -0.0068359375, 0.058349609375, 0.12353515625, 0.188720703125, 0.25390625, 0.319091796875, 0.38427734375, 0.449462890625, 0.5146484375, 0.579833984375, 0.64501953125, 0.710205078125, 0.775390625, 0.840576171875, 0.90576171875, 0.970947265625, 1.0361328125, 1.101318359375, 1.16650390625, 1.231689453125, 1.296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 16.0, 13.0, 30.0, 55.0, 56.0, 65.0, 96.0, 80.0, 96.0, 76.0, 91.0, 71.0, 60.0, 62.0, 45.0, 23.0, 18.0, 10.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.42822265625, -0.41744232177734375, -0.4066619873046875, -0.39588165283203125, -0.385101318359375, -0.37432098388671875, -0.3635406494140625, -0.35276031494140625, -0.34197998046875, -0.33119964599609375, -0.3204193115234375, -0.30963897705078125, -0.298858642578125, -0.28807830810546875, -0.2772979736328125, -0.26651763916015625, -0.2557373046875, -0.24495697021484375, -0.2341766357421875, -0.22339630126953125, -0.212615966796875, -0.20183563232421875, -0.1910552978515625, -0.18027496337890625, -0.16949462890625, -0.15871429443359375, -0.1479339599609375, -0.13715362548828125, -0.126373291015625, -0.11559295654296875, -0.1048126220703125, -0.09403228759765625, -0.083251953125, -0.07247161865234375, -0.0616912841796875, -0.05091094970703125, -0.040130615234375, -0.02935028076171875, -0.0185699462890625, -0.00778961181640625, 0.00299072265625, 0.01377105712890625, 0.0245513916015625, 0.03533172607421875, 0.046112060546875, 0.05689239501953125, 0.0676727294921875, 0.07845306396484375, 0.0892333984375, 0.10001373291015625, 0.1107940673828125, 0.12157440185546875, 0.132354736328125, 0.14313507080078125, 0.1539154052734375, 0.16469573974609375, 0.17547607421875, 0.18625640869140625, 0.1970367431640625, 0.20781707763671875, 0.218597412109375, 0.22937774658203125, 0.2401580810546875, 0.25093841552734375, 0.26171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 11.0, 5.0, 15.0, 10.0, 16.0, 24.0, 46.0, 43.0, 97.0, 125.0, 180.0, 346.0, 610.0, 1130.0, 2483.0, 6044.0, 18418.0, 74643.0, 1214298.0, 2741163.0, 98637.0, 22715.0, 7312.0, 2834.0, 1293.0, 676.0, 393.0, 229.0, 157.0, 93.0, 52.0, 53.0, 29.0, 30.0, 10.0, 20.0, 7.0, 2.0, 4.0, 4.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.23046875, -1.1908721923828125, -1.151275634765625, -1.1116790771484375, -1.07208251953125, -1.0324859619140625, -0.992889404296875, -0.9532928466796875, -0.9136962890625, -0.8740997314453125, -0.834503173828125, -0.7949066162109375, -0.75531005859375, -0.7157135009765625, -0.676116943359375, -0.6365203857421875, -0.596923828125, -0.5573272705078125, -0.517730712890625, -0.4781341552734375, -0.43853759765625, -0.3989410400390625, -0.359344482421875, -0.3197479248046875, -0.2801513671875, -0.2405548095703125, -0.200958251953125, -0.1613616943359375, -0.12176513671875, -0.0821685791015625, -0.042572021484375, -0.0029754638671875, 0.03662109375, 0.0762176513671875, 0.115814208984375, 0.1554107666015625, 0.19500732421875, 0.2346038818359375, 0.274200439453125, 0.3137969970703125, 0.3533935546875, 0.3929901123046875, 0.432586669921875, 0.4721832275390625, 0.51177978515625, 0.5513763427734375, 0.590972900390625, 0.6305694580078125, 0.670166015625, 0.7097625732421875, 0.749359130859375, 0.7889556884765625, 0.82855224609375, 0.8681488037109375, 0.907745361328125, 0.9473419189453125, 0.9869384765625, 1.0265350341796875, 1.066131591796875, 1.1057281494140625, 1.14532470703125, 1.1849212646484375, 1.224517822265625, 1.2641143798828125, 1.3037109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 5.0, 18.0, 14.0, 17.0, 32.0, 39.0, 61.0, 93.0, 191.0, 519.0, 1524.0, 816.0, 297.0, 149.0, 97.0, 52.0, 40.0, 28.0, 12.0, 10.0, 13.0, 12.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.378662109375, -0.3650016784667969, -0.35134124755859375, -0.3376808166503906, -0.3240203857421875, -0.3103599548339844, -0.29669952392578125, -0.2830390930175781, -0.269378662109375, -0.2557182312011719, -0.24205780029296875, -0.22839736938476562, -0.2147369384765625, -0.20107650756835938, -0.18741607666015625, -0.17375564575195312, -0.16009521484375, -0.14643478393554688, -0.13277435302734375, -0.11911392211914062, -0.1054534912109375, -0.09179306030273438, -0.07813262939453125, -0.06447219848632812, -0.050811767578125, -0.037151336669921875, -0.02349090576171875, -0.009830474853515625, 0.0038299560546875, 0.017490386962890625, 0.03115081787109375, 0.044811248779296875, 0.0584716796875, 0.07213211059570312, 0.08579254150390625, 0.09945297241210938, 0.1131134033203125, 0.12677383422851562, 0.14043426513671875, 0.15409469604492188, 0.167755126953125, 0.18141555786132812, 0.19507598876953125, 0.20873641967773438, 0.2223968505859375, 0.23605728149414062, 0.24971771240234375, 0.2633781433105469, 0.27703857421875, 0.2906990051269531, 0.30435943603515625, 0.3180198669433594, 0.3316802978515625, 0.3453407287597656, 0.35900115966796875, 0.3726615905761719, 0.386322021484375, 0.3999824523925781, 0.41364288330078125, 0.4273033142089844, 0.4409637451171875, 0.4546241760253906, 0.46828460693359375, 0.4819450378417969, 0.49560546875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 11.0, 19.0, 76.0, 303.0, 382.0, 163.0, 42.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4266514778137207, -2.1859872341156006, -1.9453227519989014, -1.7046585083007812, -1.4639941453933716, -1.223329782485962, -0.9826655387878418, -0.7420011758804321, -0.5013368129730225, -0.2606724798679352, -0.0200081467628479, 0.220656156539917, 0.46132051944732666, 0.7019848823547363, 0.9426491260528564, 1.1833134889602661, 1.4239778518676758, 1.6646422147750854, 1.9053065776824951, 2.1459708213806152, 2.3866353034973145, 2.6272995471954346, 2.8679637908935547, 3.108628273010254, 3.349292516708374, 3.589956760406494, 3.8306212425231934, 4.071285247802734, 4.311949729919434, 4.552614212036133, 4.793278694152832, 5.033942699432373, 5.274606704711914, 5.515271186828613, 5.755935192108154, 5.9965996742248535, 6.237264156341553, 6.477928161621094, 6.718592643737793, 6.959257125854492, 7.199921607971191, 7.440586090087891, 7.681250095367432, 7.921914577484131, 8.162578582763672, 8.403243064880371, 8.64390754699707, 8.88457202911377, 9.125236511230469, 9.365900993347168, 9.606565475463867, 9.84722900390625, 10.08789348602295, 10.328557968139648, 10.569222450256348, 10.809886932373047, 11.05055046081543, 11.291214942932129, 11.531879425048828, 11.772542953491211, 12.01320743560791, 12.25387191772461, 12.494536399841309, 12.735200881958008, 12.975865364074707]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 8.0, 11.0, 8.0, 11.0, 12.0, 22.0, 24.0, 28.0, 36.0, 49.0, 37.0, 49.0, 47.0, 50.0, 48.0, 54.0, 61.0, 54.0, 54.0, 52.0, 43.0, 45.0, 43.0, 26.0, 30.0, 28.0, 16.0, 19.0, 6.0, 8.0, 11.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4040803909301758, -1.3527841567993164, -1.301487922668457, -1.2501916885375977, -1.1988954544067383, -1.147599220275879, -1.09630286693573, -1.0450066328048706, -0.9937103986740112, -0.9424141645431519, -0.8911179304122925, -0.8398216366767883, -0.788525402545929, -0.7372291684150696, -0.6859328746795654, -0.634636640548706, -0.5833404064178467, -0.5320441722869873, -0.48074790835380554, -0.4294516444206238, -0.3781554102897644, -0.32685917615890503, -0.27556291222572327, -0.2242666482925415, -0.17297041416168213, -0.12167416512966156, -0.07037791609764099, -0.019081667065620422, 0.032214581966400146, 0.08351081609725952, 0.13480708003044128, 0.18610334396362305, 0.23739969730377197, 0.28869593143463135, 0.3399921953678131, 0.3912884593009949, 0.44258469343185425, 0.4938809275627136, 0.5451772212982178, 0.5964734554290771, 0.6477696895599365, 0.6990659236907959, 0.7503621578216553, 0.8016584515571594, 0.8529546856880188, 0.9042509198188782, 0.9555472135543823, 1.0068434476852417, 1.058139681816101, 1.1094359159469604, 1.1607321500778198, 1.2120283842086792, 1.2633247375488281, 1.3146209716796875, 1.3659172058105469, 1.4172134399414062, 1.4685096740722656, 1.519805908203125, 1.5711021423339844, 1.6223983764648438, 1.6736946105957031, 1.7249908447265625, 1.7762871980667114, 1.8275834321975708, 1.8788796663284302]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 13.0, 15.0, 13.0, 28.0, 45.0, 55.0, 91.0, 150.0, 277.0, 521.0, 1187.0, 3159.0, 12052.0, 77991.0, 585883.0, 321296.0, 34956.0, 6832.0, 2104.0, 866.0, 426.0, 216.0, 119.0, 72.0, 56.0, 33.0, 26.0, 15.0, 12.0, 10.0, 7.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7490234375, -1.6812591552734375, -1.613494873046875, -1.5457305908203125, -1.47796630859375, -1.4102020263671875, -1.342437744140625, -1.2746734619140625, -1.2069091796875, -1.1391448974609375, -1.071380615234375, -1.0036163330078125, -0.93585205078125, -0.8680877685546875, -0.800323486328125, -0.7325592041015625, -0.664794921875, -0.5970306396484375, -0.529266357421875, -0.4615020751953125, -0.39373779296875, -0.3259735107421875, -0.258209228515625, -0.1904449462890625, -0.1226806640625, -0.0549163818359375, 0.012847900390625, 0.0806121826171875, 0.14837646484375, 0.2161407470703125, 0.283905029296875, 0.3516693115234375, 0.41943359375, 0.4871978759765625, 0.554962158203125, 0.6227264404296875, 0.69049072265625, 0.7582550048828125, 0.826019287109375, 0.8937835693359375, 0.9615478515625, 1.0293121337890625, 1.097076416015625, 1.1648406982421875, 1.23260498046875, 1.3003692626953125, 1.368133544921875, 1.4358978271484375, 1.503662109375, 1.5714263916015625, 1.639190673828125, 1.7069549560546875, 1.77471923828125, 1.8424835205078125, 1.910247802734375, 1.9780120849609375, 2.0457763671875, 2.1135406494140625, 2.181304931640625, 2.2490692138671875, 2.31683349609375, 2.3845977783203125, 2.452362060546875, 2.5201263427734375, 2.587890625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 12.0, 12.0, 16.0, 25.0, 45.0, 60.0, 57.0, 79.0, 81.0, 92.0, 97.0, 77.0, 78.0, 76.0, 58.0, 43.0, 32.0, 20.0, 15.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.43359375, -0.4227867126464844, -0.41197967529296875, -0.4011726379394531, -0.3903656005859375, -0.3795585632324219, -0.36875152587890625, -0.3579444885253906, -0.347137451171875, -0.3363304138183594, -0.32552337646484375, -0.3147163391113281, -0.3039093017578125, -0.2931022644042969, -0.28229522705078125, -0.2714881896972656, -0.26068115234375, -0.24987411499023438, -0.23906707763671875, -0.22826004028320312, -0.2174530029296875, -0.20664596557617188, -0.19583892822265625, -0.18503189086914062, -0.174224853515625, -0.16341781616210938, -0.15261077880859375, -0.14180374145507812, -0.1309967041015625, -0.12018966674804688, -0.10938262939453125, -0.09857559204101562, -0.0877685546875, -0.07696151733398438, -0.06615447998046875, -0.055347442626953125, -0.0445404052734375, -0.033733367919921875, -0.02292633056640625, -0.012119293212890625, -0.001312255859375, 0.009494781494140625, 0.02030181884765625, 0.031108856201171875, 0.0419158935546875, 0.052722930908203125, 0.06352996826171875, 0.07433700561523438, 0.08514404296875, 0.09595108032226562, 0.10675811767578125, 0.11756515502929688, 0.1283721923828125, 0.13917922973632812, 0.14998626708984375, 0.16079330444335938, 0.171600341796875, 0.18240737915039062, 0.19321441650390625, 0.20402145385742188, 0.2148284912109375, 0.22563552856445312, 0.23644256591796875, 0.24724960327148438, 0.258056640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 7.0, 8.0, 5.0, 5.0, 8.0, 3.0, 6.0, 10.0, 10.0, 16.0, 38.0, 44.0, 82.0, 168.0, 283.0, 581.0, 1340.0, 3710.0, 11489.0, 44796.0, 206902.0, 510060.0, 206784.0, 44331.0, 11613.0, 3668.0, 1423.0, 545.0, 253.0, 132.0, 74.0, 50.0, 34.0, 20.0, 14.0, 15.0, 5.0, 8.0, 4.0, 6.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98193359375, -0.9486465454101562, -0.9153594970703125, -0.8820724487304688, -0.848785400390625, -0.8154983520507812, -0.7822113037109375, -0.7489242553710938, -0.71563720703125, -0.6823501586914062, -0.6490631103515625, -0.6157760620117188, -0.582489013671875, -0.5492019653320312, -0.5159149169921875, -0.48262786865234375, -0.4493408203125, -0.41605377197265625, -0.3827667236328125, -0.34947967529296875, -0.316192626953125, -0.28290557861328125, -0.2496185302734375, -0.21633148193359375, -0.18304443359375, -0.14975738525390625, -0.1164703369140625, -0.08318328857421875, -0.049896240234375, -0.01660919189453125, 0.0166778564453125, 0.04996490478515625, 0.083251953125, 0.11653900146484375, 0.1498260498046875, 0.18311309814453125, 0.216400146484375, 0.24968719482421875, 0.2829742431640625, 0.31626129150390625, 0.34954833984375, 0.38283538818359375, 0.4161224365234375, 0.44940948486328125, 0.482696533203125, 0.5159835815429688, 0.5492706298828125, 0.5825576782226562, 0.6158447265625, 0.6491317749023438, 0.6824188232421875, 0.7157058715820312, 0.748992919921875, 0.7822799682617188, 0.8155670166015625, 0.8488540649414062, 0.88214111328125, 0.9154281616210938, 0.9487152099609375, 0.9820022583007812, 1.015289306640625, 1.0485763549804688, 1.0818634033203125, 1.1151504516601562, 1.1484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 0.0, 5.0, 2.0, 5.0, 5.0, 8.0, 5.0, 10.0, 14.0, 10.0, 17.0, 19.0, 19.0, 33.0, 28.0, 29.0, 26.0, 23.0, 43.0, 49.0, 35.0, 48.0, 47.0, 46.0, 41.0, 39.0, 46.0, 40.0, 43.0, 43.0, 33.0, 29.0, 24.0, 21.0, 17.0, 12.0, 18.0, 17.0, 8.0, 4.0, 12.0, 4.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.814453125, -0.790679931640625, -0.76690673828125, -0.743133544921875, -0.7193603515625, -0.695587158203125, -0.67181396484375, -0.648040771484375, -0.624267578125, -0.600494384765625, -0.57672119140625, -0.552947998046875, -0.5291748046875, -0.505401611328125, -0.48162841796875, -0.457855224609375, -0.43408203125, -0.410308837890625, -0.38653564453125, -0.362762451171875, -0.3389892578125, -0.315216064453125, -0.29144287109375, -0.267669677734375, -0.243896484375, -0.220123291015625, -0.19635009765625, -0.172576904296875, -0.1488037109375, -0.125030517578125, -0.10125732421875, -0.077484130859375, -0.0537109375, -0.029937744140625, -0.00616455078125, 0.017608642578125, 0.0413818359375, 0.065155029296875, 0.08892822265625, 0.112701416015625, 0.136474609375, 0.160247802734375, 0.18402099609375, 0.207794189453125, 0.2315673828125, 0.255340576171875, 0.27911376953125, 0.302886962890625, 0.32666015625, 0.350433349609375, 0.37420654296875, 0.397979736328125, 0.4217529296875, 0.445526123046875, 0.46929931640625, 0.493072509765625, 0.516845703125, 0.540618896484375, 0.56439208984375, 0.588165283203125, 0.6119384765625, 0.635711669921875, 0.65948486328125, 0.683258056640625, 0.70703125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 1.0, 4.0, 4.0, 17.0, 21.0, 43.0, 60.0, 130.0, 277.0, 639.0, 1901.0, 8414.0, 70141.0, 717466.0, 226563.0, 17770.0, 3346.0, 941.0, 383.0, 167.0, 96.0, 59.0, 38.0, 25.0, 17.0, 4.0, 9.0, 9.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96875, -0.9381942749023438, -0.9076385498046875, -0.8770828247070312, -0.846527099609375, -0.8159713745117188, -0.7854156494140625, -0.7548599243164062, -0.72430419921875, -0.6937484741210938, -0.6631927490234375, -0.6326370239257812, -0.602081298828125, -0.5715255737304688, -0.5409698486328125, -0.5104141235351562, -0.4798583984375, -0.44930267333984375, -0.4187469482421875, -0.38819122314453125, -0.357635498046875, -0.32707977294921875, -0.2965240478515625, -0.26596832275390625, -0.23541259765625, -0.20485687255859375, -0.1743011474609375, -0.14374542236328125, -0.113189697265625, -0.08263397216796875, -0.0520782470703125, -0.02152252197265625, 0.009033203125, 0.03958892822265625, 0.0701446533203125, 0.10070037841796875, 0.131256103515625, 0.16181182861328125, 0.1923675537109375, 0.22292327880859375, 0.25347900390625, 0.28403472900390625, 0.3145904541015625, 0.34514617919921875, 0.375701904296875, 0.40625762939453125, 0.4368133544921875, 0.46736907958984375, 0.4979248046875, 0.5284805297851562, 0.5590362548828125, 0.5895919799804688, 0.620147705078125, 0.6507034301757812, 0.6812591552734375, 0.7118148803710938, 0.74237060546875, 0.7729263305664062, 0.8034820556640625, 0.8340377807617188, 0.864593505859375, 0.8951492309570312, 0.9257049560546875, 0.9562606811523438, 0.98681640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 7.0, 6.0, 6.0, 10.0, 12.0, 14.0, 31.0, 30.0, 50.0, 53.0, 73.0, 63.0, 84.0, 88.0, 92.0, 77.0, 74.0, 48.0, 50.0, 27.0, 22.0, 17.0, 14.0, 12.0, 11.0, 6.0, 5.0, 7.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00011146068572998047, -0.00010842457413673401, -0.00010538846254348755, -0.00010235235095024109, -9.931623935699463e-05, -9.628012776374817e-05, -9.324401617050171e-05, -9.020790457725525e-05, -8.717179298400879e-05, -8.413568139076233e-05, -8.109956979751587e-05, -7.806345820426941e-05, -7.502734661102295e-05, -7.199123501777649e-05, -6.895512342453003e-05, -6.591901183128357e-05, -6.288290023803711e-05, -5.984678864479065e-05, -5.681067705154419e-05, -5.377456545829773e-05, -5.073845386505127e-05, -4.770234227180481e-05, -4.466623067855835e-05, -4.163011908531189e-05, -3.859400749206543e-05, -3.555789589881897e-05, -3.252178430557251e-05, -2.948567271232605e-05, -2.644956111907959e-05, -2.341344952583313e-05, -2.037733793258667e-05, -1.734122633934021e-05, -1.430511474609375e-05, -1.126900315284729e-05, -8.23289155960083e-06, -5.19677996635437e-06, -2.16066837310791e-06, 8.754432201385498e-07, 3.91155481338501e-06, 6.94766640663147e-06, 9.98377799987793e-06, 1.301988959312439e-05, 1.605600118637085e-05, 1.909211277961731e-05, 2.212822437286377e-05, 2.516433596611023e-05, 2.820044755935669e-05, 3.123655915260315e-05, 3.427267074584961e-05, 3.730878233909607e-05, 4.034489393234253e-05, 4.338100552558899e-05, 4.641711711883545e-05, 4.945322871208191e-05, 5.248934030532837e-05, 5.552545189857483e-05, 5.856156349182129e-05, 6.159767508506775e-05, 6.463378667831421e-05, 6.766989827156067e-05, 7.070600986480713e-05, 7.374212145805359e-05, 7.677823305130005e-05, 7.981434464454651e-05, 8.285045623779297e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 8.0, 7.0, 14.0, 15.0, 30.0, 38.0, 61.0, 134.0, 238.0, 570.0, 1886.0, 9262.0, 107892.0, 785562.0, 129213.0, 10449.0, 2011.0, 632.0, 257.0, 109.0, 72.0, 39.0, 24.0, 13.0, 8.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60595703125, -0.5749282836914062, -0.5438995361328125, -0.5128707885742188, -0.481842041015625, -0.45081329345703125, -0.4197845458984375, -0.38875579833984375, -0.35772705078125, -0.32669830322265625, -0.2956695556640625, -0.26464080810546875, -0.233612060546875, -0.20258331298828125, -0.1715545654296875, -0.14052581787109375, -0.1094970703125, -0.07846832275390625, -0.0474395751953125, -0.01641082763671875, 0.014617919921875, 0.04564666748046875, 0.0766754150390625, 0.10770416259765625, 0.13873291015625, 0.16976165771484375, 0.2007904052734375, 0.23181915283203125, 0.262847900390625, 0.29387664794921875, 0.3249053955078125, 0.35593414306640625, 0.386962890625, 0.41799163818359375, 0.4490203857421875, 0.48004913330078125, 0.511077880859375, 0.5421066284179688, 0.5731353759765625, 0.6041641235351562, 0.63519287109375, 0.6662216186523438, 0.6972503662109375, 0.7282791137695312, 0.759307861328125, 0.7903366088867188, 0.8213653564453125, 0.8523941040039062, 0.8834228515625, 0.9144515991210938, 0.9454803466796875, 0.9765090942382812, 1.007537841796875, 1.0385665893554688, 1.0695953369140625, 1.1006240844726562, 1.13165283203125, 1.1626815795898438, 1.1937103271484375, 1.2247390747070312, 1.255767822265625, 1.2867965698242188, 1.3178253173828125, 1.3488540649414062, 1.3798828125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 5.0, 10.0, 14.0, 19.0, 16.0, 23.0, 24.0, 53.0, 45.0, 59.0, 90.0, 70.0, 87.0, 82.0, 65.0, 64.0, 61.0, 50.0, 52.0, 28.0, 18.0, 11.0, 15.0, 9.0, 8.0, 4.0, 6.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342529296875, -0.32982635498046875, -0.3171234130859375, -0.30442047119140625, -0.291717529296875, -0.27901458740234375, -0.2663116455078125, -0.25360870361328125, -0.24090576171875, -0.22820281982421875, -0.2154998779296875, -0.20279693603515625, -0.190093994140625, -0.17739105224609375, -0.1646881103515625, -0.15198516845703125, -0.1392822265625, -0.12657928466796875, -0.1138763427734375, -0.10117340087890625, -0.088470458984375, -0.07576751708984375, -0.0630645751953125, -0.05036163330078125, -0.03765869140625, -0.02495574951171875, -0.0122528076171875, 0.00045013427734375, 0.013153076171875, 0.02585601806640625, 0.0385589599609375, 0.05126190185546875, 0.06396484375, 0.07666778564453125, 0.0893707275390625, 0.10207366943359375, 0.114776611328125, 0.12747955322265625, 0.1401824951171875, 0.15288543701171875, 0.16558837890625, 0.17829132080078125, 0.1909942626953125, 0.20369720458984375, 0.216400146484375, 0.22910308837890625, 0.2418060302734375, 0.25450897216796875, 0.2672119140625, 0.27991485595703125, 0.2926177978515625, 0.30532073974609375, 0.318023681640625, 0.33072662353515625, 0.3434295654296875, 0.35613250732421875, 0.36883544921875, 0.38153839111328125, 0.3942413330078125, 0.40694427490234375, 0.419647216796875, 0.43235015869140625, 0.4450531005859375, 0.45775604248046875, 0.470458984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 13.0, 36.0, 168.0, 315.0, 288.0, 115.0, 39.0, 10.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.353282928466797, -16.82286262512207, -16.29244041442871, -15.762019157409668, -15.231597900390625, -14.701176643371582, -14.170755386352539, -13.640335083007812, -13.109912872314453, -12.57949161529541, -12.049070358276367, -11.518649101257324, -10.988227844238281, -10.457806587219238, -9.927385330200195, -9.396965026855469, -8.866543769836426, -8.336122512817383, -7.80570125579834, -7.275279998779297, -6.744858741760254, -6.214437484741211, -5.684016704559326, -5.153595447540283, -4.62317419052124, -4.092752933502197, -3.5623316764831543, -3.0319106578826904, -2.5014894008636475, -1.9710681438446045, -1.4406471252441406, -0.9102258682250977, -0.3798046112060547, 0.1506165862083435, 0.6810377836227417, 1.2114589214324951, 1.741880178451538, 2.272301435470581, 2.802722454071045, 3.333143711090088, 3.863564968109131, 4.393986225128174, 4.924407482147217, 5.454828262329102, 5.9852495193481445, 6.5156707763671875, 7.0460920333862305, 7.576513290405273, 8.106934547424316, 8.63735580444336, 9.167777061462402, 9.698198318481445, 10.228619575500488, 10.759040832519531, 11.289461135864258, 11.819883346557617, 12.350303649902344, 12.880724906921387, 13.41114616394043, 13.941567420959473, 14.471988677978516, 15.002409934997559, 15.532831192016602, 16.063251495361328, 16.593673706054688]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 9.0, 8.0, 10.0, 19.0, 15.0, 19.0, 22.0, 27.0, 36.0, 35.0, 43.0, 42.0, 44.0, 42.0, 59.0, 49.0, 39.0, 43.0, 48.0, 54.0, 54.0, 45.0, 31.0, 35.0, 20.0, 27.0, 15.0, 21.0, 17.0, 13.0, 14.0, 10.0, 6.0, 3.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.109270095825195, -4.95625114440918, -4.803232192993164, -4.650213241577148, -4.497194290161133, -4.344175338745117, -4.191156387329102, -4.038137435913086, -3.8851184844970703, -3.7320995330810547, -3.579080581665039, -3.4260616302490234, -3.273042678833008, -3.120023727416992, -2.9670047760009766, -2.813985824584961, -2.6609668731689453, -2.5079479217529297, -2.354928970336914, -2.2019100189208984, -2.048891067504883, -1.8958721160888672, -1.7428531646728516, -1.589834213256836, -1.4368152618408203, -1.2837963104248047, -1.130777359008789, -0.9777584075927734, -0.8247394561767578, -0.6717205047607422, -0.5187015533447266, -0.36568260192871094, -0.2126631736755371, -0.059644222259521484, 0.09337472915649414, 0.24639368057250977, 0.3994126319885254, 0.552431583404541, 0.7054505348205566, 0.8584694862365723, 1.011488437652588, 1.1645073890686035, 1.3175263404846191, 1.4705452919006348, 1.6235642433166504, 1.776583194732666, 1.9296021461486816, 2.0826210975646973, 2.235640048980713, 2.3886590003967285, 2.541677951812744, 2.6946969032287598, 2.8477158546447754, 3.000734806060791, 3.1537537574768066, 3.3067727088928223, 3.459791660308838, 3.6128106117248535, 3.765829563140869, 3.9188485145568848, 4.0718674659729, 4.224886417388916, 4.377905368804932, 4.530924320220947, 4.683943271636963]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 6.0, 10.0, 5.0, 8.0, 6.0, 13.0, 15.0, 19.0, 29.0, 36.0, 26.0, 49.0, 57.0, 79.0, 121.0, 172.0, 274.0, 452.0, 857.0, 1950.0, 4645.0, 12776.0, 53479.0, 3325528.0, 737903.0, 37828.0, 10382.0, 3959.0, 1663.0, 816.0, 439.0, 244.0, 163.0, 81.0, 63.0, 42.0, 25.0, 21.0, 10.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.779296875, -2.7129669189453125, -2.646636962890625, -2.5803070068359375, -2.51397705078125, -2.4476470947265625, -2.381317138671875, -2.3149871826171875, -2.2486572265625, -2.1823272705078125, -2.115997314453125, -2.0496673583984375, -1.98333740234375, -1.9170074462890625, -1.850677490234375, -1.7843475341796875, -1.718017578125, -1.6516876220703125, -1.585357666015625, -1.5190277099609375, -1.45269775390625, -1.3863677978515625, -1.320037841796875, -1.2537078857421875, -1.1873779296875, -1.1210479736328125, -1.054718017578125, -0.9883880615234375, -0.92205810546875, -0.8557281494140625, -0.789398193359375, -0.7230682373046875, -0.65673828125, -0.5904083251953125, -0.524078369140625, -0.4577484130859375, -0.39141845703125, -0.3250885009765625, -0.258758544921875, -0.1924285888671875, -0.1260986328125, -0.0597686767578125, 0.006561279296875, 0.0728912353515625, 0.13922119140625, 0.2055511474609375, 0.271881103515625, 0.3382110595703125, 0.404541015625, 0.4708709716796875, 0.537200927734375, 0.6035308837890625, 0.66986083984375, 0.7361907958984375, 0.802520751953125, 0.8688507080078125, 0.9351806640625, 1.0015106201171875, 1.067840576171875, 1.1341705322265625, 1.20050048828125, 1.2668304443359375, 1.333160400390625, 1.3994903564453125, 1.4658203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 9.0, 14.0, 15.0, 29.0, 38.0, 36.0, 39.0, 65.0, 64.0, 69.0, 71.0, 90.0, 81.0, 73.0, 53.0, 45.0, 50.0, 43.0, 35.0, 18.0, 13.0, 18.0, 9.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.3876953125, -0.377593994140625, -0.36749267578125, -0.357391357421875, -0.3472900390625, -0.337188720703125, -0.32708740234375, -0.316986083984375, -0.306884765625, -0.296783447265625, -0.28668212890625, -0.276580810546875, -0.2664794921875, -0.256378173828125, -0.24627685546875, -0.236175537109375, -0.22607421875, -0.215972900390625, -0.20587158203125, -0.195770263671875, -0.1856689453125, -0.175567626953125, -0.16546630859375, -0.155364990234375, -0.145263671875, -0.135162353515625, -0.12506103515625, -0.114959716796875, -0.1048583984375, -0.094757080078125, -0.08465576171875, -0.074554443359375, -0.064453125, -0.054351806640625, -0.04425048828125, -0.034149169921875, -0.0240478515625, -0.013946533203125, -0.00384521484375, 0.006256103515625, 0.016357421875, 0.026458740234375, 0.03656005859375, 0.046661376953125, 0.0567626953125, 0.066864013671875, 0.07696533203125, 0.087066650390625, 0.09716796875, 0.107269287109375, 0.11737060546875, 0.127471923828125, 0.1375732421875, 0.147674560546875, 0.15777587890625, 0.167877197265625, 0.177978515625, 0.188079833984375, 0.19818115234375, 0.208282470703125, 0.2183837890625, 0.228485107421875, 0.23858642578125, 0.248687744140625, 0.2587890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 10.0, 9.0, 10.0, 29.0, 42.0, 53.0, 97.0, 146.0, 261.0, 569.0, 1415.0, 4227.0, 17258.0, 161839.0, 3851704.0, 134432.0, 15570.0, 4133.0, 1331.0, 528.0, 274.0, 126.0, 74.0, 49.0, 35.0, 17.0, 13.0, 13.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.8515625, -2.782806396484375, -2.71405029296875, -2.645294189453125, -2.5765380859375, -2.507781982421875, -2.43902587890625, -2.370269775390625, -2.301513671875, -2.232757568359375, -2.16400146484375, -2.095245361328125, -2.0264892578125, -1.957733154296875, -1.88897705078125, -1.820220947265625, -1.75146484375, -1.682708740234375, -1.61395263671875, -1.545196533203125, -1.4764404296875, -1.407684326171875, -1.33892822265625, -1.270172119140625, -1.201416015625, -1.132659912109375, -1.06390380859375, -0.995147705078125, -0.9263916015625, -0.857635498046875, -0.78887939453125, -0.720123291015625, -0.6513671875, -0.582611083984375, -0.51385498046875, -0.445098876953125, -0.3763427734375, -0.307586669921875, -0.23883056640625, -0.170074462890625, -0.101318359375, -0.032562255859375, 0.03619384765625, 0.104949951171875, 0.1737060546875, 0.242462158203125, 0.31121826171875, 0.379974365234375, 0.44873046875, 0.517486572265625, 0.58624267578125, 0.654998779296875, 0.7237548828125, 0.792510986328125, 0.86126708984375, 0.930023193359375, 0.998779296875, 1.067535400390625, 1.13629150390625, 1.205047607421875, 1.2738037109375, 1.342559814453125, 1.41131591796875, 1.480072021484375, 1.548828125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 12.0, 9.0, 11.0, 12.0, 15.0, 21.0, 39.0, 61.0, 92.0, 157.0, 335.0, 939.0, 1501.0, 441.0, 171.0, 101.0, 54.0, 30.0, 16.0, 9.0, 15.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.73681640625, -0.7169952392578125, -0.697174072265625, -0.6773529052734375, -0.65753173828125, -0.6377105712890625, -0.617889404296875, -0.5980682373046875, -0.5782470703125, -0.5584259033203125, -0.538604736328125, -0.5187835693359375, -0.49896240234375, -0.4791412353515625, -0.459320068359375, -0.4394989013671875, -0.419677734375, -0.3998565673828125, -0.380035400390625, -0.3602142333984375, -0.34039306640625, -0.3205718994140625, -0.300750732421875, -0.2809295654296875, -0.2611083984375, -0.2412872314453125, -0.221466064453125, -0.2016448974609375, -0.18182373046875, -0.1620025634765625, -0.142181396484375, -0.1223602294921875, -0.1025390625, -0.0827178955078125, -0.062896728515625, -0.0430755615234375, -0.02325439453125, -0.0034332275390625, 0.016387939453125, 0.0362091064453125, 0.0560302734375, 0.0758514404296875, 0.095672607421875, 0.1154937744140625, 0.13531494140625, 0.1551361083984375, 0.174957275390625, 0.1947784423828125, 0.214599609375, 0.2344207763671875, 0.254241943359375, 0.2740631103515625, 0.29388427734375, 0.3137054443359375, 0.333526611328125, 0.3533477783203125, 0.3731689453125, 0.3929901123046875, 0.412811279296875, 0.4326324462890625, 0.45245361328125, 0.4722747802734375, 0.492095947265625, 0.5119171142578125, 0.53173828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 6.0, 16.0, 36.0, 62.0, 96.0, 186.0, 221.0, 162.0, 122.0, 45.0, 19.0, 7.0, 8.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.845273971557617, -5.666065692901611, -5.486856937408447, -5.307648658752441, -5.1284403800964355, -4.94923210144043, -4.770023345947266, -4.59081506729126, -4.411606788635254, -4.232398509979248, -4.053189754486084, -3.873981475830078, -3.6947731971740723, -3.5155646800994873, -3.3363561630249023, -3.1571478843688965, -2.9779391288757324, -2.7987306118011475, -2.6195223331451416, -2.4403138160705566, -2.261105537414551, -2.081897020339966, -1.9026885032653809, -1.7234801054000854, -1.54427170753479, -1.3650633096694946, -1.1858549118041992, -1.0066463947296143, -0.8274379968643188, -0.6482295989990234, -0.4690210819244385, -0.28981268405914307, -0.11060380935668945, 0.06860461831092834, 0.24781304597854614, 0.42702150344848633, 0.6062299013137817, 0.7854382991790771, 0.9646468162536621, 1.1438552141189575, 1.323063611984253, 1.5022720098495483, 1.6814804077148438, 1.8606889247894287, 2.0398974418640137, 2.2191057205200195, 2.3983142375946045, 2.5775227546691895, 2.7567310333251953, 2.9359395503997803, 3.115147829055786, 3.294356346130371, 3.473564624786377, 3.652773141860962, 3.831981658935547, 4.011189937591553, 4.190398216247559, 4.3696064949035645, 4.5488152503967285, 4.728023529052734, 4.90723180770874, 5.086440086364746, 5.26564884185791, 5.444857120513916, 5.62406587600708]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 3.0, 13.0, 6.0, 12.0, 17.0, 21.0, 24.0, 40.0, 45.0, 49.0, 46.0, 66.0, 53.0, 62.0, 59.0, 57.0, 68.0, 76.0, 57.0, 42.0, 49.0, 43.0, 27.0, 19.0, 14.0, 13.0, 9.0, 2.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.837348222732544, -1.7499698400497437, -1.6625914573669434, -1.5752129554748535, -1.4878345727920532, -1.400456190109253, -1.3130778074264526, -1.2256994247436523, -1.1383209228515625, -1.0509425401687622, -0.9635640978813171, -0.8761857151985168, -0.7888072729110718, -0.7014288902282715, -0.6140505075454712, -0.5266720652580261, -0.4392937421798706, -0.3519153296947479, -0.26453691720962524, -0.17715853452682495, -0.08978012204170227, -0.00240170955657959, 0.0849766731262207, 0.17235511541366577, 0.25973349809646606, 0.34711191058158875, 0.4344903230667114, 0.5218687057495117, 0.609247088432312, 0.6966255307197571, 0.7840039134025574, 0.8713823556900024, 0.9587607383728027, 1.046139121055603, 1.1335175037384033, 1.2208960056304932, 1.3082743883132935, 1.3956527709960938, 1.483031153678894, 1.5704095363616943, 1.6577880382537842, 1.7451664209365845, 1.8325448036193848, 1.9199233055114746, 2.0073015689849854, 2.094680070877075, 2.182058334350586, 2.269436836242676, 2.3568153381347656, 2.4441938400268555, 2.531572103500366, 2.618950605392456, 2.706328868865967, 2.7937073707580566, 2.8810858726501465, 2.9684641361236572, 3.055842399597168, 3.143220901489258, 3.2305991649627686, 3.3179776668548584, 3.405355930328369, 3.492734432220459, 3.580112934112549, 3.6674911975860596, 3.7548696994781494]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 6.0, 7.0, 8.0, 16.0, 23.0, 35.0, 48.0, 66.0, 141.0, 323.0, 697.0, 1792.0, 6236.0, 33286.0, 455555.0, 503910.0, 36421.0, 6647.0, 1953.0, 682.0, 285.0, 157.0, 84.0, 60.0, 32.0, 28.0, 15.0, 10.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.90234375, -2.823944091796875, -2.74554443359375, -2.667144775390625, -2.5887451171875, -2.510345458984375, -2.43194580078125, -2.353546142578125, -2.275146484375, -2.196746826171875, -2.11834716796875, -2.039947509765625, -1.9615478515625, -1.883148193359375, -1.80474853515625, -1.726348876953125, -1.64794921875, -1.569549560546875, -1.49114990234375, -1.412750244140625, -1.3343505859375, -1.255950927734375, -1.17755126953125, -1.099151611328125, -1.020751953125, -0.942352294921875, -0.86395263671875, -0.785552978515625, -0.7071533203125, -0.628753662109375, -0.55035400390625, -0.471954345703125, -0.3935546875, -0.315155029296875, -0.23675537109375, -0.158355712890625, -0.0799560546875, -0.001556396484375, 0.07684326171875, 0.155242919921875, 0.233642578125, 0.312042236328125, 0.39044189453125, 0.468841552734375, 0.5472412109375, 0.625640869140625, 0.70404052734375, 0.782440185546875, 0.86083984375, 0.939239501953125, 1.01763916015625, 1.096038818359375, 1.1744384765625, 1.252838134765625, 1.33123779296875, 1.409637451171875, 1.488037109375, 1.566436767578125, 1.64483642578125, 1.723236083984375, 1.8016357421875, 1.880035400390625, 1.95843505859375, 2.036834716796875, 2.115234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 11.0, 11.0, 13.0, 13.0, 25.0, 43.0, 45.0, 46.0, 49.0, 71.0, 55.0, 82.0, 92.0, 74.0, 77.0, 60.0, 53.0, 44.0, 46.0, 22.0, 22.0, 14.0, 11.0, 12.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.412353515625, -0.4012794494628906, -0.39020538330078125, -0.3791313171386719, -0.3680572509765625, -0.3569831848144531, -0.34590911865234375, -0.3348350524902344, -0.323760986328125, -0.3126869201660156, -0.30161285400390625, -0.2905387878417969, -0.2794647216796875, -0.2683906555175781, -0.25731658935546875, -0.24624252319335938, -0.23516845703125, -0.22409439086914062, -0.21302032470703125, -0.20194625854492188, -0.1908721923828125, -0.17979812622070312, -0.16872406005859375, -0.15764999389648438, -0.146575927734375, -0.13550186157226562, -0.12442779541015625, -0.11335372924804688, -0.1022796630859375, -0.09120559692382812, -0.08013153076171875, -0.06905746459960938, -0.0579833984375, -0.046909332275390625, -0.03583526611328125, -0.024761199951171875, -0.0136871337890625, -0.002613067626953125, 0.00846099853515625, 0.019535064697265625, 0.030609130859375, 0.041683197021484375, 0.05275726318359375, 0.06383132934570312, 0.0749053955078125, 0.08597946166992188, 0.09705352783203125, 0.10812759399414062, 0.11920166015625, 0.13027572631835938, 0.14134979248046875, 0.15242385864257812, 0.1634979248046875, 0.17457199096679688, 0.18564605712890625, 0.19672012329101562, 0.207794189453125, 0.21886825561523438, 0.22994232177734375, 0.24101638793945312, 0.2520904541015625, 0.2631645202636719, 0.27423858642578125, 0.2853126525878906, 0.29638671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 8.0, 11.0, 21.0, 31.0, 36.0, 52.0, 110.0, 186.0, 386.0, 948.0, 2782.0, 10089.0, 54059.0, 419163.0, 480419.0, 63717.0, 11435.0, 3022.0, 1041.0, 444.0, 212.0, 98.0, 57.0, 50.0, 28.0, 21.0, 14.0, 15.0, 14.0, 10.0, 10.0, 7.0, 11.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5634765625, -1.517547607421875, -1.47161865234375, -1.425689697265625, -1.3797607421875, -1.333831787109375, -1.28790283203125, -1.241973876953125, -1.196044921875, -1.150115966796875, -1.10418701171875, -1.058258056640625, -1.0123291015625, -0.966400146484375, -0.92047119140625, -0.874542236328125, -0.82861328125, -0.782684326171875, -0.73675537109375, -0.690826416015625, -0.6448974609375, -0.598968505859375, -0.55303955078125, -0.507110595703125, -0.461181640625, -0.415252685546875, -0.36932373046875, -0.323394775390625, -0.2774658203125, -0.231536865234375, -0.18560791015625, -0.139678955078125, -0.09375, -0.047821044921875, -0.00189208984375, 0.044036865234375, 0.0899658203125, 0.135894775390625, 0.18182373046875, 0.227752685546875, 0.273681640625, 0.319610595703125, 0.36553955078125, 0.411468505859375, 0.4573974609375, 0.503326416015625, 0.54925537109375, 0.595184326171875, 0.64111328125, 0.687042236328125, 0.73297119140625, 0.778900146484375, 0.8248291015625, 0.870758056640625, 0.91668701171875, 0.962615966796875, 1.008544921875, 1.054473876953125, 1.10040283203125, 1.146331787109375, 1.1922607421875, 1.238189697265625, 1.28411865234375, 1.330047607421875, 1.3759765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 3.0, 5.0, 11.0, 13.0, 15.0, 22.0, 28.0, 24.0, 27.0, 28.0, 30.0, 40.0, 54.0, 68.0, 48.0, 39.0, 70.0, 47.0, 74.0, 54.0, 48.0, 44.0, 38.0, 29.0, 20.0, 23.0, 16.0, 16.0, 15.0, 13.0, 5.0, 6.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.978515625, -0.9448089599609375, -0.911102294921875, -0.8773956298828125, -0.84368896484375, -0.8099822998046875, -0.776275634765625, -0.7425689697265625, -0.7088623046875, -0.6751556396484375, -0.641448974609375, -0.6077423095703125, -0.57403564453125, -0.5403289794921875, -0.506622314453125, -0.4729156494140625, -0.439208984375, -0.4055023193359375, -0.371795654296875, -0.3380889892578125, -0.30438232421875, -0.2706756591796875, -0.236968994140625, -0.2032623291015625, -0.1695556640625, -0.1358489990234375, -0.102142333984375, -0.0684356689453125, -0.03472900390625, -0.0010223388671875, 0.032684326171875, 0.0663909912109375, 0.10009765625, 0.1338043212890625, 0.167510986328125, 0.2012176513671875, 0.23492431640625, 0.2686309814453125, 0.302337646484375, 0.3360443115234375, 0.3697509765625, 0.4034576416015625, 0.437164306640625, 0.4708709716796875, 0.50457763671875, 0.5382843017578125, 0.571990966796875, 0.6056976318359375, 0.639404296875, 0.6731109619140625, 0.706817626953125, 0.7405242919921875, 0.77423095703125, 0.8079376220703125, 0.841644287109375, 0.8753509521484375, 0.9090576171875, 0.9427642822265625, 0.976470947265625, 1.0101776123046875, 1.04388427734375, 1.0775909423828125, 1.111297607421875, 1.1450042724609375, 1.1787109375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 7.0, 16.0, 44.0, 88.0, 209.0, 818.0, 17675.0, 1022860.0, 6027.0, 510.0, 158.0, 88.0, 28.0, 12.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51171875, -3.3785400390625, -3.245361328125, -3.1121826171875, -2.97900390625, -2.8458251953125, -2.712646484375, -2.5794677734375, -2.4462890625, -2.3131103515625, -2.179931640625, -2.0467529296875, -1.91357421875, -1.7803955078125, -1.647216796875, -1.5140380859375, -1.380859375, -1.2476806640625, -1.114501953125, -0.9813232421875, -0.84814453125, -0.7149658203125, -0.581787109375, -0.4486083984375, -0.3154296875, -0.1822509765625, -0.049072265625, 0.0841064453125, 0.21728515625, 0.3504638671875, 0.483642578125, 0.6168212890625, 0.75, 0.8831787109375, 1.016357421875, 1.1495361328125, 1.28271484375, 1.4158935546875, 1.549072265625, 1.6822509765625, 1.8154296875, 1.9486083984375, 2.081787109375, 2.2149658203125, 2.34814453125, 2.4813232421875, 2.614501953125, 2.7476806640625, 2.880859375, 3.0140380859375, 3.147216796875, 3.2803955078125, 3.41357421875, 3.5467529296875, 3.679931640625, 3.8131103515625, 3.9462890625, 4.0794677734375, 4.212646484375, 4.3458251953125, 4.47900390625, 4.6121826171875, 4.745361328125, 4.8785400390625, 5.01171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 18.0, 22.0, 39.0, 72.0, 114.0, 167.0, 213.0, 135.0, 87.0, 42.0, 33.0, 22.0, 11.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002493858337402344, -0.00024287402629852295, -0.00023636221885681152, -0.0002298504114151001, -0.00022333860397338867, -0.00021682679653167725, -0.00021031498908996582, -0.0002038031816482544, -0.00019729137420654297, -0.00019077956676483154, -0.00018426775932312012, -0.0001777559518814087, -0.00017124414443969727, -0.00016473233699798584, -0.00015822052955627441, -0.000151708722114563, -0.00014519691467285156, -0.00013868510723114014, -0.0001321732997894287, -0.00012566149234771729, -0.00011914968490600586, -0.00011263787746429443, -0.00010612607002258301, -9.961426258087158e-05, -9.310245513916016e-05, -8.659064769744873e-05, -8.00788402557373e-05, -7.356703281402588e-05, -6.705522537231445e-05, -6.054341793060303e-05, -5.40316104888916e-05, -4.7519803047180176e-05, -4.100799560546875e-05, -3.4496188163757324e-05, -2.79843807220459e-05, -2.1472573280334473e-05, -1.4960765838623047e-05, -8.448958396911621e-06, -1.9371509552001953e-06, 4.5746564865112305e-06, 1.1086463928222656e-05, 1.7598271369934082e-05, 2.4110078811645508e-05, 3.0621886253356934e-05, 3.713369369506836e-05, 4.3645501136779785e-05, 5.015730857849121e-05, 5.666911602020264e-05, 6.318092346191406e-05, 6.969273090362549e-05, 7.620453834533691e-05, 8.271634578704834e-05, 8.922815322875977e-05, 9.573996067047119e-05, 0.00010225176811218262, 0.00010876357555389404, 0.00011527538299560547, 0.0001217871904373169, 0.00012829899787902832, 0.00013481080532073975, 0.00014132261276245117, 0.0001478344202041626, 0.00015434622764587402, 0.00016085803508758545, 0.00016736984252929688]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 20.0, 52.0, 80.0, 199.0, 621.0, 8565.0, 1030102.0, 7949.0, 623.0, 181.0, 69.0, 43.0, 24.0, 12.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.7421875, -4.6005859375, -4.458984375, -4.3173828125, -4.17578125, -4.0341796875, -3.892578125, -3.7509765625, -3.609375, -3.4677734375, -3.326171875, -3.1845703125, -3.04296875, -2.9013671875, -2.759765625, -2.6181640625, -2.4765625, -2.3349609375, -2.193359375, -2.0517578125, -1.91015625, -1.7685546875, -1.626953125, -1.4853515625, -1.34375, -1.2021484375, -1.060546875, -0.9189453125, -0.77734375, -0.6357421875, -0.494140625, -0.3525390625, -0.2109375, -0.0693359375, 0.072265625, 0.2138671875, 0.35546875, 0.4970703125, 0.638671875, 0.7802734375, 0.921875, 1.0634765625, 1.205078125, 1.3466796875, 1.48828125, 1.6298828125, 1.771484375, 1.9130859375, 2.0546875, 2.1962890625, 2.337890625, 2.4794921875, 2.62109375, 2.7626953125, 2.904296875, 3.0458984375, 3.1875, 3.3291015625, 3.470703125, 3.6123046875, 3.75390625, 3.8955078125, 4.037109375, 4.1787109375, 4.3203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 24.0, 96.0, 417.0, 339.0, 85.0, 26.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.513671875, -2.4324951171875, -2.351318359375, -2.2701416015625, -2.18896484375, -2.1077880859375, -2.026611328125, -1.9454345703125, -1.8642578125, -1.7830810546875, -1.701904296875, -1.6207275390625, -1.53955078125, -1.4583740234375, -1.377197265625, -1.2960205078125, -1.21484375, -1.1336669921875, -1.052490234375, -0.9713134765625, -0.89013671875, -0.8089599609375, -0.727783203125, -0.6466064453125, -0.5654296875, -0.4842529296875, -0.403076171875, -0.3218994140625, -0.24072265625, -0.1595458984375, -0.078369140625, 0.0028076171875, 0.083984375, 0.1651611328125, 0.246337890625, 0.3275146484375, 0.40869140625, 0.4898681640625, 0.571044921875, 0.6522216796875, 0.7333984375, 0.8145751953125, 0.895751953125, 0.9769287109375, 1.05810546875, 1.1392822265625, 1.220458984375, 1.3016357421875, 1.3828125, 1.4639892578125, 1.545166015625, 1.6263427734375, 1.70751953125, 1.7886962890625, 1.869873046875, 1.9510498046875, 2.0322265625, 2.1134033203125, 2.194580078125, 2.2757568359375, 2.35693359375, 2.4381103515625, 2.519287109375, 2.6004638671875, 2.681640625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 8.0, 26.0, 86.0, 277.0, 347.0, 171.0, 63.0, 17.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-37.4338264465332, -36.72834777832031, -36.02286911010742, -35.31739044189453, -34.61191177368164, -33.90643310546875, -33.200950622558594, -32.4954719543457, -31.789993286132812, -31.084514617919922, -30.37903594970703, -29.67355728149414, -28.968076705932617, -28.262598037719727, -27.557119369506836, -26.851640701293945, -26.146162033081055, -25.440683364868164, -24.735204696655273, -24.02972412109375, -23.32424545288086, -22.61876678466797, -21.913288116455078, -21.207809448242188, -20.502330780029297, -19.796852111816406, -19.091373443603516, -18.385894775390625, -17.6804141998291, -16.97493553161621, -16.26945686340332, -15.56397819519043, -14.858497619628906, -14.153018951416016, -13.447539329528809, -12.742060661315918, -12.036581039428711, -11.33110237121582, -10.62562370300293, -9.920145034790039, -9.214665412902832, -8.509186744689941, -7.803707122802734, -7.098228454589844, -6.392749309539795, -5.687270164489746, -4.9817914962768555, -4.276312351226807, -3.570833206176758, -2.865354061126709, -2.1598751544952393, -1.4543962478637695, -0.7489171028137207, -0.043437957763671875, 0.6620407104492188, 1.3675198554992676, 2.0729990005493164, 2.7784781455993652, 3.483957052230835, 4.189435958862305, 4.8949151039123535, 5.600394248962402, 6.305872917175293, 7.011352062225342, 7.716831207275391]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 3.0, 7.0, 6.0, 13.0, 17.0, 4.0, 13.0, 24.0, 17.0, 24.0, 27.0, 28.0, 30.0, 38.0, 43.0, 44.0, 50.0, 41.0, 38.0, 53.0, 36.0, 39.0, 44.0, 36.0, 36.0, 39.0, 34.0, 35.0, 27.0, 18.0, 18.0, 19.0, 16.0, 15.0, 7.0, 14.0, 11.0, 5.0, 6.0, 3.0, 3.0, 2.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.314615726470947, -5.158224582672119, -5.001832962036133, -4.845441818237305, -4.689050674438477, -4.532659530639648, -4.376267910003662, -4.219876766204834, -4.063485145568848, -3.9070937633514404, -3.7507026195526123, -3.594311237335205, -3.437920093536377, -3.2815287113189697, -3.1251373291015625, -2.9687461853027344, -2.8123550415039062, -2.655963659286499, -2.499572515487671, -2.3431811332702637, -2.1867899894714355, -2.0303986072540283, -1.874007225036621, -1.7176159620285034, -1.5612246990203857, -1.404833436012268, -1.2484421730041504, -1.0920507907867432, -0.9356595277786255, -0.7792682647705078, -0.6228769421577454, -0.4664856195449829, -0.31009387969970703, -0.15370258688926697, 0.0026887059211730957, 0.15907999873161316, 0.3154712915420532, 0.4718625545501709, 0.6282538771629333, 0.7846451997756958, 0.9410364627838135, 1.0974277257919312, 1.2538189888000488, 1.410210371017456, 1.5666016340255737, 1.7229928970336914, 1.8793842792510986, 2.035775661468506, 2.192166805267334, 2.348558187484741, 2.5049493312835693, 2.6613407135009766, 2.8177318572998047, 2.974123239517212, 3.130514621734619, 3.2869057655334473, 3.4432971477508545, 3.5996885299682617, 3.75607967376709, 3.912471055984497, 4.068862438201904, 4.225253582000732, 4.3816447257995605, 4.538036346435547, 4.694427490234375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 8.0, 11.0, 14.0, 18.0, 21.0, 35.0, 56.0, 74.0, 137.0, 215.0, 485.0, 1201.0, 3802.0, 16340.0, 201843.0, 3913791.0, 44584.0, 7808.0, 2276.0, 829.0, 335.0, 177.0, 88.0, 51.0, 31.0, 19.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.642578125, -3.554290771484375, -3.46600341796875, -3.377716064453125, -3.2894287109375, -3.201141357421875, -3.11285400390625, -3.024566650390625, -2.936279296875, -2.847991943359375, -2.75970458984375, -2.671417236328125, -2.5831298828125, -2.494842529296875, -2.40655517578125, -2.318267822265625, -2.22998046875, -2.141693115234375, -2.05340576171875, -1.965118408203125, -1.8768310546875, -1.788543701171875, -1.70025634765625, -1.611968994140625, -1.523681640625, -1.435394287109375, -1.34710693359375, -1.258819580078125, -1.1705322265625, -1.082244873046875, -0.99395751953125, -0.905670166015625, -0.8173828125, -0.729095458984375, -0.64080810546875, -0.552520751953125, -0.4642333984375, -0.375946044921875, -0.28765869140625, -0.199371337890625, -0.111083984375, -0.022796630859375, 0.06549072265625, 0.153778076171875, 0.2420654296875, 0.330352783203125, 0.41864013671875, 0.506927490234375, 0.59521484375, 0.683502197265625, 0.77178955078125, 0.860076904296875, 0.9483642578125, 1.036651611328125, 1.12493896484375, 1.213226318359375, 1.301513671875, 1.389801025390625, 1.47808837890625, 1.566375732421875, 1.6546630859375, 1.742950439453125, 1.83123779296875, 1.919525146484375, 2.0078125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 5.0, 13.0, 17.0, 21.0, 20.0, 21.0, 33.0, 42.0, 50.0, 67.0, 65.0, 57.0, 62.0, 68.0, 62.0, 70.0, 60.0, 61.0, 52.0, 30.0, 28.0, 29.0, 25.0, 11.0, 13.0, 8.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.440673828125, -0.42914581298828125, -0.4176177978515625, -0.40608978271484375, -0.394561767578125, -0.38303375244140625, -0.3715057373046875, -0.35997772216796875, -0.34844970703125, -0.33692169189453125, -0.3253936767578125, -0.31386566162109375, -0.302337646484375, -0.29080963134765625, -0.2792816162109375, -0.26775360107421875, -0.2562255859375, -0.24469757080078125, -0.2331695556640625, -0.22164154052734375, -0.210113525390625, -0.19858551025390625, -0.1870574951171875, -0.17552947998046875, -0.16400146484375, -0.15247344970703125, -0.1409454345703125, -0.12941741943359375, -0.117889404296875, -0.10636138916015625, -0.0948333740234375, -0.08330535888671875, -0.07177734375, -0.06024932861328125, -0.0487213134765625, -0.03719329833984375, -0.025665283203125, -0.01413726806640625, -0.0026092529296875, 0.00891876220703125, 0.02044677734375, 0.03197479248046875, 0.0435028076171875, 0.05503082275390625, 0.066558837890625, 0.07808685302734375, 0.0896148681640625, 0.10114288330078125, 0.1126708984375, 0.12419891357421875, 0.1357269287109375, 0.14725494384765625, 0.158782958984375, 0.17031097412109375, 0.1818389892578125, 0.19336700439453125, 0.20489501953125, 0.21642303466796875, 0.2279510498046875, 0.23947906494140625, 0.251007080078125, 0.26253509521484375, 0.2740631103515625, 0.28559112548828125, 0.297119140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 0.0, 11.0, 11.0, 11.0, 19.0, 44.0, 62.0, 82.0, 107.0, 152.0, 256.0, 636.0, 2453.0, 26626.0, 4112781.0, 46305.0, 3125.0, 748.0, 299.0, 165.0, 120.0, 84.0, 71.0, 44.0, 23.0, 25.0, 13.0, 10.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69921875, -5.52423095703125, -5.3492431640625, -5.17425537109375, -4.999267578125, -4.82427978515625, -4.6492919921875, -4.47430419921875, -4.29931640625, -4.12432861328125, -3.9493408203125, -3.77435302734375, -3.599365234375, -3.42437744140625, -3.2493896484375, -3.07440185546875, -2.8994140625, -2.72442626953125, -2.5494384765625, -2.37445068359375, -2.199462890625, -2.02447509765625, -1.8494873046875, -1.67449951171875, -1.49951171875, -1.32452392578125, -1.1495361328125, -0.97454833984375, -0.799560546875, -0.62457275390625, -0.4495849609375, -0.27459716796875, -0.099609375, 0.07537841796875, 0.2503662109375, 0.42535400390625, 0.600341796875, 0.77532958984375, 0.9503173828125, 1.12530517578125, 1.30029296875, 1.47528076171875, 1.6502685546875, 1.82525634765625, 2.000244140625, 2.17523193359375, 2.3502197265625, 2.52520751953125, 2.7001953125, 2.87518310546875, 3.0501708984375, 3.22515869140625, 3.400146484375, 3.57513427734375, 3.7501220703125, 3.92510986328125, 4.10009765625, 4.27508544921875, 4.4500732421875, 4.62506103515625, 4.800048828125, 4.97503662109375, 5.1500244140625, 5.32501220703125, 5.5]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 14.0, 38.0, 130.0, 2249.0, 1502.0, 91.0, 32.0, 13.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.930389404296875, -1.85882568359375, -1.787261962890625, -1.7156982421875, -1.644134521484375, -1.57257080078125, -1.501007080078125, -1.429443359375, -1.357879638671875, -1.28631591796875, -1.214752197265625, -1.1431884765625, -1.071624755859375, -1.00006103515625, -0.928497314453125, -0.85693359375, -0.785369873046875, -0.71380615234375, -0.642242431640625, -0.5706787109375, -0.499114990234375, -0.42755126953125, -0.355987548828125, -0.284423828125, -0.212860107421875, -0.14129638671875, -0.069732666015625, 0.0018310546875, 0.073394775390625, 0.14495849609375, 0.216522216796875, 0.2880859375, 0.359649658203125, 0.43121337890625, 0.502777099609375, 0.5743408203125, 0.645904541015625, 0.71746826171875, 0.789031982421875, 0.860595703125, 0.932159423828125, 1.00372314453125, 1.075286865234375, 1.1468505859375, 1.218414306640625, 1.28997802734375, 1.361541748046875, 1.43310546875, 1.504669189453125, 1.57623291015625, 1.647796630859375, 1.7193603515625, 1.790924072265625, 1.86248779296875, 1.934051513671875, 2.005615234375, 2.077178955078125, 2.14874267578125, 2.220306396484375, 2.2918701171875, 2.363433837890625, 2.43499755859375, 2.506561279296875, 2.578125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 6.0, 15.0, 22.0, 49.0, 141.0, 279.0, 247.0, 123.0, 66.0, 29.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.467264175415039, -6.251947402954102, -6.036631107330322, -5.821314334869385, -5.6059980392456055, -5.390681266784668, -5.175364971160889, -4.960048198699951, -4.744731903076172, -4.529415130615234, -4.314098834991455, -4.098782062530518, -3.8834657669067383, -3.668148994445801, -3.4528326988220215, -3.237515926361084, -3.0221993923187256, -2.806882858276367, -2.591566324234009, -2.3762497901916504, -2.160933256149292, -1.945616602897644, -1.7303000688552856, -1.5149835348129272, -1.2996670007705688, -1.0843504667282104, -0.869033932685852, -0.6537173390388489, -0.4384008049964905, -0.2230842113494873, -0.007767677307128906, 0.2075488567352295, 0.4228653907775879, 0.6381819248199463, 0.8534984588623047, 1.068814992904663, 1.2841315269470215, 1.4994481801986694, 1.7147647142410278, 1.9300812482833862, 2.145397663116455, 2.3607141971588135, 2.576030731201172, 2.7913472652435303, 3.0066637992858887, 3.221980571746826, 3.4372968673706055, 3.652613639831543, 3.8679301738739014, 4.08324670791626, 4.298563480377197, 4.513879776000977, 4.729196548461914, 4.944512844085693, 5.159829616546631, 5.37514591217041, 5.590462684631348, 5.805779457092285, 6.0210957527160645, 6.236412525177002, 6.451728820800781, 6.667045593261719, 6.882361888885498, 7.0976786613464355, 7.312994956970215]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 21.0, 33.0, 62.0, 83.0, 103.0, 117.0, 118.0, 126.0, 103.0, 77.0, 50.0, 27.0, 31.0, 21.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5036702156066895, -5.349239349365234, -5.194808006286621, -5.040376663208008, -4.885945796966553, -4.731514930725098, -4.577083587646484, -4.422652244567871, -4.268221378326416, -4.113790512084961, -3.9593591690063477, -3.8049280643463135, -3.6504969596862793, -3.496065855026245, -3.341634750366211, -3.1872036457061768, -3.0327725410461426, -2.8783414363861084, -2.723910331726074, -2.56947922706604, -2.415048122406006, -2.2606170177459717, -2.1061859130859375, -1.9517548084259033, -1.7973237037658691, -1.642892599105835, -1.4884614944458008, -1.3340303897857666, -1.1795992851257324, -1.0251681804656982, -0.8707370758056641, -0.7163059711456299, -0.5618753433227539, -0.4074442386627197, -0.25301313400268555, -0.09858202934265137, 0.05584907531738281, 0.210280179977417, 0.36471128463745117, 0.5191423892974854, 0.6735734939575195, 0.8280045986175537, 0.9824357032775879, 1.136866807937622, 1.2912979125976562, 1.4457290172576904, 1.6001601219177246, 1.7545912265777588, 1.909022331237793, 2.063453435897827, 2.2178845405578613, 2.3723156452178955, 2.5267467498779297, 2.681177854537964, 2.835608959197998, 2.9900400638580322, 3.1444711685180664, 3.2989022731781006, 3.4533333778381348, 3.607764482498169, 3.762195587158203, 3.9166266918182373, 4.0710577964782715, 4.225488662719727, 4.37992000579834]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 1.0, 10.0, 18.0, 27.0, 32.0, 68.0, 144.0, 266.0, 818.0, 3570.0, 35419.0, 774144.0, 220485.0, 10932.0, 1678.0, 497.0, 188.0, 105.0, 56.0, 29.0, 22.0, 15.0, 7.0, 9.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.5703125, -4.460906982421875, -4.35150146484375, -4.242095947265625, -4.1326904296875, -4.023284912109375, -3.91387939453125, -3.804473876953125, -3.695068359375, -3.585662841796875, -3.47625732421875, -3.366851806640625, -3.2574462890625, -3.148040771484375, -3.03863525390625, -2.929229736328125, -2.81982421875, -2.710418701171875, -2.60101318359375, -2.491607666015625, -2.3822021484375, -2.272796630859375, -2.16339111328125, -2.053985595703125, -1.944580078125, -1.835174560546875, -1.72576904296875, -1.616363525390625, -1.5069580078125, -1.397552490234375, -1.28814697265625, -1.178741455078125, -1.0693359375, -0.959930419921875, -0.85052490234375, -0.741119384765625, -0.6317138671875, -0.522308349609375, -0.41290283203125, -0.303497314453125, -0.194091796875, -0.084686279296875, 0.02471923828125, 0.134124755859375, 0.2435302734375, 0.352935791015625, 0.46234130859375, 0.571746826171875, 0.68115234375, 0.790557861328125, 0.89996337890625, 1.009368896484375, 1.1187744140625, 1.228179931640625, 1.33758544921875, 1.446990966796875, 1.556396484375, 1.665802001953125, 1.77520751953125, 1.884613037109375, 1.9940185546875, 2.103424072265625, 2.21282958984375, 2.322235107421875, 2.431640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 11.0, 20.0, 18.0, 21.0, 41.0, 58.0, 69.0, 77.0, 82.0, 85.0, 85.0, 74.0, 75.0, 63.0, 63.0, 31.0, 34.0, 25.0, 23.0, 17.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.59326171875, -0.5784912109375, -0.563720703125, -0.5489501953125, -0.5341796875, -0.5194091796875, -0.504638671875, -0.4898681640625, -0.47509765625, -0.4603271484375, -0.445556640625, -0.4307861328125, -0.416015625, -0.4012451171875, -0.386474609375, -0.3717041015625, -0.35693359375, -0.3421630859375, -0.327392578125, -0.3126220703125, -0.2978515625, -0.2830810546875, -0.268310546875, -0.2535400390625, -0.23876953125, -0.2239990234375, -0.209228515625, -0.1944580078125, -0.1796875, -0.1649169921875, -0.150146484375, -0.1353759765625, -0.12060546875, -0.1058349609375, -0.091064453125, -0.0762939453125, -0.0615234375, -0.0467529296875, -0.031982421875, -0.0172119140625, -0.00244140625, 0.0123291015625, 0.027099609375, 0.0418701171875, 0.056640625, 0.0714111328125, 0.086181640625, 0.1009521484375, 0.11572265625, 0.1304931640625, 0.145263671875, 0.1600341796875, 0.1748046875, 0.1895751953125, 0.204345703125, 0.2191162109375, 0.23388671875, 0.2486572265625, 0.263427734375, 0.2781982421875, 0.29296875, 0.3077392578125, 0.322509765625, 0.3372802734375, 0.35205078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 5.0, 10.0, 17.0, 17.0, 9.0, 30.0, 29.0, 53.0, 73.0, 144.0, 259.0, 722.0, 2454.0, 10843.0, 66950.0, 488243.0, 411068.0, 55003.0, 9162.0, 2194.0, 653.0, 254.0, 120.0, 76.0, 46.0, 29.0, 18.0, 12.0, 10.0, 12.0, 10.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.31927490234375, -1.2684326171875, -1.21759033203125, -1.166748046875, -1.11590576171875, -1.0650634765625, -1.01422119140625, -0.96337890625, -0.91253662109375, -0.8616943359375, -0.81085205078125, -0.760009765625, -0.70916748046875, -0.6583251953125, -0.60748291015625, -0.556640625, -0.50579833984375, -0.4549560546875, -0.40411376953125, -0.353271484375, -0.30242919921875, -0.2515869140625, -0.20074462890625, -0.14990234375, -0.09906005859375, -0.0482177734375, 0.00262451171875, 0.053466796875, 0.10430908203125, 0.1551513671875, 0.20599365234375, 0.2568359375, 0.30767822265625, 0.3585205078125, 0.40936279296875, 0.460205078125, 0.51104736328125, 0.5618896484375, 0.61273193359375, 0.66357421875, 0.71441650390625, 0.7652587890625, 0.81610107421875, 0.866943359375, 0.91778564453125, 0.9686279296875, 1.01947021484375, 1.0703125, 1.12115478515625, 1.1719970703125, 1.22283935546875, 1.273681640625, 1.32452392578125, 1.3753662109375, 1.42620849609375, 1.47705078125, 1.52789306640625, 1.5787353515625, 1.62957763671875, 1.680419921875, 1.73126220703125, 1.7821044921875, 1.83294677734375, 1.8837890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 8.0, 10.0, 11.0, 8.0, 20.0, 19.0, 25.0, 30.0, 30.0, 32.0, 44.0, 35.0, 34.0, 53.0, 39.0, 47.0, 44.0, 59.0, 41.0, 49.0, 35.0, 37.0, 38.0, 38.0, 29.0, 21.0, 32.0, 23.0, 17.0, 22.0, 6.0, 16.0, 10.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93408203125, -0.9002914428710938, -0.8665008544921875, -0.8327102661132812, -0.798919677734375, -0.7651290893554688, -0.7313385009765625, -0.6975479125976562, -0.66375732421875, -0.6299667358398438, -0.5961761474609375, -0.5623855590820312, -0.528594970703125, -0.49480438232421875, -0.4610137939453125, -0.42722320556640625, -0.3934326171875, -0.35964202880859375, -0.3258514404296875, -0.29206085205078125, -0.258270263671875, -0.22447967529296875, -0.1906890869140625, -0.15689849853515625, -0.12310791015625, -0.08931732177734375, -0.0555267333984375, -0.02173614501953125, 0.012054443359375, 0.04584503173828125, 0.0796356201171875, 0.11342620849609375, 0.147216796875, 0.18100738525390625, 0.2147979736328125, 0.24858856201171875, 0.282379150390625, 0.31616973876953125, 0.3499603271484375, 0.38375091552734375, 0.41754150390625, 0.45133209228515625, 0.4851226806640625, 0.5189132690429688, 0.552703857421875, 0.5864944458007812, 0.6202850341796875, 0.6540756225585938, 0.6878662109375, 0.7216567993164062, 0.7554473876953125, 0.7892379760742188, 0.823028564453125, 0.8568191528320312, 0.8906097412109375, 0.9244003295898438, 0.95819091796875, 0.9919815063476562, 1.0257720947265625, 1.0595626831054688, 1.093353271484375, 1.1271438598632812, 1.1609344482421875, 1.1947250366210938, 1.228515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 9.0, 12.0, 12.0, 23.0, 27.0, 45.0, 79.0, 168.0, 293.0, 620.0, 1551.0, 4887.0, 24093.0, 206654.0, 667490.0, 120611.0, 15813.0, 3740.0, 1288.0, 539.0, 271.0, 137.0, 80.0, 40.0, 27.0, 17.0, 8.0, 9.0, 2.0, 8.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.515625, -0.49745941162109375, -0.4792938232421875, -0.46112823486328125, -0.442962646484375, -0.42479705810546875, -0.4066314697265625, -0.38846588134765625, -0.37030029296875, -0.35213470458984375, -0.3339691162109375, -0.31580352783203125, -0.297637939453125, -0.27947235107421875, -0.2613067626953125, -0.24314117431640625, -0.2249755859375, -0.20680999755859375, -0.1886444091796875, -0.17047882080078125, -0.152313232421875, -0.13414764404296875, -0.1159820556640625, -0.09781646728515625, -0.07965087890625, -0.06148529052734375, -0.0433197021484375, -0.02515411376953125, -0.006988525390625, 0.01117706298828125, 0.0293426513671875, 0.04750823974609375, 0.065673828125, 0.08383941650390625, 0.1020050048828125, 0.12017059326171875, 0.138336181640625, 0.15650177001953125, 0.1746673583984375, 0.19283294677734375, 0.21099853515625, 0.22916412353515625, 0.2473297119140625, 0.26549530029296875, 0.283660888671875, 0.30182647705078125, 0.3199920654296875, 0.33815765380859375, 0.3563232421875, 0.37448883056640625, 0.3926544189453125, 0.41082000732421875, 0.428985595703125, 0.44715118408203125, 0.4653167724609375, 0.48348236083984375, 0.50164794921875, 0.5198135375976562, 0.5379791259765625, 0.5561447143554688, 0.574310302734375, 0.5924758911132812, 0.6106414794921875, 0.6288070678710938, 0.64697265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 9.0, 8.0, 17.0, 16.0, 32.0, 39.0, 51.0, 82.0, 125.0, 153.0, 138.0, 96.0, 81.0, 49.0, 34.0, 16.0, 17.0, 11.0, 10.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015926361083984375, -0.00015561282634735107, -0.0001519620418548584, -0.00014831125736236572, -0.00014466047286987305, -0.00014100968837738037, -0.0001373589038848877, -0.00013370811939239502, -0.00013005733489990234, -0.00012640655040740967, -0.000122755765914917, -0.00011910498142242432, -0.00011545419692993164, -0.00011180341243743896, -0.00010815262794494629, -0.00010450184345245361, -0.00010085105895996094, -9.720027446746826e-05, -9.354948997497559e-05, -8.989870548248291e-05, -8.624792098999023e-05, -8.259713649749756e-05, -7.894635200500488e-05, -7.529556751251221e-05, -7.164478302001953e-05, -6.799399852752686e-05, -6.434321403503418e-05, -6.0692429542541504e-05, -5.704164505004883e-05, -5.339086055755615e-05, -4.9740076065063477e-05, -4.60892915725708e-05, -4.2438507080078125e-05, -3.878772258758545e-05, -3.5136938095092773e-05, -3.14861536026001e-05, -2.7835369110107422e-05, -2.4184584617614746e-05, -2.053380012512207e-05, -1.6883015632629395e-05, -1.3232231140136719e-05, -9.581446647644043e-06, -5.930662155151367e-06, -2.2798776626586914e-06, 1.3709068298339844e-06, 5.02169132232666e-06, 8.672475814819336e-06, 1.2323260307312012e-05, 1.5974044799804688e-05, 1.9624829292297363e-05, 2.327561378479004e-05, 2.6926398277282715e-05, 3.057718276977539e-05, 3.4227967262268066e-05, 3.787875175476074e-05, 4.152953624725342e-05, 4.5180320739746094e-05, 4.883110523223877e-05, 5.2481889724731445e-05, 5.613267421722412e-05, 5.97834587097168e-05, 6.343424320220947e-05, 6.708502769470215e-05, 7.073581218719482e-05, 7.43865966796875e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 5.0, 10.0, 5.0, 10.0, 20.0, 33.0, 70.0, 161.0, 364.0, 1170.0, 4589.0, 30293.0, 412589.0, 551910.0, 39579.0, 5544.0, 1354.0, 488.0, 171.0, 77.0, 49.0, 23.0, 15.0, 9.0, 3.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.0126953125, -0.9891777038574219, -0.9656600952148438, -0.9421424865722656, -0.9186248779296875, -0.8951072692871094, -0.8715896606445312, -0.8480720520019531, -0.824554443359375, -0.8010368347167969, -0.7775192260742188, -0.7540016174316406, -0.7304840087890625, -0.7069664001464844, -0.6834487915039062, -0.6599311828613281, -0.63641357421875, -0.6128959655761719, -0.5893783569335938, -0.5658607482910156, -0.5423431396484375, -0.5188255310058594, -0.49530792236328125, -0.4717903137207031, -0.448272705078125, -0.4247550964355469, -0.40123748779296875, -0.3777198791503906, -0.3542022705078125, -0.3306846618652344, -0.30716705322265625, -0.2836494445800781, -0.2601318359375, -0.23661422729492188, -0.21309661865234375, -0.18957901000976562, -0.1660614013671875, -0.14254379272460938, -0.11902618408203125, -0.09550857543945312, -0.071990966796875, -0.048473358154296875, -0.02495574951171875, -0.001438140869140625, 0.0220794677734375, 0.045597076416015625, 0.06911468505859375, 0.09263229370117188, 0.11614990234375, 0.13966751098632812, 0.16318511962890625, 0.18670272827148438, 0.2102203369140625, 0.23373794555664062, 0.25725555419921875, 0.2807731628417969, 0.304290771484375, 0.3278083801269531, 0.35132598876953125, 0.3748435974121094, 0.3983612060546875, 0.4218788146972656, 0.44539642333984375, 0.4689140319824219, 0.492431640625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 5.0, 17.0, 12.0, 15.0, 25.0, 22.0, 49.0, 71.0, 86.0, 116.0, 114.0, 112.0, 99.0, 69.0, 55.0, 30.0, 30.0, 18.0, 15.0, 11.0, 11.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.533203125, -0.5189895629882812, -0.5047760009765625, -0.49056243896484375, -0.476348876953125, -0.46213531494140625, -0.4479217529296875, -0.43370819091796875, -0.41949462890625, -0.40528106689453125, -0.3910675048828125, -0.37685394287109375, -0.362640380859375, -0.34842681884765625, -0.3342132568359375, -0.31999969482421875, -0.3057861328125, -0.29157257080078125, -0.2773590087890625, -0.26314544677734375, -0.248931884765625, -0.23471832275390625, -0.2205047607421875, -0.20629119873046875, -0.19207763671875, -0.17786407470703125, -0.1636505126953125, -0.14943695068359375, -0.135223388671875, -0.12100982666015625, -0.1067962646484375, -0.09258270263671875, -0.078369140625, -0.06415557861328125, -0.0499420166015625, -0.03572845458984375, -0.021514892578125, -0.00730133056640625, 0.0069122314453125, 0.02112579345703125, 0.03533935546875, 0.04955291748046875, 0.0637664794921875, 0.07798004150390625, 0.092193603515625, 0.10640716552734375, 0.1206207275390625, 0.13483428955078125, 0.1490478515625, 0.16326141357421875, 0.1774749755859375, 0.19168853759765625, 0.205902099609375, 0.22011566162109375, 0.2343292236328125, 0.24854278564453125, 0.26275634765625, 0.27696990966796875, 0.2911834716796875, 0.30539703369140625, 0.319610595703125, 0.33382415771484375, 0.3480377197265625, 0.36225128173828125, 0.37646484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 13.0, 24.0, 43.0, 83.0, 110.0, 169.0, 162.0, 141.0, 121.0, 58.0, 39.0, 17.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.583742618560791, -5.280097007751465, -4.976451396942139, -4.6728057861328125, -4.369159698486328, -4.06551456451416, -3.761868476867676, -3.4582228660583496, -3.1545772552490234, -2.8509316444396973, -2.547286033630371, -2.243640184402466, -1.9399945735931396, -1.6363489627838135, -1.3327032327651978, -1.029057502746582, -0.7254118919372559, -0.4217662215232849, -0.11812055110931396, 0.18552511930465698, 0.48917078971862793, 0.7928164005279541, 1.0964621305465698, 1.4001078605651855, 1.7037534713745117, 2.007399082183838, 2.311044692993164, 2.6146905422210693, 2.9183361530303955, 3.2219817638397217, 3.525627613067627, 3.829273223876953, 4.1329193115234375, 4.436564922332764, 4.74021053314209, 5.043856143951416, 5.347501754760742, 5.651147842407227, 5.954793453216553, 6.258439064025879, 6.562084674835205, 6.865730285644531, 7.169375896453857, 7.473021507263184, 7.776667594909668, 8.080312728881836, 8.38395881652832, 8.687604904174805, 8.991250038146973, 9.294896125793457, 9.598541259765625, 9.90218734741211, 10.205832481384277, 10.509478569030762, 10.81312370300293, 11.116769790649414, 11.420415878295898, 11.724061965942383, 12.02770709991455, 12.331353187561035, 12.634998321533203, 12.938644409179688, 13.242289543151855, 13.54593563079834, 13.849580764770508]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 7.0, 1.0, 8.0, 11.0, 14.0, 6.0, 8.0, 11.0, 16.0, 17.0, 15.0, 26.0, 27.0, 23.0, 21.0, 34.0, 27.0, 22.0, 29.0, 44.0, 36.0, 25.0, 45.0, 42.0, 42.0, 34.0, 40.0, 44.0, 29.0, 30.0, 27.0, 28.0, 25.0, 23.0, 21.0, 20.0, 15.0, 24.0, 13.0, 14.0, 5.0, 6.0, 13.0, 8.0, 4.0, 7.0, 8.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.377024173736572, -4.24040412902832, -4.103784084320068, -3.9671640396118164, -3.8305439949035645, -3.6939239501953125, -3.5573041439056396, -3.4206840991973877, -3.2840640544891357, -3.147444009780884, -3.010823965072632, -2.87420392036438, -2.737584114074707, -2.600964069366455, -2.464344024658203, -2.327723979949951, -2.191103935241699, -2.0544838905334473, -1.9178638458251953, -1.781243920326233, -1.644623875617981, -1.508003830909729, -1.3713839054107666, -1.2347638607025146, -1.0981438159942627, -0.9615237712860107, -0.8249037861824036, -0.6882838010787964, -0.5516637563705444, -0.4150437116622925, -0.2784237265586853, -0.14180374145507812, -0.005184173583984375, 0.1314358413219452, 0.26805585622787476, 0.4046758711338043, 0.5412958860397339, 0.6779159307479858, 0.814535915851593, 0.9511559009552002, 1.0877759456634521, 1.224395990371704, 1.361016035079956, 1.4976359605789185, 1.6342560052871704, 1.7708760499954224, 1.9074959754943848, 2.0441160202026367, 2.1807360649108887, 2.3173561096191406, 2.4539761543273926, 2.5905961990356445, 2.7272162437438965, 2.8638362884521484, 3.0004560947418213, 3.1370761394500732, 3.273696184158325, 3.410316228866577, 3.546936273574829, 3.683556318283081, 3.820176124572754, 3.956796169281006, 4.093416213989258, 4.23003625869751, 4.366656303405762]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 4.0, 7.0, 5.0, 15.0, 14.0, 13.0, 13.0, 23.0, 28.0, 38.0, 44.0, 69.0, 111.0, 163.0, 279.0, 555.0, 1147.0, 2822.0, 8206.0, 30196.0, 844059.0, 3257799.0, 33665.0, 8948.0, 3219.0, 1404.0, 625.0, 320.0, 196.0, 98.0, 72.0, 39.0, 34.0, 17.0, 12.0, 4.0, 9.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.237884521484375, -4.13201904296875, -4.026153564453125, -3.9202880859375, -3.814422607421875, -3.70855712890625, -3.602691650390625, -3.496826171875, -3.390960693359375, -3.28509521484375, -3.179229736328125, -3.0733642578125, -2.967498779296875, -2.86163330078125, -2.755767822265625, -2.64990234375, -2.544036865234375, -2.43817138671875, -2.332305908203125, -2.2264404296875, -2.120574951171875, -2.01470947265625, -1.908843994140625, -1.802978515625, -1.697113037109375, -1.59124755859375, -1.485382080078125, -1.3795166015625, -1.273651123046875, -1.16778564453125, -1.061920166015625, -0.9560546875, -0.850189208984375, -0.74432373046875, -0.638458251953125, -0.5325927734375, -0.426727294921875, -0.32086181640625, -0.214996337890625, -0.109130859375, -0.003265380859375, 0.10260009765625, 0.208465576171875, 0.3143310546875, 0.420196533203125, 0.52606201171875, 0.631927490234375, 0.73779296875, 0.843658447265625, 0.94952392578125, 1.055389404296875, 1.1612548828125, 1.267120361328125, 1.37298583984375, 1.478851318359375, 1.584716796875, 1.690582275390625, 1.79644775390625, 1.902313232421875, 2.0081787109375, 2.114044189453125, 2.21990966796875, 2.325775146484375, 2.431640625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 8.0, 8.0, 11.0, 9.0, 21.0, 20.0, 20.0, 43.0, 45.0, 60.0, 60.0, 69.0, 71.0, 73.0, 81.0, 60.0, 62.0, 59.0, 54.0, 32.0, 42.0, 35.0, 15.0, 14.0, 14.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.5498046875, -0.5359840393066406, -0.5221633911132812, -0.5083427429199219, -0.4945220947265625, -0.4807014465332031, -0.46688079833984375, -0.4530601501464844, -0.439239501953125, -0.4254188537597656, -0.41159820556640625, -0.3977775573730469, -0.3839569091796875, -0.3701362609863281, -0.35631561279296875, -0.3424949645996094, -0.32867431640625, -0.3148536682128906, -0.30103302001953125, -0.2872123718261719, -0.2733917236328125, -0.2595710754394531, -0.24575042724609375, -0.23192977905273438, -0.218109130859375, -0.20428848266601562, -0.19046783447265625, -0.17664718627929688, -0.1628265380859375, -0.14900588989257812, -0.13518524169921875, -0.12136459350585938, -0.1075439453125, -0.09372329711914062, -0.07990264892578125, -0.06608200073242188, -0.0522613525390625, -0.038440704345703125, -0.02462005615234375, -0.010799407958984375, 0.003021240234375, 0.016841888427734375, 0.03066253662109375, 0.044483184814453125, 0.0583038330078125, 0.07212448120117188, 0.08594512939453125, 0.09976577758789062, 0.11358642578125, 0.12740707397460938, 0.14122772216796875, 0.15504837036132812, 0.1688690185546875, 0.18268966674804688, 0.19651031494140625, 0.21033096313476562, 0.224151611328125, 0.23797225952148438, 0.25179290771484375, 0.2656135559082031, 0.2794342041015625, 0.2932548522949219, 0.30707550048828125, 0.3208961486816406, 0.334716796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 16.0, 6.0, 17.0, 31.0, 30.0, 42.0, 48.0, 79.0, 94.0, 119.0, 172.0, 251.0, 289.0, 485.0, 806.0, 1553.0, 3364.0, 8745.0, 31024.0, 252845.0, 3766816.0, 96374.0, 18960.0, 6149.0, 2509.0, 1264.0, 707.0, 400.0, 279.0, 198.0, 147.0, 96.0, 100.0, 70.0, 49.0, 35.0, 26.0, 18.0, 15.0, 9.0, 8.0, 8.0, 6.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.04736328125, -1.9775390625, -1.90771484375, -1.837890625, -1.76806640625, -1.6982421875, -1.62841796875, -1.55859375, -1.48876953125, -1.4189453125, -1.34912109375, -1.279296875, -1.20947265625, -1.1396484375, -1.06982421875, -1.0, -0.93017578125, -0.8603515625, -0.79052734375, -0.720703125, -0.65087890625, -0.5810546875, -0.51123046875, -0.44140625, -0.37158203125, -0.3017578125, -0.23193359375, -0.162109375, -0.09228515625, -0.0224609375, 0.04736328125, 0.1171875, 0.18701171875, 0.2568359375, 0.32666015625, 0.396484375, 0.46630859375, 0.5361328125, 0.60595703125, 0.67578125, 0.74560546875, 0.8154296875, 0.88525390625, 0.955078125, 1.02490234375, 1.0947265625, 1.16455078125, 1.234375, 1.30419921875, 1.3740234375, 1.44384765625, 1.513671875, 1.58349609375, 1.6533203125, 1.72314453125, 1.79296875, 1.86279296875, 1.9326171875, 2.00244140625, 2.072265625, 2.14208984375, 2.2119140625, 2.28173828125, 2.3515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 12.0, 10.0, 21.0, 29.0, 62.0, 174.0, 839.0, 2488.0, 223.0, 92.0, 45.0, 25.0, 13.0, 10.0, 6.0, 4.0, 5.0, 5.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.201171875, -1.1660003662109375, -1.130828857421875, -1.0956573486328125, -1.06048583984375, -1.0253143310546875, -0.990142822265625, -0.9549713134765625, -0.9197998046875, -0.8846282958984375, -0.849456787109375, -0.8142852783203125, -0.77911376953125, -0.7439422607421875, -0.708770751953125, -0.6735992431640625, -0.638427734375, -0.6032562255859375, -0.568084716796875, -0.5329132080078125, -0.49774169921875, -0.4625701904296875, -0.427398681640625, -0.3922271728515625, -0.3570556640625, -0.3218841552734375, -0.286712646484375, -0.2515411376953125, -0.21636962890625, -0.1811981201171875, -0.146026611328125, -0.1108551025390625, -0.07568359375, -0.0405120849609375, -0.005340576171875, 0.0298309326171875, 0.06500244140625, 0.1001739501953125, 0.135345458984375, 0.1705169677734375, 0.2056884765625, 0.2408599853515625, 0.276031494140625, 0.3112030029296875, 0.34637451171875, 0.3815460205078125, 0.416717529296875, 0.4518890380859375, 0.487060546875, 0.5222320556640625, 0.557403564453125, 0.5925750732421875, 0.62774658203125, 0.6629180908203125, 0.698089599609375, 0.7332611083984375, 0.7684326171875, 0.8036041259765625, 0.838775634765625, 0.8739471435546875, 0.90911865234375, 0.9442901611328125, 0.979461669921875, 1.0146331787109375, 1.0498046875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 8.0, 16.0, 33.0, 97.0, 300.0, 352.0, 145.0, 35.0, 12.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.955515384674072, -6.655892372131348, -6.356269359588623, -6.056646347045898, -5.757023811340332, -5.457400798797607, -5.157777786254883, -4.858155250549316, -4.558531761169434, -4.258908748626709, -3.9592859745025635, -3.659662961959839, -3.3600401878356934, -3.0604171752929688, -2.760794162750244, -2.4611713886260986, -2.161548614501953, -1.861925721168518, -1.562302827835083, -1.2626798152923584, -0.9630569219589233, -0.6634340286254883, -0.36381101608276367, -0.06418824195861816, 0.23543477058410645, 0.5350576639175415, 0.8346806168556213, 1.1343035697937012, 1.4339264631271362, 1.7335493564605713, 2.033172369003296, 2.3327951431274414, 2.632417678833008, 2.9320406913757324, 3.231663465499878, 3.5312864780426025, 3.830909252166748, 4.130532264709473, 4.430155277252197, 4.729778289794922, 5.029400825500488, 5.329023838043213, 5.6286468505859375, 5.928269386291504, 6.2278923988342285, 6.527515411376953, 6.827138423919678, 7.126761436462402, 7.426384449005127, 7.726007461547852, 8.025629997253418, 8.3252534866333, 8.624876022338867, 8.92449951171875, 9.224122047424316, 9.523744583129883, 9.823368072509766, 10.122990608215332, 10.422614097595215, 10.722236633300781, 11.021860122680664, 11.32148265838623, 11.621105194091797, 11.92072868347168, 12.220351219177246]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 13.0, 17.0, 17.0, 24.0, 38.0, 47.0, 71.0, 65.0, 70.0, 85.0, 87.0, 86.0, 84.0, 70.0, 53.0, 56.0, 26.0, 34.0, 16.0, 12.0, 5.0, 0.0, 5.0, 3.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.753364086151123, -3.634342670440674, -3.5153210163116455, -3.3962996006011963, -3.277278184890747, -3.1582565307617188, -3.0392351150512695, -2.9202136993408203, -2.801192283630371, -2.682170867919922, -2.5631492137908936, -2.4441277980804443, -2.325106382369995, -2.206084728240967, -2.0870633125305176, -1.9680418968200684, -1.8490203619003296, -1.7299988269805908, -1.6109774112701416, -1.4919558763504028, -1.3729344606399536, -1.2539129257202148, -1.1348915100097656, -1.0158699750900269, -0.8968484997749329, -0.7778270244598389, -0.6588055491447449, -0.5397840738296509, -0.4207625687122345, -0.3017410635948181, -0.18271958827972412, -0.06369811296463013, 0.05532336235046387, 0.17434483766555786, 0.29336631298065186, 0.41238781809806824, 0.5314092636108398, 0.6504307985305786, 0.7694522738456726, 0.8884737491607666, 1.0074951648712158, 1.1265166997909546, 1.2455381155014038, 1.3645596504211426, 1.4835810661315918, 1.6026026010513306, 1.7216241359710693, 1.8406455516815186, 1.9596670866012573, 2.078688621520996, 2.1977100372314453, 2.3167314529418945, 2.435753107070923, 2.554774522781372, 2.6737959384918213, 2.7928175926208496, 2.911839008331299, 3.030860424041748, 3.1498820781707764, 3.2689034938812256, 3.387924909591675, 3.506946563720703, 3.6259679794311523, 3.7449893951416016, 3.864010810852051]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 13.0, 12.0, 12.0, 20.0, 25.0, 38.0, 68.0, 119.0, 205.0, 362.0, 713.0, 1964.0, 5882.0, 24417.0, 155221.0, 633606.0, 186653.0, 28762.0, 6679.0, 2088.0, 804.0, 415.0, 180.0, 79.0, 65.0, 53.0, 23.0, 16.0, 21.0, 10.0, 6.0, 6.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.375, -2.299713134765625, -2.22442626953125, -2.149139404296875, -2.0738525390625, -1.998565673828125, -1.92327880859375, -1.847991943359375, -1.772705078125, -1.697418212890625, -1.62213134765625, -1.546844482421875, -1.4715576171875, -1.396270751953125, -1.32098388671875, -1.245697021484375, -1.17041015625, -1.095123291015625, -1.01983642578125, -0.944549560546875, -0.8692626953125, -0.793975830078125, -0.71868896484375, -0.643402099609375, -0.568115234375, -0.492828369140625, -0.41754150390625, -0.342254638671875, -0.2669677734375, -0.191680908203125, -0.11639404296875, -0.041107177734375, 0.0341796875, 0.109466552734375, 0.18475341796875, 0.260040283203125, 0.3353271484375, 0.410614013671875, 0.48590087890625, 0.561187744140625, 0.636474609375, 0.711761474609375, 0.78704833984375, 0.862335205078125, 0.9376220703125, 1.012908935546875, 1.08819580078125, 1.163482666015625, 1.23876953125, 1.314056396484375, 1.38934326171875, 1.464630126953125, 1.5399169921875, 1.615203857421875, 1.69049072265625, 1.765777587890625, 1.841064453125, 1.916351318359375, 1.99163818359375, 2.066925048828125, 2.1422119140625, 2.217498779296875, 2.29278564453125, 2.368072509765625, 2.443359375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 11.0, 16.0, 18.0, 23.0, 40.0, 50.0, 40.0, 53.0, 72.0, 74.0, 80.0, 92.0, 65.0, 79.0, 77.0, 45.0, 41.0, 30.0, 24.0, 18.0, 16.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.62451171875, -0.60888671875, -0.59326171875, -0.57763671875, -0.56201171875, -0.54638671875, -0.53076171875, -0.51513671875, -0.49951171875, -0.48388671875, -0.46826171875, -0.45263671875, -0.43701171875, -0.42138671875, -0.40576171875, -0.39013671875, -0.37451171875, -0.35888671875, -0.34326171875, -0.32763671875, -0.31201171875, -0.29638671875, -0.28076171875, -0.26513671875, -0.24951171875, -0.23388671875, -0.21826171875, -0.20263671875, -0.18701171875, -0.17138671875, -0.15576171875, -0.14013671875, -0.12451171875, -0.10888671875, -0.09326171875, -0.07763671875, -0.06201171875, -0.04638671875, -0.03076171875, -0.01513671875, 0.00048828125, 0.01611328125, 0.03173828125, 0.04736328125, 0.06298828125, 0.07861328125, 0.09423828125, 0.10986328125, 0.12548828125, 0.14111328125, 0.15673828125, 0.17236328125, 0.18798828125, 0.20361328125, 0.21923828125, 0.23486328125, 0.25048828125, 0.26611328125, 0.28173828125, 0.29736328125, 0.31298828125, 0.32861328125, 0.34423828125, 0.35986328125, 0.37548828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 8.0, 1.0, 5.0, 6.0, 10.0, 7.0, 16.0, 27.0, 32.0, 36.0, 66.0, 89.0, 130.0, 218.0, 362.0, 640.0, 1220.0, 2454.0, 5213.0, 12005.0, 30018.0, 83844.0, 231306.0, 374153.0, 192808.0, 69160.0, 25308.0, 10255.0, 4389.0, 2100.0, 1120.0, 589.0, 324.0, 212.0, 133.0, 73.0, 54.0, 39.0, 33.0, 18.0, 20.0, 11.0, 11.0, 13.0, 2.0, 3.0, 10.0, 5.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89453125, -0.8651123046875, -0.835693359375, -0.8062744140625, -0.77685546875, -0.7474365234375, -0.718017578125, -0.6885986328125, -0.6591796875, -0.6297607421875, -0.600341796875, -0.5709228515625, -0.54150390625, -0.5120849609375, -0.482666015625, -0.4532470703125, -0.423828125, -0.3944091796875, -0.364990234375, -0.3355712890625, -0.30615234375, -0.2767333984375, -0.247314453125, -0.2178955078125, -0.1884765625, -0.1590576171875, -0.129638671875, -0.1002197265625, -0.07080078125, -0.0413818359375, -0.011962890625, 0.0174560546875, 0.046875, 0.0762939453125, 0.105712890625, 0.1351318359375, 0.16455078125, 0.1939697265625, 0.223388671875, 0.2528076171875, 0.2822265625, 0.3116455078125, 0.341064453125, 0.3704833984375, 0.39990234375, 0.4293212890625, 0.458740234375, 0.4881591796875, 0.517578125, 0.5469970703125, 0.576416015625, 0.6058349609375, 0.63525390625, 0.6646728515625, 0.694091796875, 0.7235107421875, 0.7529296875, 0.7823486328125, 0.811767578125, 0.8411865234375, 0.87060546875, 0.9000244140625, 0.929443359375, 0.9588623046875, 0.98828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 7.0, 12.0, 9.0, 11.0, 16.0, 22.0, 22.0, 13.0, 34.0, 26.0, 34.0, 36.0, 29.0, 47.0, 51.0, 48.0, 66.0, 46.0, 56.0, 30.0, 41.0, 45.0, 38.0, 31.0, 43.0, 32.0, 21.0, 16.0, 29.0, 22.0, 7.0, 12.0, 9.0, 5.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.18072509765625, -1.1378173828125, -1.09490966796875, -1.052001953125, -1.00909423828125, -0.9661865234375, -0.92327880859375, -0.88037109375, -0.83746337890625, -0.7945556640625, -0.75164794921875, -0.708740234375, -0.66583251953125, -0.6229248046875, -0.58001708984375, -0.537109375, -0.49420166015625, -0.4512939453125, -0.40838623046875, -0.365478515625, -0.32257080078125, -0.2796630859375, -0.23675537109375, -0.19384765625, -0.15093994140625, -0.1080322265625, -0.06512451171875, -0.022216796875, 0.02069091796875, 0.0635986328125, 0.10650634765625, 0.1494140625, 0.19232177734375, 0.2352294921875, 0.27813720703125, 0.321044921875, 0.36395263671875, 0.4068603515625, 0.44976806640625, 0.49267578125, 0.53558349609375, 0.5784912109375, 0.62139892578125, 0.664306640625, 0.70721435546875, 0.7501220703125, 0.79302978515625, 0.8359375, 0.87884521484375, 0.9217529296875, 0.96466064453125, 1.007568359375, 1.05047607421875, 1.0933837890625, 1.13629150390625, 1.17919921875, 1.22210693359375, 1.2650146484375, 1.30792236328125, 1.350830078125, 1.39373779296875, 1.4366455078125, 1.47955322265625, 1.5224609375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 19.0, 20.0, 42.0, 49.0, 58.0, 96.0, 165.0, 216.0, 372.0, 670.0, 1408.0, 3565.0, 11993.0, 94883.0, 776643.0, 136286.0, 14642.0, 4112.0, 1531.0, 728.0, 374.0, 224.0, 151.0, 79.0, 50.0, 50.0, 40.0, 25.0, 14.0, 7.0, 7.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.02734375, -0.9937286376953125, -0.960113525390625, -0.9264984130859375, -0.89288330078125, -0.8592681884765625, -0.825653076171875, -0.7920379638671875, -0.7584228515625, -0.7248077392578125, -0.691192626953125, -0.6575775146484375, -0.62396240234375, -0.5903472900390625, -0.556732177734375, -0.5231170654296875, -0.489501953125, -0.4558868408203125, -0.422271728515625, -0.3886566162109375, -0.35504150390625, -0.3214263916015625, -0.287811279296875, -0.2541961669921875, -0.2205810546875, -0.1869659423828125, -0.153350830078125, -0.1197357177734375, -0.08612060546875, -0.0525054931640625, -0.018890380859375, 0.0147247314453125, 0.04833984375, 0.0819549560546875, 0.115570068359375, 0.1491851806640625, 0.18280029296875, 0.2164154052734375, 0.250030517578125, 0.2836456298828125, 0.3172607421875, 0.3508758544921875, 0.384490966796875, 0.4181060791015625, 0.45172119140625, 0.4853363037109375, 0.518951416015625, 0.5525665283203125, 0.586181640625, 0.6197967529296875, 0.653411865234375, 0.6870269775390625, 0.72064208984375, 0.7542572021484375, 0.787872314453125, 0.8214874267578125, 0.8551025390625, 0.8887176513671875, 0.922332763671875, 0.9559478759765625, 0.98956298828125, 1.0231781005859375, 1.056793212890625, 1.0904083251953125, 1.1240234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 10.0, 19.0, 32.0, 34.0, 65.0, 102.0, 172.0, 187.0, 141.0, 80.0, 71.0, 35.0, 18.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021910667419433594, -0.00021290406584739685, -0.00020670145750045776, -0.00020049884915351868, -0.0001942962408065796, -0.0001880936324596405, -0.00018189102411270142, -0.00017568841576576233, -0.00016948580741882324, -0.00016328319907188416, -0.00015708059072494507, -0.00015087798237800598, -0.0001446753740310669, -0.0001384727656841278, -0.00013227015733718872, -0.00012606754899024963, -0.00011986494064331055, -0.00011366233229637146, -0.00010745972394943237, -0.00010125711560249329, -9.50545072555542e-05, -8.885189890861511e-05, -8.264929056167603e-05, -7.644668221473694e-05, -7.024407386779785e-05, -6.404146552085876e-05, -5.783885717391968e-05, -5.163624882698059e-05, -4.5433640480041504e-05, -3.923103213310242e-05, -3.302842378616333e-05, -2.6825815439224243e-05, -2.0623207092285156e-05, -1.442059874534607e-05, -8.217990398406982e-06, -2.0153820514678955e-06, 4.187226295471191e-06, 1.0389834642410278e-05, 1.6592442989349365e-05, 2.2795051336288452e-05, 2.899765968322754e-05, 3.5200268030166626e-05, 4.140287637710571e-05, 4.76054847240448e-05, 5.380809307098389e-05, 6.0010701417922974e-05, 6.621330976486206e-05, 7.241591811180115e-05, 7.861852645874023e-05, 8.482113480567932e-05, 9.102374315261841e-05, 9.72263514995575e-05, 0.00010342895984649658, 0.00010963156819343567, 0.00011583417654037476, 0.00012203678488731384, 0.00012823939323425293, 0.00013444200158119202, 0.0001406446099281311, 0.0001468472182750702, 0.00015304982662200928, 0.00015925243496894836, 0.00016545504331588745, 0.00017165765166282654, 0.00017786026000976562]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 15.0, 18.0, 27.0, 44.0, 61.0, 98.0, 143.0, 315.0, 831.0, 2190.0, 8277.0, 76833.0, 794976.0, 147772.0, 12163.0, 2932.0, 965.0, 403.0, 177.0, 100.0, 73.0, 46.0, 31.0, 22.0, 14.0, 9.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9881591796875, -0.947998046875, -0.9078369140625, -0.86767578125, -0.8275146484375, -0.787353515625, -0.7471923828125, -0.70703125, -0.6668701171875, -0.626708984375, -0.5865478515625, -0.54638671875, -0.5062255859375, -0.466064453125, -0.4259033203125, -0.3857421875, -0.3455810546875, -0.305419921875, -0.2652587890625, -0.22509765625, -0.1849365234375, -0.144775390625, -0.1046142578125, -0.064453125, -0.0242919921875, 0.015869140625, 0.0560302734375, 0.09619140625, 0.1363525390625, 0.176513671875, 0.2166748046875, 0.2568359375, 0.2969970703125, 0.337158203125, 0.3773193359375, 0.41748046875, 0.4576416015625, 0.497802734375, 0.5379638671875, 0.578125, 0.6182861328125, 0.658447265625, 0.6986083984375, 0.73876953125, 0.7789306640625, 0.819091796875, 0.8592529296875, 0.8994140625, 0.9395751953125, 0.979736328125, 1.0198974609375, 1.06005859375, 1.1002197265625, 1.140380859375, 1.1805419921875, 1.220703125, 1.2608642578125, 1.301025390625, 1.3411865234375, 1.38134765625, 1.4215087890625, 1.461669921875, 1.5018310546875, 1.5419921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 3.0, 8.0, 13.0, 10.0, 31.0, 51.0, 53.0, 94.0, 119.0, 144.0, 137.0, 97.0, 84.0, 52.0, 34.0, 26.0, 14.0, 3.0, 4.0, 7.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.12890625, -1.0980300903320312, -1.0671539306640625, -1.0362777709960938, -1.005401611328125, -0.9745254516601562, -0.9436492919921875, -0.9127731323242188, -0.88189697265625, -0.8510208129882812, -0.8201446533203125, -0.7892684936523438, -0.758392333984375, -0.7275161743164062, -0.6966400146484375, -0.6657638549804688, -0.6348876953125, -0.6040115356445312, -0.5731353759765625, -0.5422592163085938, -0.511383056640625, -0.48050689697265625, -0.4496307373046875, -0.41875457763671875, -0.38787841796875, -0.35700225830078125, -0.3261260986328125, -0.29524993896484375, -0.264373779296875, -0.23349761962890625, -0.2026214599609375, -0.17174530029296875, -0.140869140625, -0.10999298095703125, -0.0791168212890625, -0.04824066162109375, -0.017364501953125, 0.01351165771484375, 0.0443878173828125, 0.07526397705078125, 0.10614013671875, 0.13701629638671875, 0.1678924560546875, 0.19876861572265625, 0.229644775390625, 0.26052093505859375, 0.2913970947265625, 0.32227325439453125, 0.3531494140625, 0.38402557373046875, 0.4149017333984375, 0.44577789306640625, 0.476654052734375, 0.5075302124023438, 0.5384063720703125, 0.5692825317382812, 0.60015869140625, 0.6310348510742188, 0.6619110107421875, 0.6927871704101562, 0.723663330078125, 0.7545394897460938, 0.7854156494140625, 0.8162918090820312, 0.84716796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 9.0, 11.0, 16.0, 29.0, 64.0, 112.0, 142.0, 196.0, 177.0, 130.0, 59.0, 35.0, 13.0, 9.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.208967208862305, -8.721240043640137, -8.233511924743652, -7.745784282684326, -7.258056640625, -6.770329475402832, -6.282601356506348, -5.79487419128418, -5.307146072387695, -4.819418430328369, -4.331690788269043, -3.843963146209717, -3.3562355041503906, -2.8685081005096436, -2.3807804584503174, -1.8930528163909912, -1.4053254127502441, -0.917597770690918, -0.4298701882362366, 0.057857394218444824, 0.545585036277771, 1.0333125591278076, 1.5210402011871338, 2.00876784324646, 2.496495485305786, 2.9842231273651123, 3.4719507694244385, 3.9596781730651855, 4.447405815124512, 4.935133457183838, 5.422861099243164, 5.91058874130249, 6.398316383361816, 6.886044025421143, 7.373771667480469, 7.861499309539795, 8.349226951599121, 8.836954116821289, 9.324682235717773, 9.812409400939941, 10.300137519836426, 10.787864685058594, 11.275592803955078, 11.763319969177246, 12.25104808807373, 12.738775253295898, 13.226503372192383, 13.71423053741455, 14.201957702636719, 14.689684867858887, 15.177412986755371, 15.665140151977539, 16.152868270874023, 16.640596389770508, 17.12832260131836, 17.616050720214844, 18.103778839111328, 18.591506958007812, 19.079233169555664, 19.56696128845215, 20.054689407348633, 20.542417526245117, 21.03014373779297, 21.517871856689453, 22.005599975585938]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 6.0, 6.0, 5.0, 9.0, 9.0, 6.0, 8.0, 16.0, 12.0, 13.0, 14.0, 22.0, 15.0, 25.0, 24.0, 27.0, 31.0, 35.0, 15.0, 41.0, 36.0, 54.0, 43.0, 41.0, 41.0, 39.0, 25.0, 41.0, 44.0, 42.0, 37.0, 33.0, 26.0, 31.0, 19.0, 21.0, 13.0, 16.0, 14.0, 11.0, 8.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.625533580780029, -6.410942554473877, -6.196352005004883, -5.9817609786987305, -5.767169952392578, -5.552578926086426, -5.337987899780273, -5.123397350311279, -4.908806324005127, -4.694215297698975, -4.4796247482299805, -4.265033721923828, -4.050442695617676, -3.8358516693115234, -3.62126088142395, -3.406670093536377, -3.1920790672302246, -2.9774880409240723, -2.762897253036499, -2.548306465148926, -2.3337154388427734, -2.119124412536621, -1.9045336246490479, -1.689942717552185, -1.4753518104553223, -1.2607609033584595, -1.0461699962615967, -0.8315790891647339, -0.6169881820678711, -0.4023972749710083, -0.1878063678741455, 0.026784539222717285, 0.24137544631958008, 0.45596635341644287, 0.6705572605133057, 0.8851481676101685, 1.0997390747070312, 1.314329981803894, 1.5289208889007568, 1.7435117959976196, 1.9581027030944824, 2.1726937294006348, 2.387284517288208, 2.6018753051757812, 2.8164663314819336, 3.031057357788086, 3.245648145675659, 3.4602389335632324, 3.6748299598693848, 3.889420986175537, 4.104011535644531, 4.318602561950684, 4.533193588256836, 4.747784614562988, 4.962375640869141, 5.176966190338135, 5.391557216644287, 5.6061482429504395, 5.820738792419434, 6.035329818725586, 6.249920845031738, 6.464511871337891, 6.679102897644043, 6.893693447113037, 7.1082844734191895]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 6.0, 3.0, 2.0, 6.0, 8.0, 16.0, 15.0, 24.0, 30.0, 36.0, 44.0, 81.0, 125.0, 185.0, 388.0, 867.0, 2393.0, 7723.0, 40197.0, 3689287.0, 418364.0, 25093.0, 5818.0, 1962.0, 815.0, 387.0, 159.0, 104.0, 52.0, 26.0, 29.0, 9.0, 10.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0], "bins": [-5.484375, -5.362152099609375, -5.23992919921875, -5.117706298828125, -4.9954833984375, -4.873260498046875, -4.75103759765625, -4.628814697265625, -4.506591796875, -4.384368896484375, -4.26214599609375, -4.139923095703125, -4.0177001953125, -3.895477294921875, -3.77325439453125, -3.651031494140625, -3.52880859375, -3.406585693359375, -3.28436279296875, -3.162139892578125, -3.0399169921875, -2.917694091796875, -2.79547119140625, -2.673248291015625, -2.551025390625, -2.428802490234375, -2.30657958984375, -2.184356689453125, -2.0621337890625, -1.939910888671875, -1.81768798828125, -1.695465087890625, -1.5732421875, -1.451019287109375, -1.32879638671875, -1.206573486328125, -1.0843505859375, -0.962127685546875, -0.83990478515625, -0.717681884765625, -0.595458984375, -0.473236083984375, -0.35101318359375, -0.228790283203125, -0.1065673828125, 0.015655517578125, 0.13787841796875, 0.260101318359375, 0.38232421875, 0.504547119140625, 0.62677001953125, 0.748992919921875, 0.8712158203125, 0.993438720703125, 1.11566162109375, 1.237884521484375, 1.360107421875, 1.482330322265625, 1.60455322265625, 1.726776123046875, 1.8489990234375, 1.971221923828125, 2.09344482421875, 2.215667724609375, 2.337890625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 11.0, 8.0, 19.0, 14.0, 16.0, 24.0, 35.0, 34.0, 33.0, 64.0, 54.0, 59.0, 52.0, 67.0, 60.0, 79.0, 74.0, 60.0, 37.0, 34.0, 35.0, 31.0, 19.0, 20.0, 15.0, 12.0, 10.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.58984375, -0.5746307373046875, -0.559417724609375, -0.5442047119140625, -0.52899169921875, -0.5137786865234375, -0.498565673828125, -0.4833526611328125, -0.4681396484375, -0.4529266357421875, -0.437713623046875, -0.4225006103515625, -0.40728759765625, -0.3920745849609375, -0.376861572265625, -0.3616485595703125, -0.346435546875, -0.3312225341796875, -0.316009521484375, -0.3007965087890625, -0.28558349609375, -0.2703704833984375, -0.255157470703125, -0.2399444580078125, -0.2247314453125, -0.2095184326171875, -0.194305419921875, -0.1790924072265625, -0.16387939453125, -0.1486663818359375, -0.133453369140625, -0.1182403564453125, -0.10302734375, -0.0878143310546875, -0.072601318359375, -0.0573883056640625, -0.04217529296875, -0.0269622802734375, -0.011749267578125, 0.0034637451171875, 0.0186767578125, 0.0338897705078125, 0.049102783203125, 0.0643157958984375, 0.07952880859375, 0.0947418212890625, 0.109954833984375, 0.1251678466796875, 0.140380859375, 0.1555938720703125, 0.170806884765625, 0.1860198974609375, 0.20123291015625, 0.2164459228515625, 0.231658935546875, 0.2468719482421875, 0.2620849609375, 0.2772979736328125, 0.292510986328125, 0.3077239990234375, 0.32293701171875, 0.3381500244140625, 0.353363037109375, 0.3685760498046875, 0.3837890625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 7.0, 3.0, 9.0, 6.0, 7.0, 5.0, 8.0, 18.0, 26.0, 23.0, 46.0, 67.0, 68.0, 96.0, 154.0, 269.0, 430.0, 613.0, 1069.0, 2045.0, 4390.0, 10817.0, 42055.0, 444024.0, 3554445.0, 101146.0, 19329.0, 6485.0, 2889.0, 1435.0, 809.0, 527.0, 286.0, 191.0, 140.0, 95.0, 64.0, 44.0, 26.0, 30.0, 30.0, 13.0, 8.0, 4.0, 8.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.1953125, -2.125030517578125, -2.05474853515625, -1.984466552734375, -1.9141845703125, -1.843902587890625, -1.77362060546875, -1.703338623046875, -1.633056640625, -1.562774658203125, -1.49249267578125, -1.422210693359375, -1.3519287109375, -1.281646728515625, -1.21136474609375, -1.141082763671875, -1.07080078125, -1.000518798828125, -0.93023681640625, -0.859954833984375, -0.7896728515625, -0.719390869140625, -0.64910888671875, -0.578826904296875, -0.508544921875, -0.438262939453125, -0.36798095703125, -0.297698974609375, -0.2274169921875, -0.157135009765625, -0.08685302734375, -0.016571044921875, 0.0537109375, 0.123992919921875, 0.19427490234375, 0.264556884765625, 0.3348388671875, 0.405120849609375, 0.47540283203125, 0.545684814453125, 0.615966796875, 0.686248779296875, 0.75653076171875, 0.826812744140625, 0.8970947265625, 0.967376708984375, 1.03765869140625, 1.107940673828125, 1.17822265625, 1.248504638671875, 1.31878662109375, 1.389068603515625, 1.4593505859375, 1.529632568359375, 1.59991455078125, 1.670196533203125, 1.740478515625, 1.810760498046875, 1.88104248046875, 1.951324462890625, 2.0216064453125, 2.091888427734375, 2.16217041015625, 2.232452392578125, 2.302734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 4.0, 3.0, 5.0, 13.0, 14.0, 22.0, 26.0, 54.0, 158.0, 456.0, 2427.0, 512.0, 161.0, 88.0, 37.0, 27.0, 17.0, 10.0, 12.0, 9.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.314453125, -1.2740631103515625, -1.233673095703125, -1.1932830810546875, -1.15289306640625, -1.1125030517578125, -1.072113037109375, -1.0317230224609375, -0.9913330078125, -0.9509429931640625, -0.910552978515625, -0.8701629638671875, -0.82977294921875, -0.7893829345703125, -0.748992919921875, -0.7086029052734375, -0.668212890625, -0.6278228759765625, -0.587432861328125, -0.5470428466796875, -0.50665283203125, -0.4662628173828125, -0.425872802734375, -0.3854827880859375, -0.3450927734375, -0.3047027587890625, -0.264312744140625, -0.2239227294921875, -0.18353271484375, -0.1431427001953125, -0.102752685546875, -0.0623626708984375, -0.02197265625, 0.0184173583984375, 0.058807373046875, 0.0991973876953125, 0.13958740234375, 0.1799774169921875, 0.220367431640625, 0.2607574462890625, 0.3011474609375, 0.3415374755859375, 0.381927490234375, 0.4223175048828125, 0.46270751953125, 0.5030975341796875, 0.543487548828125, 0.5838775634765625, 0.624267578125, 0.6646575927734375, 0.705047607421875, 0.7454376220703125, 0.78582763671875, 0.8262176513671875, 0.866607666015625, 0.9069976806640625, 0.9473876953125, 0.9877777099609375, 1.028167724609375, 1.0685577392578125, 1.10894775390625, 1.1493377685546875, 1.189727783203125, 1.2301177978515625, 1.2705078125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 23.0, 72.0, 194.0, 270.0, 247.0, 94.0, 54.0, 21.0, 5.0, 3.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.648687362670898, -4.309000015258789, -3.9693121910095215, -3.629624843597412, -3.2899370193481445, -2.950249671936035, -2.6105620861053467, -2.270874500274658, -1.9311869144439697, -1.5914993286132812, -1.2518117427825928, -0.9121242761611938, -0.5724366903305054, -0.2327491044998169, 0.10693836212158203, 0.4466259479522705, 0.786313533782959, 1.1260011196136475, 1.465688705444336, 1.8053761720657349, 2.145063877105713, 2.4847512245178223, 2.8244388103485107, 3.164126396179199, 3.5038139820098877, 3.843501567840576, 4.1831889152526855, 4.522876739501953, 4.8625640869140625, 5.20225191116333, 5.5419392585754395, 5.881627082824707, 6.221314430236816, 6.561001777648926, 6.900689601898193, 7.240376949310303, 7.58006477355957, 7.91975212097168, 8.259439468383789, 8.599126815795898, 8.938815116882324, 9.278502464294434, 9.618189811706543, 9.957878112792969, 10.297565460205078, 10.637252807617188, 10.976940155029297, 11.316627502441406, 11.656314849853516, 11.996002197265625, 12.335689544677734, 12.67537784576416, 13.01506519317627, 13.354752540588379, 13.694439888000488, 14.034128189086914, 14.373815536499023, 14.713502883911133, 15.053190231323242, 15.392878532409668, 15.732565879821777, 16.072254180908203, 16.411941528320312, 16.751628875732422, 17.09131622314453]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 9.0, 8.0, 13.0, 33.0, 31.0, 39.0, 64.0, 71.0, 90.0, 75.0, 89.0, 105.0, 84.0, 68.0, 54.0, 47.0, 42.0, 26.0, 22.0, 17.0, 5.0, 7.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.562389373779297, -5.396784782409668, -5.231180191040039, -5.06557559967041, -4.899971008300781, -4.734366416931152, -4.568761825561523, -4.4031572341918945, -4.237552642822266, -4.071948051452637, -3.906343460083008, -3.740738868713379, -3.57513427734375, -3.409529685974121, -3.243924856185913, -3.078320264816284, -2.912715435028076, -2.7471108436584473, -2.5815062522888184, -2.4159016609191895, -2.2502970695495605, -2.0846924781799316, -1.9190876483917236, -1.7534830570220947, -1.5878784656524658, -1.422273874282837, -1.256669282913208, -1.0910645723342896, -0.9254599809646606, -0.7598553895950317, -0.5942507386207581, -0.4286460876464844, -0.26304149627685547, -0.09743687510490417, 0.06816774606704712, 0.2337723672389984, 0.3993769884109497, 0.5649815797805786, 0.7305862307548523, 0.896190881729126, 1.0617954730987549, 1.2274000644683838, 1.3930046558380127, 1.5586093664169312, 1.72421395778656, 1.889818549156189, 2.0554232597351074, 2.2210278511047363, 2.3866324424743652, 2.552237033843994, 2.717841625213623, 2.883446216583252, 3.049050807952881, 3.2146553993225098, 3.3802602291107178, 3.5458648204803467, 3.7114694118499756, 3.8770740032196045, 4.0426788330078125, 4.208283424377441, 4.37388801574707, 4.539492607116699, 4.705097198486328, 4.870701789855957, 5.036306381225586]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 9.0, 5.0, 5.0, 8.0, 16.0, 19.0, 34.0, 55.0, 76.0, 153.0, 306.0, 666.0, 1633.0, 4864.0, 17796.0, 84524.0, 434452.0, 403895.0, 76191.0, 16503.0, 4620.0, 1510.0, 568.0, 275.0, 145.0, 81.0, 38.0, 35.0, 18.0, 15.0, 11.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.70361328125, -2.6240234375, -2.54443359375, -2.46484375, -2.38525390625, -2.3056640625, -2.22607421875, -2.146484375, -2.06689453125, -1.9873046875, -1.90771484375, -1.828125, -1.74853515625, -1.6689453125, -1.58935546875, -1.509765625, -1.43017578125, -1.3505859375, -1.27099609375, -1.19140625, -1.11181640625, -1.0322265625, -0.95263671875, -0.873046875, -0.79345703125, -0.7138671875, -0.63427734375, -0.5546875, -0.47509765625, -0.3955078125, -0.31591796875, -0.236328125, -0.15673828125, -0.0771484375, 0.00244140625, 0.08203125, 0.16162109375, 0.2412109375, 0.32080078125, 0.400390625, 0.47998046875, 0.5595703125, 0.63916015625, 0.71875, 0.79833984375, 0.8779296875, 0.95751953125, 1.037109375, 1.11669921875, 1.1962890625, 1.27587890625, 1.35546875, 1.43505859375, 1.5146484375, 1.59423828125, 1.673828125, 1.75341796875, 1.8330078125, 1.91259765625, 1.9921875, 2.07177734375, 2.1513671875, 2.23095703125, 2.310546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 7.0, 8.0, 9.0, 15.0, 15.0, 19.0, 21.0, 44.0, 44.0, 35.0, 36.0, 40.0, 68.0, 54.0, 81.0, 67.0, 77.0, 70.0, 50.0, 44.0, 37.0, 36.0, 29.0, 22.0, 20.0, 17.0, 9.0, 6.0, 5.0, 10.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6293830871582031, -0.6127700805664062, -0.5961570739746094, -0.5795440673828125, -0.5629310607910156, -0.5463180541992188, -0.5297050476074219, -0.513092041015625, -0.4964790344238281, -0.47986602783203125, -0.4632530212402344, -0.4466400146484375, -0.4300270080566406, -0.41341400146484375, -0.3968009948730469, -0.38018798828125, -0.3635749816894531, -0.34696197509765625, -0.3303489685058594, -0.3137359619140625, -0.2971229553222656, -0.28050994873046875, -0.2638969421386719, -0.247283935546875, -0.23067092895507812, -0.21405792236328125, -0.19744491577148438, -0.1808319091796875, -0.16421890258789062, -0.14760589599609375, -0.13099288940429688, -0.1143798828125, -0.09776687622070312, -0.08115386962890625, -0.06454086303710938, -0.0479278564453125, -0.031314849853515625, -0.01470184326171875, 0.001911163330078125, 0.018524169921875, 0.035137176513671875, 0.05175018310546875, 0.06836318969726562, 0.0849761962890625, 0.10158920288085938, 0.11820220947265625, 0.13481521606445312, 0.15142822265625, 0.16804122924804688, 0.18465423583984375, 0.20126724243164062, 0.2178802490234375, 0.23449325561523438, 0.25110626220703125, 0.2677192687988281, 0.284332275390625, 0.3009452819824219, 0.31755828857421875, 0.3341712951660156, 0.3507843017578125, 0.3673973083496094, 0.38401031494140625, 0.4006233215332031, 0.417236328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 22.0, 11.0, 15.0, 27.0, 56.0, 94.0, 109.0, 206.0, 467.0, 924.0, 1896.0, 4329.0, 10595.0, 29847.0, 109112.0, 397174.0, 356843.0, 93565.0, 26708.0, 9271.0, 3789.0, 1718.0, 825.0, 388.0, 238.0, 133.0, 59.0, 39.0, 28.0, 26.0, 19.0, 7.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.384765625, -1.331390380859375, -1.27801513671875, -1.224639892578125, -1.1712646484375, -1.117889404296875, -1.06451416015625, -1.011138916015625, -0.957763671875, -0.904388427734375, -0.85101318359375, -0.797637939453125, -0.7442626953125, -0.690887451171875, -0.63751220703125, -0.584136962890625, -0.53076171875, -0.477386474609375, -0.42401123046875, -0.370635986328125, -0.3172607421875, -0.263885498046875, -0.21051025390625, -0.157135009765625, -0.103759765625, -0.050384521484375, 0.00299072265625, 0.056365966796875, 0.1097412109375, 0.163116455078125, 0.21649169921875, 0.269866943359375, 0.3232421875, 0.376617431640625, 0.42999267578125, 0.483367919921875, 0.5367431640625, 0.590118408203125, 0.64349365234375, 0.696868896484375, 0.750244140625, 0.803619384765625, 0.85699462890625, 0.910369873046875, 0.9637451171875, 1.017120361328125, 1.07049560546875, 1.123870849609375, 1.17724609375, 1.230621337890625, 1.28399658203125, 1.337371826171875, 1.3907470703125, 1.444122314453125, 1.49749755859375, 1.550872802734375, 1.604248046875, 1.657623291015625, 1.71099853515625, 1.764373779296875, 1.8177490234375, 1.871124267578125, 1.92449951171875, 1.977874755859375, 2.03125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 9.0, 5.0, 7.0, 2.0, 11.0, 9.0, 21.0, 15.0, 17.0, 18.0, 18.0, 32.0, 25.0, 51.0, 51.0, 45.0, 55.0, 54.0, 57.0, 55.0, 47.0, 59.0, 55.0, 48.0, 40.0, 41.0, 28.0, 29.0, 19.0, 16.0, 13.0, 9.0, 8.0, 10.0, 5.0, 8.0, 2.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.034698486328125, -1.96392822265625, -1.893157958984375, -1.8223876953125, -1.751617431640625, -1.68084716796875, -1.610076904296875, -1.539306640625, -1.468536376953125, -1.39776611328125, -1.326995849609375, -1.2562255859375, -1.185455322265625, -1.11468505859375, -1.043914794921875, -0.97314453125, -0.902374267578125, -0.83160400390625, -0.760833740234375, -0.6900634765625, -0.619293212890625, -0.54852294921875, -0.477752685546875, -0.406982421875, -0.336212158203125, -0.26544189453125, -0.194671630859375, -0.1239013671875, -0.053131103515625, 0.01763916015625, 0.088409423828125, 0.1591796875, 0.229949951171875, 0.30072021484375, 0.371490478515625, 0.4422607421875, 0.513031005859375, 0.58380126953125, 0.654571533203125, 0.725341796875, 0.796112060546875, 0.86688232421875, 0.937652587890625, 1.0084228515625, 1.079193115234375, 1.14996337890625, 1.220733642578125, 1.29150390625, 1.362274169921875, 1.43304443359375, 1.503814697265625, 1.5745849609375, 1.645355224609375, 1.71612548828125, 1.786895751953125, 1.857666015625, 1.928436279296875, 1.99920654296875, 2.069976806640625, 2.1407470703125, 2.211517333984375, 2.28228759765625, 2.353057861328125, 2.423828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 12.0, 12.0, 16.0, 36.0, 38.0, 74.0, 115.0, 220.0, 382.0, 739.0, 1682.0, 5380.0, 24594.0, 165052.0, 642676.0, 172988.0, 25366.0, 5763.0, 1801.0, 706.0, 373.0, 228.0, 106.0, 81.0, 36.0, 20.0, 19.0, 11.0, 4.0, 3.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.248046875, -1.211883544921875, -1.17572021484375, -1.139556884765625, -1.1033935546875, -1.067230224609375, -1.03106689453125, -0.994903564453125, -0.958740234375, -0.922576904296875, -0.88641357421875, -0.850250244140625, -0.8140869140625, -0.777923583984375, -0.74176025390625, -0.705596923828125, -0.66943359375, -0.633270263671875, -0.59710693359375, -0.560943603515625, -0.5247802734375, -0.488616943359375, -0.45245361328125, -0.416290283203125, -0.380126953125, -0.343963623046875, -0.30780029296875, -0.271636962890625, -0.2354736328125, -0.199310302734375, -0.16314697265625, -0.126983642578125, -0.0908203125, -0.054656982421875, -0.01849365234375, 0.017669677734375, 0.0538330078125, 0.089996337890625, 0.12615966796875, 0.162322998046875, 0.198486328125, 0.234649658203125, 0.27081298828125, 0.306976318359375, 0.3431396484375, 0.379302978515625, 0.41546630859375, 0.451629638671875, 0.48779296875, 0.523956298828125, 0.56011962890625, 0.596282958984375, 0.6324462890625, 0.668609619140625, 0.70477294921875, 0.740936279296875, 0.777099609375, 0.813262939453125, 0.84942626953125, 0.885589599609375, 0.9217529296875, 0.957916259765625, 0.99407958984375, 1.030242919921875, 1.06640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 11.0, 14.0, 16.0, 24.0, 53.0, 66.0, 75.0, 112.0, 135.0, 132.0, 104.0, 71.0, 68.0, 35.0, 27.0, 18.0, 9.0, 19.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001571178436279297, -0.0001510903239250183, -0.00014506280422210693, -0.00013903528451919556, -0.00013300776481628418, -0.0001269802451133728, -0.00012095272541046143, -0.00011492520570755005, -0.00010889768600463867, -0.0001028701663017273, -9.684264659881592e-05, -9.081512689590454e-05, -8.478760719299316e-05, -7.876008749008179e-05, -7.273256778717041e-05, -6.670504808425903e-05, -6.0677528381347656e-05, -5.465000867843628e-05, -4.86224889755249e-05, -4.2594969272613525e-05, -3.656744956970215e-05, -3.053992986679077e-05, -2.4512410163879395e-05, -1.8484890460968018e-05, -1.245737075805664e-05, -6.429851055145264e-06, -4.023313522338867e-07, 5.62518835067749e-06, 1.1652708053588867e-05, 1.7680227756500244e-05, 2.370774745941162e-05, 2.9735267162322998e-05, 3.5762786865234375e-05, 4.179030656814575e-05, 4.781782627105713e-05, 5.3845345973968506e-05, 5.987286567687988e-05, 6.590038537979126e-05, 7.192790508270264e-05, 7.795542478561401e-05, 8.398294448852539e-05, 9.001046419143677e-05, 9.603798389434814e-05, 0.00010206550359725952, 0.0001080930233001709, 0.00011412054300308228, 0.00012014806270599365, 0.00012617558240890503, 0.0001322031021118164, 0.00013823062181472778, 0.00014425814151763916, 0.00015028566122055054, 0.00015631318092346191, 0.0001623407006263733, 0.00016836822032928467, 0.00017439574003219604, 0.00018042325973510742, 0.0001864507794380188, 0.00019247829914093018, 0.00019850581884384155, 0.00020453333854675293, 0.0002105608582496643, 0.00021658837795257568, 0.00022261589765548706, 0.00022864341735839844]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 11.0, 4.0, 10.0, 4.0, 9.0, 23.0, 32.0, 35.0, 67.0, 98.0, 241.0, 464.0, 1161.0, 3943.0, 17746.0, 122127.0, 606771.0, 253001.0, 33406.0, 6367.0, 1755.0, 640.0, 271.0, 157.0, 83.0, 47.0, 36.0, 20.0, 13.0, 12.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.5205078125, -1.4840240478515625, -1.447540283203125, -1.4110565185546875, -1.37457275390625, -1.3380889892578125, -1.301605224609375, -1.2651214599609375, -1.2286376953125, -1.1921539306640625, -1.155670166015625, -1.1191864013671875, -1.08270263671875, -1.0462188720703125, -1.009735107421875, -0.9732513427734375, -0.936767578125, -0.9002838134765625, -0.863800048828125, -0.8273162841796875, -0.79083251953125, -0.7543487548828125, -0.717864990234375, -0.6813812255859375, -0.6448974609375, -0.6084136962890625, -0.571929931640625, -0.5354461669921875, -0.49896240234375, -0.4624786376953125, -0.425994873046875, -0.3895111083984375, -0.35302734375, -0.3165435791015625, -0.280059814453125, -0.2435760498046875, -0.20709228515625, -0.1706085205078125, -0.134124755859375, -0.0976409912109375, -0.0611572265625, -0.0246734619140625, 0.011810302734375, 0.0482940673828125, 0.08477783203125, 0.1212615966796875, 0.157745361328125, 0.1942291259765625, 0.230712890625, 0.2671966552734375, 0.303680419921875, 0.3401641845703125, 0.37664794921875, 0.4131317138671875, 0.449615478515625, 0.4860992431640625, 0.5225830078125, 0.5590667724609375, 0.595550537109375, 0.6320343017578125, 0.66851806640625, 0.7050018310546875, 0.741485595703125, 0.7779693603515625, 0.814453125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 11.0, 16.0, 29.0, 32.0, 32.0, 62.0, 101.0, 140.0, 163.0, 113.0, 88.0, 58.0, 39.0, 26.0, 26.0, 17.0, 6.0, 15.0, 7.0, 3.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.826171875, -1.7821502685546875, -1.738128662109375, -1.6941070556640625, -1.65008544921875, -1.6060638427734375, -1.562042236328125, -1.5180206298828125, -1.4739990234375, -1.4299774169921875, -1.385955810546875, -1.3419342041015625, -1.29791259765625, -1.2538909912109375, -1.209869384765625, -1.1658477783203125, -1.121826171875, -1.0778045654296875, -1.033782958984375, -0.9897613525390625, -0.94573974609375, -0.9017181396484375, -0.857696533203125, -0.8136749267578125, -0.7696533203125, -0.7256317138671875, -0.681610107421875, -0.6375885009765625, -0.59356689453125, -0.5495452880859375, -0.505523681640625, -0.4615020751953125, -0.41748046875, -0.3734588623046875, -0.329437255859375, -0.2854156494140625, -0.24139404296875, -0.1973724365234375, -0.153350830078125, -0.1093292236328125, -0.0653076171875, -0.0212860107421875, 0.022735595703125, 0.0667572021484375, 0.11077880859375, 0.1548004150390625, 0.198822021484375, 0.2428436279296875, 0.286865234375, 0.3308868408203125, 0.374908447265625, 0.4189300537109375, 0.46295166015625, 0.5069732666015625, 0.550994873046875, 0.5950164794921875, 0.6390380859375, 0.6830596923828125, 0.727081298828125, 0.7711029052734375, 0.81512451171875, 0.8591461181640625, 0.903167724609375, 0.9471893310546875, 0.9912109375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 24.0, 38.0, 180.0, 330.0, 287.0, 115.0, 28.0, 10.0], "bins": [-77.53179931640625, -76.23814392089844, -74.9444808959961, -73.65082550048828, -72.35717010498047, -71.06350708007812, -69.76985168457031, -68.4761962890625, -67.18254089355469, -65.88888549804688, -64.59522247314453, -63.30156707763672, -62.007911682128906, -60.71425247192383, -59.42059326171875, -58.12693786621094, -56.833274841308594, -55.539615631103516, -54.2459602355957, -52.952301025390625, -51.65864562988281, -50.364986419677734, -49.071327209472656, -47.777671813964844, -46.484012603759766, -45.19035339355469, -43.896697998046875, -42.6030387878418, -41.30937957763672, -40.015724182128906, -38.72206497192383, -37.42840576171875, -36.13474655151367, -34.841087341308594, -33.54743194580078, -32.2537727355957, -30.960115432739258, -29.666458129882812, -28.372798919677734, -27.07914161682129, -25.785486221313477, -24.49182891845703, -23.198169708251953, -21.904512405395508, -20.610855102539062, -19.317197799682617, -18.023540496826172, -16.729881286621094, -15.436223983764648, -14.142566680908203, -12.848908424377441, -11.55525016784668, -10.261592864990234, -8.967935562133789, -7.674277305603027, -6.380619049072266, -5.086961269378662, -3.7933034896850586, -2.499645709991455, -1.2059879302978516, 0.08766984939575195, 1.3813276290893555, 2.674985408782959, 3.9686436653137207, 5.262300968170166]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 12.0, 10.0, 10.0, 27.0, 17.0, 17.0, 24.0, 34.0, 37.0, 36.0, 38.0, 57.0, 54.0, 63.0, 62.0, 51.0, 77.0, 56.0, 53.0, 35.0, 43.0, 28.0, 34.0, 28.0, 27.0, 27.0, 16.0, 18.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.77413558959961, -13.325748443603516, -12.877361297607422, -12.428975105285645, -11.98058795928955, -11.532200813293457, -11.08381462097168, -10.635427474975586, -10.187040328979492, -9.738653182983398, -9.290266036987305, -8.841879844665527, -8.393492698669434, -7.94510555267334, -7.496718883514404, -7.048332214355469, -6.599945068359375, -6.151557922363281, -5.703171253204346, -5.25478458404541, -4.806397438049316, -4.358010292053223, -3.909623622894287, -3.4612367153167725, -3.012849807739258, -2.564462900161743, -2.1160759925842285, -1.6676890850067139, -1.2193021774291992, -0.7709152698516846, -0.3225283622741699, 0.12585854530334473, 0.5742454528808594, 1.022632360458374, 1.4710192680358887, 1.9194061756134033, 2.367793083190918, 2.8161799907684326, 3.2645668983459473, 3.712953805923462, 4.161340713500977, 4.60972785949707, 5.058114528656006, 5.506501197814941, 5.954888343811035, 6.403275489807129, 6.8516621589660645, 7.300048828125, 7.748435974121094, 8.196823120117188, 8.645210266113281, 9.093596458435059, 9.541983604431152, 9.990370750427246, 10.438756942749023, 10.887144088745117, 11.335531234741211, 11.783918380737305, 12.232305526733398, 12.680691719055176, 13.12907886505127, 13.577466011047363, 14.02585220336914, 14.474239349365234, 14.922626495361328]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 8.0, 5.0, 4.0, 10.0, 9.0, 8.0, 18.0, 49.0, 71.0, 132.0, 323.0, 866.0, 2506.0, 13404.0, 4098100.0, 70732.0, 5577.0, 1454.0, 538.0, 203.0, 102.0, 71.0, 24.0, 22.0, 17.0, 9.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 4.0], "bins": [-7.82421875, -7.653289794921875, -7.48236083984375, -7.311431884765625, -7.1405029296875, -6.969573974609375, -6.79864501953125, -6.627716064453125, -6.456787109375, -6.285858154296875, -6.11492919921875, -5.944000244140625, -5.7730712890625, -5.602142333984375, -5.43121337890625, -5.260284423828125, -5.08935546875, -4.918426513671875, -4.74749755859375, -4.576568603515625, -4.4056396484375, -4.234710693359375, -4.06378173828125, -3.892852783203125, -3.721923828125, -3.550994873046875, -3.38006591796875, -3.209136962890625, -3.0382080078125, -2.867279052734375, -2.69635009765625, -2.525421142578125, -2.3544921875, -2.183563232421875, -2.01263427734375, -1.841705322265625, -1.6707763671875, -1.499847412109375, -1.32891845703125, -1.157989501953125, -0.987060546875, -0.816131591796875, -0.64520263671875, -0.474273681640625, -0.3033447265625, -0.132415771484375, 0.03851318359375, 0.209442138671875, 0.38037109375, 0.551300048828125, 0.72222900390625, 0.893157958984375, 1.0640869140625, 1.235015869140625, 1.40594482421875, 1.576873779296875, 1.747802734375, 1.918731689453125, 2.08966064453125, 2.260589599609375, 2.4315185546875, 2.602447509765625, 2.77337646484375, 2.944305419921875, 3.115234375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 7.0, 8.0, 8.0, 8.0, 14.0, 14.0, 15.0, 13.0, 21.0, 24.0, 30.0, 45.0, 51.0, 30.0, 45.0, 49.0, 50.0, 51.0, 49.0, 46.0, 46.0, 51.0, 35.0, 41.0, 45.0, 33.0, 37.0, 26.0, 22.0, 9.0, 11.0, 15.0, 11.0, 11.0, 9.0, 1.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.60986328125, -0.5930099487304688, -0.5761566162109375, -0.5593032836914062, -0.542449951171875, -0.5255966186523438, -0.5087432861328125, -0.49188995361328125, -0.47503662109375, -0.45818328857421875, -0.4413299560546875, -0.42447662353515625, -0.407623291015625, -0.39076995849609375, -0.3739166259765625, -0.35706329345703125, -0.3402099609375, -0.32335662841796875, -0.3065032958984375, -0.28964996337890625, -0.272796630859375, -0.25594329833984375, -0.2390899658203125, -0.22223663330078125, -0.20538330078125, -0.18852996826171875, -0.1716766357421875, -0.15482330322265625, -0.137969970703125, -0.12111663818359375, -0.1042633056640625, -0.08740997314453125, -0.070556640625, -0.05370330810546875, -0.0368499755859375, -0.01999664306640625, -0.003143310546875, 0.01371002197265625, 0.0305633544921875, 0.04741668701171875, 0.06427001953125, 0.08112335205078125, 0.0979766845703125, 0.11483001708984375, 0.131683349609375, 0.14853668212890625, 0.1653900146484375, 0.18224334716796875, 0.1990966796875, 0.21595001220703125, 0.2328033447265625, 0.24965667724609375, 0.266510009765625, 0.28336334228515625, 0.3002166748046875, 0.31707000732421875, 0.33392333984375, 0.35077667236328125, 0.3676300048828125, 0.38448333740234375, 0.401336669921875, 0.41819000244140625, 0.4350433349609375, 0.45189666748046875, 0.46875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 7.0, 10.0, 14.0, 12.0, 21.0, 32.0, 46.0, 62.0, 95.0, 143.0, 228.0, 416.0, 706.0, 1391.0, 3121.0, 8290.0, 31716.0, 3795295.0, 316725.0, 23716.0, 6766.0, 2604.0, 1200.0, 657.0, 341.0, 213.0, 152.0, 94.0, 47.0, 39.0, 29.0, 19.0, 6.0, 10.0, 13.0, 6.0, 6.0, 5.0, 2.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.31640625, -3.221405029296875, -3.12640380859375, -3.031402587890625, -2.9364013671875, -2.841400146484375, -2.74639892578125, -2.651397705078125, -2.556396484375, -2.461395263671875, -2.36639404296875, -2.271392822265625, -2.1763916015625, -2.081390380859375, -1.98638916015625, -1.891387939453125, -1.79638671875, -1.701385498046875, -1.60638427734375, -1.511383056640625, -1.4163818359375, -1.321380615234375, -1.22637939453125, -1.131378173828125, -1.036376953125, -0.941375732421875, -0.84637451171875, -0.751373291015625, -0.6563720703125, -0.561370849609375, -0.46636962890625, -0.371368408203125, -0.2763671875, -0.181365966796875, -0.08636474609375, 0.008636474609375, 0.1036376953125, 0.198638916015625, 0.29364013671875, 0.388641357421875, 0.483642578125, 0.578643798828125, 0.67364501953125, 0.768646240234375, 0.8636474609375, 0.958648681640625, 1.05364990234375, 1.148651123046875, 1.24365234375, 1.338653564453125, 1.43365478515625, 1.528656005859375, 1.6236572265625, 1.718658447265625, 1.81365966796875, 1.908660888671875, 2.003662109375, 2.098663330078125, 2.19366455078125, 2.288665771484375, 2.3836669921875, 2.478668212890625, 2.57366943359375, 2.668670654296875, 2.763671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 10.0, 8.0, 6.0, 5.0, 21.0, 32.0, 54.0, 215.0, 3421.0, 179.0, 51.0, 22.0, 23.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.83251953125, -0.8113784790039062, -0.7902374267578125, -0.7690963745117188, -0.747955322265625, -0.7268142700195312, -0.7056732177734375, -0.6845321655273438, -0.66339111328125, -0.6422500610351562, -0.6211090087890625, -0.5999679565429688, -0.578826904296875, -0.5576858520507812, -0.5365447998046875, -0.5154037475585938, -0.4942626953125, -0.47312164306640625, -0.4519805908203125, -0.43083953857421875, -0.409698486328125, -0.38855743408203125, -0.3674163818359375, -0.34627532958984375, -0.32513427734375, -0.30399322509765625, -0.2828521728515625, -0.26171112060546875, -0.240570068359375, -0.21942901611328125, -0.1982879638671875, -0.17714691162109375, -0.156005859375, -0.13486480712890625, -0.1137237548828125, -0.09258270263671875, -0.071441650390625, -0.05030059814453125, -0.0291595458984375, -0.00801849365234375, 0.01312255859375, 0.03426361083984375, 0.0554046630859375, 0.07654571533203125, 0.097686767578125, 0.11882781982421875, 0.1399688720703125, 0.16110992431640625, 0.1822509765625, 0.20339202880859375, 0.2245330810546875, 0.24567413330078125, 0.266815185546875, 0.28795623779296875, 0.3090972900390625, 0.33023834228515625, 0.35137939453125, 0.37252044677734375, 0.3936614990234375, 0.41480255126953125, 0.435943603515625, 0.45708465576171875, 0.4782257080078125, 0.49936676025390625, 0.5205078125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 3.0, 4.0, 6.0, 14.0, 28.0, 40.0, 60.0, 120.0, 147.0, 166.0, 134.0, 124.0, 76.0, 40.0, 22.0, 11.0, 3.0, 6.0, 6.0, 2.0, 2.0], "bins": [-4.905620574951172, -4.812600135803223, -4.719579696655273, -4.626559257507324, -4.533538341522217, -4.440517902374268, -4.347497463226318, -4.254477024078369, -4.16145658493042, -4.068436145782471, -3.9754154682159424, -3.882395029067993, -3.789374589920044, -3.6963541507720947, -3.6033334732055664, -3.510313034057617, -3.417292594909668, -3.3242721557617188, -3.2312514781951904, -3.138231039047241, -3.045210599899292, -2.9521901607513428, -2.8591694831848145, -2.7661490440368652, -2.673128366470337, -2.5801079273223877, -2.4870872497558594, -2.39406681060791, -2.301046371459961, -2.2080259323120117, -2.1150052547454834, -2.021984815597534, -1.928964376449585, -1.8359438180923462, -1.742923378944397, -1.6499028205871582, -1.556882381439209, -1.4638618230819702, -1.3708412647247314, -1.2778208255767822, -1.184800386428833, -1.0917798280715942, -0.998759388923645, -0.9057388305664062, -0.812718391418457, -0.7196978330612183, -0.6266773343086243, -0.5336568355560303, -0.4406362771987915, -0.3476157784461975, -0.2545952796936035, -0.16157475113868713, -0.06855425238609314, 0.024466246366500854, 0.11748677492141724, 0.21050727367401123, 0.3035277724266052, 0.3965482711791992, 0.4895687699317932, 0.5825892686843872, 0.675609827041626, 0.7686302661895752, 0.861650824546814, 0.954671323299408, 1.047691822052002]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 6.0, 8.0, 20.0, 10.0, 10.0, 9.0, 16.0, 23.0, 26.0, 32.0, 34.0, 29.0, 46.0, 40.0, 35.0, 34.0, 61.0, 46.0, 56.0, 40.0, 38.0, 49.0, 43.0, 30.0, 36.0, 31.0, 31.0, 23.0, 18.0, 18.0, 23.0, 18.0, 7.0, 9.0, 7.0, 5.0, 12.0, 5.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.1453073024749756, -1.1123360395431519, -1.0793648958206177, -1.046393632888794, -1.0134224891662598, -0.980451226234436, -0.9474800229072571, -0.9145088195800781, -0.8815376162528992, -0.8485664129257202, -0.8155952095985413, -0.7826240062713623, -0.7496527433395386, -0.7166815996170044, -0.6837103366851807, -0.6507391333580017, -0.6177679300308228, -0.5847967267036438, -0.5518255233764648, -0.5188543200492859, -0.48588308691978455, -0.4529118835926056, -0.41994065046310425, -0.3869694471359253, -0.35399824380874634, -0.3210270404815674, -0.2880558371543884, -0.2550846040248871, -0.22211340069770813, -0.18914219737052917, -0.15617097914218903, -0.12319976091384888, -0.09022867679595947, -0.05725746601819992, -0.02428625524044037, 0.008684955537319183, 0.041656166315078735, 0.07462736964225769, 0.10759858787059784, 0.140569806098938, 0.17354100942611694, 0.2065122127532959, 0.23948343098163605, 0.2724546492099762, 0.30542585253715515, 0.3383970558643341, 0.37136828899383545, 0.4043394923210144, 0.43731069564819336, 0.4702818989753723, 0.5032531023025513, 0.5362243056297302, 0.5691955089569092, 0.6021667718887329, 0.6351379752159119, 0.6681091785430908, 0.7010803818702698, 0.7340515851974487, 0.7670227885246277, 0.7999939918518066, 0.8329652547836304, 0.8659363985061646, 0.8989076614379883, 0.9318788647651672, 0.9648500680923462]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 6.0, 7.0, 10.0, 24.0, 23.0, 36.0, 52.0, 84.0, 195.0, 436.0, 970.0, 2413.0, 6829.0, 22070.0, 78555.0, 269174.0, 419266.0, 177908.0, 48562.0, 14148.0, 4646.0, 1737.0, 703.0, 333.0, 141.0, 89.0, 47.0, 29.0, 12.0, 13.0, 7.0, 7.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.509765625, -2.42962646484375, -2.3494873046875, -2.26934814453125, -2.189208984375, -2.10906982421875, -2.0289306640625, -1.94879150390625, -1.86865234375, -1.78851318359375, -1.7083740234375, -1.62823486328125, -1.548095703125, -1.46795654296875, -1.3878173828125, -1.30767822265625, -1.2275390625, -1.14739990234375, -1.0672607421875, -0.98712158203125, -0.906982421875, -0.82684326171875, -0.7467041015625, -0.66656494140625, -0.58642578125, -0.50628662109375, -0.4261474609375, -0.34600830078125, -0.265869140625, -0.18572998046875, -0.1055908203125, -0.02545166015625, 0.0546875, 0.13482666015625, 0.2149658203125, 0.29510498046875, 0.375244140625, 0.45538330078125, 0.5355224609375, 0.61566162109375, 0.69580078125, 0.77593994140625, 0.8560791015625, 0.93621826171875, 1.016357421875, 1.09649658203125, 1.1766357421875, 1.25677490234375, 1.3369140625, 1.41705322265625, 1.4971923828125, 1.57733154296875, 1.657470703125, 1.73760986328125, 1.8177490234375, 1.89788818359375, 1.97802734375, 2.05816650390625, 2.1383056640625, 2.21844482421875, 2.298583984375, 2.37872314453125, 2.4588623046875, 2.53900146484375, 2.619140625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 6.0, 5.0, 5.0, 9.0, 5.0, 19.0, 9.0, 17.0, 20.0, 19.0, 34.0, 29.0, 26.0, 44.0, 35.0, 44.0, 49.0, 48.0, 43.0, 46.0, 37.0, 45.0, 49.0, 40.0, 40.0, 38.0, 41.0, 29.0, 33.0, 30.0, 22.0, 14.0, 16.0, 13.0, 13.0, 10.0, 6.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6240234375, -0.6060409545898438, -0.5880584716796875, -0.5700759887695312, -0.552093505859375, -0.5341110229492188, -0.5161285400390625, -0.49814605712890625, -0.48016357421875, -0.46218109130859375, -0.4441986083984375, -0.42621612548828125, -0.408233642578125, -0.39025115966796875, -0.3722686767578125, -0.35428619384765625, -0.3363037109375, -0.31832122802734375, -0.3003387451171875, -0.28235626220703125, -0.264373779296875, -0.24639129638671875, -0.2284088134765625, -0.21042633056640625, -0.19244384765625, -0.17446136474609375, -0.1564788818359375, -0.13849639892578125, -0.120513916015625, -0.10253143310546875, -0.0845489501953125, -0.06656646728515625, -0.048583984375, -0.03060150146484375, -0.0126190185546875, 0.00536346435546875, 0.023345947265625, 0.04132843017578125, 0.0593109130859375, 0.07729339599609375, 0.09527587890625, 0.11325836181640625, 0.1312408447265625, 0.14922332763671875, 0.167205810546875, 0.18518829345703125, 0.2031707763671875, 0.22115325927734375, 0.2391357421875, 0.25711822509765625, 0.2751007080078125, 0.29308319091796875, 0.311065673828125, 0.32904815673828125, 0.3470306396484375, 0.36501312255859375, 0.38299560546875, 0.40097808837890625, 0.4189605712890625, 0.43694305419921875, 0.454925537109375, 0.47290802001953125, 0.4908905029296875, 0.5088729858398438, 0.52685546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 13.0, 13.0, 34.0, 27.0, 67.0, 76.0, 158.0, 203.0, 385.0, 765.0, 1376.0, 2657.0, 5655.0, 12495.0, 29933.0, 76586.0, 199486.0, 374617.0, 208500.0, 79083.0, 31016.0, 13309.0, 5953.0, 2829.0, 1446.0, 758.0, 435.0, 246.0, 167.0, 94.0, 42.0, 35.0, 22.0, 13.0, 13.0, 15.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.64453125, -1.5923614501953125, -1.540191650390625, -1.4880218505859375, -1.43585205078125, -1.3836822509765625, -1.331512451171875, -1.2793426513671875, -1.2271728515625, -1.1750030517578125, -1.122833251953125, -1.0706634521484375, -1.01849365234375, -0.9663238525390625, -0.914154052734375, -0.8619842529296875, -0.809814453125, -0.7576446533203125, -0.705474853515625, -0.6533050537109375, -0.60113525390625, -0.5489654541015625, -0.496795654296875, -0.4446258544921875, -0.3924560546875, -0.3402862548828125, -0.288116455078125, -0.2359466552734375, -0.18377685546875, -0.1316070556640625, -0.079437255859375, -0.0272674560546875, 0.02490234375, 0.0770721435546875, 0.129241943359375, 0.1814117431640625, 0.23358154296875, 0.2857513427734375, 0.337921142578125, 0.3900909423828125, 0.4422607421875, 0.4944305419921875, 0.546600341796875, 0.5987701416015625, 0.65093994140625, 0.7031097412109375, 0.755279541015625, 0.8074493408203125, 0.859619140625, 0.9117889404296875, 0.963958740234375, 1.0161285400390625, 1.06829833984375, 1.1204681396484375, 1.172637939453125, 1.2248077392578125, 1.2769775390625, 1.3291473388671875, 1.381317138671875, 1.4334869384765625, 1.48565673828125, 1.5378265380859375, 1.589996337890625, 1.6421661376953125, 1.6943359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 10.0, 10.0, 15.0, 28.0, 21.0, 22.0, 21.0, 49.0, 34.0, 37.0, 58.0, 49.0, 56.0, 63.0, 51.0, 65.0, 54.0, 46.0, 42.0, 43.0, 38.0, 32.0, 24.0, 22.0, 23.0, 15.0, 8.0, 11.0, 13.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.173828125, -3.056732177734375, -2.93963623046875, -2.822540283203125, -2.7054443359375, -2.588348388671875, -2.47125244140625, -2.354156494140625, -2.237060546875, -2.119964599609375, -2.00286865234375, -1.885772705078125, -1.7686767578125, -1.651580810546875, -1.53448486328125, -1.417388916015625, -1.30029296875, -1.183197021484375, -1.06610107421875, -0.949005126953125, -0.8319091796875, -0.714813232421875, -0.59771728515625, -0.480621337890625, -0.363525390625, -0.246429443359375, -0.12933349609375, -0.012237548828125, 0.1048583984375, 0.221954345703125, 0.33905029296875, 0.456146240234375, 0.5732421875, 0.690338134765625, 0.80743408203125, 0.924530029296875, 1.0416259765625, 1.158721923828125, 1.27581787109375, 1.392913818359375, 1.510009765625, 1.627105712890625, 1.74420166015625, 1.861297607421875, 1.9783935546875, 2.095489501953125, 2.21258544921875, 2.329681396484375, 2.44677734375, 2.563873291015625, 2.68096923828125, 2.798065185546875, 2.9151611328125, 3.032257080078125, 3.14935302734375, 3.266448974609375, 3.383544921875, 3.500640869140625, 3.61773681640625, 3.734832763671875, 3.8519287109375, 3.969024658203125, 4.08612060546875, 4.203216552734375, 4.3203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 17.0, 31.0, 53.0, 87.0, 172.0, 412.0, 1173.0, 6321.0, 199505.0, 825101.0, 12858.0, 1851.0, 494.0, 213.0, 95.0, 57.0, 48.0, 16.0, 6.0, 13.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.5078125, -4.36761474609375, -4.2274169921875, -4.08721923828125, -3.947021484375, -3.80682373046875, -3.6666259765625, -3.52642822265625, -3.38623046875, -3.24603271484375, -3.1058349609375, -2.96563720703125, -2.825439453125, -2.68524169921875, -2.5450439453125, -2.40484619140625, -2.2646484375, -2.12445068359375, -1.9842529296875, -1.84405517578125, -1.703857421875, -1.56365966796875, -1.4234619140625, -1.28326416015625, -1.14306640625, -1.00286865234375, -0.8626708984375, -0.72247314453125, -0.582275390625, -0.44207763671875, -0.3018798828125, -0.16168212890625, -0.021484375, 0.11871337890625, 0.2589111328125, 0.39910888671875, 0.539306640625, 0.67950439453125, 0.8197021484375, 0.95989990234375, 1.10009765625, 1.24029541015625, 1.3804931640625, 1.52069091796875, 1.660888671875, 1.80108642578125, 1.9412841796875, 2.08148193359375, 2.2216796875, 2.36187744140625, 2.5020751953125, 2.64227294921875, 2.782470703125, 2.92266845703125, 3.0628662109375, 3.20306396484375, 3.34326171875, 3.48345947265625, 3.6236572265625, 3.76385498046875, 3.904052734375, 4.04425048828125, 4.1844482421875, 4.32464599609375, 4.46484375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 16.0, 27.0, 25.0, 43.0, 58.0, 83.0, 91.0, 136.0, 119.0, 100.0, 104.0, 66.0, 29.0, 30.0, 24.0, 16.0, 8.0, 8.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014734268188476562, -0.00013963505625724792, -0.00013192743062973022, -0.00012421980500221252, -0.00011651217937469482, -0.00010880455374717712, -0.00010109692811965942, -9.338930249214172e-05, -8.568167686462402e-05, -7.797405123710632e-05, -7.026642560958862e-05, -6.255879998207092e-05, -5.485117435455322e-05, -4.714354872703552e-05, -3.943592309951782e-05, -3.172829747200012e-05, -2.4020671844482422e-05, -1.631304621696472e-05, -8.605420589447021e-06, -8.977949619293213e-07, 6.809830665588379e-06, 1.4517456293106079e-05, 2.222508192062378e-05, 2.993270754814148e-05, 3.764033317565918e-05, 4.534795880317688e-05, 5.305558443069458e-05, 6.076321005821228e-05, 6.847083568572998e-05, 7.617846131324768e-05, 8.388608694076538e-05, 9.159371256828308e-05, 9.930133819580078e-05, 0.00010700896382331848, 0.00011471658945083618, 0.00012242421507835388, 0.00013013184070587158, 0.00013783946633338928, 0.00014554709196090698, 0.00015325471758842468, 0.00016096234321594238, 0.00016866996884346008, 0.00017637759447097778, 0.00018408522009849548, 0.00019179284572601318, 0.00019950047135353088, 0.00020720809698104858, 0.00021491572260856628, 0.00022262334823608398, 0.00023033097386360168, 0.00023803859949111938, 0.0002457462251186371, 0.0002534538507461548, 0.0002611614763736725, 0.0002688691020011902, 0.0002765767276287079, 0.0002842843532562256, 0.0002919919788837433, 0.000299699604511261, 0.0003074072301387787, 0.0003151148557662964, 0.0003228224813938141, 0.0003305301070213318, 0.0003382377326488495, 0.0003459453582763672]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 9.0, 10.0, 27.0, 41.0, 91.0, 221.0, 678.0, 2332.0, 12879.0, 325334.0, 681136.0, 21214.0, 3222.0, 845.0, 294.0, 102.0, 62.0, 24.0, 9.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.416015625, -3.31585693359375, -3.2156982421875, -3.11553955078125, -3.015380859375, -2.91522216796875, -2.8150634765625, -2.71490478515625, -2.61474609375, -2.51458740234375, -2.4144287109375, -2.31427001953125, -2.214111328125, -2.11395263671875, -2.0137939453125, -1.91363525390625, -1.8134765625, -1.71331787109375, -1.6131591796875, -1.51300048828125, -1.412841796875, -1.31268310546875, -1.2125244140625, -1.11236572265625, -1.01220703125, -0.91204833984375, -0.8118896484375, -0.71173095703125, -0.611572265625, -0.51141357421875, -0.4112548828125, -0.31109619140625, -0.2109375, -0.11077880859375, -0.0106201171875, 0.08953857421875, 0.189697265625, 0.28985595703125, 0.3900146484375, 0.49017333984375, 0.59033203125, 0.69049072265625, 0.7906494140625, 0.89080810546875, 0.990966796875, 1.09112548828125, 1.1912841796875, 1.29144287109375, 1.3916015625, 1.49176025390625, 1.5919189453125, 1.69207763671875, 1.792236328125, 1.89239501953125, 1.9925537109375, 2.09271240234375, 2.19287109375, 2.29302978515625, 2.3931884765625, 2.49334716796875, 2.593505859375, 2.69366455078125, 2.7938232421875, 2.89398193359375, 2.994140625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 4.0, 10.0, 6.0, 9.0, 20.0, 32.0, 85.0, 142.0, 204.0, 230.0, 118.0, 61.0, 31.0, 18.0, 7.0, 7.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.546875, -4.42962646484375, -4.3123779296875, -4.19512939453125, -4.077880859375, -3.96063232421875, -3.8433837890625, -3.72613525390625, -3.60888671875, -3.49163818359375, -3.3743896484375, -3.25714111328125, -3.139892578125, -3.02264404296875, -2.9053955078125, -2.78814697265625, -2.6708984375, -2.55364990234375, -2.4364013671875, -2.31915283203125, -2.201904296875, -2.08465576171875, -1.9674072265625, -1.85015869140625, -1.73291015625, -1.61566162109375, -1.4984130859375, -1.38116455078125, -1.263916015625, -1.14666748046875, -1.0294189453125, -0.91217041015625, -0.794921875, -0.67767333984375, -0.5604248046875, -0.44317626953125, -0.325927734375, -0.20867919921875, -0.0914306640625, 0.02581787109375, 0.14306640625, 0.26031494140625, 0.3775634765625, 0.49481201171875, 0.612060546875, 0.72930908203125, 0.8465576171875, 0.96380615234375, 1.0810546875, 1.19830322265625, 1.3155517578125, 1.43280029296875, 1.550048828125, 1.66729736328125, 1.7845458984375, 1.90179443359375, 2.01904296875, 2.13629150390625, 2.2535400390625, 2.37078857421875, 2.488037109375, 2.60528564453125, 2.7225341796875, 2.83978271484375, 2.95703125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 14.0, 28.0, 74.0, 170.0, 270.0, 231.0, 144.0, 60.0, 12.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.5616569519043, -31.949108123779297, -30.336559295654297, -28.724008560180664, -27.111459732055664, -25.498910903930664, -23.88636016845703, -22.27381134033203, -20.66126251220703, -19.04871368408203, -17.43616485595703, -15.823614120483398, -14.211065292358398, -12.598516464233398, -10.985966682434082, -9.373416900634766, -7.760868072509766, -6.148318767547607, -4.535769462585449, -2.923220157623291, -1.3106708526611328, 0.3018779754638672, 1.9144277572631836, 3.5269775390625, 5.1395263671875, 6.752075672149658, 8.364624977111816, 9.977174758911133, 11.589723587036133, 13.202272415161133, 14.81482219696045, 16.427371978759766, 18.03992462158203, 19.65247344970703, 21.26502227783203, 22.877573013305664, 24.490121841430664, 26.102670669555664, 27.715221405029297, 29.327770233154297, 30.940319061279297, 32.5528678894043, 34.1654167175293, 35.7779655456543, 37.39051818847656, 39.00306701660156, 40.61561584472656, 42.22816467285156, 43.84071350097656, 45.45326232910156, 47.06581115722656, 48.67835998535156, 50.29090881347656, 51.90345764160156, 53.51601028442383, 55.12855911254883, 56.74110794067383, 58.35365676879883, 59.96620559692383, 61.57875442504883, 63.191307067871094, 64.8038558959961, 66.4164047241211, 68.0289535522461, 69.6415023803711]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 0.0, 10.0, 9.0, 7.0, 10.0, 11.0, 17.0, 15.0, 19.0, 27.0, 25.0, 17.0, 27.0, 33.0, 44.0, 52.0, 44.0, 47.0, 39.0, 48.0, 60.0, 47.0, 57.0, 43.0, 29.0, 39.0, 28.0, 22.0, 24.0, 18.0, 21.0, 28.0, 18.0, 6.0, 12.0, 10.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-17.513343811035156, -16.96009635925293, -16.40684700012207, -15.853599548339844, -15.300352096557617, -14.747103691101074, -14.193855285644531, -13.640607833862305, -13.087359428405762, -12.534111022949219, -11.980863571166992, -11.42761516571045, -10.874366760253906, -10.32111930847168, -9.767870903015137, -9.214622497558594, -8.661375045776367, -8.108126640319824, -7.554879188537598, -7.001630783081055, -6.44838285446167, -5.895134925842285, -5.341886520385742, -4.788638591766357, -4.235390663146973, -3.682142734527588, -3.128894567489624, -2.57564640045166, -2.0223984718322754, -1.4691505432128906, -0.9159023761749268, -0.3626542091369629, 0.19059371948242188, 0.7438417673110962, 1.2970898151397705, 1.8503378629684448, 2.403585910797119, 2.956833839416504, 3.5100820064544678, 4.063330173492432, 4.616578102111816, 5.169826030731201, 5.723073959350586, 6.276322364807129, 6.829570293426514, 7.382818222045898, 7.936066627502441, 8.489315032958984, 9.042562484741211, 9.595810890197754, 10.14905834197998, 10.702306747436523, 11.25555419921875, 11.808802604675293, 12.362051010131836, 12.915298461914062, 13.468546867370605, 14.021795272827148, 14.575042724609375, 15.128291130065918, 15.681539535522461, 16.234786987304688, 16.788034439086914, 17.341283798217773, 17.89453125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 15.0, 17.0, 36.0, 69.0, 151.0, 405.0, 1382.0, 7261.0, 4007031.0, 170849.0, 5407.0, 1052.0, 340.0, 128.0, 53.0, 34.0, 14.0, 8.0, 10.0, 1.0, 8.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.453125, -13.1536865234375, -12.854248046875, -12.5548095703125, -12.25537109375, -11.9559326171875, -11.656494140625, -11.3570556640625, -11.0576171875, -10.7581787109375, -10.458740234375, -10.1593017578125, -9.85986328125, -9.5604248046875, -9.260986328125, -8.9615478515625, -8.662109375, -8.3626708984375, -8.063232421875, -7.7637939453125, -7.46435546875, -7.1649169921875, -6.865478515625, -6.5660400390625, -6.2666015625, -5.9671630859375, -5.667724609375, -5.3682861328125, -5.06884765625, -4.7694091796875, -4.469970703125, -4.1705322265625, -3.87109375, -3.5716552734375, -3.272216796875, -2.9727783203125, -2.67333984375, -2.3739013671875, -2.074462890625, -1.7750244140625, -1.4755859375, -1.1761474609375, -0.876708984375, -0.5772705078125, -0.27783203125, 0.0216064453125, 0.321044921875, 0.6204833984375, 0.919921875, 1.2193603515625, 1.518798828125, 1.8182373046875, 2.11767578125, 2.4171142578125, 2.716552734375, 3.0159912109375, 3.3154296875, 3.6148681640625, 3.914306640625, 4.2137451171875, 4.51318359375, 4.8126220703125, 5.112060546875, 5.4114990234375, 5.7109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 1.0, 4.0, 6.0, 9.0, 4.0, 7.0, 14.0, 23.0, 22.0, 27.0, 36.0, 31.0, 32.0, 57.0, 54.0, 42.0, 45.0, 56.0, 46.0, 53.0, 60.0, 54.0, 43.0, 43.0, 48.0, 33.0, 25.0, 22.0, 20.0, 11.0, 13.0, 8.0, 12.0, 7.0, 9.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.87548828125, -0.849853515625, -0.82421875, -0.798583984375, -0.77294921875, -0.747314453125, -0.7216796875, -0.696044921875, -0.67041015625, -0.644775390625, -0.619140625, -0.593505859375, -0.56787109375, -0.542236328125, -0.5166015625, -0.490966796875, -0.46533203125, -0.439697265625, -0.4140625, -0.388427734375, -0.36279296875, -0.337158203125, -0.3115234375, -0.285888671875, -0.26025390625, -0.234619140625, -0.208984375, -0.183349609375, -0.15771484375, -0.132080078125, -0.1064453125, -0.080810546875, -0.05517578125, -0.029541015625, -0.00390625, 0.021728515625, 0.04736328125, 0.072998046875, 0.0986328125, 0.124267578125, 0.14990234375, 0.175537109375, 0.201171875, 0.226806640625, 0.25244140625, 0.278076171875, 0.3037109375, 0.329345703125, 0.35498046875, 0.380615234375, 0.40625, 0.431884765625, 0.45751953125, 0.483154296875, 0.5087890625, 0.534423828125, 0.56005859375, 0.585693359375, 0.611328125, 0.636962890625, 0.66259765625, 0.688232421875, 0.7138671875, 0.739501953125, 0.76513671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 8.0, 10.0, 23.0, 19.0, 35.0, 53.0, 71.0, 99.0, 155.0, 220.0, 320.0, 536.0, 815.0, 1297.0, 2004.0, 3446.0, 6132.0, 12130.0, 32057.0, 140761.0, 3827171.0, 112899.0, 28401.0, 11456.0, 5677.0, 3157.0, 1838.0, 1246.0, 725.0, 506.0, 306.0, 203.0, 143.0, 114.0, 74.0, 56.0, 34.0, 32.0, 18.0, 9.0, 4.0, 10.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.387664794921875, -2.30657958984375, -2.225494384765625, -2.1444091796875, -2.063323974609375, -1.98223876953125, -1.901153564453125, -1.820068359375, -1.738983154296875, -1.65789794921875, -1.576812744140625, -1.4957275390625, -1.414642333984375, -1.33355712890625, -1.252471923828125, -1.17138671875, -1.090301513671875, -1.00921630859375, -0.928131103515625, -0.8470458984375, -0.765960693359375, -0.68487548828125, -0.603790283203125, -0.522705078125, -0.441619873046875, -0.36053466796875, -0.279449462890625, -0.1983642578125, -0.117279052734375, -0.03619384765625, 0.044891357421875, 0.1259765625, 0.207061767578125, 0.28814697265625, 0.369232177734375, 0.4503173828125, 0.531402587890625, 0.61248779296875, 0.693572998046875, 0.774658203125, 0.855743408203125, 0.93682861328125, 1.017913818359375, 1.0989990234375, 1.180084228515625, 1.26116943359375, 1.342254638671875, 1.42333984375, 1.504425048828125, 1.58551025390625, 1.666595458984375, 1.7476806640625, 1.828765869140625, 1.90985107421875, 1.990936279296875, 2.072021484375, 2.153106689453125, 2.23419189453125, 2.315277099609375, 2.3963623046875, 2.477447509765625, 2.55853271484375, 2.639617919921875, 2.720703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 5.0, 7.0, 10.0, 11.0, 11.0, 16.0, 18.0, 37.0, 56.0, 156.0, 2979.0, 487.0, 105.0, 56.0, 34.0, 31.0, 15.0, 4.0, 8.0, 2.0, 7.0, 7.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.984375, -0.9576873779296875, -0.930999755859375, -0.9043121337890625, -0.87762451171875, -0.8509368896484375, -0.824249267578125, -0.7975616455078125, -0.7708740234375, -0.7441864013671875, -0.717498779296875, -0.6908111572265625, -0.66412353515625, -0.6374359130859375, -0.610748291015625, -0.5840606689453125, -0.557373046875, -0.5306854248046875, -0.503997802734375, -0.4773101806640625, -0.45062255859375, -0.4239349365234375, -0.397247314453125, -0.3705596923828125, -0.3438720703125, -0.3171844482421875, -0.290496826171875, -0.2638092041015625, -0.23712158203125, -0.2104339599609375, -0.183746337890625, -0.1570587158203125, -0.13037109375, -0.1036834716796875, -0.076995849609375, -0.0503082275390625, -0.02362060546875, 0.0030670166015625, 0.029754638671875, 0.0564422607421875, 0.0831298828125, 0.1098175048828125, 0.136505126953125, 0.1631927490234375, 0.18988037109375, 0.2165679931640625, 0.243255615234375, 0.2699432373046875, 0.296630859375, 0.3233184814453125, 0.350006103515625, 0.3766937255859375, 0.40338134765625, 0.4300689697265625, 0.456756591796875, 0.4834442138671875, 0.5101318359375, 0.5368194580078125, 0.563507080078125, 0.5901947021484375, 0.61688232421875, 0.6435699462890625, 0.670257568359375, 0.6969451904296875, 0.7236328125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 11.0, 17.0, 29.0, 39.0, 64.0, 102.0, 127.0, 147.0, 131.0, 107.0, 69.0, 60.0, 36.0, 36.0, 12.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.696760654449463, -6.558041572570801, -6.419322490692139, -6.280602931976318, -6.141883850097656, -6.003164768218994, -5.864445686340332, -5.72572660446167, -5.587007522583008, -5.448288440704346, -5.309569358825684, -5.170849800109863, -5.032130718231201, -4.893411636352539, -4.754692554473877, -4.615973472595215, -4.4772539138793945, -4.338534832000732, -4.19981575012207, -4.06109619140625, -3.922377109527588, -3.783658027648926, -3.6449389457702637, -3.5062198638916016, -3.3675005435943604, -3.2287814617156982, -3.090062141418457, -2.951343059539795, -2.812623977661133, -2.6739046573638916, -2.5351855754852295, -2.3964662551879883, -2.2577476501464844, -2.1190285682678223, -1.980309247970581, -1.841590166091919, -1.7028709650039673, -1.5641517639160156, -1.4254326820373535, -1.2867134809494019, -1.1479942798614502, -1.0092750787734985, -0.8705559372901917, -0.7318367958068848, -0.5931175947189331, -0.45439839363098145, -0.31567925214767456, -0.17696011066436768, -0.038240909576416016, 0.10047826170921326, 0.23919743299484253, 0.3779166042804718, 0.5166357755661011, 0.6553549766540527, 0.7940741181373596, 0.9327932596206665, 1.0715124607086182, 1.2102316617965698, 1.3489508628845215, 1.4876699447631836, 1.6263891458511353, 1.765108346939087, 1.903827428817749, 2.0425467491149902, 2.1812658309936523]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 11.0, 13.0, 12.0, 15.0, 21.0, 17.0, 25.0, 24.0, 34.0, 23.0, 38.0, 34.0, 48.0, 47.0, 49.0, 47.0, 55.0, 40.0, 47.0, 55.0, 41.0, 39.0, 39.0, 44.0, 22.0, 23.0, 23.0, 13.0, 15.0, 15.0, 14.0, 20.0, 11.0, 3.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8557887077331543, -1.7828123569488525, -1.7098360061645508, -1.636859655380249, -1.5638831853866577, -1.490906834602356, -1.4179304838180542, -1.344954013824463, -1.2719776630401611, -1.1990013122558594, -1.1260249614715576, -1.0530486106872559, -0.9800721406936646, -0.9070957899093628, -0.834119439125061, -0.7611430287361145, -0.6881667375564575, -0.6151903867721558, -0.5422139763832092, -0.46923762559890747, -0.3962612450122833, -0.3232848644256592, -0.2503085136413574, -0.1773321032524109, -0.10435575246810913, -0.03137937933206558, 0.041596993803977966, 0.11457335948944092, 0.18754974007606506, 0.2605261206626892, 0.33350247144699097, 0.4064788818359375, 0.47945523262023926, 0.552431583404541, 0.6254079937934875, 0.6983843445777893, 0.7713607549667358, 0.8443371057510376, 0.9173134565353394, 0.9902898669242859, 1.0632662773132324, 1.1362426280975342, 1.209218978881836, 1.2821953296661377, 1.355171799659729, 1.4281481504440308, 1.5011245012283325, 1.5741009712219238, 1.647077202796936, 1.7200535535812378, 1.7930299043655396, 1.8660063743591309, 1.9389827251434326, 2.0119590759277344, 2.084935426712036, 2.157911777496338, 2.2308881282806396, 2.3038644790649414, 2.376840829849243, 2.449817180633545, 2.5227935314178467, 2.5957698822021484, 2.6687464714050293, 2.741722822189331, 2.814699172973633]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 4.0, 17.0, 12.0, 17.0, 22.0, 25.0, 58.0, 146.0, 256.0, 681.0, 1589.0, 4692.0, 15615.0, 61018.0, 257586.0, 470802.0, 177988.0, 41372.0, 10917.0, 3424.0, 1258.0, 582.0, 236.0, 96.0, 62.0, 34.0, 10.0, 14.0, 9.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.751953125, -2.658233642578125, -2.56451416015625, -2.470794677734375, -2.3770751953125, -2.283355712890625, -2.18963623046875, -2.095916748046875, -2.002197265625, -1.908477783203125, -1.81475830078125, -1.721038818359375, -1.6273193359375, -1.533599853515625, -1.43988037109375, -1.346160888671875, -1.25244140625, -1.158721923828125, -1.06500244140625, -0.971282958984375, -0.8775634765625, -0.783843994140625, -0.69012451171875, -0.596405029296875, -0.502685546875, -0.408966064453125, -0.31524658203125, -0.221527099609375, -0.1278076171875, -0.034088134765625, 0.05963134765625, 0.153350830078125, 0.2470703125, 0.340789794921875, 0.43450927734375, 0.528228759765625, 0.6219482421875, 0.715667724609375, 0.80938720703125, 0.903106689453125, 0.996826171875, 1.090545654296875, 1.18426513671875, 1.277984619140625, 1.3717041015625, 1.465423583984375, 1.55914306640625, 1.652862548828125, 1.74658203125, 1.840301513671875, 1.93402099609375, 2.027740478515625, 2.1214599609375, 2.215179443359375, 2.30889892578125, 2.402618408203125, 2.496337890625, 2.590057373046875, 2.68377685546875, 2.777496337890625, 2.8712158203125, 2.964935302734375, 3.05865478515625, 3.152374267578125, 3.24609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 10.0, 11.0, 9.0, 11.0, 11.0, 22.0, 20.0, 26.0, 34.0, 42.0, 26.0, 49.0, 47.0, 56.0, 53.0, 51.0, 48.0, 38.0, 61.0, 61.0, 44.0, 50.0, 36.0, 36.0, 36.0, 27.0, 13.0, 7.0, 10.0, 13.0, 7.0, 10.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.95166015625, -0.924560546875, -0.8974609375, -0.870361328125, -0.84326171875, -0.816162109375, -0.7890625, -0.761962890625, -0.73486328125, -0.707763671875, -0.6806640625, -0.653564453125, -0.62646484375, -0.599365234375, -0.572265625, -0.545166015625, -0.51806640625, -0.490966796875, -0.4638671875, -0.436767578125, -0.40966796875, -0.382568359375, -0.35546875, -0.328369140625, -0.30126953125, -0.274169921875, -0.2470703125, -0.219970703125, -0.19287109375, -0.165771484375, -0.138671875, -0.111572265625, -0.08447265625, -0.057373046875, -0.0302734375, -0.003173828125, 0.02392578125, 0.051025390625, 0.078125, 0.105224609375, 0.13232421875, 0.159423828125, 0.1865234375, 0.213623046875, 0.24072265625, 0.267822265625, 0.294921875, 0.322021484375, 0.34912109375, 0.376220703125, 0.4033203125, 0.430419921875, 0.45751953125, 0.484619140625, 0.51171875, 0.538818359375, 0.56591796875, 0.593017578125, 0.6201171875, 0.647216796875, 0.67431640625, 0.701416015625, 0.728515625, 0.755615234375, 0.78271484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 15.0, 23.0, 20.0, 59.0, 86.0, 168.0, 326.0, 798.0, 2198.0, 7265.0, 33364.0, 225980.0, 622885.0, 126617.0, 20822.0, 5080.0, 1557.0, 636.0, 266.0, 158.0, 78.0, 40.0, 31.0, 13.0, 8.0, 10.0, 14.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.103546142578125, -3.98052978515625, -3.857513427734375, -3.7344970703125, -3.611480712890625, -3.48846435546875, -3.365447998046875, -3.242431640625, -3.119415283203125, -2.99639892578125, -2.873382568359375, -2.7503662109375, -2.627349853515625, -2.50433349609375, -2.381317138671875, -2.25830078125, -2.135284423828125, -2.01226806640625, -1.889251708984375, -1.7662353515625, -1.643218994140625, -1.52020263671875, -1.397186279296875, -1.274169921875, -1.151153564453125, -1.02813720703125, -0.905120849609375, -0.7821044921875, -0.659088134765625, -0.53607177734375, -0.413055419921875, -0.2900390625, -0.167022705078125, -0.04400634765625, 0.079010009765625, 0.2020263671875, 0.325042724609375, 0.44805908203125, 0.571075439453125, 0.694091796875, 0.817108154296875, 0.94012451171875, 1.063140869140625, 1.1861572265625, 1.309173583984375, 1.43218994140625, 1.555206298828125, 1.67822265625, 1.801239013671875, 1.92425537109375, 2.047271728515625, 2.1702880859375, 2.293304443359375, 2.41632080078125, 2.539337158203125, 2.662353515625, 2.785369873046875, 2.90838623046875, 3.031402587890625, 3.1544189453125, 3.277435302734375, 3.40045166015625, 3.523468017578125, 3.646484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 5.0, 9.0, 12.0, 14.0, 30.0, 25.0, 35.0, 30.0, 44.0, 55.0, 64.0, 65.0, 63.0, 67.0, 60.0, 56.0, 68.0, 59.0, 48.0, 38.0, 37.0, 28.0, 21.0, 21.0, 16.0, 4.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.6973876953125, -5.515869140625, -5.3343505859375, -5.15283203125, -4.9713134765625, -4.789794921875, -4.6082763671875, -4.4267578125, -4.2452392578125, -4.063720703125, -3.8822021484375, -3.70068359375, -3.5191650390625, -3.337646484375, -3.1561279296875, -2.974609375, -2.7930908203125, -2.611572265625, -2.4300537109375, -2.24853515625, -2.0670166015625, -1.885498046875, -1.7039794921875, -1.5224609375, -1.3409423828125, -1.159423828125, -0.9779052734375, -0.79638671875, -0.6148681640625, -0.433349609375, -0.2518310546875, -0.0703125, 0.1112060546875, 0.292724609375, 0.4742431640625, 0.65576171875, 0.8372802734375, 1.018798828125, 1.2003173828125, 1.3818359375, 1.5633544921875, 1.744873046875, 1.9263916015625, 2.10791015625, 2.2894287109375, 2.470947265625, 2.6524658203125, 2.833984375, 3.0155029296875, 3.197021484375, 3.3785400390625, 3.56005859375, 3.7415771484375, 3.923095703125, 4.1046142578125, 4.2861328125, 4.4676513671875, 4.649169921875, 4.8306884765625, 5.01220703125, 5.1937255859375, 5.375244140625, 5.5567626953125, 5.73828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 16.0, 29.0, 44.0, 98.0, 237.0, 777.0, 6991.0, 667853.0, 366382.0, 5068.0, 673.0, 197.0, 84.0, 50.0, 33.0, 5.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.52734375, -7.35205078125, -7.1767578125, -7.00146484375, -6.826171875, -6.65087890625, -6.4755859375, -6.30029296875, -6.125, -5.94970703125, -5.7744140625, -5.59912109375, -5.423828125, -5.24853515625, -5.0732421875, -4.89794921875, -4.72265625, -4.54736328125, -4.3720703125, -4.19677734375, -4.021484375, -3.84619140625, -3.6708984375, -3.49560546875, -3.3203125, -3.14501953125, -2.9697265625, -2.79443359375, -2.619140625, -2.44384765625, -2.2685546875, -2.09326171875, -1.91796875, -1.74267578125, -1.5673828125, -1.39208984375, -1.216796875, -1.04150390625, -0.8662109375, -0.69091796875, -0.515625, -0.34033203125, -0.1650390625, 0.01025390625, 0.185546875, 0.36083984375, 0.5361328125, 0.71142578125, 0.88671875, 1.06201171875, 1.2373046875, 1.41259765625, 1.587890625, 1.76318359375, 1.9384765625, 2.11376953125, 2.2890625, 2.46435546875, 2.6396484375, 2.81494140625, 2.990234375, 3.16552734375, 3.3408203125, 3.51611328125, 3.69140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 13.0, 15.0, 13.0, 22.0, 28.0, 55.0, 79.0, 98.0, 129.0, 136.0, 102.0, 86.0, 79.0, 45.0, 36.0, 20.0, 12.0, 8.0, 12.0, 5.0, 1.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002484321594238281, -0.00023790448904037476, -0.0002273768186569214, -0.00021684914827346802, -0.00020632147789001465, -0.00019579380750656128, -0.0001852661371231079, -0.00017473846673965454, -0.00016421079635620117, -0.0001536831259727478, -0.00014315545558929443, -0.00013262778520584106, -0.0001221001148223877, -0.00011157244443893433, -0.00010104477405548096, -9.051710367202759e-05, -7.998943328857422e-05, -6.946176290512085e-05, -5.893409252166748e-05, -4.840642213821411e-05, -3.787875175476074e-05, -2.7351081371307373e-05, -1.6823410987854004e-05, -6.295740604400635e-06, 4.231929779052734e-06, 1.4759600162506104e-05, 2.5287270545959473e-05, 3.581494092941284e-05, 4.634261131286621e-05, 5.687028169631958e-05, 6.739795207977295e-05, 7.792562246322632e-05, 8.845329284667969e-05, 9.898096323013306e-05, 0.00010950863361358643, 0.0001200363039970398, 0.00013056397438049316, 0.00014109164476394653, 0.0001516193151473999, 0.00016214698553085327, 0.00017267465591430664, 0.00018320232629776, 0.00019372999668121338, 0.00020425766706466675, 0.00021478533744812012, 0.00022531300783157349, 0.00023584067821502686, 0.0002463683485984802, 0.0002568960189819336, 0.00026742368936538696, 0.00027795135974884033, 0.0002884790301322937, 0.00029900670051574707, 0.00030953437089920044, 0.0003200620412826538, 0.0003305897116661072, 0.00034111738204956055, 0.0003516450524330139, 0.0003621727228164673, 0.00037270039319992065, 0.000383228063583374, 0.0003937557339668274, 0.00040428340435028076, 0.00041481107473373413, 0.0004253387451171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 12.0, 18.0, 36.0, 77.0, 122.0, 241.0, 808.0, 7681.0, 764613.0, 269840.0, 4062.0, 619.0, 221.0, 88.0, 52.0, 22.0, 22.0, 9.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2734375, -5.10272216796875, -4.9320068359375, -4.76129150390625, -4.590576171875, -4.41986083984375, -4.2491455078125, -4.07843017578125, -3.90771484375, -3.73699951171875, -3.5662841796875, -3.39556884765625, -3.224853515625, -3.05413818359375, -2.8834228515625, -2.71270751953125, -2.5419921875, -2.37127685546875, -2.2005615234375, -2.02984619140625, -1.859130859375, -1.68841552734375, -1.5177001953125, -1.34698486328125, -1.17626953125, -1.00555419921875, -0.8348388671875, -0.66412353515625, -0.493408203125, -0.32269287109375, -0.1519775390625, 0.01873779296875, 0.189453125, 0.36016845703125, 0.5308837890625, 0.70159912109375, 0.872314453125, 1.04302978515625, 1.2137451171875, 1.38446044921875, 1.55517578125, 1.72589111328125, 1.8966064453125, 2.06732177734375, 2.238037109375, 2.40875244140625, 2.5794677734375, 2.75018310546875, 2.9208984375, 3.09161376953125, 3.2623291015625, 3.43304443359375, 3.603759765625, 3.77447509765625, 3.9451904296875, 4.11590576171875, 4.28662109375, 4.45733642578125, 4.6280517578125, 4.79876708984375, 4.969482421875, 5.14019775390625, 5.3109130859375, 5.48162841796875, 5.65234375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 22.0, 45.0, 121.0, 219.0, 258.0, 191.0, 77.0, 33.0, 16.0, 8.0, 8.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.814453125, -1.637542724609375, -1.46063232421875, -1.283721923828125, -1.1068115234375, -0.929901123046875, -0.75299072265625, -0.576080322265625, -0.399169921875, -0.222259521484375, -0.04534912109375, 0.131561279296875, 0.3084716796875, 0.485382080078125, 0.66229248046875, 0.839202880859375, 1.01611328125, 1.193023681640625, 1.36993408203125, 1.546844482421875, 1.7237548828125, 1.900665283203125, 2.07757568359375, 2.254486083984375, 2.431396484375, 2.608306884765625, 2.78521728515625, 2.962127685546875, 3.1390380859375, 3.315948486328125, 3.49285888671875, 3.669769287109375, 3.8466796875, 4.023590087890625, 4.20050048828125, 4.377410888671875, 4.5543212890625, 4.731231689453125, 4.90814208984375, 5.085052490234375, 5.261962890625, 5.438873291015625, 5.61578369140625, 5.792694091796875, 5.9696044921875, 6.146514892578125, 6.32342529296875, 6.500335693359375, 6.67724609375, 6.854156494140625, 7.03106689453125, 7.207977294921875, 7.3848876953125, 7.561798095703125, 7.73870849609375, 7.915618896484375, 8.092529296875, 8.269439697265625, 8.44635009765625, 8.623260498046875, 8.8001708984375, 8.977081298828125, 9.15399169921875, 9.330902099609375, 9.5078125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 10.0, 20.0, 50.0, 103.0, 186.0, 228.0, 183.0, 120.0, 50.0, 25.0, 10.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.940765380859375, -56.25018310546875, -54.55960464477539, -52.869022369384766, -51.178443908691406, -49.48786163330078, -47.797279357910156, -46.10669708251953, -44.41611862182617, -42.72553634643555, -41.03495788574219, -39.34437561035156, -37.65379333496094, -35.96321487426758, -34.27263259887695, -32.582054138183594, -30.89147186279297, -29.200891494750977, -27.510311126708984, -25.81972885131836, -24.129148483276367, -22.438568115234375, -20.74798583984375, -19.057405471801758, -17.366825103759766, -15.676244735717773, -13.985663414001465, -12.295082092285156, -10.604501724243164, -8.913921356201172, -7.223340034484863, -5.532758712768555, -3.8421783447265625, -2.151597499847412, -0.4610166549682617, 1.2295641899108887, 2.920145034790039, 4.610725402832031, 6.30130672454834, 7.991888046264648, 9.68246841430664, 11.373048782348633, 13.063630104064941, 14.75421142578125, 16.444791793823242, 18.135372161865234, 19.82595443725586, 21.51653480529785, 23.207115173339844, 24.897695541381836, 26.588275909423828, 28.278858184814453, 29.969438552856445, 31.660018920898438, 33.35060119628906, 35.04118347167969, 36.73176193237305, 38.42234420776367, 40.11292266845703, 41.803504943847656, 43.49408721923828, 45.18466567993164, 46.875247955322266, 48.565826416015625, 50.25640869140625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 4.0, 4.0, 10.0, 11.0, 14.0, 15.0, 16.0, 23.0, 14.0, 39.0, 36.0, 46.0, 54.0, 45.0, 42.0, 58.0, 47.0, 66.0, 64.0, 63.0, 46.0, 50.0, 37.0, 38.0, 32.0, 20.0, 24.0, 20.0, 13.0, 17.0, 9.0, 14.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.285371780395508, -25.575790405273438, -24.866209030151367, -24.156627655029297, -23.447046279907227, -22.737464904785156, -22.027883529663086, -21.318302154541016, -20.608720779418945, -19.899139404296875, -19.189558029174805, -18.479976654052734, -17.770395278930664, -17.060813903808594, -16.351232528686523, -15.641651153564453, -14.932069778442383, -14.222488403320312, -13.512907028198242, -12.803325653076172, -12.093744277954102, -11.384162902832031, -10.674581527709961, -9.96500015258789, -9.25541877746582, -8.54583740234375, -7.83625602722168, -7.126674652099609, -6.417093276977539, -5.707511901855469, -4.997930526733398, -4.288349151611328, -3.5787696838378906, -2.8691883087158203, -2.15960693359375, -1.4500255584716797, -0.7404441833496094, -0.030862808227539062, 0.6787185668945312, 1.3882999420166016, 2.097881317138672, 2.807462692260742, 3.5170440673828125, 4.226625442504883, 4.936206817626953, 5.645788192749023, 6.355369567871094, 7.064950942993164, 7.774532318115234, 8.484113693237305, 9.193695068359375, 9.903276443481445, 10.612857818603516, 11.322439193725586, 12.032020568847656, 12.741601943969727, 13.451183319091797, 14.160764694213867, 14.870346069335938, 15.579927444458008, 16.289508819580078, 16.99909019470215, 17.70867156982422, 18.41825294494629, 19.12783432006836]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 0.0, 4.0, 12.0, 7.0, 19.0, 14.0, 30.0, 72.0, 140.0, 309.0, 752.0, 2063.0, 9281.0, 4119988.0, 54457.0, 4836.0, 1347.0, 505.0, 210.0, 86.0, 56.0, 27.0, 23.0, 16.0, 9.0, 9.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -12.0096435546875, -11.683349609375, -11.3570556640625, -11.03076171875, -10.7044677734375, -10.378173828125, -10.0518798828125, -9.7255859375, -9.3992919921875, -9.072998046875, -8.7467041015625, -8.42041015625, -8.0941162109375, -7.767822265625, -7.4415283203125, -7.115234375, -6.7889404296875, -6.462646484375, -6.1363525390625, -5.81005859375, -5.4837646484375, -5.157470703125, -4.8311767578125, -4.5048828125, -4.1785888671875, -3.852294921875, -3.5260009765625, -3.19970703125, -2.8734130859375, -2.547119140625, -2.2208251953125, -1.89453125, -1.5682373046875, -1.241943359375, -0.9156494140625, -0.58935546875, -0.2630615234375, 0.063232421875, 0.3895263671875, 0.7158203125, 1.0421142578125, 1.368408203125, 1.6947021484375, 2.02099609375, 2.3472900390625, 2.673583984375, 2.9998779296875, 3.326171875, 3.6524658203125, 3.978759765625, 4.3050537109375, 4.63134765625, 4.9576416015625, 5.283935546875, 5.6102294921875, 5.9365234375, 6.2628173828125, 6.589111328125, 6.9154052734375, 7.24169921875, 7.5679931640625, 7.894287109375, 8.2205810546875, 8.546875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 4.0, 14.0, 13.0, 20.0, 24.0, 21.0, 33.0, 25.0, 53.0, 52.0, 48.0, 67.0, 58.0, 70.0, 71.0, 68.0, 66.0, 46.0, 48.0, 28.0, 32.0, 22.0, 22.0, 18.0, 12.0, 15.0, 7.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.154296875, -1.1186676025390625, -1.083038330078125, -1.0474090576171875, -1.01177978515625, -0.9761505126953125, -0.940521240234375, -0.9048919677734375, -0.8692626953125, -0.8336334228515625, -0.798004150390625, -0.7623748779296875, -0.72674560546875, -0.6911163330078125, -0.655487060546875, -0.6198577880859375, -0.584228515625, -0.5485992431640625, -0.512969970703125, -0.4773406982421875, -0.44171142578125, -0.4060821533203125, -0.370452880859375, -0.3348236083984375, -0.2991943359375, -0.2635650634765625, -0.227935791015625, -0.1923065185546875, -0.15667724609375, -0.1210479736328125, -0.085418701171875, -0.0497894287109375, -0.01416015625, 0.0214691162109375, 0.057098388671875, 0.0927276611328125, 0.12835693359375, 0.1639862060546875, 0.199615478515625, 0.2352447509765625, 0.2708740234375, 0.3065032958984375, 0.342132568359375, 0.3777618408203125, 0.41339111328125, 0.4490203857421875, 0.484649658203125, 0.5202789306640625, 0.555908203125, 0.5915374755859375, 0.627166748046875, 0.6627960205078125, 0.69842529296875, 0.7340545654296875, 0.769683837890625, 0.8053131103515625, 0.8409423828125, 0.8765716552734375, 0.912200927734375, 0.9478302001953125, 0.98345947265625, 1.0190887451171875, 1.054718017578125, 1.0903472900390625, 1.1259765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 10.0, 10.0, 7.0, 11.0, 16.0, 31.0, 27.0, 45.0, 55.0, 68.0, 114.0, 169.0, 249.0, 512.0, 1347.0, 4498.0, 22864.0, 4058779.0, 90962.0, 10051.0, 2483.0, 889.0, 422.0, 198.0, 105.0, 96.0, 69.0, 43.0, 42.0, 32.0, 23.0, 12.0, 17.0, 9.0, 3.0, 4.0, 0.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.17578125, -6.93475341796875, -6.6937255859375, -6.45269775390625, -6.211669921875, -5.97064208984375, -5.7296142578125, -5.48858642578125, -5.24755859375, -5.00653076171875, -4.7655029296875, -4.52447509765625, -4.283447265625, -4.04241943359375, -3.8013916015625, -3.56036376953125, -3.3193359375, -3.07830810546875, -2.8372802734375, -2.59625244140625, -2.355224609375, -2.11419677734375, -1.8731689453125, -1.63214111328125, -1.39111328125, -1.15008544921875, -0.9090576171875, -0.66802978515625, -0.427001953125, -0.18597412109375, 0.0550537109375, 0.29608154296875, 0.537109375, 0.77813720703125, 1.0191650390625, 1.26019287109375, 1.501220703125, 1.74224853515625, 1.9832763671875, 2.22430419921875, 2.46533203125, 2.70635986328125, 2.9473876953125, 3.18841552734375, 3.429443359375, 3.67047119140625, 3.9114990234375, 4.15252685546875, 4.3935546875, 4.63458251953125, 4.8756103515625, 5.11663818359375, 5.357666015625, 5.59869384765625, 5.8397216796875, 6.08074951171875, 6.32177734375, 6.56280517578125, 6.8038330078125, 7.04486083984375, 7.285888671875, 7.52691650390625, 7.7679443359375, 8.00897216796875, 8.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 7.0, 6.0, 20.0, 34.0, 74.0, 3641.0, 197.0, 48.0, 19.0, 14.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6650390625, -1.6029510498046875, -1.540863037109375, -1.4787750244140625, -1.41668701171875, -1.3545989990234375, -1.292510986328125, -1.2304229736328125, -1.1683349609375, -1.1062469482421875, -1.044158935546875, -0.9820709228515625, -0.91998291015625, -0.8578948974609375, -0.795806884765625, -0.7337188720703125, -0.671630859375, -0.6095428466796875, -0.547454833984375, -0.4853668212890625, -0.42327880859375, -0.3611907958984375, -0.299102783203125, -0.2370147705078125, -0.1749267578125, -0.1128387451171875, -0.050750732421875, 0.0113372802734375, 0.07342529296875, 0.1355133056640625, 0.197601318359375, 0.2596893310546875, 0.32177734375, 0.3838653564453125, 0.445953369140625, 0.5080413818359375, 0.57012939453125, 0.6322174072265625, 0.694305419921875, 0.7563934326171875, 0.8184814453125, 0.8805694580078125, 0.942657470703125, 1.0047454833984375, 1.06683349609375, 1.1289215087890625, 1.191009521484375, 1.2530975341796875, 1.315185546875, 1.3772735595703125, 1.439361572265625, 1.5014495849609375, 1.56353759765625, 1.6256256103515625, 1.687713623046875, 1.7498016357421875, 1.8118896484375, 1.8739776611328125, 1.936065673828125, 1.9981536865234375, 2.06024169921875, 2.1223297119140625, 2.184417724609375, 2.2465057373046875, 2.30859375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 7.0, 4.0, 12.0, 13.0, 17.0, 24.0, 32.0, 38.0, 41.0, 57.0, 79.0, 68.0, 65.0, 73.0, 94.0, 68.0, 68.0, 59.0, 51.0, 35.0, 23.0, 14.0, 18.0, 9.0, 11.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.427734375, -3.3411476612091064, -3.254560947418213, -3.1679739952087402, -3.0813872814178467, -2.994800567626953, -2.9082138538360596, -2.821627140045166, -2.7350401878356934, -2.6484534740448, -2.5618667602539062, -2.4752798080444336, -2.38869309425354, -2.3021063804626465, -2.215519666671753, -2.1289329528808594, -2.0423460006713867, -1.9557592868804932, -1.86917245388031, -1.7825857400894165, -1.6959989070892334, -1.6094121932983398, -1.5228254795074463, -1.4362386465072632, -1.3496520519256592, -1.2630653381347656, -1.1764785051345825, -1.089891791343689, -1.0033049583435059, -0.9167182445526123, -0.830131471157074, -0.7435446977615356, -0.6569578647613525, -0.5703710913658142, -0.4837843179702759, -0.39719757437705994, -0.3106108009815216, -0.22402402758598328, -0.13743728399276733, -0.050850510597229004, 0.035736262798309326, 0.12232302874326706, 0.2089097946882248, 0.29549655318260193, 0.38208332657814026, 0.4686700999736786, 0.5552568435668945, 0.6418436169624329, 0.7284303903579712, 0.8150171637535095, 0.9016039371490479, 0.9881906509399414, 1.0747774839401245, 1.161364197731018, 1.2479510307312012, 1.3345377445220947, 1.4211244583129883, 1.5077111721038818, 1.594298005104065, 1.6808847188949585, 1.7674715518951416, 1.8540582656860352, 1.9406449794769287, 2.0272316932678223, 2.113818645477295]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 13.0, 13.0, 6.0, 12.0, 13.0, 15.0, 18.0, 22.0, 21.0, 33.0, 33.0, 40.0, 34.0, 38.0, 39.0, 42.0, 57.0, 49.0, 39.0, 38.0, 32.0, 42.0, 32.0, 44.0, 30.0, 28.0, 34.0, 21.0, 24.0, 20.0, 15.0, 18.0, 12.0, 18.0, 5.0, 12.0, 11.0, 3.0, 2.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.3478598594665527, -2.2728610038757324, -2.197861909866333, -2.1228628158569336, -2.0478639602661133, -1.9728649854660034, -1.8978660106658936, -1.8228670358657837, -1.7478680610656738, -1.672869086265564, -1.597870111465454, -1.5228711366653442, -1.4478721618652344, -1.3728731870651245, -1.2978742122650146, -1.2228752374649048, -1.147876262664795, -1.072877287864685, -0.9978783130645752, -0.9228793382644653, -0.8478803634643555, -0.7728813886642456, -0.6978824138641357, -0.6228834390640259, -0.547884464263916, -0.47288548946380615, -0.3978865146636963, -0.3228875398635864, -0.24788856506347656, -0.1728895902633667, -0.09789061546325684, -0.022891640663146973, 0.05210709571838379, 0.12710607051849365, 0.20210504531860352, 0.2771040201187134, 0.35210299491882324, 0.4271019697189331, 0.502100944519043, 0.5770999193191528, 0.6520988941192627, 0.7270978689193726, 0.8020968437194824, 0.8770958185195923, 0.9520947933197021, 1.027093768119812, 1.1020927429199219, 1.1770917177200317, 1.2520906925201416, 1.3270896673202515, 1.4020886421203613, 1.4770876169204712, 1.552086591720581, 1.627085566520691, 1.7020845413208008, 1.7770835161209106, 1.8520824909210205, 1.9270814657211304, 2.0020804405212402, 2.0770792961120605, 2.15207839012146, 2.2270774841308594, 2.3020763397216797, 2.3770751953125, 2.4520742893218994]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 1.0, 8.0, 6.0, 7.0, 7.0, 19.0, 24.0, 33.0, 64.0, 88.0, 157.0, 289.0, 590.0, 1078.0, 2492.0, 5797.0, 15155.0, 45330.0, 148427.0, 386642.0, 297648.0, 96095.0, 30043.0, 10500.0, 4199.0, 1877.0, 892.0, 481.0, 236.0, 138.0, 75.0, 60.0, 28.0, 25.0, 11.0, 13.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-3.119140625, -3.034423828125, -2.94970703125, -2.864990234375, -2.7802734375, -2.695556640625, -2.61083984375, -2.526123046875, -2.44140625, -2.356689453125, -2.27197265625, -2.187255859375, -2.1025390625, -2.017822265625, -1.93310546875, -1.848388671875, -1.763671875, -1.678955078125, -1.59423828125, -1.509521484375, -1.4248046875, -1.340087890625, -1.25537109375, -1.170654296875, -1.0859375, -1.001220703125, -0.91650390625, -0.831787109375, -0.7470703125, -0.662353515625, -0.57763671875, -0.492919921875, -0.408203125, -0.323486328125, -0.23876953125, -0.154052734375, -0.0693359375, 0.015380859375, 0.10009765625, 0.184814453125, 0.26953125, 0.354248046875, 0.43896484375, 0.523681640625, 0.6083984375, 0.693115234375, 0.77783203125, 0.862548828125, 0.947265625, 1.031982421875, 1.11669921875, 1.201416015625, 1.2861328125, 1.370849609375, 1.45556640625, 1.540283203125, 1.625, 1.709716796875, 1.79443359375, 1.879150390625, 1.9638671875, 2.048583984375, 2.13330078125, 2.218017578125, 2.302734375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 4.0, 8.0, 3.0, 3.0, 11.0, 16.0, 20.0, 11.0, 18.0, 18.0, 31.0, 32.0, 36.0, 36.0, 51.0, 48.0, 55.0, 54.0, 56.0, 54.0, 54.0, 50.0, 48.0, 40.0, 35.0, 41.0, 28.0, 30.0, 23.0, 13.0, 13.0, 10.0, 9.0, 11.0, 4.0, 2.0, 7.0, 1.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.203125, -1.168212890625, -1.13330078125, -1.098388671875, -1.0634765625, -1.028564453125, -0.99365234375, -0.958740234375, -0.923828125, -0.888916015625, -0.85400390625, -0.819091796875, -0.7841796875, -0.749267578125, -0.71435546875, -0.679443359375, -0.64453125, -0.609619140625, -0.57470703125, -0.539794921875, -0.5048828125, -0.469970703125, -0.43505859375, -0.400146484375, -0.365234375, -0.330322265625, -0.29541015625, -0.260498046875, -0.2255859375, -0.190673828125, -0.15576171875, -0.120849609375, -0.0859375, -0.051025390625, -0.01611328125, 0.018798828125, 0.0537109375, 0.088623046875, 0.12353515625, 0.158447265625, 0.193359375, 0.228271484375, 0.26318359375, 0.298095703125, 0.3330078125, 0.367919921875, 0.40283203125, 0.437744140625, 0.47265625, 0.507568359375, 0.54248046875, 0.577392578125, 0.6123046875, 0.647216796875, 0.68212890625, 0.717041015625, 0.751953125, 0.786865234375, 0.82177734375, 0.856689453125, 0.8916015625, 0.926513671875, 0.96142578125, 0.996337890625, 1.03125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 5.0, 11.0, 23.0, 28.0, 37.0, 55.0, 116.0, 212.0, 400.0, 859.0, 2287.0, 8027.0, 40721.0, 334975.0, 570693.0, 72603.0, 12197.0, 3192.0, 1084.0, 486.0, 231.0, 121.0, 64.0, 30.0, 29.0, 20.0, 13.0, 7.0, 3.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.10418701171875, -3.9583740234375, -3.81256103515625, -3.666748046875, -3.52093505859375, -3.3751220703125, -3.22930908203125, -3.08349609375, -2.93768310546875, -2.7918701171875, -2.64605712890625, -2.500244140625, -2.35443115234375, -2.2086181640625, -2.06280517578125, -1.9169921875, -1.77117919921875, -1.6253662109375, -1.47955322265625, -1.333740234375, -1.18792724609375, -1.0421142578125, -0.89630126953125, -0.75048828125, -0.60467529296875, -0.4588623046875, -0.31304931640625, -0.167236328125, -0.02142333984375, 0.1243896484375, 0.27020263671875, 0.416015625, 0.56182861328125, 0.7076416015625, 0.85345458984375, 0.999267578125, 1.14508056640625, 1.2908935546875, 1.43670654296875, 1.58251953125, 1.72833251953125, 1.8741455078125, 2.01995849609375, 2.165771484375, 2.31158447265625, 2.4573974609375, 2.60321044921875, 2.7490234375, 2.89483642578125, 3.0406494140625, 3.18646240234375, 3.332275390625, 3.47808837890625, 3.6239013671875, 3.76971435546875, 3.91552734375, 4.06134033203125, 4.2071533203125, 4.35296630859375, 4.498779296875, 4.64459228515625, 4.7904052734375, 4.93621826171875, 5.08203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 8.0, 18.0, 19.0, 23.0, 26.0, 36.0, 44.0, 46.0, 46.0, 51.0, 62.0, 58.0, 57.0, 58.0, 54.0, 50.0, 64.0, 46.0, 43.0, 32.0, 37.0, 28.0, 25.0, 19.0, 13.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6796875, -6.4505615234375, -6.221435546875, -5.9923095703125, -5.76318359375, -5.5340576171875, -5.304931640625, -5.0758056640625, -4.8466796875, -4.6175537109375, -4.388427734375, -4.1593017578125, -3.93017578125, -3.7010498046875, -3.471923828125, -3.2427978515625, -3.013671875, -2.7845458984375, -2.555419921875, -2.3262939453125, -2.09716796875, -1.8680419921875, -1.638916015625, -1.4097900390625, -1.1806640625, -0.9515380859375, -0.722412109375, -0.4932861328125, -0.26416015625, -0.0350341796875, 0.194091796875, 0.4232177734375, 0.65234375, 0.8814697265625, 1.110595703125, 1.3397216796875, 1.56884765625, 1.7979736328125, 2.027099609375, 2.2562255859375, 2.4853515625, 2.7144775390625, 2.943603515625, 3.1727294921875, 3.40185546875, 3.6309814453125, 3.860107421875, 4.0892333984375, 4.318359375, 4.5474853515625, 4.776611328125, 5.0057373046875, 5.23486328125, 5.4639892578125, 5.693115234375, 5.9222412109375, 6.1513671875, 6.3804931640625, 6.609619140625, 6.8387451171875, 7.06787109375, 7.2969970703125, 7.526123046875, 7.7552490234375, 7.984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 12.0, 3.0, 8.0, 14.0, 16.0, 40.0, 72.0, 120.0, 212.0, 548.0, 1716.0, 11132.0, 472981.0, 546893.0, 11970.0, 1756.0, 535.0, 237.0, 124.0, 64.0, 42.0, 17.0, 13.0, 8.0, 5.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.92327880859375, -4.7645263671875, -4.60577392578125, -4.447021484375, -4.28826904296875, -4.1295166015625, -3.97076416015625, -3.81201171875, -3.65325927734375, -3.4945068359375, -3.33575439453125, -3.177001953125, -3.01824951171875, -2.8594970703125, -2.70074462890625, -2.5419921875, -2.38323974609375, -2.2244873046875, -2.06573486328125, -1.906982421875, -1.74822998046875, -1.5894775390625, -1.43072509765625, -1.27197265625, -1.11322021484375, -0.9544677734375, -0.79571533203125, -0.636962890625, -0.47821044921875, -0.3194580078125, -0.16070556640625, -0.001953125, 0.15679931640625, 0.3155517578125, 0.47430419921875, 0.633056640625, 0.79180908203125, 0.9505615234375, 1.10931396484375, 1.26806640625, 1.42681884765625, 1.5855712890625, 1.74432373046875, 1.903076171875, 2.06182861328125, 2.2205810546875, 2.37933349609375, 2.5380859375, 2.69683837890625, 2.8555908203125, 3.01434326171875, 3.173095703125, 3.33184814453125, 3.4906005859375, 3.64935302734375, 3.80810546875, 3.96685791015625, 4.1256103515625, 4.28436279296875, 4.443115234375, 4.60186767578125, 4.7606201171875, 4.91937255859375, 5.078125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 3.0, 6.0, 9.0, 27.0, 30.0, 50.0, 49.0, 103.0, 118.0, 128.0, 145.0, 107.0, 77.0, 49.0, 31.0, 21.0, 15.0, 9.0, 11.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005693435668945312, -0.0005553476512432098, -0.0005413517355918884, -0.000527355819940567, -0.0005133599042892456, -0.0004993639886379242, -0.0004853680729866028, -0.00047137215733528137, -0.00045737624168395996, -0.00044338032603263855, -0.00042938441038131714, -0.00041538849472999573, -0.0004013925790786743, -0.0003873966634273529, -0.0003734007477760315, -0.0003594048321247101, -0.00034540891647338867, -0.00033141300082206726, -0.00031741708517074585, -0.00030342116951942444, -0.00028942525386810303, -0.0002754293382167816, -0.0002614334225654602, -0.0002474375069141388, -0.00023344159126281738, -0.00021944567561149597, -0.00020544975996017456, -0.00019145384430885315, -0.00017745792865753174, -0.00016346201300621033, -0.00014946609735488892, -0.0001354701817035675, -0.0001214742660522461, -0.00010747835040092468, -9.348243474960327e-05, -7.948651909828186e-05, -6.549060344696045e-05, -5.149468779563904e-05, -3.749877214431763e-05, -2.3502856492996216e-05, -9.506940841674805e-06, 4.4889748096466064e-06, 1.8484890460968018e-05, 3.248080611228943e-05, 4.647672176361084e-05, 6.047263741493225e-05, 7.446855306625366e-05, 8.846446871757507e-05, 0.00010246038436889648, 0.0001164563000202179, 0.0001304522156715393, 0.00014444813132286072, 0.00015844404697418213, 0.00017243996262550354, 0.00018643587827682495, 0.00020043179392814636, 0.00021442770957946777, 0.00022842362523078918, 0.0002424195408821106, 0.000256415456533432, 0.0002704113721847534, 0.00028440728783607483, 0.00029840320348739624, 0.00031239911913871765, 0.00032639503479003906]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 6.0, 9.0, 15.0, 16.0, 48.0, 68.0, 115.0, 237.0, 450.0, 1078.0, 2924.0, 11790.0, 89217.0, 795351.0, 126864.0, 14523.0, 3607.0, 1206.0, 494.0, 239.0, 111.0, 74.0, 40.0, 28.0, 10.0, 8.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.8765869140625, -2.782470703125, -2.6883544921875, -2.59423828125, -2.5001220703125, -2.406005859375, -2.3118896484375, -2.2177734375, -2.1236572265625, -2.029541015625, -1.9354248046875, -1.84130859375, -1.7471923828125, -1.653076171875, -1.5589599609375, -1.46484375, -1.3707275390625, -1.276611328125, -1.1824951171875, -1.08837890625, -0.9942626953125, -0.900146484375, -0.8060302734375, -0.7119140625, -0.6177978515625, -0.523681640625, -0.4295654296875, -0.33544921875, -0.2413330078125, -0.147216796875, -0.0531005859375, 0.041015625, 0.1351318359375, 0.229248046875, 0.3233642578125, 0.41748046875, 0.5115966796875, 0.605712890625, 0.6998291015625, 0.7939453125, 0.8880615234375, 0.982177734375, 1.0762939453125, 1.17041015625, 1.2645263671875, 1.358642578125, 1.4527587890625, 1.546875, 1.6409912109375, 1.735107421875, 1.8292236328125, 1.92333984375, 2.0174560546875, 2.111572265625, 2.2056884765625, 2.2998046875, 2.3939208984375, 2.488037109375, 2.5821533203125, 2.67626953125, 2.7703857421875, 2.864501953125, 2.9586181640625, 3.052734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 7.0, 1.0, 6.0, 8.0, 15.0, 13.0, 20.0, 29.0, 43.0, 50.0, 75.0, 101.0, 120.0, 134.0, 109.0, 70.0, 63.0, 32.0, 25.0, 21.0, 15.0, 11.0, 9.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.40234375, -3.30487060546875, -3.2073974609375, -3.10992431640625, -3.012451171875, -2.91497802734375, -2.8175048828125, -2.72003173828125, -2.62255859375, -2.52508544921875, -2.4276123046875, -2.33013916015625, -2.232666015625, -2.13519287109375, -2.0377197265625, -1.94024658203125, -1.8427734375, -1.74530029296875, -1.6478271484375, -1.55035400390625, -1.452880859375, -1.35540771484375, -1.2579345703125, -1.16046142578125, -1.06298828125, -0.96551513671875, -0.8680419921875, -0.77056884765625, -0.673095703125, -0.57562255859375, -0.4781494140625, -0.38067626953125, -0.283203125, -0.18572998046875, -0.0882568359375, 0.00921630859375, 0.106689453125, 0.20416259765625, 0.3016357421875, 0.39910888671875, 0.49658203125, 0.59405517578125, 0.6915283203125, 0.78900146484375, 0.886474609375, 0.98394775390625, 1.0814208984375, 1.17889404296875, 1.2763671875, 1.37384033203125, 1.4713134765625, 1.56878662109375, 1.666259765625, 1.76373291015625, 1.8612060546875, 1.95867919921875, 2.05615234375, 2.15362548828125, 2.2510986328125, 2.34857177734375, 2.446044921875, 2.54351806640625, 2.6409912109375, 2.73846435546875, 2.8359375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 12.0, 14.0, 17.0, 29.0, 57.0, 94.0, 118.0, 161.0, 156.0, 96.0, 95.0, 64.0, 33.0, 20.0, 8.0, 14.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.67017364501953, -44.55193328857422, -43.433692932128906, -42.31545639038086, -41.19721603393555, -40.078975677490234, -38.96073913574219, -37.842498779296875, -36.72425842285156, -35.60601806640625, -34.48777770996094, -33.36954116821289, -32.25130081176758, -31.133060455322266, -30.014822006225586, -28.896583557128906, -27.778343200683594, -26.66010284423828, -25.5418643951416, -24.423625946044922, -23.30538558959961, -22.187145233154297, -21.068906784057617, -19.950668334960938, -18.832427978515625, -17.714187622070312, -16.595949172973633, -15.477709770202637, -14.35947036743164, -13.241230964660645, -12.122991561889648, -11.004752159118652, -9.886512756347656, -8.76827335357666, -7.650033950805664, -6.531794548034668, -5.413555145263672, -4.295315742492676, -3.1770763397216797, -2.0588369369506836, -0.9405975341796875, 0.1776418685913086, 1.2958812713623047, 2.414120674133301, 3.532360076904297, 4.650599479675293, 5.768838882446289, 6.887078285217285, 8.005317687988281, 9.123557090759277, 10.241796493530273, 11.36003589630127, 12.478275299072266, 13.596514701843262, 14.714754104614258, 15.832993507385254, 16.95123291015625, 18.069473266601562, 19.187711715698242, 20.305950164794922, 21.424190521240234, 22.542430877685547, 23.660669326782227, 24.778907775878906, 25.89714813232422]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 1.0, 7.0, 10.0, 12.0, 9.0, 18.0, 13.0, 18.0, 20.0, 24.0, 22.0, 24.0, 22.0, 36.0, 39.0, 36.0, 47.0, 52.0, 41.0, 42.0, 48.0, 43.0, 47.0, 41.0, 36.0, 40.0, 37.0, 22.0, 28.0, 25.0, 18.0, 18.0, 19.0, 9.0, 13.0, 13.0, 7.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.017623901367188, -22.295289993286133, -21.572956085205078, -20.850622177124023, -20.12828826904297, -19.405956268310547, -18.683622360229492, -17.961288452148438, -17.238954544067383, -16.516620635986328, -15.794286727905273, -15.071953773498535, -14.34961986541748, -13.627285957336426, -12.904953002929688, -12.182619094848633, -11.460285186767578, -10.737951278686523, -10.015617370605469, -9.29328441619873, -8.570950508117676, -7.848616600036621, -7.126283168792725, -6.403949737548828, -5.681615829467773, -4.959281921386719, -4.236948490142822, -3.5146148204803467, -2.792281150817871, -2.0699474811553955, -1.34761381149292, -0.6252803802490234, 0.09705352783203125, 0.8193871974945068, 1.5417208671569824, 2.264054536819458, 2.9863882064819336, 3.708721876144409, 4.431055545806885, 5.153388977050781, 5.875722885131836, 6.598056793212891, 7.320390224456787, 8.042723655700684, 8.765057563781738, 9.487391471862793, 10.209724426269531, 10.932058334350586, 11.65439224243164, 12.376726150512695, 13.09906005859375, 13.821393013000488, 14.543726921081543, 15.266060829162598, 15.988393783569336, 16.71072769165039, 17.433061599731445, 18.1553955078125, 18.877729415893555, 19.60006332397461, 20.32239532470703, 21.044729232788086, 21.76706314086914, 22.489397048950195, 23.21173095703125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 11.0, 14.0, 22.0, 37.0, 63.0, 112.0, 216.0, 455.0, 1021.0, 3057.0, 12103.0, 148594.0, 3998169.0, 23362.0, 4563.0, 1403.0, 548.0, 269.0, 109.0, 62.0, 38.0, 25.0, 9.0, 8.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66796875, -7.46710205078125, -7.2662353515625, -7.06536865234375, -6.864501953125, -6.66363525390625, -6.4627685546875, -6.26190185546875, -6.06103515625, -5.86016845703125, -5.6593017578125, -5.45843505859375, -5.257568359375, -5.05670166015625, -4.8558349609375, -4.65496826171875, -4.4541015625, -4.25323486328125, -4.0523681640625, -3.85150146484375, -3.650634765625, -3.44976806640625, -3.2489013671875, -3.04803466796875, -2.84716796875, -2.64630126953125, -2.4454345703125, -2.24456787109375, -2.043701171875, -1.84283447265625, -1.6419677734375, -1.44110107421875, -1.240234375, -1.03936767578125, -0.8385009765625, -0.63763427734375, -0.436767578125, -0.23590087890625, -0.0350341796875, 0.16583251953125, 0.36669921875, 0.56756591796875, 0.7684326171875, 0.96929931640625, 1.170166015625, 1.37103271484375, 1.5718994140625, 1.77276611328125, 1.9736328125, 2.17449951171875, 2.3753662109375, 2.57623291015625, 2.777099609375, 2.97796630859375, 3.1788330078125, 3.37969970703125, 3.58056640625, 3.78143310546875, 3.9822998046875, 4.18316650390625, 4.384033203125, 4.58489990234375, 4.7857666015625, 4.98663330078125, 5.1875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 9.0, 10.0, 8.0, 5.0, 16.0, 27.0, 31.0, 46.0, 64.0, 79.0, 76.0, 83.0, 92.0, 84.0, 64.0, 89.0, 71.0, 37.0, 36.0, 14.0, 15.0, 9.0, 8.0, 7.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2109375, -2.153106689453125, -2.09527587890625, -2.037445068359375, -1.9796142578125, -1.921783447265625, -1.86395263671875, -1.806121826171875, -1.748291015625, -1.690460205078125, -1.63262939453125, -1.574798583984375, -1.5169677734375, -1.459136962890625, -1.40130615234375, -1.343475341796875, -1.28564453125, -1.227813720703125, -1.16998291015625, -1.112152099609375, -1.0543212890625, -0.996490478515625, -0.93865966796875, -0.880828857421875, -0.822998046875, -0.765167236328125, -0.70733642578125, -0.649505615234375, -0.5916748046875, -0.533843994140625, -0.47601318359375, -0.418182373046875, -0.3603515625, -0.302520751953125, -0.24468994140625, -0.186859130859375, -0.1290283203125, -0.071197509765625, -0.01336669921875, 0.044464111328125, 0.102294921875, 0.160125732421875, 0.21795654296875, 0.275787353515625, 0.3336181640625, 0.391448974609375, 0.44927978515625, 0.507110595703125, 0.56494140625, 0.622772216796875, 0.68060302734375, 0.738433837890625, 0.7962646484375, 0.854095458984375, 0.91192626953125, 0.969757080078125, 1.027587890625, 1.085418701171875, 1.14324951171875, 1.201080322265625, 1.2589111328125, 1.316741943359375, 1.37457275390625, 1.432403564453125, 1.490234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 7.0, 9.0, 6.0, 3.0, 19.0, 18.0, 26.0, 29.0, 49.0, 53.0, 81.0, 189.0, 358.0, 922.0, 2764.0, 17681.0, 4051306.0, 111600.0, 6395.0, 1532.0, 561.0, 245.0, 149.0, 81.0, 61.0, 41.0, 26.0, 23.0, 12.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5234375, -7.1611328125, -6.798828125, -6.4365234375, -6.07421875, -5.7119140625, -5.349609375, -4.9873046875, -4.625, -4.2626953125, -3.900390625, -3.5380859375, -3.17578125, -2.8134765625, -2.451171875, -2.0888671875, -1.7265625, -1.3642578125, -1.001953125, -0.6396484375, -0.27734375, 0.0849609375, 0.447265625, 0.8095703125, 1.171875, 1.5341796875, 1.896484375, 2.2587890625, 2.62109375, 2.9833984375, 3.345703125, 3.7080078125, 4.0703125, 4.4326171875, 4.794921875, 5.1572265625, 5.51953125, 5.8818359375, 6.244140625, 6.6064453125, 6.96875, 7.3310546875, 7.693359375, 8.0556640625, 8.41796875, 8.7802734375, 9.142578125, 9.5048828125, 9.8671875, 10.2294921875, 10.591796875, 10.9541015625, 11.31640625, 11.6787109375, 12.041015625, 12.4033203125, 12.765625, 13.1279296875, 13.490234375, 13.8525390625, 14.21484375, 14.5771484375, 14.939453125, 15.3017578125, 15.6640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 10.0, 24.0, 50.0, 210.0, 3458.0, 206.0, 60.0, 27.0, 13.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53515625, -2.381103515625, -2.22705078125, -2.072998046875, -1.9189453125, -1.764892578125, -1.61083984375, -1.456787109375, -1.302734375, -1.148681640625, -0.99462890625, -0.840576171875, -0.6865234375, -0.532470703125, -0.37841796875, -0.224365234375, -0.0703125, 0.083740234375, 0.23779296875, 0.391845703125, 0.5458984375, 0.699951171875, 0.85400390625, 1.008056640625, 1.162109375, 1.316162109375, 1.47021484375, 1.624267578125, 1.7783203125, 1.932373046875, 2.08642578125, 2.240478515625, 2.39453125, 2.548583984375, 2.70263671875, 2.856689453125, 3.0107421875, 3.164794921875, 3.31884765625, 3.472900390625, 3.626953125, 3.781005859375, 3.93505859375, 4.089111328125, 4.2431640625, 4.397216796875, 4.55126953125, 4.705322265625, 4.859375, 5.013427734375, 5.16748046875, 5.321533203125, 5.4755859375, 5.629638671875, 5.78369140625, 5.937744140625, 6.091796875, 6.245849609375, 6.39990234375, 6.553955078125, 6.7080078125, 6.862060546875, 7.01611328125, 7.170166015625, 7.32421875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 36.0, 88.0, 245.0, 348.0, 201.0, 57.0, 18.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.21238899230957, -16.321622848510742, -15.430856704711914, -14.540090560913086, -13.649324417114258, -12.75855827331543, -11.867791175842285, -10.977025032043457, -10.086258888244629, -9.1954927444458, -8.304726600646973, -7.413959980010986, -6.523193836212158, -5.63242769241333, -4.741661071777344, -3.8508949279785156, -2.9601287841796875, -2.0693626403808594, -1.1785962581634521, -0.2878298759460449, 0.6029362678527832, 1.4937024116516113, 2.3844690322875977, 3.275235176086426, 4.166001319885254, 5.056767463684082, 5.94753360748291, 6.8383002281188965, 7.729066371917725, 8.619832992553711, 9.510599136352539, 10.401365280151367, 11.292133331298828, 12.182899475097656, 13.073665618896484, 13.964431762695312, 14.85519790649414, 15.745964050292969, 16.636730194091797, 17.527496337890625, 18.418262481689453, 19.30902862548828, 20.19979476928711, 21.090560913085938, 21.981327056884766, 22.872093200683594, 23.762859344482422, 24.65362548828125, 25.54439353942871, 26.43515968322754, 27.325925827026367, 28.216691970825195, 29.107458114624023, 29.99822425842285, 30.888992309570312, 31.77975845336914, 32.67052459716797, 33.5612907409668, 34.452056884765625, 35.34282302856445, 36.23358917236328, 37.12435531616211, 38.01512145996094, 38.905887603759766, 39.796653747558594]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 7.0, 10.0, 11.0, 21.0, 29.0, 39.0, 72.0, 66.0, 82.0, 106.0, 92.0, 89.0, 96.0, 70.0, 67.0, 49.0, 33.0, 25.0, 19.0, 9.0, 4.0, 8.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.999860763549805, -12.589277267456055, -12.178694725036621, -11.768112182617188, -11.357528686523438, -10.946945190429688, -10.536362648010254, -10.12578010559082, -9.71519660949707, -9.30461311340332, -8.894030570983887, -8.483448028564453, -8.072864532470703, -7.662281513214111, -7.2516984939575195, -6.841115474700928, -6.430532455444336, -6.019949436187744, -5.609366416931152, -5.1987833976745605, -4.788200378417969, -4.377617359161377, -3.967034339904785, -3.5564513206481934, -3.1458683013916016, -2.7352852821350098, -2.324702262878418, -1.9141192436218262, -1.5035362243652344, -1.0929532051086426, -0.6823701858520508, -0.271787166595459, 0.1387948989868164, 0.5493779182434082, 0.9599609375, 1.3705439567565918, 1.7811269760131836, 2.1917099952697754, 2.602293014526367, 3.012876033782959, 3.423459053039551, 3.8340420722961426, 4.244625091552734, 4.655208110809326, 5.065791130065918, 5.47637414932251, 5.886957168579102, 6.297540187835693, 6.708123207092285, 7.118706226348877, 7.529289245605469, 7.9398722648620605, 8.350455284118652, 8.761037826538086, 9.171621322631836, 9.582204818725586, 9.99278736114502, 10.403369903564453, 10.813953399658203, 11.224536895751953, 11.635119438171387, 12.04570198059082, 12.45628547668457, 12.86686897277832, 13.277451515197754]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 4.0, 7.0, 12.0, 15.0, 24.0, 37.0, 57.0, 75.0, 113.0, 164.0, 270.0, 455.0, 808.0, 1514.0, 3023.0, 6976.0, 19208.0, 65711.0, 255612.0, 461734.0, 165517.0, 43141.0, 13476.0, 5229.0, 2456.0, 1204.0, 675.0, 389.0, 209.0, 153.0, 102.0, 62.0, 36.0, 23.0, 13.0, 15.0, 8.0, 11.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.646484375, -3.533721923828125, -3.42095947265625, -3.308197021484375, -3.1954345703125, -3.082672119140625, -2.96990966796875, -2.857147216796875, -2.744384765625, -2.631622314453125, -2.51885986328125, -2.406097412109375, -2.2933349609375, -2.180572509765625, -2.06781005859375, -1.955047607421875, -1.84228515625, -1.729522705078125, -1.61676025390625, -1.503997802734375, -1.3912353515625, -1.278472900390625, -1.16571044921875, -1.052947998046875, -0.940185546875, -0.827423095703125, -0.71466064453125, -0.601898193359375, -0.4891357421875, -0.376373291015625, -0.26361083984375, -0.150848388671875, -0.0380859375, 0.074676513671875, 0.18743896484375, 0.300201416015625, 0.4129638671875, 0.525726318359375, 0.63848876953125, 0.751251220703125, 0.864013671875, 0.976776123046875, 1.08953857421875, 1.202301025390625, 1.3150634765625, 1.427825927734375, 1.54058837890625, 1.653350830078125, 1.76611328125, 1.878875732421875, 1.99163818359375, 2.104400634765625, 2.2171630859375, 2.329925537109375, 2.44268798828125, 2.555450439453125, 2.668212890625, 2.780975341796875, 2.89373779296875, 3.006500244140625, 3.1192626953125, 3.232025146484375, 3.34478759765625, 3.457550048828125, 3.5703125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 0.0, 3.0, 6.0, 7.0, 7.0, 15.0, 15.0, 15.0, 26.0, 34.0, 30.0, 66.0, 69.0, 58.0, 77.0, 79.0, 82.0, 60.0, 61.0, 65.0, 60.0, 44.0, 30.0, 33.0, 18.0, 7.0, 10.0, 5.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.111328125, -2.052337646484375, -1.99334716796875, -1.934356689453125, -1.8753662109375, -1.816375732421875, -1.75738525390625, -1.698394775390625, -1.639404296875, -1.580413818359375, -1.52142333984375, -1.462432861328125, -1.4034423828125, -1.344451904296875, -1.28546142578125, -1.226470947265625, -1.16748046875, -1.108489990234375, -1.04949951171875, -0.990509033203125, -0.9315185546875, -0.872528076171875, -0.81353759765625, -0.754547119140625, -0.695556640625, -0.636566162109375, -0.57757568359375, -0.518585205078125, -0.4595947265625, -0.400604248046875, -0.34161376953125, -0.282623291015625, -0.2236328125, -0.164642333984375, -0.10565185546875, -0.046661376953125, 0.0123291015625, 0.071319580078125, 0.13031005859375, 0.189300537109375, 0.248291015625, 0.307281494140625, 0.36627197265625, 0.425262451171875, 0.4842529296875, 0.543243408203125, 0.60223388671875, 0.661224365234375, 0.72021484375, 0.779205322265625, 0.83819580078125, 0.897186279296875, 0.9561767578125, 1.015167236328125, 1.07415771484375, 1.133148193359375, 1.192138671875, 1.251129150390625, 1.31011962890625, 1.369110107421875, 1.4281005859375, 1.487091064453125, 1.54608154296875, 1.605072021484375, 1.6640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 10.0, 10.0, 19.0, 48.0, 93.0, 221.0, 778.0, 3417.0, 48226.0, 920596.0, 69864.0, 4043.0, 783.0, 241.0, 97.0, 40.0, 35.0, 10.0, 8.0, 5.0, 3.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.92578125, -7.57427978515625, -7.2227783203125, -6.87127685546875, -6.519775390625, -6.16827392578125, -5.8167724609375, -5.46527099609375, -5.11376953125, -4.76226806640625, -4.4107666015625, -4.05926513671875, -3.707763671875, -3.35626220703125, -3.0047607421875, -2.65325927734375, -2.3017578125, -1.95025634765625, -1.5987548828125, -1.24725341796875, -0.895751953125, -0.54425048828125, -0.1927490234375, 0.15875244140625, 0.51025390625, 0.86175537109375, 1.2132568359375, 1.56475830078125, 1.916259765625, 2.26776123046875, 2.6192626953125, 2.97076416015625, 3.322265625, 3.67376708984375, 4.0252685546875, 4.37677001953125, 4.728271484375, 5.07977294921875, 5.4312744140625, 5.78277587890625, 6.13427734375, 6.48577880859375, 6.8372802734375, 7.18878173828125, 7.540283203125, 7.89178466796875, 8.2432861328125, 8.59478759765625, 8.9462890625, 9.29779052734375, 9.6492919921875, 10.00079345703125, 10.352294921875, 10.70379638671875, 11.0552978515625, 11.40679931640625, 11.75830078125, 12.10980224609375, 12.4613037109375, 12.81280517578125, 13.164306640625, 13.51580810546875, 13.8673095703125, 14.21881103515625, 14.5703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 11.0, 11.0, 11.0, 22.0, 30.0, 28.0, 36.0, 38.0, 55.0, 66.0, 72.0, 70.0, 83.0, 81.0, 64.0, 57.0, 52.0, 52.0, 48.0, 26.0, 20.0, 15.0, 11.0, 17.0, 7.0, 6.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.734375, -5.4593505859375, -5.184326171875, -4.9093017578125, -4.63427734375, -4.3592529296875, -4.084228515625, -3.8092041015625, -3.5341796875, -3.2591552734375, -2.984130859375, -2.7091064453125, -2.43408203125, -2.1590576171875, -1.884033203125, -1.6090087890625, -1.333984375, -1.0589599609375, -0.783935546875, -0.5089111328125, -0.23388671875, 0.0411376953125, 0.316162109375, 0.5911865234375, 0.8662109375, 1.1412353515625, 1.416259765625, 1.6912841796875, 1.96630859375, 2.2413330078125, 2.516357421875, 2.7913818359375, 3.06640625, 3.3414306640625, 3.616455078125, 3.8914794921875, 4.16650390625, 4.4415283203125, 4.716552734375, 4.9915771484375, 5.2666015625, 5.5416259765625, 5.816650390625, 6.0916748046875, 6.36669921875, 6.6417236328125, 6.916748046875, 7.1917724609375, 7.466796875, 7.7418212890625, 8.016845703125, 8.2918701171875, 8.56689453125, 8.8419189453125, 9.116943359375, 9.3919677734375, 9.6669921875, 9.9420166015625, 10.217041015625, 10.4920654296875, 10.76708984375, 11.0421142578125, 11.317138671875, 11.5921630859375, 11.8671875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 4.0, 14.0, 7.0, 8.0, 18.0, 18.0, 16.0, 30.0, 45.0, 94.0, 132.0, 181.0, 335.0, 583.0, 1237.0, 3189.0, 11082.0, 65106.0, 568168.0, 347003.0, 38894.0, 7671.0, 2411.0, 1010.0, 505.0, 268.0, 178.0, 104.0, 80.0, 41.0, 31.0, 32.0, 11.0, 6.0, 10.0, 2.0, 5.0, 5.0, 2.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.658203125, -1.607757568359375, -1.55731201171875, -1.506866455078125, -1.4564208984375, -1.405975341796875, -1.35552978515625, -1.305084228515625, -1.254638671875, -1.204193115234375, -1.15374755859375, -1.103302001953125, -1.0528564453125, -1.002410888671875, -0.95196533203125, -0.901519775390625, -0.85107421875, -0.800628662109375, -0.75018310546875, -0.699737548828125, -0.6492919921875, -0.598846435546875, -0.54840087890625, -0.497955322265625, -0.447509765625, -0.397064208984375, -0.34661865234375, -0.296173095703125, -0.2457275390625, -0.195281982421875, -0.14483642578125, -0.094390869140625, -0.0439453125, 0.006500244140625, 0.05694580078125, 0.107391357421875, 0.1578369140625, 0.208282470703125, 0.25872802734375, 0.309173583984375, 0.359619140625, 0.410064697265625, 0.46051025390625, 0.510955810546875, 0.5614013671875, 0.611846923828125, 0.66229248046875, 0.712738037109375, 0.76318359375, 0.813629150390625, 0.86407470703125, 0.914520263671875, 0.9649658203125, 1.015411376953125, 1.06585693359375, 1.116302490234375, 1.166748046875, 1.217193603515625, 1.26763916015625, 1.318084716796875, 1.3685302734375, 1.418975830078125, 1.46942138671875, 1.519866943359375, 1.5703125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 11.0, 14.0, 19.0, 22.0, 29.0, 35.0, 46.0, 45.0, 63.0, 53.0, 77.0, 79.0, 70.0, 75.0, 44.0, 59.0, 49.0, 35.0, 29.0, 20.0, 19.0, 13.0, 20.0, 11.0, 13.0, 10.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022077560424804688, -0.0002142973244190216, -0.00020781904458999634, -0.00020134076476097107, -0.0001948624849319458, -0.00018838420510292053, -0.00018190592527389526, -0.00017542764544487, -0.00016894936561584473, -0.00016247108578681946, -0.0001559928059577942, -0.00014951452612876892, -0.00014303624629974365, -0.00013655796647071838, -0.00013007968664169312, -0.00012360140681266785, -0.00011712312698364258, -0.00011064484715461731, -0.00010416656732559204, -9.768828749656677e-05, -9.12100076675415e-05, -8.473172783851624e-05, -7.825344800949097e-05, -7.17751681804657e-05, -6.529688835144043e-05, -5.881860852241516e-05, -5.234032869338989e-05, -4.5862048864364624e-05, -3.9383769035339355e-05, -3.290548920631409e-05, -2.642720937728882e-05, -1.994892954826355e-05, -1.3470649719238281e-05, -6.992369890213013e-06, -5.140900611877441e-07, 5.964189767837524e-06, 1.2442469596862793e-05, 1.892074942588806e-05, 2.539902925491333e-05, 3.18773090839386e-05, 3.835558891296387e-05, 4.4833868741989136e-05, 5.1312148571014404e-05, 5.779042840003967e-05, 6.426870822906494e-05, 7.074698805809021e-05, 7.722526788711548e-05, 8.370354771614075e-05, 9.018182754516602e-05, 9.666010737419128e-05, 0.00010313838720321655, 0.00010961666703224182, 0.00011609494686126709, 0.00012257322669029236, 0.00012905150651931763, 0.0001355297863483429, 0.00014200806617736816, 0.00014848634600639343, 0.0001549646258354187, 0.00016144290566444397, 0.00016792118549346924, 0.0001743994653224945, 0.00018087774515151978, 0.00018735602498054504, 0.0001938343048095703]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 12.0, 12.0, 21.0, 45.0, 99.0, 192.0, 522.0, 1704.0, 11326.0, 523906.0, 497016.0, 11021.0, 1735.0, 555.0, 227.0, 77.0, 36.0, 26.0, 9.0, 7.0, 3.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.20562744140625, -3.0987548828125, -2.99188232421875, -2.885009765625, -2.77813720703125, -2.6712646484375, -2.56439208984375, -2.45751953125, -2.35064697265625, -2.2437744140625, -2.13690185546875, -2.030029296875, -1.92315673828125, -1.8162841796875, -1.70941162109375, -1.6025390625, -1.49566650390625, -1.3887939453125, -1.28192138671875, -1.175048828125, -1.06817626953125, -0.9613037109375, -0.85443115234375, -0.74755859375, -0.64068603515625, -0.5338134765625, -0.42694091796875, -0.320068359375, -0.21319580078125, -0.1063232421875, 0.00054931640625, 0.107421875, 0.21429443359375, 0.3211669921875, 0.42803955078125, 0.534912109375, 0.64178466796875, 0.7486572265625, 0.85552978515625, 0.96240234375, 1.06927490234375, 1.1761474609375, 1.28302001953125, 1.389892578125, 1.49676513671875, 1.6036376953125, 1.71051025390625, 1.8173828125, 1.92425537109375, 2.0311279296875, 2.13800048828125, 2.244873046875, 2.35174560546875, 2.4586181640625, 2.56549072265625, 2.67236328125, 2.77923583984375, 2.8861083984375, 2.99298095703125, 3.099853515625, 3.20672607421875, 3.3135986328125, 3.42047119140625, 3.52734375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 3.0, 10.0, 9.0, 20.0, 32.0, 45.0, 61.0, 91.0, 98.0, 145.0, 105.0, 107.0, 86.0, 74.0, 34.0, 32.0, 19.0, 12.0, 11.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2646484375, -1.1865386962890625, -1.108428955078125, -1.0303192138671875, -0.95220947265625, -0.8740997314453125, -0.795989990234375, -0.7178802490234375, -0.6397705078125, -0.5616607666015625, -0.483551025390625, -0.4054412841796875, -0.32733154296875, -0.2492218017578125, -0.171112060546875, -0.0930023193359375, -0.014892578125, 0.0632171630859375, 0.141326904296875, 0.2194366455078125, 0.29754638671875, 0.3756561279296875, 0.453765869140625, 0.5318756103515625, 0.6099853515625, 0.6880950927734375, 0.766204833984375, 0.8443145751953125, 0.92242431640625, 1.0005340576171875, 1.078643798828125, 1.1567535400390625, 1.23486328125, 1.3129730224609375, 1.391082763671875, 1.4691925048828125, 1.54730224609375, 1.6254119873046875, 1.703521728515625, 1.7816314697265625, 1.8597412109375, 1.9378509521484375, 2.015960693359375, 2.0940704345703125, 2.17218017578125, 2.2502899169921875, 2.328399658203125, 2.4065093994140625, 2.484619140625, 2.5627288818359375, 2.640838623046875, 2.7189483642578125, 2.79705810546875, 2.8751678466796875, 2.953277587890625, 3.0313873291015625, 3.1094970703125, 3.1876068115234375, 3.265716552734375, 3.3438262939453125, 3.42193603515625, 3.5000457763671875, 3.578155517578125, 3.6562652587890625, 3.734375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 5.0, 36.0, 75.0, 122.0, 226.0, 228.0, 134.0, 91.0, 46.0, 18.0, 7.0, 6.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.32183074951172, -56.514591217041016, -54.70735168457031, -52.900108337402344, -51.09286880493164, -49.28562927246094, -47.478389739990234, -45.67115020751953, -43.86390686035156, -42.05666732788086, -40.249427795410156, -38.44218444824219, -36.634944915771484, -34.82770538330078, -33.02046585083008, -31.213226318359375, -29.405986785888672, -27.59874725341797, -25.791505813598633, -23.98426628112793, -22.177024841308594, -20.36978530883789, -18.562545776367188, -16.755306243896484, -14.948064804077148, -13.140824317932129, -11.33358383178711, -9.526344299316406, -7.719103813171387, -5.911863327026367, -4.104623794555664, -2.2973833084106445, -0.490142822265625, 1.3170974254608154, 3.124337673187256, 4.931577682495117, 6.738818168640137, 8.546058654785156, 10.35329818725586, 12.160538673400879, 13.967779159545898, 15.775019645690918, 17.582260131835938, 19.38949966430664, 21.196739196777344, 23.00398063659668, 24.811220169067383, 26.61846160888672, 28.425701141357422, 30.232940673828125, 32.04018020629883, 33.84741973876953, 35.6546630859375, 37.4619026184082, 39.269142150878906, 41.07638168334961, 42.88362121582031, 44.690860748291016, 46.49810028076172, 48.30534362792969, 50.11258316040039, 51.919822692871094, 53.7270622253418, 55.5343017578125, 57.34154510498047]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 6.0, 9.0, 12.0, 13.0, 20.0, 16.0, 25.0, 16.0, 27.0, 37.0, 40.0, 40.0, 34.0, 62.0, 65.0, 62.0, 58.0, 69.0, 50.0, 52.0, 43.0, 46.0, 32.0, 37.0, 19.0, 25.0, 17.0, 22.0, 11.0, 7.0, 6.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-34.696685791015625, -33.67158889770508, -32.64649200439453, -31.62139129638672, -30.596294403076172, -29.571197509765625, -28.546098709106445, -27.520999908447266, -26.49590301513672, -25.470806121826172, -24.445707321166992, -23.420608520507812, -22.395511627197266, -21.37041473388672, -20.34531593322754, -19.32021713256836, -18.295120239257812, -17.270023345947266, -16.244924545288086, -15.219826698303223, -14.19472885131836, -13.169631004333496, -12.144533157348633, -11.11943531036377, -10.094337463378906, -9.069239616394043, -8.04414176940918, -7.019043922424316, -5.993946075439453, -4.96884822845459, -3.9437503814697266, -2.9186525344848633, -1.8935585021972656, -0.8684606552124023, 0.15663719177246094, 1.1817350387573242, 2.2068328857421875, 3.231930732727051, 4.257028579711914, 5.282126426696777, 6.307224273681641, 7.332322120666504, 8.357419967651367, 9.38251781463623, 10.407615661621094, 11.432713508605957, 12.45781135559082, 13.482909202575684, 14.508007049560547, 15.53310489654541, 16.558202743530273, 17.583301544189453, 18.6083984375, 19.633495330810547, 20.658594131469727, 21.683692932128906, 22.708789825439453, 23.73388671875, 24.75898551940918, 25.78408432006836, 26.809181213378906, 27.834278106689453, 28.859376907348633, 29.884475708007812, 30.90957260131836]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 11.0, 15.0, 20.0, 10.0, 23.0, 49.0, 59.0, 86.0, 166.0, 271.0, 590.0, 1344.0, 3577.0, 12022.0, 62283.0, 2812317.0, 1236787.0, 49023.0, 10328.0, 3156.0, 1163.0, 495.0, 214.0, 134.0, 57.0, 35.0, 13.0, 12.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-6.15234375, -6.021240234375, -5.89013671875, -5.759033203125, -5.6279296875, -5.496826171875, -5.36572265625, -5.234619140625, -5.103515625, -4.972412109375, -4.84130859375, -4.710205078125, -4.5791015625, -4.447998046875, -4.31689453125, -4.185791015625, -4.0546875, -3.923583984375, -3.79248046875, -3.661376953125, -3.5302734375, -3.399169921875, -3.26806640625, -3.136962890625, -3.005859375, -2.874755859375, -2.74365234375, -2.612548828125, -2.4814453125, -2.350341796875, -2.21923828125, -2.088134765625, -1.95703125, -1.825927734375, -1.69482421875, -1.563720703125, -1.4326171875, -1.301513671875, -1.17041015625, -1.039306640625, -0.908203125, -0.777099609375, -0.64599609375, -0.514892578125, -0.3837890625, -0.252685546875, -0.12158203125, 0.009521484375, 0.140625, 0.271728515625, 0.40283203125, 0.533935546875, 0.6650390625, 0.796142578125, 0.92724609375, 1.058349609375, 1.189453125, 1.320556640625, 1.45166015625, 1.582763671875, 1.7138671875, 1.844970703125, 1.97607421875, 2.107177734375, 2.23828125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 10.0, 3.0, 8.0, 6.0, 14.0, 19.0, 17.0, 33.0, 30.0, 30.0, 44.0, 49.0, 57.0, 75.0, 58.0, 64.0, 56.0, 65.0, 60.0, 47.0, 48.0, 37.0, 45.0, 27.0, 25.0, 27.0, 10.0, 16.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4951171875, -1.45074462890625, -1.4063720703125, -1.36199951171875, -1.317626953125, -1.27325439453125, -1.2288818359375, -1.18450927734375, -1.14013671875, -1.09576416015625, -1.0513916015625, -1.00701904296875, -0.962646484375, -0.91827392578125, -0.8739013671875, -0.82952880859375, -0.78515625, -0.74078369140625, -0.6964111328125, -0.65203857421875, -0.607666015625, -0.56329345703125, -0.5189208984375, -0.47454833984375, -0.43017578125, -0.38580322265625, -0.3414306640625, -0.29705810546875, -0.252685546875, -0.20831298828125, -0.1639404296875, -0.11956787109375, -0.0751953125, -0.03082275390625, 0.0135498046875, 0.05792236328125, 0.102294921875, 0.14666748046875, 0.1910400390625, 0.23541259765625, 0.27978515625, 0.32415771484375, 0.3685302734375, 0.41290283203125, 0.457275390625, 0.50164794921875, 0.5460205078125, 0.59039306640625, 0.634765625, 0.67913818359375, 0.7235107421875, 0.76788330078125, 0.812255859375, 0.85662841796875, 0.9010009765625, 0.94537353515625, 0.98974609375, 1.03411865234375, 1.0784912109375, 1.12286376953125, 1.167236328125, 1.21160888671875, 1.2559814453125, 1.30035400390625, 1.3447265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 6.0, 4.0, 5.0, 4.0, 5.0, 8.0, 14.0, 22.0, 25.0, 37.0, 58.0, 107.0, 154.0, 291.0, 490.0, 1049.0, 2151.0, 5176.0, 15101.0, 58055.0, 503586.0, 3390864.0, 167979.0, 32564.0, 9694.0, 3566.0, 1567.0, 742.0, 368.0, 226.0, 151.0, 81.0, 41.0, 23.0, 24.0, 11.0, 12.0, 10.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-4.203125, -4.090423583984375, -3.97772216796875, -3.865020751953125, -3.7523193359375, -3.639617919921875, -3.52691650390625, -3.414215087890625, -3.301513671875, -3.188812255859375, -3.07611083984375, -2.963409423828125, -2.8507080078125, -2.738006591796875, -2.62530517578125, -2.512603759765625, -2.39990234375, -2.287200927734375, -2.17449951171875, -2.061798095703125, -1.9490966796875, -1.836395263671875, -1.72369384765625, -1.610992431640625, -1.498291015625, -1.385589599609375, -1.27288818359375, -1.160186767578125, -1.0474853515625, -0.934783935546875, -0.82208251953125, -0.709381103515625, -0.5966796875, -0.483978271484375, -0.37127685546875, -0.258575439453125, -0.1458740234375, -0.033172607421875, 0.07952880859375, 0.192230224609375, 0.304931640625, 0.417633056640625, 0.53033447265625, 0.643035888671875, 0.7557373046875, 0.868438720703125, 0.98114013671875, 1.093841552734375, 1.20654296875, 1.319244384765625, 1.43194580078125, 1.544647216796875, 1.6573486328125, 1.770050048828125, 1.88275146484375, 1.995452880859375, 2.108154296875, 2.220855712890625, 2.33355712890625, 2.446258544921875, 2.5589599609375, 2.671661376953125, 2.78436279296875, 2.897064208984375, 3.009765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 14.0, 7.0, 16.0, 31.0, 34.0, 43.0, 71.0, 117.0, 188.0, 408.0, 846.0, 1104.0, 501.0, 215.0, 129.0, 85.0, 55.0, 37.0, 42.0, 23.0, 19.0, 11.0, 13.0, 11.0, 4.0, 5.0, 3.0, 6.0, 0.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.171875, -4.056671142578125, -3.94146728515625, -3.826263427734375, -3.7110595703125, -3.595855712890625, -3.48065185546875, -3.365447998046875, -3.250244140625, -3.135040283203125, -3.01983642578125, -2.904632568359375, -2.7894287109375, -2.674224853515625, -2.55902099609375, -2.443817138671875, -2.32861328125, -2.213409423828125, -2.09820556640625, -1.983001708984375, -1.8677978515625, -1.752593994140625, -1.63739013671875, -1.522186279296875, -1.406982421875, -1.291778564453125, -1.17657470703125, -1.061370849609375, -0.9461669921875, -0.830963134765625, -0.71575927734375, -0.600555419921875, -0.4853515625, -0.370147705078125, -0.25494384765625, -0.139739990234375, -0.0245361328125, 0.090667724609375, 0.20587158203125, 0.321075439453125, 0.436279296875, 0.551483154296875, 0.66668701171875, 0.781890869140625, 0.8970947265625, 1.012298583984375, 1.12750244140625, 1.242706298828125, 1.35791015625, 1.473114013671875, 1.58831787109375, 1.703521728515625, 1.8187255859375, 1.933929443359375, 2.04913330078125, 2.164337158203125, 2.279541015625, 2.394744873046875, 2.50994873046875, 2.625152587890625, 2.7403564453125, 2.855560302734375, 2.97076416015625, 3.085968017578125, 3.201171875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 18.0, 34.0, 58.0, 107.0, 173.0, 203.0, 149.0, 115.0, 55.0, 29.0, 18.0, 5.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.90979766845703, -41.7921257019043, -40.67445373535156, -39.55678176879883, -38.439109802246094, -37.321441650390625, -36.203765869140625, -35.086097717285156, -33.96842575073242, -32.85075378417969, -31.733081817626953, -30.61540985107422, -29.497739791870117, -28.380067825317383, -27.26239585876465, -26.144723892211914, -25.02705192565918, -23.909379959106445, -22.79170799255371, -21.67403793334961, -20.556365966796875, -19.43869400024414, -18.321022033691406, -17.203350067138672, -16.085678100585938, -14.968006134033203, -13.850335121154785, -12.73266315460205, -11.614992141723633, -10.497320175170898, -9.379648208618164, -8.26197624206543, -7.144306182861328, -6.026634693145752, -4.908963203430176, -3.7912912368774414, -2.6736197471618652, -1.555948257446289, -0.4382762908935547, 0.6793951988220215, 1.7970666885375977, 2.914738178253174, 4.03240966796875, 5.150081634521484, 6.2677531242370605, 7.385424613952637, 8.503096580505371, 9.620767593383789, 10.738439559936523, 11.856111526489258, 12.973782539367676, 14.09145450592041, 15.209125518798828, 16.326797485351562, 17.444469451904297, 18.56214141845703, 19.679813385009766, 20.7974853515625, 21.915157318115234, 23.03282928466797, 24.15049934387207, 25.268171310424805, 26.38584327697754, 27.503515243530273, 28.621185302734375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 7.0, 10.0, 8.0, 14.0, 7.0, 25.0, 13.0, 31.0, 27.0, 41.0, 39.0, 36.0, 46.0, 56.0, 40.0, 77.0, 52.0, 53.0, 46.0, 43.0, 47.0, 39.0, 30.0, 34.0, 26.0, 33.0, 26.0, 9.0, 12.0, 15.0, 9.0, 13.0, 11.0, 4.0, 2.0, 6.0, 4.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.761592864990234, -18.23255157470703, -17.70351219177246, -17.174470901489258, -16.645431518554688, -16.116390228271484, -15.587348937988281, -15.058308601379395, -14.529268264770508, -14.000227928161621, -13.471187591552734, -12.942146301269531, -12.413105964660645, -11.884065628051758, -11.355024337768555, -10.825984001159668, -10.296943664550781, -9.767903327941895, -9.238862991333008, -8.709821701049805, -8.180781364440918, -7.651741027832031, -7.122700214385986, -6.593659400939941, -6.064619064331055, -5.535578727722168, -5.006537914276123, -4.477497100830078, -3.9484567642211914, -3.4194161891937256, -2.8903756141662598, -2.361335039138794, -1.832296371459961, -1.3032557964324951, -0.7742152214050293, -0.24517464637756348, 0.28386592864990234, 0.8129065036773682, 1.341947078704834, 1.8709876537322998, 2.4000282287597656, 2.9290688037872314, 3.4581093788146973, 3.987149953842163, 4.516190528869629, 5.045230865478516, 5.5742716789245605, 6.1033124923706055, 6.632352828979492, 7.161393165588379, 7.690433979034424, 8.219474792480469, 8.748515129089355, 9.277555465698242, 9.806596755981445, 10.335637092590332, 10.864677429199219, 11.393717765808105, 11.922758102416992, 12.451799392700195, 12.980839729309082, 13.509880065917969, 14.038921356201172, 14.567961692810059, 15.097002029418945]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 4.0, 9.0, 13.0, 14.0, 39.0, 44.0, 57.0, 87.0, 136.0, 225.0, 372.0, 611.0, 1027.0, 1745.0, 2925.0, 5218.0, 10125.0, 20121.0, 41219.0, 86659.0, 171492.0, 259526.0, 215197.0, 117379.0, 57169.0, 27396.0, 13557.0, 7027.0, 3845.0, 2116.0, 1196.0, 734.0, 435.0, 279.0, 188.0, 119.0, 89.0, 60.0, 33.0, 22.0, 17.0, 4.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0], "bins": [-1.9013671875, -1.8509521484375, -1.800537109375, -1.7501220703125, -1.69970703125, -1.6492919921875, -1.598876953125, -1.5484619140625, -1.498046875, -1.4476318359375, -1.397216796875, -1.3468017578125, -1.29638671875, -1.2459716796875, -1.195556640625, -1.1451416015625, -1.0947265625, -1.0443115234375, -0.993896484375, -0.9434814453125, -0.89306640625, -0.8426513671875, -0.792236328125, -0.7418212890625, -0.69140625, -0.6409912109375, -0.590576171875, -0.5401611328125, -0.48974609375, -0.4393310546875, -0.388916015625, -0.3385009765625, -0.2880859375, -0.2376708984375, -0.187255859375, -0.1368408203125, -0.08642578125, -0.0360107421875, 0.014404296875, 0.0648193359375, 0.115234375, 0.1656494140625, 0.216064453125, 0.2664794921875, 0.31689453125, 0.3673095703125, 0.417724609375, 0.4681396484375, 0.5185546875, 0.5689697265625, 0.619384765625, 0.6697998046875, 0.72021484375, 0.7706298828125, 0.821044921875, 0.8714599609375, 0.921875, 0.9722900390625, 1.022705078125, 1.0731201171875, 1.12353515625, 1.1739501953125, 1.224365234375, 1.2747802734375, 1.3251953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 2.0, 7.0, 11.0, 13.0, 23.0, 20.0, 24.0, 24.0, 22.0, 25.0, 50.0, 56.0, 42.0, 44.0, 46.0, 51.0, 46.0, 52.0, 46.0, 44.0, 50.0, 42.0, 33.0, 36.0, 36.0, 23.0, 23.0, 29.0, 13.0, 10.0, 16.0, 10.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0185546875, -0.983154296875, -0.94775390625, -0.912353515625, -0.876953125, -0.841552734375, -0.80615234375, -0.770751953125, -0.7353515625, -0.699951171875, -0.66455078125, -0.629150390625, -0.59375, -0.558349609375, -0.52294921875, -0.487548828125, -0.4521484375, -0.416748046875, -0.38134765625, -0.345947265625, -0.310546875, -0.275146484375, -0.23974609375, -0.204345703125, -0.1689453125, -0.133544921875, -0.09814453125, -0.062744140625, -0.02734375, 0.008056640625, 0.04345703125, 0.078857421875, 0.1142578125, 0.149658203125, 0.18505859375, 0.220458984375, 0.255859375, 0.291259765625, 0.32666015625, 0.362060546875, 0.3974609375, 0.432861328125, 0.46826171875, 0.503662109375, 0.5390625, 0.574462890625, 0.60986328125, 0.645263671875, 0.6806640625, 0.716064453125, 0.75146484375, 0.786865234375, 0.822265625, 0.857666015625, 0.89306640625, 0.928466796875, 0.9638671875, 0.999267578125, 1.03466796875, 1.070068359375, 1.10546875, 1.140869140625, 1.17626953125, 1.211669921875, 1.2470703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 9.0, 8.0, 14.0, 16.0, 43.0, 57.0, 97.0, 159.0, 232.0, 373.0, 622.0, 1161.0, 2628.0, 7727.0, 35589.0, 243117.0, 623211.0, 106751.0, 17871.0, 4677.0, 1900.0, 929.0, 529.0, 293.0, 192.0, 103.0, 75.0, 59.0, 38.0, 23.0, 13.0, 11.0, 6.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.82421875, -4.701446533203125, -4.57867431640625, -4.455902099609375, -4.3331298828125, -4.210357666015625, -4.08758544921875, -3.964813232421875, -3.842041015625, -3.719268798828125, -3.59649658203125, -3.473724365234375, -3.3509521484375, -3.228179931640625, -3.10540771484375, -2.982635498046875, -2.85986328125, -2.737091064453125, -2.61431884765625, -2.491546630859375, -2.3687744140625, -2.246002197265625, -2.12322998046875, -2.000457763671875, -1.877685546875, -1.754913330078125, -1.63214111328125, -1.509368896484375, -1.3865966796875, -1.263824462890625, -1.14105224609375, -1.018280029296875, -0.8955078125, -0.772735595703125, -0.64996337890625, -0.527191162109375, -0.4044189453125, -0.281646728515625, -0.15887451171875, -0.036102294921875, 0.086669921875, 0.209442138671875, 0.33221435546875, 0.454986572265625, 0.5777587890625, 0.700531005859375, 0.82330322265625, 0.946075439453125, 1.06884765625, 1.191619873046875, 1.31439208984375, 1.437164306640625, 1.5599365234375, 1.682708740234375, 1.80548095703125, 1.928253173828125, 2.051025390625, 2.173797607421875, 2.29656982421875, 2.419342041015625, 2.5421142578125, 2.664886474609375, 2.78765869140625, 2.910430908203125, 3.033203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 12.0, 9.0, 15.0, 16.0, 20.0, 21.0, 33.0, 34.0, 34.0, 36.0, 48.0, 46.0, 65.0, 50.0, 53.0, 50.0, 60.0, 47.0, 59.0, 41.0, 40.0, 36.0, 30.0, 30.0, 22.0, 24.0, 13.0, 13.0, 5.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.671875, -5.50421142578125, -5.3365478515625, -5.16888427734375, -5.001220703125, -4.83355712890625, -4.6658935546875, -4.49822998046875, -4.33056640625, -4.16290283203125, -3.9952392578125, -3.82757568359375, -3.659912109375, -3.49224853515625, -3.3245849609375, -3.15692138671875, -2.9892578125, -2.82159423828125, -2.6539306640625, -2.48626708984375, -2.318603515625, -2.15093994140625, -1.9832763671875, -1.81561279296875, -1.64794921875, -1.48028564453125, -1.3126220703125, -1.14495849609375, -0.977294921875, -0.80963134765625, -0.6419677734375, -0.47430419921875, -0.306640625, -0.13897705078125, 0.0286865234375, 0.19635009765625, 0.364013671875, 0.53167724609375, 0.6993408203125, 0.86700439453125, 1.03466796875, 1.20233154296875, 1.3699951171875, 1.53765869140625, 1.705322265625, 1.87298583984375, 2.0406494140625, 2.20831298828125, 2.3759765625, 2.54364013671875, 2.7113037109375, 2.87896728515625, 3.046630859375, 3.21429443359375, 3.3819580078125, 3.54962158203125, 3.71728515625, 3.88494873046875, 4.0526123046875, 4.22027587890625, 4.387939453125, 4.55560302734375, 4.7232666015625, 4.89093017578125, 5.05859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 10.0, 7.0, 16.0, 11.0, 22.0, 33.0, 57.0, 81.0, 154.0, 307.0, 710.0, 1911.0, 7896.0, 63118.0, 802604.0, 153452.0, 13506.0, 2884.0, 962.0, 365.0, 180.0, 99.0, 62.0, 31.0, 29.0, 19.0, 14.0, 6.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9207763671875, -1.851318359375, -1.7818603515625, -1.71240234375, -1.6429443359375, -1.573486328125, -1.5040283203125, -1.4345703125, -1.3651123046875, -1.295654296875, -1.2261962890625, -1.15673828125, -1.0872802734375, -1.017822265625, -0.9483642578125, -0.87890625, -0.8094482421875, -0.739990234375, -0.6705322265625, -0.60107421875, -0.5316162109375, -0.462158203125, -0.3927001953125, -0.3232421875, -0.2537841796875, -0.184326171875, -0.1148681640625, -0.04541015625, 0.0240478515625, 0.093505859375, 0.1629638671875, 0.232421875, 0.3018798828125, 0.371337890625, 0.4407958984375, 0.51025390625, 0.5797119140625, 0.649169921875, 0.7186279296875, 0.7880859375, 0.8575439453125, 0.927001953125, 0.9964599609375, 1.06591796875, 1.1353759765625, 1.204833984375, 1.2742919921875, 1.34375, 1.4132080078125, 1.482666015625, 1.5521240234375, 1.62158203125, 1.6910400390625, 1.760498046875, 1.8299560546875, 1.8994140625, 1.9688720703125, 2.038330078125, 2.1077880859375, 2.17724609375, 2.2467041015625, 2.316162109375, 2.3856201171875, 2.455078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 8.0, 16.0, 12.0, 27.0, 51.0, 64.0, 108.0, 128.0, 141.0, 130.0, 105.0, 63.0, 38.0, 33.0, 24.0, 10.0, 15.0, 6.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005822181701660156, -0.0005674064159393311, -0.0005525946617126465, -0.0005377829074859619, -0.0005229711532592773, -0.0005081593990325928, -0.0004933476448059082, -0.00047853589057922363, -0.00046372413635253906, -0.0004489123821258545, -0.0004341006278991699, -0.00041928887367248535, -0.0004044771194458008, -0.0003896653652191162, -0.00037485361099243164, -0.00036004185676574707, -0.0003452301025390625, -0.00033041834831237793, -0.00031560659408569336, -0.0003007948398590088, -0.0002859830856323242, -0.00027117133140563965, -0.0002563595771789551, -0.0002415478229522705, -0.00022673606872558594, -0.00021192431449890137, -0.0001971125602722168, -0.00018230080604553223, -0.00016748905181884766, -0.00015267729759216309, -0.00013786554336547852, -0.00012305378913879395, -0.00010824203491210938, -9.34302806854248e-05, -7.861852645874023e-05, -6.380677223205566e-05, -4.8995018005371094e-05, -3.4183263778686523e-05, -1.9371509552001953e-05, -4.559755325317383e-06, 1.0251998901367188e-05, 2.5063753128051758e-05, 3.987550735473633e-05, 5.46872615814209e-05, 6.949901580810547e-05, 8.431077003479004e-05, 9.912252426147461e-05, 0.00011393427848815918, 0.00012874603271484375, 0.00014355778694152832, 0.0001583695411682129, 0.00017318129539489746, 0.00018799304962158203, 0.0002028048038482666, 0.00021761655807495117, 0.00023242831230163574, 0.0002472400665283203, 0.0002620518207550049, 0.00027686357498168945, 0.000291675329208374, 0.0003064870834350586, 0.00032129883766174316, 0.00033611059188842773, 0.0003509223461151123, 0.0003657341003417969]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 9.0, 16.0, 12.0, 30.0, 44.0, 50.0, 115.0, 166.0, 295.0, 508.0, 1032.0, 2471.0, 7251.0, 33325.0, 305636.0, 616634.0, 63603.0, 11193.0, 3291.0, 1327.0, 677.0, 337.0, 202.0, 108.0, 73.0, 49.0, 26.0, 23.0, 11.0, 8.0, 5.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1523895263671875, -1.102630615234375, -1.0528717041015625, -1.00311279296875, -0.9533538818359375, -0.903594970703125, -0.8538360595703125, -0.8040771484375, -0.7543182373046875, -0.704559326171875, -0.6548004150390625, -0.60504150390625, -0.5552825927734375, -0.505523681640625, -0.4557647705078125, -0.406005859375, -0.3562469482421875, -0.306488037109375, -0.2567291259765625, -0.20697021484375, -0.1572113037109375, -0.107452392578125, -0.0576934814453125, -0.0079345703125, 0.0418243408203125, 0.091583251953125, 0.1413421630859375, 0.19110107421875, 0.2408599853515625, 0.290618896484375, 0.3403778076171875, 0.39013671875, 0.4398956298828125, 0.489654541015625, 0.5394134521484375, 0.58917236328125, 0.6389312744140625, 0.688690185546875, 0.7384490966796875, 0.7882080078125, 0.8379669189453125, 0.887725830078125, 0.9374847412109375, 0.98724365234375, 1.0370025634765625, 1.086761474609375, 1.1365203857421875, 1.186279296875, 1.2360382080078125, 1.285797119140625, 1.3355560302734375, 1.38531494140625, 1.4350738525390625, 1.484832763671875, 1.5345916748046875, 1.5843505859375, 1.6341094970703125, 1.683868408203125, 1.7336273193359375, 1.78338623046875, 1.8331451416015625, 1.882904052734375, 1.9326629638671875, 1.982421875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 4.0, 3.0, 3.0, 11.0, 27.0, 24.0, 45.0, 46.0, 71.0, 93.0, 126.0, 118.0, 110.0, 85.0, 73.0, 43.0, 36.0, 26.0, 16.0, 15.0, 7.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.03863525390625, -1.9718017578125, -1.90496826171875, -1.838134765625, -1.77130126953125, -1.7044677734375, -1.63763427734375, -1.57080078125, -1.50396728515625, -1.4371337890625, -1.37030029296875, -1.303466796875, -1.23663330078125, -1.1697998046875, -1.10296630859375, -1.0361328125, -0.96929931640625, -0.9024658203125, -0.83563232421875, -0.768798828125, -0.70196533203125, -0.6351318359375, -0.56829833984375, -0.50146484375, -0.43463134765625, -0.3677978515625, -0.30096435546875, -0.234130859375, -0.16729736328125, -0.1004638671875, -0.03363037109375, 0.033203125, 0.10003662109375, 0.1668701171875, 0.23370361328125, 0.300537109375, 0.36737060546875, 0.4342041015625, 0.50103759765625, 0.56787109375, 0.63470458984375, 0.7015380859375, 0.76837158203125, 0.835205078125, 0.90203857421875, 0.9688720703125, 1.03570556640625, 1.1025390625, 1.16937255859375, 1.2362060546875, 1.30303955078125, 1.369873046875, 1.43670654296875, 1.5035400390625, 1.57037353515625, 1.63720703125, 1.70404052734375, 1.7708740234375, 1.83770751953125, 1.904541015625, 1.97137451171875, 2.0382080078125, 2.10504150390625, 2.171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 20.0, 27.0, 108.0, 183.0, 302.0, 211.0, 91.0, 34.0, 15.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.68215942382812, -68.04549407958984, -66.40882110595703, -64.77215576171875, -63.13548278808594, -61.49881362915039, -59.862144470214844, -58.22547912597656, -56.58880615234375, -54.9521369934082, -53.315467834472656, -51.67879867553711, -50.04212951660156, -48.405460357666016, -46.76879119873047, -45.13212585449219, -43.49545669555664, -41.858787536621094, -40.22211837768555, -38.58544921875, -36.94878005981445, -35.312110900878906, -33.675445556640625, -32.03877258300781, -30.4021053314209, -28.76543617248535, -27.128767013549805, -25.49209976196289, -23.855430603027344, -22.218761444091797, -20.58209228515625, -18.945423126220703, -17.308757781982422, -15.672088623046875, -14.035419464111328, -12.398751258850098, -10.76208209991455, -9.125412940979004, -7.488744735717773, -5.852075576782227, -4.21540641784668, -2.578737497329712, -0.9420685768127441, 0.6946001052856445, 2.3312692642211914, 3.9679384231567383, 5.604606628417969, 7.241275787353516, 8.877944946289062, 10.51461410522461, 12.151283264160156, 13.787951469421387, 15.424620628356934, 17.061290740966797, 18.69795799255371, 20.334627151489258, 21.971296310424805, 23.60796546936035, 25.2446346282959, 26.881301879882812, 28.51797103881836, 30.154640197753906, 31.791309356689453, 33.427978515625, 35.06464767456055]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 6.0, 13.0, 13.0, 16.0, 20.0, 22.0, 33.0, 29.0, 52.0, 41.0, 51.0, 51.0, 64.0, 81.0, 81.0, 66.0, 68.0, 61.0, 43.0, 30.0, 35.0, 22.0, 22.0, 21.0, 17.0, 10.0, 8.0, 7.0, 1.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.02332305908203, -28.27657127380371, -27.52981948852539, -26.78306770324707, -26.03631591796875, -25.289566040039062, -24.542814254760742, -23.796062469482422, -23.0493106842041, -22.30255889892578, -21.55580711364746, -20.80905532836914, -20.062305450439453, -19.315553665161133, -18.568801879882812, -17.822050094604492, -17.075298309326172, -16.32854652404785, -15.581794738769531, -14.835043907165527, -14.088292121887207, -13.341540336608887, -12.594789505004883, -11.848037719726562, -11.101285934448242, -10.354534149169922, -9.607782363891602, -8.861031532287598, -8.114279747009277, -7.367527961730957, -6.620776653289795, -5.874025344848633, -5.1272735595703125, -4.380521774291992, -3.63377046585083, -2.887018918991089, -2.1402673721313477, -1.3935158252716064, -0.6467642784118652, 0.09998703002929688, 0.8467388153076172, 1.5934903621673584, 2.3402419090270996, 3.086993455886841, 3.833745002746582, 4.580496788024902, 5.3272480964660645, 6.073999404907227, 6.820751190185547, 7.567502975463867, 8.314254760742188, 9.061005592346191, 9.807757377624512, 10.554509162902832, 11.301259994506836, 12.048011779785156, 12.794763565063477, 13.541515350341797, 14.288267135620117, 15.035017967224121, 15.781769752502441, 16.528520584106445, 17.275272369384766, 18.022024154663086, 18.768775939941406]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 5.0, 9.0, 12.0, 25.0, 31.0, 40.0, 74.0, 105.0, 204.0, 504.0, 1642.0, 7166.0, 51631.0, 3670771.0, 436626.0, 19822.0, 3949.0, 969.0, 332.0, 120.0, 69.0, 58.0, 21.0, 31.0, 7.0, 8.0, 7.0, 4.0, 12.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.890625, -4.753936767578125, -4.61724853515625, -4.480560302734375, -4.3438720703125, -4.207183837890625, -4.07049560546875, -3.933807373046875, -3.797119140625, -3.660430908203125, -3.52374267578125, -3.387054443359375, -3.2503662109375, -3.113677978515625, -2.97698974609375, -2.840301513671875, -2.70361328125, -2.566925048828125, -2.43023681640625, -2.293548583984375, -2.1568603515625, -2.020172119140625, -1.88348388671875, -1.746795654296875, -1.610107421875, -1.473419189453125, -1.33673095703125, -1.200042724609375, -1.0633544921875, -0.926666259765625, -0.78997802734375, -0.653289794921875, -0.5166015625, -0.379913330078125, -0.24322509765625, -0.106536865234375, 0.0301513671875, 0.166839599609375, 0.30352783203125, 0.440216064453125, 0.576904296875, 0.713592529296875, 0.85028076171875, 0.986968994140625, 1.1236572265625, 1.260345458984375, 1.39703369140625, 1.533721923828125, 1.67041015625, 1.807098388671875, 1.94378662109375, 2.080474853515625, 2.2171630859375, 2.353851318359375, 2.49053955078125, 2.627227783203125, 2.763916015625, 2.900604248046875, 3.03729248046875, 3.173980712890625, 3.3106689453125, 3.447357177734375, 3.58404541015625, 3.720733642578125, 3.857421875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 9.0, 15.0, 17.0, 36.0, 57.0, 54.0, 76.0, 102.0, 103.0, 109.0, 98.0, 82.0, 80.0, 51.0, 45.0, 31.0, 21.0, 11.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.08984375, -3.0200958251953125, -2.950347900390625, -2.8805999755859375, -2.81085205078125, -2.7411041259765625, -2.671356201171875, -2.6016082763671875, -2.5318603515625, -2.4621124267578125, -2.392364501953125, -2.3226165771484375, -2.25286865234375, -2.1831207275390625, -2.113372802734375, -2.0436248779296875, -1.973876953125, -1.9041290283203125, -1.834381103515625, -1.7646331787109375, -1.69488525390625, -1.6251373291015625, -1.555389404296875, -1.4856414794921875, -1.4158935546875, -1.3461456298828125, -1.276397705078125, -1.2066497802734375, -1.13690185546875, -1.0671539306640625, -0.997406005859375, -0.9276580810546875, -0.85791015625, -0.7881622314453125, -0.718414306640625, -0.6486663818359375, -0.57891845703125, -0.5091705322265625, -0.439422607421875, -0.3696746826171875, -0.2999267578125, -0.2301788330078125, -0.160430908203125, -0.0906829833984375, -0.02093505859375, 0.0488128662109375, 0.118560791015625, 0.1883087158203125, 0.258056640625, 0.3278045654296875, 0.397552490234375, 0.4673004150390625, 0.53704833984375, 0.6067962646484375, 0.676544189453125, 0.7462921142578125, 0.8160400390625, 0.8857879638671875, 0.955535888671875, 1.0252838134765625, 1.09503173828125, 1.1647796630859375, 1.234527587890625, 1.3042755126953125, 1.3740234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 13.0, 19.0, 16.0, 36.0, 54.0, 102.0, 203.0, 372.0, 863.0, 1899.0, 4603.0, 12051.0, 35270.0, 153371.0, 2743889.0, 1107364.0, 93040.0, 25451.0, 8954.0, 3487.0, 1555.0, 765.0, 398.0, 222.0, 115.0, 65.0, 35.0, 31.0, 12.0, 8.0, 4.0, 4.0, 7.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.740234375, -2.656829833984375, -2.57342529296875, -2.490020751953125, -2.4066162109375, -2.323211669921875, -2.23980712890625, -2.156402587890625, -2.072998046875, -1.989593505859375, -1.90618896484375, -1.822784423828125, -1.7393798828125, -1.655975341796875, -1.57257080078125, -1.489166259765625, -1.40576171875, -1.322357177734375, -1.23895263671875, -1.155548095703125, -1.0721435546875, -0.988739013671875, -0.90533447265625, -0.821929931640625, -0.738525390625, -0.655120849609375, -0.57171630859375, -0.488311767578125, -0.4049072265625, -0.321502685546875, -0.23809814453125, -0.154693603515625, -0.0712890625, 0.012115478515625, 0.09552001953125, 0.178924560546875, 0.2623291015625, 0.345733642578125, 0.42913818359375, 0.512542724609375, 0.595947265625, 0.679351806640625, 0.76275634765625, 0.846160888671875, 0.9295654296875, 1.012969970703125, 1.09637451171875, 1.179779052734375, 1.26318359375, 1.346588134765625, 1.42999267578125, 1.513397216796875, 1.5968017578125, 1.680206298828125, 1.76361083984375, 1.847015380859375, 1.930419921875, 2.013824462890625, 2.09722900390625, 2.180633544921875, 2.2640380859375, 2.347442626953125, 2.43084716796875, 2.514251708984375, 2.59765625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 10.0, 5.0, 7.0, 4.0, 10.0, 15.0, 14.0, 19.0, 12.0, 35.0, 32.0, 67.0, 86.0, 137.0, 288.0, 529.0, 858.0, 783.0, 458.0, 237.0, 158.0, 88.0, 60.0, 28.0, 23.0, 27.0, 14.0, 24.0, 9.0, 3.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.01348876953125, -1.9293212890625, -1.84515380859375, -1.760986328125, -1.67681884765625, -1.5926513671875, -1.50848388671875, -1.42431640625, -1.34014892578125, -1.2559814453125, -1.17181396484375, -1.087646484375, -1.00347900390625, -0.9193115234375, -0.83514404296875, -0.7509765625, -0.66680908203125, -0.5826416015625, -0.49847412109375, -0.414306640625, -0.33013916015625, -0.2459716796875, -0.16180419921875, -0.07763671875, 0.00653076171875, 0.0906982421875, 0.17486572265625, 0.259033203125, 0.34320068359375, 0.4273681640625, 0.51153564453125, 0.595703125, 0.67987060546875, 0.7640380859375, 0.84820556640625, 0.932373046875, 1.01654052734375, 1.1007080078125, 1.18487548828125, 1.26904296875, 1.35321044921875, 1.4373779296875, 1.52154541015625, 1.605712890625, 1.68988037109375, 1.7740478515625, 1.85821533203125, 1.9423828125, 2.02655029296875, 2.1107177734375, 2.19488525390625, 2.279052734375, 2.36322021484375, 2.4473876953125, 2.53155517578125, 2.61572265625, 2.69989013671875, 2.7840576171875, 2.86822509765625, 2.952392578125, 3.03656005859375, 3.1207275390625, 3.20489501953125, 3.2890625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 93.0, 186.0, 314.0, 224.0, 100.0, 34.0, 10.0, 8.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.85332489013672, -39.42203903198242, -37.990753173828125, -36.55946350097656, -35.128177642822266, -33.69689178466797, -32.26560592651367, -30.834320068359375, -29.403032302856445, -27.97174644470215, -26.54045867919922, -25.109172821044922, -23.677886962890625, -22.246599197387695, -20.8153133392334, -19.38402557373047, -17.952739715576172, -16.521453857421875, -15.090166091918945, -13.658880233764648, -12.227593421936035, -10.796306610107422, -9.365020751953125, -7.933733940124512, -6.502447128295898, -5.071160316467285, -3.63987398147583, -2.208587646484375, -0.7773008346557617, 0.6539859771728516, 2.0852718353271484, 3.5165586471557617, 4.947845458984375, 6.379132270812988, 7.810418605804443, 9.241704940795898, 10.672991752624512, 12.104278564453125, 13.535564422607422, 14.966851234436035, 16.39813804626465, 17.829423904418945, 19.260711669921875, 20.691997528076172, 22.12328338623047, 23.5545711517334, 24.985857009887695, 26.417144775390625, 27.848430633544922, 29.27971649169922, 30.71100425720215, 32.14228820800781, 33.573577880859375, 35.00486373901367, 36.43614959716797, 37.867435455322266, 39.29872131347656, 40.73000717163086, 42.161293029785156, 43.59258270263672, 45.023868560791016, 46.45515441894531, 47.88644027709961, 49.317726135253906, 50.74901580810547]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 7.0, 4.0, 2.0, 5.0, 10.0, 15.0, 12.0, 15.0, 24.0, 24.0, 24.0, 46.0, 30.0, 47.0, 55.0, 56.0, 48.0, 60.0, 62.0, 55.0, 58.0, 49.0, 47.0, 51.0, 33.0, 29.0, 32.0, 18.0, 25.0, 15.0, 13.0, 10.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.802183151245117, -14.299299240112305, -13.796415328979492, -13.29353141784668, -12.790647506713867, -12.287763595581055, -11.784880638122559, -11.281996726989746, -10.779112815856934, -10.276228904724121, -9.773344993591309, -9.270461082458496, -8.767578125, -8.264694213867188, -7.761810302734375, -7.2589263916015625, -6.75604248046875, -6.2531585693359375, -5.750274658203125, -5.247391223907471, -4.744507312774658, -4.241623401641846, -3.7387397289276123, -3.235856056213379, -2.7329721450805664, -2.230088233947754, -1.7272045612335205, -1.2243207693099976, -0.7214369773864746, -0.2185530662536621, 0.2843306064605713, 0.7872142791748047, 1.29010009765625, 1.792983889579773, 2.295867681503296, 2.7987513542175293, 3.301635265350342, 3.8045191764831543, 4.307402610778809, 4.810286521911621, 5.313170433044434, 5.816054344177246, 6.318938255310059, 6.821821689605713, 7.324705600738525, 7.827589511871338, 8.330472946166992, 8.833356857299805, 9.336240768432617, 9.83912467956543, 10.342008590698242, 10.844892501831055, 11.347776412963867, 11.85066032409668, 12.353543281555176, 12.856427192687988, 13.3593111038208, 13.862195014953613, 14.365078926086426, 14.867962837219238, 15.370845794677734, 15.873729705810547, 16.37661361694336, 16.879497528076172, 17.382381439208984]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 0.0, 6.0, 5.0, 9.0, 9.0, 15.0, 24.0, 47.0, 70.0, 130.0, 190.0, 298.0, 532.0, 945.0, 1740.0, 3162.0, 6097.0, 12525.0, 26576.0, 59283.0, 135082.0, 275526.0, 277093.0, 136126.0, 59832.0, 27211.0, 12598.0, 6323.0, 3127.0, 1728.0, 945.0, 535.0, 294.0, 180.0, 104.0, 59.0, 40.0, 36.0, 13.0, 8.0, 12.0, 9.0, 2.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.828125, -1.7691650390625, -1.710205078125, -1.6512451171875, -1.59228515625, -1.5333251953125, -1.474365234375, -1.4154052734375, -1.3564453125, -1.2974853515625, -1.238525390625, -1.1795654296875, -1.12060546875, -1.0616455078125, -1.002685546875, -0.9437255859375, -0.884765625, -0.8258056640625, -0.766845703125, -0.7078857421875, -0.64892578125, -0.5899658203125, -0.531005859375, -0.4720458984375, -0.4130859375, -0.3541259765625, -0.295166015625, -0.2362060546875, -0.17724609375, -0.1182861328125, -0.059326171875, -0.0003662109375, 0.05859375, 0.1175537109375, 0.176513671875, 0.2354736328125, 0.29443359375, 0.3533935546875, 0.412353515625, 0.4713134765625, 0.5302734375, 0.5892333984375, 0.648193359375, 0.7071533203125, 0.76611328125, 0.8250732421875, 0.884033203125, 0.9429931640625, 1.001953125, 1.0609130859375, 1.119873046875, 1.1788330078125, 1.23779296875, 1.2967529296875, 1.355712890625, 1.4146728515625, 1.4736328125, 1.5325927734375, 1.591552734375, 1.6505126953125, 1.70947265625, 1.7684326171875, 1.827392578125, 1.8863525390625, 1.9453125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 15.0, 19.0, 25.0, 28.0, 31.0, 40.0, 52.0, 55.0, 65.0, 83.0, 62.0, 71.0, 75.0, 70.0, 49.0, 61.0, 38.0, 31.0, 30.0, 25.0, 24.0, 22.0, 10.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.515625, -1.465087890625, -1.41455078125, -1.364013671875, -1.3134765625, -1.262939453125, -1.21240234375, -1.161865234375, -1.111328125, -1.060791015625, -1.01025390625, -0.959716796875, -0.9091796875, -0.858642578125, -0.80810546875, -0.757568359375, -0.70703125, -0.656494140625, -0.60595703125, -0.555419921875, -0.5048828125, -0.454345703125, -0.40380859375, -0.353271484375, -0.302734375, -0.252197265625, -0.20166015625, -0.151123046875, -0.1005859375, -0.050048828125, 0.00048828125, 0.051025390625, 0.1015625, 0.152099609375, 0.20263671875, 0.253173828125, 0.3037109375, 0.354248046875, 0.40478515625, 0.455322265625, 0.505859375, 0.556396484375, 0.60693359375, 0.657470703125, 0.7080078125, 0.758544921875, 0.80908203125, 0.859619140625, 0.91015625, 0.960693359375, 1.01123046875, 1.061767578125, 1.1123046875, 1.162841796875, 1.21337890625, 1.263916015625, 1.314453125, 1.364990234375, 1.41552734375, 1.466064453125, 1.5166015625, 1.567138671875, 1.61767578125, 1.668212890625, 1.71875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 7.0, 14.0, 13.0, 25.0, 13.0, 32.0, 54.0, 62.0, 117.0, 136.0, 238.0, 430.0, 743.0, 1473.0, 3575.0, 11269.0, 45617.0, 236241.0, 583365.0, 126492.0, 26365.0, 7127.0, 2532.0, 1137.0, 589.0, 302.0, 187.0, 120.0, 71.0, 55.0, 31.0, 26.0, 14.0, 15.0, 13.0, 13.0, 3.0, 7.0, 8.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.62109375, -3.505462646484375, -3.38983154296875, -3.274200439453125, -3.1585693359375, -3.042938232421875, -2.92730712890625, -2.811676025390625, -2.696044921875, -2.580413818359375, -2.46478271484375, -2.349151611328125, -2.2335205078125, -2.117889404296875, -2.00225830078125, -1.886627197265625, -1.77099609375, -1.655364990234375, -1.53973388671875, -1.424102783203125, -1.3084716796875, -1.192840576171875, -1.07720947265625, -0.961578369140625, -0.845947265625, -0.730316162109375, -0.61468505859375, -0.499053955078125, -0.3834228515625, -0.267791748046875, -0.15216064453125, -0.036529541015625, 0.0791015625, 0.194732666015625, 0.31036376953125, 0.425994873046875, 0.5416259765625, 0.657257080078125, 0.77288818359375, 0.888519287109375, 1.004150390625, 1.119781494140625, 1.23541259765625, 1.351043701171875, 1.4666748046875, 1.582305908203125, 1.69793701171875, 1.813568115234375, 1.92919921875, 2.044830322265625, 2.16046142578125, 2.276092529296875, 2.3917236328125, 2.507354736328125, 2.62298583984375, 2.738616943359375, 2.854248046875, 2.969879150390625, 3.08551025390625, 3.201141357421875, 3.3167724609375, 3.432403564453125, 3.54803466796875, 3.663665771484375, 3.779296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 4.0, 8.0, 13.0, 13.0, 16.0, 19.0, 23.0, 42.0, 25.0, 36.0, 44.0, 46.0, 52.0, 46.0, 52.0, 60.0, 52.0, 57.0, 53.0, 56.0, 40.0, 46.0, 39.0, 30.0, 27.0, 20.0, 12.0, 15.0, 13.0, 12.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8125, -4.646484375, -4.48046875, -4.314453125, -4.1484375, -3.982421875, -3.81640625, -3.650390625, -3.484375, -3.318359375, -3.15234375, -2.986328125, -2.8203125, -2.654296875, -2.48828125, -2.322265625, -2.15625, -1.990234375, -1.82421875, -1.658203125, -1.4921875, -1.326171875, -1.16015625, -0.994140625, -0.828125, -0.662109375, -0.49609375, -0.330078125, -0.1640625, 0.001953125, 0.16796875, 0.333984375, 0.5, 0.666015625, 0.83203125, 0.998046875, 1.1640625, 1.330078125, 1.49609375, 1.662109375, 1.828125, 1.994140625, 2.16015625, 2.326171875, 2.4921875, 2.658203125, 2.82421875, 2.990234375, 3.15625, 3.322265625, 3.48828125, 3.654296875, 3.8203125, 3.986328125, 4.15234375, 4.318359375, 4.484375, 4.650390625, 4.81640625, 4.982421875, 5.1484375, 5.314453125, 5.48046875, 5.646484375, 5.8125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 6.0, 9.0, 7.0, 6.0, 7.0, 28.0, 32.0, 42.0, 66.0, 128.0, 269.0, 565.0, 1528.0, 5034.0, 31448.0, 666628.0, 317664.0, 19111.0, 3725.0, 1185.0, 523.0, 210.0, 126.0, 72.0, 34.0, 32.0, 14.0, 11.0, 9.0, 8.0, 7.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.86468505859375, -2.7801513671875, -2.69561767578125, -2.611083984375, -2.52655029296875, -2.4420166015625, -2.35748291015625, -2.27294921875, -2.18841552734375, -2.1038818359375, -2.01934814453125, -1.934814453125, -1.85028076171875, -1.7657470703125, -1.68121337890625, -1.5966796875, -1.51214599609375, -1.4276123046875, -1.34307861328125, -1.258544921875, -1.17401123046875, -1.0894775390625, -1.00494384765625, -0.92041015625, -0.83587646484375, -0.7513427734375, -0.66680908203125, -0.582275390625, -0.49774169921875, -0.4132080078125, -0.32867431640625, -0.244140625, -0.15960693359375, -0.0750732421875, 0.00946044921875, 0.093994140625, 0.17852783203125, 0.2630615234375, 0.34759521484375, 0.43212890625, 0.51666259765625, 0.6011962890625, 0.68572998046875, 0.770263671875, 0.85479736328125, 0.9393310546875, 1.02386474609375, 1.1083984375, 1.19293212890625, 1.2774658203125, 1.36199951171875, 1.446533203125, 1.53106689453125, 1.6156005859375, 1.70013427734375, 1.78466796875, 1.86920166015625, 1.9537353515625, 2.03826904296875, 2.122802734375, 2.20733642578125, 2.2918701171875, 2.37640380859375, 2.4609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 5.0, 3.0, 6.0, 13.0, 20.0, 19.0, 17.0, 61.0, 59.0, 75.0, 92.0, 106.0, 117.0, 94.0, 78.0, 59.0, 40.0, 44.0, 18.0, 14.0, 13.0, 7.0, 5.0, 11.0, 3.0, 3.0, 8.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00039124488830566406, -0.0003782697021961212, -0.00036529451608657837, -0.0003523193299770355, -0.0003393441438674927, -0.00032636895775794983, -0.000313393771648407, -0.00030041858553886414, -0.0002874433994293213, -0.00027446821331977844, -0.0002614930272102356, -0.00024851784110069275, -0.0002355426549911499, -0.00022256746888160706, -0.0002095922827720642, -0.00019661709666252136, -0.00018364191055297852, -0.00017066672444343567, -0.00015769153833389282, -0.00014471635222434998, -0.00013174116611480713, -0.00011876598000526428, -0.00010579079389572144, -9.281560778617859e-05, -7.984042167663574e-05, -6.68652355670929e-05, -5.389004945755005e-05, -4.09148633480072e-05, -2.7939677238464355e-05, -1.4964491128921509e-05, -1.989305019378662e-06, 1.0985881090164185e-05, 2.396106719970703e-05, 3.693625330924988e-05, 4.9911439418792725e-05, 6.288662552833557e-05, 7.586181163787842e-05, 8.883699774742126e-05, 0.00010181218385696411, 0.00011478736996650696, 0.0001277625560760498, 0.00014073774218559265, 0.0001537129282951355, 0.00016668811440467834, 0.0001796633005142212, 0.00019263848662376404, 0.00020561367273330688, 0.00021858885884284973, 0.00023156404495239258, 0.0002445392310619354, 0.00025751441717147827, 0.0002704896032810211, 0.00028346478939056396, 0.0002964399755001068, 0.00030941516160964966, 0.0003223903477191925, 0.00033536553382873535, 0.0003483407199382782, 0.00036131590604782104, 0.0003742910921573639, 0.00038726627826690674, 0.0004002414643764496, 0.00041321665048599243, 0.0004261918365955353, 0.0004391670227050781]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 11.0, 16.0, 21.0, 30.0, 55.0, 75.0, 153.0, 271.0, 595.0, 1427.0, 4605.0, 24619.0, 282303.0, 668993.0, 54128.0, 7587.0, 2047.0, 814.0, 353.0, 162.0, 102.0, 67.0, 38.0, 22.0, 15.0, 11.0, 7.0, 6.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.115234375, -2.051483154296875, -1.98773193359375, -1.923980712890625, -1.8602294921875, -1.796478271484375, -1.73272705078125, -1.668975830078125, -1.605224609375, -1.541473388671875, -1.47772216796875, -1.413970947265625, -1.3502197265625, -1.286468505859375, -1.22271728515625, -1.158966064453125, -1.09521484375, -1.031463623046875, -0.96771240234375, -0.903961181640625, -0.8402099609375, -0.776458740234375, -0.71270751953125, -0.648956298828125, -0.585205078125, -0.521453857421875, -0.45770263671875, -0.393951416015625, -0.3302001953125, -0.266448974609375, -0.20269775390625, -0.138946533203125, -0.0751953125, -0.011444091796875, 0.05230712890625, 0.116058349609375, 0.1798095703125, 0.243560791015625, 0.30731201171875, 0.371063232421875, 0.434814453125, 0.498565673828125, 0.56231689453125, 0.626068115234375, 0.6898193359375, 0.753570556640625, 0.81732177734375, 0.881072998046875, 0.94482421875, 1.008575439453125, 1.07232666015625, 1.136077880859375, 1.1998291015625, 1.263580322265625, 1.32733154296875, 1.391082763671875, 1.454833984375, 1.518585205078125, 1.58233642578125, 1.646087646484375, 1.7098388671875, 1.773590087890625, 1.83734130859375, 1.901092529296875, 1.96484375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 6.0, 6.0, 8.0, 21.0, 25.0, 26.0, 30.0, 37.0, 56.0, 61.0, 69.0, 79.0, 80.0, 88.0, 73.0, 80.0, 63.0, 45.0, 35.0, 26.0, 22.0, 18.0, 10.0, 13.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7666015625, -1.7126007080078125, -1.658599853515625, -1.6045989990234375, -1.55059814453125, -1.4965972900390625, -1.442596435546875, -1.3885955810546875, -1.3345947265625, -1.2805938720703125, -1.226593017578125, -1.1725921630859375, -1.11859130859375, -1.0645904541015625, -1.010589599609375, -0.9565887451171875, -0.902587890625, -0.8485870361328125, -0.794586181640625, -0.7405853271484375, -0.68658447265625, -0.6325836181640625, -0.578582763671875, -0.5245819091796875, -0.4705810546875, -0.4165802001953125, -0.362579345703125, -0.3085784912109375, -0.25457763671875, -0.2005767822265625, -0.146575927734375, -0.0925750732421875, -0.03857421875, 0.0154266357421875, 0.069427490234375, 0.1234283447265625, 0.17742919921875, 0.2314300537109375, 0.285430908203125, 0.3394317626953125, 0.3934326171875, 0.4474334716796875, 0.501434326171875, 0.5554351806640625, 0.60943603515625, 0.6634368896484375, 0.717437744140625, 0.7714385986328125, 0.825439453125, 0.8794403076171875, 0.933441162109375, 0.9874420166015625, 1.04144287109375, 1.0954437255859375, 1.149444580078125, 1.2034454345703125, 1.2574462890625, 1.3114471435546875, 1.365447998046875, 1.4194488525390625, 1.47344970703125, 1.5274505615234375, 1.581451416015625, 1.6354522705078125, 1.689453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 19.0, 45.0, 112.0, 216.0, 265.0, 172.0, 85.0, 35.0, 21.0, 6.0, 6.0, 5.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.83061981201172, -35.3729133605957, -33.91520690917969, -32.45750427246094, -30.999797821044922, -29.542091369628906, -28.084386825561523, -26.62668228149414, -25.168975830078125, -23.71126937866211, -22.253564834594727, -20.795860290527344, -19.338153839111328, -17.880447387695312, -16.42274284362793, -14.96503734588623, -13.507331848144531, -12.049626350402832, -10.591920852661133, -9.134215354919434, -7.676509857177734, -6.218804359436035, -4.761098861694336, -3.3033933639526367, -1.8456878662109375, -0.3879823684692383, 1.069723129272461, 2.52742862701416, 3.9851341247558594, 5.442839622497559, 6.900545120239258, 8.358250617980957, 9.815959930419922, 11.273665428161621, 12.73137092590332, 14.18907642364502, 15.646781921386719, 17.104488372802734, 18.562192916870117, 20.0198974609375, 21.477603912353516, 22.93531036376953, 24.393014907836914, 25.850719451904297, 27.308425903320312, 28.766132354736328, 30.22383689880371, 31.681541442871094, 33.13924789428711, 34.596954345703125, 36.054656982421875, 37.51236343383789, 38.970069885253906, 40.42777633666992, 41.88548278808594, 43.34318542480469, 44.8008918762207, 46.25859832763672, 47.71630096435547, 49.174007415771484, 50.6317138671875, 52.089420318603516, 53.54712677001953, 55.00482940673828, 56.4625358581543]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 6.0, 14.0, 14.0, 23.0, 30.0, 27.0, 32.0, 46.0, 43.0, 56.0, 50.0, 64.0, 79.0, 88.0, 75.0, 61.0, 52.0, 54.0, 33.0, 37.0, 30.0, 16.0, 14.0, 14.0, 10.0, 8.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.305660247802734, -35.44225311279297, -34.5788459777832, -33.71543502807617, -32.852027893066406, -31.98862075805664, -31.125213623046875, -30.261804580688477, -29.398395538330078, -28.534988403320312, -27.671579360961914, -26.80817222595215, -25.94476318359375, -25.081356048583984, -24.21794891357422, -23.35453987121582, -22.491132736206055, -21.62772560119629, -20.76431655883789, -19.900909423828125, -19.037500381469727, -18.17409324645996, -17.310684204101562, -16.447277069091797, -15.583868980407715, -14.720460891723633, -13.85705280303955, -12.993644714355469, -12.130237579345703, -11.266828536987305, -10.403421401977539, -9.540013313293457, -8.676603317260742, -7.81319522857666, -6.949787139892578, -6.086379528045654, -5.222971439361572, -4.35956335067749, -3.4961557388305664, -2.6327476501464844, -1.7693395614624023, -0.9059315919876099, -0.04252362251281738, 0.8208842277526855, 1.6842923164367676, 2.5477004051208496, 3.4111080169677734, 4.2745161056518555, 5.1379241943359375, 6.0013322830200195, 6.864740371704102, 7.728147983551025, 8.591556549072266, 9.454963684082031, 10.318371772766113, 11.181779861450195, 12.045187950134277, 12.90859603881836, 13.772004127502441, 14.635412216186523, 15.498819351196289, 16.362228393554688, 17.225635528564453, 18.08904266357422, 18.952451705932617]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 12.0, 16.0, 16.0, 25.0, 47.0, 47.0, 106.0, 224.0, 413.0, 902.0, 2046.0, 5131.0, 14957.0, 56694.0, 404992.0, 2827975.0, 760279.0, 86581.0, 21477.0, 7269.0, 2852.0, 1193.0, 525.0, 240.0, 112.0, 58.0, 38.0, 8.0, 15.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2734375, -2.216064453125, -2.15869140625, -2.101318359375, -2.0439453125, -1.986572265625, -1.92919921875, -1.871826171875, -1.814453125, -1.757080078125, -1.69970703125, -1.642333984375, -1.5849609375, -1.527587890625, -1.47021484375, -1.412841796875, -1.35546875, -1.298095703125, -1.24072265625, -1.183349609375, -1.1259765625, -1.068603515625, -1.01123046875, -0.953857421875, -0.896484375, -0.839111328125, -0.78173828125, -0.724365234375, -0.6669921875, -0.609619140625, -0.55224609375, -0.494873046875, -0.4375, -0.380126953125, -0.32275390625, -0.265380859375, -0.2080078125, -0.150634765625, -0.09326171875, -0.035888671875, 0.021484375, 0.078857421875, 0.13623046875, 0.193603515625, 0.2509765625, 0.308349609375, 0.36572265625, 0.423095703125, 0.48046875, 0.537841796875, 0.59521484375, 0.652587890625, 0.7099609375, 0.767333984375, 0.82470703125, 0.882080078125, 0.939453125, 0.996826171875, 1.05419921875, 1.111572265625, 1.1689453125, 1.226318359375, 1.28369140625, 1.341064453125, 1.3984375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 9.0, 19.0, 23.0, 34.0, 34.0, 66.0, 59.0, 97.0, 85.0, 89.0, 93.0, 99.0, 77.0, 74.0, 49.0, 41.0, 22.0, 20.0, 11.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.11328125, -3.0492782592773438, -2.9852752685546875, -2.9212722778320312, -2.857269287109375, -2.7932662963867188, -2.7292633056640625, -2.6652603149414062, -2.60125732421875, -2.5372543334960938, -2.4732513427734375, -2.4092483520507812, -2.345245361328125, -2.2812423706054688, -2.2172393798828125, -2.1532363891601562, -2.0892333984375, -2.0252304077148438, -1.9612274169921875, -1.8972244262695312, -1.833221435546875, -1.7692184448242188, -1.7052154541015625, -1.6412124633789062, -1.57720947265625, -1.5132064819335938, -1.4492034912109375, -1.3852005004882812, -1.321197509765625, -1.2571945190429688, -1.1931915283203125, -1.1291885375976562, -1.065185546875, -1.0011825561523438, -0.9371795654296875, -0.8731765747070312, -0.809173583984375, -0.7451705932617188, -0.6811676025390625, -0.6171646118164062, -0.55316162109375, -0.48915863037109375, -0.4251556396484375, -0.36115264892578125, -0.297149658203125, -0.23314666748046875, -0.1691436767578125, -0.10514068603515625, -0.0411376953125, 0.02286529541015625, 0.0868682861328125, 0.15087127685546875, 0.214874267578125, 0.27887725830078125, 0.3428802490234375, 0.40688323974609375, 0.47088623046875, 0.5348892211914062, 0.5988922119140625, 0.6628952026367188, 0.726898193359375, 0.7909011840820312, 0.8549041748046875, 0.9189071655273438, 0.98291015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 17.0, 12.0, 20.0, 24.0, 28.0, 54.0, 92.0, 156.0, 272.0, 488.0, 1014.0, 2345.0, 6415.0, 20541.0, 94655.0, 1299692.0, 2568616.0, 153942.0, 30748.0, 9033.0, 3234.0, 1338.0, 645.0, 337.0, 205.0, 110.0, 60.0, 46.0, 39.0, 31.0, 14.0, 15.0, 6.0, 6.0, 10.0, 6.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.578125, -2.48956298828125, -2.4010009765625, -2.31243896484375, -2.223876953125, -2.13531494140625, -2.0467529296875, -1.95819091796875, -1.86962890625, -1.78106689453125, -1.6925048828125, -1.60394287109375, -1.515380859375, -1.42681884765625, -1.3382568359375, -1.24969482421875, -1.1611328125, -1.07257080078125, -0.9840087890625, -0.89544677734375, -0.806884765625, -0.71832275390625, -0.6297607421875, -0.54119873046875, -0.45263671875, -0.36407470703125, -0.2755126953125, -0.18695068359375, -0.098388671875, -0.00982666015625, 0.0787353515625, 0.16729736328125, 0.255859375, 0.34442138671875, 0.4329833984375, 0.52154541015625, 0.610107421875, 0.69866943359375, 0.7872314453125, 0.87579345703125, 0.96435546875, 1.05291748046875, 1.1414794921875, 1.23004150390625, 1.318603515625, 1.40716552734375, 1.4957275390625, 1.58428955078125, 1.6728515625, 1.76141357421875, 1.8499755859375, 1.93853759765625, 2.027099609375, 2.11566162109375, 2.2042236328125, 2.29278564453125, 2.38134765625, 2.46990966796875, 2.5584716796875, 2.64703369140625, 2.735595703125, 2.82415771484375, 2.9127197265625, 3.00128173828125, 3.08984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 2.0, 6.0, 5.0, 5.0, 8.0, 18.0, 20.0, 21.0, 34.0, 47.0, 64.0, 105.0, 206.0, 321.0, 553.0, 825.0, 678.0, 404.0, 246.0, 130.0, 97.0, 63.0, 61.0, 42.0, 25.0, 19.0, 17.0, 10.0, 11.0, 7.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.2421875, -3.14324951171875, -3.0443115234375, -2.94537353515625, -2.846435546875, -2.74749755859375, -2.6485595703125, -2.54962158203125, -2.45068359375, -2.35174560546875, -2.2528076171875, -2.15386962890625, -2.054931640625, -1.95599365234375, -1.8570556640625, -1.75811767578125, -1.6591796875, -1.56024169921875, -1.4613037109375, -1.36236572265625, -1.263427734375, -1.16448974609375, -1.0655517578125, -0.96661376953125, -0.86767578125, -0.76873779296875, -0.6697998046875, -0.57086181640625, -0.471923828125, -0.37298583984375, -0.2740478515625, -0.17510986328125, -0.076171875, 0.02276611328125, 0.1217041015625, 0.22064208984375, 0.319580078125, 0.41851806640625, 0.5174560546875, 0.61639404296875, 0.71533203125, 0.81427001953125, 0.9132080078125, 1.01214599609375, 1.111083984375, 1.21002197265625, 1.3089599609375, 1.40789794921875, 1.5068359375, 1.60577392578125, 1.7047119140625, 1.80364990234375, 1.902587890625, 2.00152587890625, 2.1004638671875, 2.19940185546875, 2.29833984375, 2.39727783203125, 2.4962158203125, 2.59515380859375, 2.694091796875, 2.79302978515625, 2.8919677734375, 2.99090576171875, 3.08984375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 17.0, 38.0, 90.0, 217.0, 273.0, 204.0, 87.0, 39.0, 16.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.38591766357422, -22.97064208984375, -21.55536651611328, -20.140090942382812, -18.724817276000977, -17.309541702270508, -15.894266128540039, -14.478991508483887, -13.063715934753418, -11.64844036102295, -10.233165740966797, -8.817890167236328, -7.402615070343018, -5.987339973449707, -4.572064399719238, -3.156789779663086, -1.7415142059326172, -0.3262389898300171, 1.089036226272583, 2.5043115615844727, 3.919586658477783, 5.334861755371094, 6.7501373291015625, 8.165411949157715, 9.580687522888184, 10.995963096618652, 12.411237716674805, 13.826513290405273, 15.241788864135742, 16.657062530517578, 18.072338104248047, 19.487613677978516, 20.902889251708984, 22.318164825439453, 23.733440399169922, 25.14871597290039, 26.563989639282227, 27.979265213012695, 29.394540786743164, 30.809814453125, 32.22509002685547, 33.64036560058594, 35.055641174316406, 36.470916748046875, 37.886192321777344, 39.30146789550781, 40.71674346923828, 42.132015228271484, 43.54729461669922, 44.96257019042969, 46.377845764160156, 47.793121337890625, 49.208396911621094, 50.62367248535156, 52.03894805908203, 53.454219818115234, 54.8694953918457, 56.28477096557617, 57.70004653930664, 59.11532211303711, 60.53059768676758, 61.94586944580078, 63.36114501953125, 64.77642059326172, 66.19169616699219]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 10.0, 8.0, 11.0, 12.0, 8.0, 21.0, 22.0, 25.0, 25.0, 32.0, 30.0, 26.0, 39.0, 46.0, 47.0, 43.0, 49.0, 47.0, 45.0, 63.0, 52.0, 41.0, 41.0, 30.0, 28.0, 24.0, 20.0, 30.0, 20.0, 21.0, 13.0, 21.0, 11.0, 6.0, 6.0, 10.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.254129409790039, -13.804848670959473, -13.355567932128906, -12.90628719329834, -12.457006454467773, -12.00772476196289, -11.558444023132324, -11.109163284301758, -10.659882545471191, -10.210601806640625, -9.761321067810059, -9.312040328979492, -8.86275863647461, -8.41347885131836, -7.964197158813477, -7.51491641998291, -7.065635681152344, -6.616354942321777, -6.167074203491211, -5.717792987823486, -5.26851224899292, -4.8192315101623535, -4.369950294494629, -3.9206695556640625, -3.471388816833496, -3.0221080780029297, -2.572827100753784, -2.1235461235046387, -1.6742653846740723, -1.2249846458435059, -0.7757036685943604, -0.32642269134521484, 0.12285804748535156, 0.5721389055252075, 1.0214197635650635, 1.4707006216049194, 1.9199814796447754, 2.369262218475342, 2.8185431957244873, 3.267824172973633, 3.717104911804199, 4.166385650634766, 4.615666389465332, 5.064947605133057, 5.514228343963623, 5.9635090827941895, 6.412790298461914, 6.8620710372924805, 7.311351776123047, 7.760632514953613, 8.20991325378418, 8.659193992614746, 9.108474731445312, 9.557756423950195, 10.007037162780762, 10.456317901611328, 10.905598640441895, 11.354879379272461, 11.804160118103027, 12.253440856933594, 12.702722549438477, 13.152002334594727, 13.60128402709961, 14.050564765930176, 14.499845504760742]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 10.0, 7.0, 12.0, 31.0, 28.0, 45.0, 71.0, 152.0, 261.0, 457.0, 965.0, 1932.0, 4115.0, 9190.0, 21442.0, 49233.0, 110050.0, 214552.0, 276413.0, 191381.0, 93646.0, 41402.0, 18134.0, 7990.0, 3547.0, 1696.0, 754.0, 443.0, 225.0, 142.0, 82.0, 44.0, 28.0, 30.0, 26.0, 10.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8544921875, -1.8035430908203125, -1.752593994140625, -1.7016448974609375, -1.65069580078125, -1.5997467041015625, -1.548797607421875, -1.4978485107421875, -1.4468994140625, -1.3959503173828125, -1.345001220703125, -1.2940521240234375, -1.24310302734375, -1.1921539306640625, -1.141204833984375, -1.0902557373046875, -1.039306640625, -0.9883575439453125, -0.937408447265625, -0.8864593505859375, -0.83551025390625, -0.7845611572265625, -0.733612060546875, -0.6826629638671875, -0.6317138671875, -0.5807647705078125, -0.529815673828125, -0.4788665771484375, -0.42791748046875, -0.3769683837890625, -0.326019287109375, -0.2750701904296875, -0.22412109375, -0.1731719970703125, -0.122222900390625, -0.0712738037109375, -0.02032470703125, 0.0306243896484375, 0.081573486328125, 0.1325225830078125, 0.1834716796875, 0.2344207763671875, 0.285369873046875, 0.3363189697265625, 0.38726806640625, 0.4382171630859375, 0.489166259765625, 0.5401153564453125, 0.591064453125, 0.6420135498046875, 0.692962646484375, 0.7439117431640625, 0.79486083984375, 0.8458099365234375, 0.896759033203125, 0.9477081298828125, 0.9986572265625, 1.0496063232421875, 1.100555419921875, 1.1515045166015625, 1.20245361328125, 1.2534027099609375, 1.304351806640625, 1.3553009033203125, 1.40625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 4.0, 9.0, 18.0, 10.0, 14.0, 27.0, 30.0, 32.0, 37.0, 55.0, 55.0, 54.0, 65.0, 61.0, 51.0, 42.0, 58.0, 52.0, 47.0, 51.0, 46.0, 30.0, 32.0, 34.0, 27.0, 18.0, 10.0, 9.0, 9.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.7373046875, -1.6965789794921875, -1.655853271484375, -1.6151275634765625, -1.57440185546875, -1.5336761474609375, -1.492950439453125, -1.4522247314453125, -1.4114990234375, -1.3707733154296875, -1.330047607421875, -1.2893218994140625, -1.24859619140625, -1.2078704833984375, -1.167144775390625, -1.1264190673828125, -1.085693359375, -1.0449676513671875, -1.004241943359375, -0.9635162353515625, -0.92279052734375, -0.8820648193359375, -0.841339111328125, -0.8006134033203125, -0.7598876953125, -0.7191619873046875, -0.678436279296875, -0.6377105712890625, -0.59698486328125, -0.5562591552734375, -0.515533447265625, -0.4748077392578125, -0.43408203125, -0.3933563232421875, -0.352630615234375, -0.3119049072265625, -0.27117919921875, -0.2304534912109375, -0.189727783203125, -0.1490020751953125, -0.1082763671875, -0.0675506591796875, -0.026824951171875, 0.0139007568359375, 0.05462646484375, 0.0953521728515625, 0.136077880859375, 0.1768035888671875, 0.217529296875, 0.2582550048828125, 0.298980712890625, 0.3397064208984375, 0.38043212890625, 0.4211578369140625, 0.461883544921875, 0.5026092529296875, 0.5433349609375, 0.5840606689453125, 0.624786376953125, 0.6655120849609375, 0.70623779296875, 0.7469635009765625, 0.787689208984375, 0.8284149169921875, 0.869140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 13.0, 20.0, 21.0, 30.0, 42.0, 53.0, 85.0, 124.0, 199.0, 270.0, 449.0, 775.0, 1290.0, 2792.0, 8073.0, 41757.0, 310263.0, 591143.0, 71719.0, 11867.0, 3512.0, 1586.0, 879.0, 534.0, 357.0, 224.0, 141.0, 111.0, 60.0, 43.0, 37.0, 24.0, 16.0, 11.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.47265625, -4.355377197265625, -4.23809814453125, -4.120819091796875, -4.0035400390625, -3.886260986328125, -3.76898193359375, -3.651702880859375, -3.534423828125, -3.417144775390625, -3.29986572265625, -3.182586669921875, -3.0653076171875, -2.948028564453125, -2.83074951171875, -2.713470458984375, -2.59619140625, -2.478912353515625, -2.36163330078125, -2.244354248046875, -2.1270751953125, -2.009796142578125, -1.89251708984375, -1.775238037109375, -1.657958984375, -1.540679931640625, -1.42340087890625, -1.306121826171875, -1.1888427734375, -1.071563720703125, -0.95428466796875, -0.837005615234375, -0.7197265625, -0.602447509765625, -0.48516845703125, -0.367889404296875, -0.2506103515625, -0.133331298828125, -0.01605224609375, 0.101226806640625, 0.218505859375, 0.335784912109375, 0.45306396484375, 0.570343017578125, 0.6876220703125, 0.804901123046875, 0.92218017578125, 1.039459228515625, 1.15673828125, 1.274017333984375, 1.39129638671875, 1.508575439453125, 1.6258544921875, 1.743133544921875, 1.86041259765625, 1.977691650390625, 2.094970703125, 2.212249755859375, 2.32952880859375, 2.446807861328125, 2.5640869140625, 2.681365966796875, 2.79864501953125, 2.915924072265625, 3.033203125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 7.0, 4.0, 7.0, 11.0, 13.0, 26.0, 30.0, 35.0, 35.0, 37.0, 43.0, 52.0, 61.0, 67.0, 52.0, 87.0, 65.0, 61.0, 62.0, 45.0, 43.0, 31.0, 29.0, 25.0, 21.0, 24.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.54296875, -7.35833740234375, -7.1737060546875, -6.98907470703125, -6.804443359375, -6.61981201171875, -6.4351806640625, -6.25054931640625, -6.06591796875, -5.88128662109375, -5.6966552734375, -5.51202392578125, -5.327392578125, -5.14276123046875, -4.9581298828125, -4.77349853515625, -4.5888671875, -4.40423583984375, -4.2196044921875, -4.03497314453125, -3.850341796875, -3.66571044921875, -3.4810791015625, -3.29644775390625, -3.11181640625, -2.92718505859375, -2.7425537109375, -2.55792236328125, -2.373291015625, -2.18865966796875, -2.0040283203125, -1.81939697265625, -1.634765625, -1.45013427734375, -1.2655029296875, -1.08087158203125, -0.896240234375, -0.71160888671875, -0.5269775390625, -0.34234619140625, -0.15771484375, 0.02691650390625, 0.2115478515625, 0.39617919921875, 0.580810546875, 0.76544189453125, 0.9500732421875, 1.13470458984375, 1.3193359375, 1.50396728515625, 1.6885986328125, 1.87322998046875, 2.057861328125, 2.24249267578125, 2.4271240234375, 2.61175537109375, 2.79638671875, 2.98101806640625, 3.1656494140625, 3.35028076171875, 3.534912109375, 3.71954345703125, 3.9041748046875, 4.08880615234375, 4.2734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 16.0, 13.0, 31.0, 90.0, 168.0, 557.0, 2035.0, 19816.0, 876368.0, 142508.0, 5368.0, 1024.0, 313.0, 121.0, 52.0, 29.0, 15.0, 8.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.957305908203125, -2.86968994140625, -2.782073974609375, -2.6944580078125, -2.606842041015625, -2.51922607421875, -2.431610107421875, -2.343994140625, -2.256378173828125, -2.16876220703125, -2.081146240234375, -1.9935302734375, -1.905914306640625, -1.81829833984375, -1.730682373046875, -1.64306640625, -1.555450439453125, -1.46783447265625, -1.380218505859375, -1.2926025390625, -1.204986572265625, -1.11737060546875, -1.029754638671875, -0.942138671875, -0.854522705078125, -0.76690673828125, -0.679290771484375, -0.5916748046875, -0.504058837890625, -0.41644287109375, -0.328826904296875, -0.2412109375, -0.153594970703125, -0.06597900390625, 0.021636962890625, 0.1092529296875, 0.196868896484375, 0.28448486328125, 0.372100830078125, 0.459716796875, 0.547332763671875, 0.63494873046875, 0.722564697265625, 0.8101806640625, 0.897796630859375, 0.98541259765625, 1.073028564453125, 1.16064453125, 1.248260498046875, 1.33587646484375, 1.423492431640625, 1.5111083984375, 1.598724365234375, 1.68634033203125, 1.773956298828125, 1.861572265625, 1.949188232421875, 2.03680419921875, 2.124420166015625, 2.2120361328125, 2.299652099609375, 2.38726806640625, 2.474884033203125, 2.5625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 3.0, 2.0, 3.0, 13.0, 13.0, 10.0, 21.0, 19.0, 22.0, 28.0, 31.0, 47.0, 54.0, 52.0, 85.0, 67.0, 83.0, 90.0, 60.0, 50.0, 43.0, 46.0, 39.0, 30.0, 19.0, 13.0, 15.0, 9.0, 7.0, 9.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021457672119140625, -0.00020572543144226074, -0.00019687414169311523, -0.00018802285194396973, -0.00017917156219482422, -0.0001703202724456787, -0.0001614689826965332, -0.0001526176929473877, -0.0001437664031982422, -0.00013491511344909668, -0.00012606382369995117, -0.00011721253395080566, -0.00010836124420166016, -9.950995445251465e-05, -9.065866470336914e-05, -8.180737495422363e-05, -7.295608520507812e-05, -6.410479545593262e-05, -5.525350570678711e-05, -4.64022159576416e-05, -3.7550926208496094e-05, -2.8699636459350586e-05, -1.9848346710205078e-05, -1.099705696105957e-05, -2.1457672119140625e-06, 6.705522537231445e-06, 1.5556812286376953e-05, 2.440810203552246e-05, 3.325939178466797e-05, 4.2110681533813477e-05, 5.0961971282958984e-05, 5.981326103210449e-05, 6.866455078125e-05, 7.751584053039551e-05, 8.636713027954102e-05, 9.521842002868652e-05, 0.00010406970977783203, 0.00011292099952697754, 0.00012177228927612305, 0.00013062357902526855, 0.00013947486877441406, 0.00014832615852355957, 0.00015717744827270508, 0.00016602873802185059, 0.0001748800277709961, 0.0001837313175201416, 0.0001925826072692871, 0.00020143389701843262, 0.00021028518676757812, 0.00021913647651672363, 0.00022798776626586914, 0.00023683905601501465, 0.00024569034576416016, 0.00025454163551330566, 0.00026339292526245117, 0.0002722442150115967, 0.0002810955047607422, 0.0002899467945098877, 0.0002987980842590332, 0.0003076493740081787, 0.0003165006637573242, 0.0003253519535064697, 0.00033420324325561523, 0.00034305453300476074, 0.00035190582275390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 5.0, 9.0, 9.0, 11.0, 21.0, 24.0, 49.0, 70.0, 85.0, 182.0, 265.0, 424.0, 777.0, 1589.0, 3690.0, 11771.0, 57742.0, 528702.0, 374913.0, 50672.0, 10681.0, 3495.0, 1510.0, 725.0, 404.0, 241.0, 148.0, 93.0, 61.0, 51.0, 30.0, 33.0, 14.0, 16.0, 12.0, 6.0, 5.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9940032958984375, -0.959686279296875, -0.9253692626953125, -0.89105224609375, -0.8567352294921875, -0.822418212890625, -0.7881011962890625, -0.7537841796875, -0.7194671630859375, -0.685150146484375, -0.6508331298828125, -0.61651611328125, -0.5821990966796875, -0.547882080078125, -0.5135650634765625, -0.479248046875, -0.4449310302734375, -0.410614013671875, -0.3762969970703125, -0.34197998046875, -0.3076629638671875, -0.273345947265625, -0.2390289306640625, -0.2047119140625, -0.1703948974609375, -0.136077880859375, -0.1017608642578125, -0.06744384765625, -0.0331268310546875, 0.001190185546875, 0.0355072021484375, 0.06982421875, 0.1041412353515625, 0.138458251953125, 0.1727752685546875, 0.20709228515625, 0.2414093017578125, 0.275726318359375, 0.3100433349609375, 0.3443603515625, 0.3786773681640625, 0.412994384765625, 0.4473114013671875, 0.48162841796875, 0.5159454345703125, 0.550262451171875, 0.5845794677734375, 0.618896484375, 0.6532135009765625, 0.687530517578125, 0.7218475341796875, 0.75616455078125, 0.7904815673828125, 0.824798583984375, 0.8591156005859375, 0.8934326171875, 0.9277496337890625, 0.962066650390625, 0.9963836669921875, 1.03070068359375, 1.0650177001953125, 1.099334716796875, 1.1336517333984375, 1.16796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 8.0, 6.0, 12.0, 8.0, 12.0, 20.0, 20.0, 26.0, 31.0, 43.0, 37.0, 52.0, 61.0, 58.0, 75.0, 66.0, 56.0, 59.0, 49.0, 49.0, 45.0, 43.0, 39.0, 21.0, 28.0, 15.0, 16.0, 10.0, 2.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91015625, -0.8780517578125, -0.845947265625, -0.8138427734375, -0.78173828125, -0.7496337890625, -0.717529296875, -0.6854248046875, -0.6533203125, -0.6212158203125, -0.589111328125, -0.5570068359375, -0.52490234375, -0.4927978515625, -0.460693359375, -0.4285888671875, -0.396484375, -0.3643798828125, -0.332275390625, -0.3001708984375, -0.26806640625, -0.2359619140625, -0.203857421875, -0.1717529296875, -0.1396484375, -0.1075439453125, -0.075439453125, -0.0433349609375, -0.01123046875, 0.0208740234375, 0.052978515625, 0.0850830078125, 0.1171875, 0.1492919921875, 0.181396484375, 0.2135009765625, 0.24560546875, 0.2777099609375, 0.309814453125, 0.3419189453125, 0.3740234375, 0.4061279296875, 0.438232421875, 0.4703369140625, 0.50244140625, 0.5345458984375, 0.566650390625, 0.5987548828125, 0.630859375, 0.6629638671875, 0.695068359375, 0.7271728515625, 0.75927734375, 0.7913818359375, 0.823486328125, 0.8555908203125, 0.8876953125, 0.9197998046875, 0.951904296875, 0.9840087890625, 1.01611328125, 1.0482177734375, 1.080322265625, 1.1124267578125, 1.14453125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 2.0, 7.0, 16.0, 36.0, 57.0, 87.0, 119.0, 222.0, 169.0, 121.0, 74.0, 40.0, 21.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.81401824951172, -31.917997360229492, -31.021976470947266, -30.12595558166504, -29.229934692382812, -28.333913803100586, -27.43789291381836, -26.541872024536133, -25.645851135253906, -24.74983024597168, -23.853809356689453, -22.957788467407227, -22.061767578125, -21.165746688842773, -20.269725799560547, -19.37370491027832, -18.477684020996094, -17.581663131713867, -16.68564224243164, -15.789621353149414, -14.893600463867188, -13.997579574584961, -13.101558685302734, -12.205537796020508, -11.309516906738281, -10.413496017456055, -9.517475128173828, -8.621454238891602, -7.725433349609375, -6.829412460327148, -5.933391571044922, -5.037370681762695, -4.141349792480469, -3.245328903198242, -2.3493080139160156, -1.453287124633789, -0.5572662353515625, 0.33875465393066406, 1.2347755432128906, 2.130796432495117, 3.0268173217773438, 3.9228382110595703, 4.818859100341797, 5.714879989624023, 6.61090087890625, 7.506921768188477, 8.402942657470703, 9.29896354675293, 10.194984436035156, 11.091005325317383, 11.98702621459961, 12.883047103881836, 13.779067993164062, 14.675088882446289, 15.571109771728516, 16.467130661010742, 17.36315155029297, 18.259172439575195, 19.155193328857422, 20.05121421813965, 20.947235107421875, 21.8432559967041, 22.739276885986328, 23.635297775268555, 24.53131866455078]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 7.0, 5.0, 8.0, 3.0, 12.0, 19.0, 25.0, 28.0, 22.0, 22.0, 28.0, 33.0, 37.0, 37.0, 43.0, 55.0, 63.0, 67.0, 64.0, 64.0, 46.0, 34.0, 36.0, 27.0, 26.0, 35.0, 19.0, 25.0, 14.0, 15.0, 16.0, 8.0, 10.0, 10.0, 6.0, 8.0, 3.0, 2.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.392358779907227, -16.842315673828125, -16.292272567749023, -15.742228507995605, -15.192185401916504, -14.642142295837402, -14.092098236083984, -13.542055130004883, -12.992012023925781, -12.44196891784668, -11.891925811767578, -11.34188175201416, -10.791838645935059, -10.241795539855957, -9.691751480102539, -9.141708374023438, -8.591665267944336, -8.041622161865234, -7.491578578948975, -6.941534996032715, -6.391491889953613, -5.841448783874512, -5.291405200958252, -4.741361618041992, -4.191318511962891, -3.64127516746521, -3.0912318229675293, -2.5411884784698486, -1.991145133972168, -1.4411017894744873, -0.8910584449768066, -0.341015100479126, 0.20902633666992188, 0.7590696811676025, 1.3091130256652832, 1.8591563701629639, 2.4091997146606445, 2.959243059158325, 3.509286403656006, 4.059329986572266, 4.609373092651367, 5.159416198730469, 5.7094597816467285, 6.259503364562988, 6.80954647064209, 7.359589576721191, 7.909633159637451, 8.459676742553711, 9.009719848632812, 9.559762954711914, 10.109806060791016, 10.659850120544434, 11.209893226623535, 11.759936332702637, 12.309980392456055, 12.860023498535156, 13.410066604614258, 13.96010971069336, 14.510152816772461, 15.060196876525879, 15.61023998260498, 16.1602840423584, 16.7103271484375, 17.2603702545166, 17.810413360595703]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 5.0, 14.0, 19.0, 23.0, 24.0, 46.0, 60.0, 96.0, 179.0, 303.0, 519.0, 947.0, 1550.0, 2999.0, 5851.0, 11603.0, 26092.0, 67307.0, 224594.0, 862959.0, 1826528.0, 832502.0, 214093.0, 65896.0, 25592.0, 11738.0, 5784.0, 3055.0, 1640.0, 930.0, 580.0, 280.0, 178.0, 112.0, 67.0, 58.0, 19.0, 18.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0693359375, -1.0408096313476562, -1.0122833251953125, -0.9837570190429688, -0.955230712890625, -0.9267044067382812, -0.8981781005859375, -0.8696517944335938, -0.84112548828125, -0.8125991821289062, -0.7840728759765625, -0.7555465698242188, -0.727020263671875, -0.6984939575195312, -0.6699676513671875, -0.6414413452148438, -0.6129150390625, -0.5843887329101562, -0.5558624267578125, -0.5273361206054688, -0.498809814453125, -0.47028350830078125, -0.4417572021484375, -0.41323089599609375, -0.38470458984375, -0.35617828369140625, -0.3276519775390625, -0.29912567138671875, -0.270599365234375, -0.24207305908203125, -0.2135467529296875, -0.18502044677734375, -0.156494140625, -0.12796783447265625, -0.0994415283203125, -0.07091522216796875, -0.042388916015625, -0.01386260986328125, 0.0146636962890625, 0.04319000244140625, 0.07171630859375, 0.10024261474609375, 0.1287689208984375, 0.15729522705078125, 0.185821533203125, 0.21434783935546875, 0.2428741455078125, 0.27140045166015625, 0.2999267578125, 0.32845306396484375, 0.3569793701171875, 0.38550567626953125, 0.414031982421875, 0.44255828857421875, 0.4710845947265625, 0.49961090087890625, 0.52813720703125, 0.5566635131835938, 0.5851898193359375, 0.6137161254882812, 0.642242431640625, 0.6707687377929688, 0.6992950439453125, 0.7278213500976562, 0.75634765625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 10.0, 7.0, 6.0, 8.0, 10.0, 11.0, 12.0, 12.0, 16.0, 15.0, 21.0, 29.0, 34.0, 38.0, 35.0, 38.0, 35.0, 40.0, 33.0, 49.0, 44.0, 41.0, 46.0, 30.0, 33.0, 45.0, 36.0, 38.0, 25.0, 30.0, 24.0, 16.0, 18.0, 9.0, 15.0, 15.0, 16.0, 10.0, 13.0, 10.0, 6.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.8359375, -0.81036376953125, -0.7847900390625, -0.75921630859375, -0.733642578125, -0.70806884765625, -0.6824951171875, -0.65692138671875, -0.63134765625, -0.60577392578125, -0.5802001953125, -0.55462646484375, -0.529052734375, -0.50347900390625, -0.4779052734375, -0.45233154296875, -0.4267578125, -0.40118408203125, -0.3756103515625, -0.35003662109375, -0.324462890625, -0.29888916015625, -0.2733154296875, -0.24774169921875, -0.22216796875, -0.19659423828125, -0.1710205078125, -0.14544677734375, -0.119873046875, -0.09429931640625, -0.0687255859375, -0.04315185546875, -0.017578125, 0.00799560546875, 0.0335693359375, 0.05914306640625, 0.084716796875, 0.11029052734375, 0.1358642578125, 0.16143798828125, 0.18701171875, 0.21258544921875, 0.2381591796875, 0.26373291015625, 0.289306640625, 0.31488037109375, 0.3404541015625, 0.36602783203125, 0.3916015625, 0.41717529296875, 0.4427490234375, 0.46832275390625, 0.493896484375, 0.51947021484375, 0.5450439453125, 0.57061767578125, 0.59619140625, 0.62176513671875, 0.6473388671875, 0.67291259765625, 0.698486328125, 0.72406005859375, 0.7496337890625, 0.77520751953125, 0.80078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 9.0, 6.0, 9.0, 15.0, 26.0, 22.0, 42.0, 38.0, 74.0, 116.0, 164.0, 327.0, 630.0, 1498.0, 4174.0, 13982.0, 58478.0, 435522.0, 3220498.0, 381593.0, 55331.0, 13750.0, 4434.0, 1747.0, 777.0, 414.0, 221.0, 133.0, 71.0, 60.0, 39.0, 26.0, 16.0, 10.0, 5.0, 9.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.39453125, -2.322998046875, -2.25146484375, -2.179931640625, -2.1083984375, -2.036865234375, -1.96533203125, -1.893798828125, -1.822265625, -1.750732421875, -1.67919921875, -1.607666015625, -1.5361328125, -1.464599609375, -1.39306640625, -1.321533203125, -1.25, -1.178466796875, -1.10693359375, -1.035400390625, -0.9638671875, -0.892333984375, -0.82080078125, -0.749267578125, -0.677734375, -0.606201171875, -0.53466796875, -0.463134765625, -0.3916015625, -0.320068359375, -0.24853515625, -0.177001953125, -0.10546875, -0.033935546875, 0.03759765625, 0.109130859375, 0.1806640625, 0.252197265625, 0.32373046875, 0.395263671875, 0.466796875, 0.538330078125, 0.60986328125, 0.681396484375, 0.7529296875, 0.824462890625, 0.89599609375, 0.967529296875, 1.0390625, 1.110595703125, 1.18212890625, 1.253662109375, 1.3251953125, 1.396728515625, 1.46826171875, 1.539794921875, 1.611328125, 1.682861328125, 1.75439453125, 1.825927734375, 1.8974609375, 1.968994140625, 2.04052734375, 2.112060546875, 2.18359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 9.0, 18.0, 15.0, 25.0, 29.0, 36.0, 51.0, 103.0, 138.0, 269.0, 486.0, 668.0, 768.0, 536.0, 357.0, 166.0, 116.0, 80.0, 55.0, 36.0, 23.0, 15.0, 17.0, 14.0, 8.0, 6.0, 3.0, 2.0, 6.0, 1.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.615234375, -2.5286865234375, -2.442138671875, -2.3555908203125, -2.26904296875, -2.1824951171875, -2.095947265625, -2.0093994140625, -1.9228515625, -1.8363037109375, -1.749755859375, -1.6632080078125, -1.57666015625, -1.4901123046875, -1.403564453125, -1.3170166015625, -1.23046875, -1.1439208984375, -1.057373046875, -0.9708251953125, -0.88427734375, -0.7977294921875, -0.711181640625, -0.6246337890625, -0.5380859375, -0.4515380859375, -0.364990234375, -0.2784423828125, -0.19189453125, -0.1053466796875, -0.018798828125, 0.0677490234375, 0.154296875, 0.2408447265625, 0.327392578125, 0.4139404296875, 0.50048828125, 0.5870361328125, 0.673583984375, 0.7601318359375, 0.8466796875, 0.9332275390625, 1.019775390625, 1.1063232421875, 1.19287109375, 1.2794189453125, 1.365966796875, 1.4525146484375, 1.5390625, 1.6256103515625, 1.712158203125, 1.7987060546875, 1.88525390625, 1.9718017578125, 2.058349609375, 2.1448974609375, 2.2314453125, 2.3179931640625, 2.404541015625, 2.4910888671875, 2.57763671875, 2.6641845703125, 2.750732421875, 2.8372802734375, 2.923828125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 11.0, 35.0, 74.0, 259.0, 284.0, 220.0, 57.0, 26.0, 20.0, 2.0, 7.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.636878967285156, -43.29689025878906, -41.9568977355957, -40.616905212402344, -39.27691650390625, -37.936927795410156, -36.5969352722168, -35.25694274902344, -33.916954040527344, -32.57696533203125, -31.23697280883789, -29.896982192993164, -28.556991577148438, -27.21700096130371, -25.877010345458984, -24.537019729614258, -23.19702911376953, -21.857038497924805, -20.517047882080078, -19.17705726623535, -17.837066650390625, -16.4970760345459, -15.157085418701172, -13.817094802856445, -12.477104187011719, -11.137113571166992, -9.797122955322266, -8.457132339477539, -7.1171417236328125, -5.777151107788086, -4.437160491943359, -3.097169876098633, -1.7571754455566406, -0.41718482971191406, 0.9228057861328125, 2.262796401977539, 3.6027870178222656, 4.942777633666992, 6.282768249511719, 7.622758865356445, 8.962749481201172, 10.302740097045898, 11.642730712890625, 12.982721328735352, 14.322711944580078, 15.662702560424805, 17.00269317626953, 18.342683792114258, 19.682674407958984, 21.02266502380371, 22.362655639648438, 23.702646255493164, 25.04263687133789, 26.382627487182617, 27.722618103027344, 29.06260871887207, 30.402599334716797, 31.742589950561523, 33.08258056640625, 34.422569274902344, 35.7625617980957, 37.10255432128906, 38.442543029785156, 39.78253173828125, 41.12252426147461]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 12.0, 10.0, 8.0, 8.0, 10.0, 13.0, 15.0, 18.0, 23.0, 27.0, 33.0, 38.0, 39.0, 55.0, 46.0, 54.0, 54.0, 64.0, 58.0, 58.0, 59.0, 46.0, 45.0, 40.0, 29.0, 29.0, 20.0, 21.0, 13.0, 10.0, 16.0, 7.0, 8.0, 2.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.405157089233398, -10.970491409301758, -10.535825729370117, -10.101160049438477, -9.666494369506836, -9.231828689575195, -8.797163009643555, -8.362497329711914, -7.927831649780273, -7.493165969848633, -7.058500289916992, -6.623834609985352, -6.189168930053711, -5.75450325012207, -5.31983757019043, -4.885171890258789, -4.45050573348999, -4.01584005355835, -3.581174373626709, -3.1465086936950684, -2.7118430137634277, -2.277177095413208, -1.8425114154815674, -1.4078457355499268, -0.9731800556182861, -0.5385143756866455, -0.10384863615036011, 0.3308171033859253, 0.7654827833175659, 1.200148582458496, 1.6348142623901367, 2.0694799423217773, 2.504145622253418, 2.9388113021850586, 3.373476982116699, 3.80814266204834, 4.2428083419799805, 4.677474021911621, 5.112139701843262, 5.546805381774902, 5.981471061706543, 6.416136741638184, 6.850802421569824, 7.285468101501465, 7.7201337814331055, 8.154799461364746, 8.589465141296387, 9.024130821228027, 9.458797454833984, 9.893463134765625, 10.328128814697266, 10.762794494628906, 11.197460174560547, 11.632125854492188, 12.066791534423828, 12.501457214355469, 12.93612289428711, 13.37078857421875, 13.80545425415039, 14.240119934082031, 14.674785614013672, 15.109451293945312, 15.544116973876953, 15.978782653808594, 16.413448333740234]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 2.0, 6.0, 11.0, 17.0, 22.0, 41.0, 47.0, 86.0, 120.0, 200.0, 296.0, 450.0, 721.0, 1266.0, 2099.0, 3736.0, 6752.0, 12405.0, 23564.0, 44899.0, 85543.0, 155699.0, 230588.0, 208434.0, 126814.0, 67570.0, 35239.0, 18756.0, 9957.0, 5443.0, 3106.0, 1803.0, 1105.0, 606.0, 402.0, 261.0, 161.0, 105.0, 76.0, 44.0, 36.0, 20.0, 13.0, 8.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.3134765625, -1.2708587646484375, -1.228240966796875, -1.1856231689453125, -1.14300537109375, -1.1003875732421875, -1.057769775390625, -1.0151519775390625, -0.9725341796875, -0.9299163818359375, -0.887298583984375, -0.8446807861328125, -0.80206298828125, -0.7594451904296875, -0.716827392578125, -0.6742095947265625, -0.631591796875, -0.5889739990234375, -0.546356201171875, -0.5037384033203125, -0.46112060546875, -0.4185028076171875, -0.375885009765625, -0.3332672119140625, -0.2906494140625, -0.2480316162109375, -0.205413818359375, -0.1627960205078125, -0.12017822265625, -0.0775604248046875, -0.034942626953125, 0.0076751708984375, 0.05029296875, 0.0929107666015625, 0.135528564453125, 0.1781463623046875, 0.22076416015625, 0.2633819580078125, 0.305999755859375, 0.3486175537109375, 0.3912353515625, 0.4338531494140625, 0.476470947265625, 0.5190887451171875, 0.56170654296875, 0.6043243408203125, 0.646942138671875, 0.6895599365234375, 0.732177734375, 0.7747955322265625, 0.817413330078125, 0.8600311279296875, 0.90264892578125, 0.9452667236328125, 0.987884521484375, 1.0305023193359375, 1.0731201171875, 1.1157379150390625, 1.158355712890625, 1.2009735107421875, 1.24359130859375, 1.2862091064453125, 1.328826904296875, 1.3714447021484375, 1.4140625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 7.0, 8.0, 9.0, 21.0, 19.0, 15.0, 26.0, 42.0, 39.0, 61.0, 69.0, 48.0, 61.0, 70.0, 59.0, 66.0, 54.0, 49.0, 55.0, 47.0, 36.0, 30.0, 31.0, 30.0, 15.0, 17.0, 5.0, 9.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.875, -1.8325729370117188, -1.7901458740234375, -1.7477188110351562, -1.705291748046875, -1.6628646850585938, -1.6204376220703125, -1.5780105590820312, -1.53558349609375, -1.4931564331054688, -1.4507293701171875, -1.4083023071289062, -1.365875244140625, -1.3234481811523438, -1.2810211181640625, -1.2385940551757812, -1.1961669921875, -1.1537399291992188, -1.1113128662109375, -1.0688858032226562, -1.026458740234375, -0.9840316772460938, -0.9416046142578125, -0.8991775512695312, -0.85675048828125, -0.8143234252929688, -0.7718963623046875, -0.7294692993164062, -0.687042236328125, -0.6446151733398438, -0.6021881103515625, -0.5597610473632812, -0.517333984375, -0.47490692138671875, -0.4324798583984375, -0.39005279541015625, -0.347625732421875, -0.30519866943359375, -0.2627716064453125, -0.22034454345703125, -0.17791748046875, -0.13549041748046875, -0.0930633544921875, -0.05063629150390625, -0.008209228515625, 0.03421783447265625, 0.0766448974609375, 0.11907196044921875, 0.1614990234375, 0.20392608642578125, 0.2463531494140625, 0.28878021240234375, 0.331207275390625, 0.37363433837890625, 0.4160614013671875, 0.45848846435546875, 0.50091552734375, 0.5433425903320312, 0.5857696533203125, 0.6281967163085938, 0.670623779296875, 0.7130508422851562, 0.7554779052734375, 0.7979049682617188, 0.84033203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 6.0, 6.0, 13.0, 23.0, 38.0, 43.0, 69.0, 100.0, 152.0, 238.0, 347.0, 548.0, 983.0, 2066.0, 5989.0, 26861.0, 182314.0, 683409.0, 117714.0, 18917.0, 4567.0, 1736.0, 864.0, 547.0, 318.0, 202.0, 147.0, 111.0, 67.0, 37.0, 41.0, 27.0, 24.0, 14.0, 6.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.527923583984375, -4.40350341796875, -4.279083251953125, -4.1546630859375, -4.030242919921875, -3.90582275390625, -3.781402587890625, -3.656982421875, -3.532562255859375, -3.40814208984375, -3.283721923828125, -3.1593017578125, -3.034881591796875, -2.91046142578125, -2.786041259765625, -2.66162109375, -2.537200927734375, -2.41278076171875, -2.288360595703125, -2.1639404296875, -2.039520263671875, -1.91510009765625, -1.790679931640625, -1.666259765625, -1.541839599609375, -1.41741943359375, -1.292999267578125, -1.1685791015625, -1.044158935546875, -0.91973876953125, -0.795318603515625, -0.6708984375, -0.546478271484375, -0.42205810546875, -0.297637939453125, -0.1732177734375, -0.048797607421875, 0.07562255859375, 0.200042724609375, 0.324462890625, 0.448883056640625, 0.57330322265625, 0.697723388671875, 0.8221435546875, 0.946563720703125, 1.07098388671875, 1.195404052734375, 1.31982421875, 1.444244384765625, 1.56866455078125, 1.693084716796875, 1.8175048828125, 1.941925048828125, 2.06634521484375, 2.190765380859375, 2.315185546875, 2.439605712890625, 2.56402587890625, 2.688446044921875, 2.8128662109375, 2.937286376953125, 3.06170654296875, 3.186126708984375, 3.310546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 8.0, 9.0, 11.0, 8.0, 16.0, 24.0, 16.0, 31.0, 33.0, 35.0, 41.0, 37.0, 42.0, 43.0, 43.0, 62.0, 51.0, 58.0, 46.0, 43.0, 39.0, 34.0, 36.0, 36.0, 32.0, 23.0, 15.0, 22.0, 21.0, 11.0, 16.0, 15.0, 10.0, 7.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.75, -4.618988037109375, -4.48797607421875, -4.356964111328125, -4.2259521484375, -4.094940185546875, -3.96392822265625, -3.832916259765625, -3.701904296875, -3.570892333984375, -3.43988037109375, -3.308868408203125, -3.1778564453125, -3.046844482421875, -2.91583251953125, -2.784820556640625, -2.65380859375, -2.522796630859375, -2.39178466796875, -2.260772705078125, -2.1297607421875, -1.998748779296875, -1.86773681640625, -1.736724853515625, -1.605712890625, -1.474700927734375, -1.34368896484375, -1.212677001953125, -1.0816650390625, -0.950653076171875, -0.81964111328125, -0.688629150390625, -0.5576171875, -0.426605224609375, -0.29559326171875, -0.164581298828125, -0.0335693359375, 0.097442626953125, 0.22845458984375, 0.359466552734375, 0.490478515625, 0.621490478515625, 0.75250244140625, 0.883514404296875, 1.0145263671875, 1.145538330078125, 1.27655029296875, 1.407562255859375, 1.53857421875, 1.669586181640625, 1.80059814453125, 1.931610107421875, 2.0626220703125, 2.193634033203125, 2.32464599609375, 2.455657958984375, 2.586669921875, 2.717681884765625, 2.84869384765625, 2.979705810546875, 3.1107177734375, 3.241729736328125, 3.37274169921875, 3.503753662109375, 3.634765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 7.0, 12.0, 13.0, 14.0, 14.0, 36.0, 50.0, 91.0, 140.0, 234.0, 458.0, 993.0, 2229.0, 6090.0, 19832.0, 88664.0, 562350.0, 288725.0, 56948.0, 13766.0, 4508.0, 1714.0, 754.0, 366.0, 198.0, 125.0, 75.0, 38.0, 25.0, 24.0, 15.0, 17.0, 10.0, 10.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86962890625, -0.8346481323242188, -0.7996673583984375, -0.7646865844726562, -0.729705810546875, -0.6947250366210938, -0.6597442626953125, -0.6247634887695312, -0.58978271484375, -0.5548019409179688, -0.5198211669921875, -0.48484039306640625, -0.449859619140625, -0.41487884521484375, -0.3798980712890625, -0.34491729736328125, -0.3099365234375, -0.27495574951171875, -0.2399749755859375, -0.20499420166015625, -0.170013427734375, -0.13503265380859375, -0.1000518798828125, -0.06507110595703125, -0.03009033203125, 0.00489044189453125, 0.0398712158203125, 0.07485198974609375, 0.109832763671875, 0.14481353759765625, 0.1797943115234375, 0.21477508544921875, 0.249755859375, 0.28473663330078125, 0.3197174072265625, 0.35469818115234375, 0.389678955078125, 0.42465972900390625, 0.4596405029296875, 0.49462127685546875, 0.52960205078125, 0.5645828247070312, 0.5995635986328125, 0.6345443725585938, 0.669525146484375, 0.7045059204101562, 0.7394866943359375, 0.7744674682617188, 0.8094482421875, 0.8444290161132812, 0.8794097900390625, 0.9143905639648438, 0.949371337890625, 0.9843521118164062, 1.0193328857421875, 1.0543136596679688, 1.08929443359375, 1.1242752075195312, 1.1592559814453125, 1.1942367553710938, 1.229217529296875, 1.2641983032226562, 1.2991790771484375, 1.3341598510742188, 1.369140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 13.0, 9.0, 14.0, 12.0, 23.0, 23.0, 28.0, 47.0, 53.0, 77.0, 82.0, 89.0, 95.0, 77.0, 67.0, 44.0, 51.0, 46.0, 26.0, 29.0, 16.0, 23.0, 8.0, 7.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031495094299316406, -0.00030369311571121216, -0.00029243528842926025, -0.00028117746114730835, -0.00026991963386535645, -0.00025866180658340454, -0.00024740397930145264, -0.00023614615201950073, -0.00022488832473754883, -0.00021363049745559692, -0.00020237267017364502, -0.00019111484289169312, -0.0001798570156097412, -0.0001685991883277893, -0.0001573413610458374, -0.0001460835337638855, -0.0001348257064819336, -0.0001235678791999817, -0.00011231005191802979, -0.00010105222463607788, -8.979439735412598e-05, -7.853657007217407e-05, -6.727874279022217e-05, -5.6020915508270264e-05, -4.476308822631836e-05, -3.3505260944366455e-05, -2.224743366241455e-05, -1.0989606380462646e-05, 2.682209014892578e-07, 1.1526048183441162e-05, 2.2783875465393066e-05, 3.404170274734497e-05, 4.5299530029296875e-05, 5.655735731124878e-05, 6.781518459320068e-05, 7.907301187515259e-05, 9.033083915710449e-05, 0.0001015886664390564, 0.0001128464937210083, 0.0001241043210029602, 0.0001353621482849121, 0.00014661997556686401, 0.00015787780284881592, 0.00016913563013076782, 0.00018039345741271973, 0.00019165128469467163, 0.00020290911197662354, 0.00021416693925857544, 0.00022542476654052734, 0.00023668259382247925, 0.00024794042110443115, 0.00025919824838638306, 0.00027045607566833496, 0.00028171390295028687, 0.00029297173023223877, 0.0003042295575141907, 0.0003154873847961426, 0.0003267452120780945, 0.0003380030393600464, 0.0003492608666419983, 0.0003605186939239502, 0.0003717765212059021, 0.000383034348487854, 0.0003942921757698059, 0.0004055500030517578]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 6.0, 7.0, 17.0, 21.0, 26.0, 34.0, 45.0, 73.0, 146.0, 217.0, 444.0, 725.0, 1355.0, 3186.0, 8419.0, 30212.0, 150035.0, 621420.0, 180160.0, 35455.0, 9616.0, 3558.0, 1555.0, 745.0, 416.0, 249.0, 135.0, 88.0, 63.0, 31.0, 19.0, 18.0, 10.0, 16.0, 10.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0302734375, -0.998626708984375, -0.96697998046875, -0.935333251953125, -0.9036865234375, -0.872039794921875, -0.84039306640625, -0.808746337890625, -0.777099609375, -0.745452880859375, -0.71380615234375, -0.682159423828125, -0.6505126953125, -0.618865966796875, -0.58721923828125, -0.555572509765625, -0.52392578125, -0.492279052734375, -0.46063232421875, -0.428985595703125, -0.3973388671875, -0.365692138671875, -0.33404541015625, -0.302398681640625, -0.270751953125, -0.239105224609375, -0.20745849609375, -0.175811767578125, -0.1441650390625, -0.112518310546875, -0.08087158203125, -0.049224853515625, -0.017578125, 0.014068603515625, 0.04571533203125, 0.077362060546875, 0.1090087890625, 0.140655517578125, 0.17230224609375, 0.203948974609375, 0.235595703125, 0.267242431640625, 0.29888916015625, 0.330535888671875, 0.3621826171875, 0.393829345703125, 0.42547607421875, 0.457122802734375, 0.48876953125, 0.520416259765625, 0.55206298828125, 0.583709716796875, 0.6153564453125, 0.647003173828125, 0.67864990234375, 0.710296630859375, 0.741943359375, 0.773590087890625, 0.80523681640625, 0.836883544921875, 0.8685302734375, 0.900177001953125, 0.93182373046875, 0.963470458984375, 0.9951171875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 10.0, 12.0, 15.0, 34.0, 46.0, 64.0, 63.0, 92.0, 108.0, 109.0, 101.0, 78.0, 79.0, 57.0, 39.0, 31.0, 21.0, 16.0, 12.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.58203125, -1.533416748046875, -1.48480224609375, -1.436187744140625, -1.3875732421875, -1.338958740234375, -1.29034423828125, -1.241729736328125, -1.193115234375, -1.144500732421875, -1.09588623046875, -1.047271728515625, -0.9986572265625, -0.950042724609375, -0.90142822265625, -0.852813720703125, -0.80419921875, -0.755584716796875, -0.70697021484375, -0.658355712890625, -0.6097412109375, -0.561126708984375, -0.51251220703125, -0.463897705078125, -0.415283203125, -0.366668701171875, -0.31805419921875, -0.269439697265625, -0.2208251953125, -0.172210693359375, -0.12359619140625, -0.074981689453125, -0.0263671875, 0.022247314453125, 0.07086181640625, 0.119476318359375, 0.1680908203125, 0.216705322265625, 0.26531982421875, 0.313934326171875, 0.362548828125, 0.411163330078125, 0.45977783203125, 0.508392333984375, 0.5570068359375, 0.605621337890625, 0.65423583984375, 0.702850341796875, 0.75146484375, 0.800079345703125, 0.84869384765625, 0.897308349609375, 0.9459228515625, 0.994537353515625, 1.04315185546875, 1.091766357421875, 1.140380859375, 1.188995361328125, 1.23760986328125, 1.286224365234375, 1.3348388671875, 1.383453369140625, 1.43206787109375, 1.480682373046875, 1.529296875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 10.0, 42.0, 178.0, 431.0, 220.0, 77.0, 23.0, 10.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.16886138916016, -67.41625213623047, -65.66364288330078, -63.91102981567383, -62.15842056274414, -60.40580749511719, -58.6531982421875, -56.90058898925781, -55.147979736328125, -53.39537048339844, -51.642757415771484, -49.8901481628418, -48.13753890991211, -46.384925842285156, -44.63231658935547, -42.87970733642578, -41.12709426879883, -39.37448501586914, -37.62187194824219, -35.8692626953125, -34.11665344238281, -32.364044189453125, -30.611431121826172, -28.858821868896484, -27.106210708618164, -25.353599548339844, -23.600990295410156, -21.848379135131836, -20.095767974853516, -18.343158721923828, -16.590547561645508, -14.837937355041504, -13.0853271484375, -11.332716941833496, -9.580106735229492, -7.827495574951172, -6.074885368347168, -4.322275161743164, -2.5696640014648438, -0.8170537948608398, 0.9355564117431641, 2.688166856765747, 4.44077730178833, 6.193387985229492, 7.945998191833496, 9.6986083984375, 11.45121955871582, 13.203829765319824, 14.956439971923828, 16.70905113220215, 18.461660385131836, 20.214271545410156, 21.966880798339844, 23.719491958618164, 25.472103118896484, 27.224712371826172, 28.977323532104492, 30.729934692382812, 32.4825439453125, 34.23515319824219, 35.98776626586914, 37.74037551879883, 39.49298858642578, 41.24559783935547, 42.998207092285156]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 5.0, 10.0, 8.0, 8.0, 10.0, 10.0, 7.0, 17.0, 19.0, 18.0, 33.0, 28.0, 25.0, 27.0, 35.0, 37.0, 38.0, 58.0, 66.0, 75.0, 67.0, 52.0, 41.0, 38.0, 37.0, 31.0, 35.0, 24.0, 22.0, 16.0, 17.0, 13.0, 9.0, 9.0, 8.0, 7.0, 7.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-16.460195541381836, -15.962446212768555, -15.46469783782959, -14.966948509216309, -14.469200134277344, -13.971450805664062, -13.473701477050781, -12.975953102111816, -12.478204727172852, -11.98045539855957, -11.482707023620605, -10.984957695007324, -10.48720932006836, -9.989459991455078, -9.491710662841797, -8.993962287902832, -8.49621295928955, -7.998464107513428, -7.500715255737305, -7.002965927124023, -6.505217552185059, -6.007468223571777, -5.509719371795654, -5.011970520019531, -4.514221668243408, -4.016472816467285, -3.518723964691162, -3.02097487449646, -2.523226022720337, -2.025477170944214, -1.5277280807495117, -1.0299792289733887, -0.5322303771972656, -0.0344814658164978, 0.46326744556427, 0.9610164165496826, 1.4587652683258057, 1.9565141201019287, 2.454263210296631, 2.952012062072754, 3.449760913848877, 3.947509765625, 4.445258617401123, 4.943007469177246, 5.440756797790527, 5.938505172729492, 6.436254501342773, 6.9340033531188965, 7.4317522048950195, 7.929501056671143, 8.427249908447266, 8.924999237060547, 9.422747611999512, 9.920496940612793, 10.418245315551758, 10.915994644165039, 11.41374397277832, 11.911493301391602, 12.409241676330566, 12.906991004943848, 13.404739379882812, 13.902488708496094, 14.400238037109375, 14.89798641204834, 15.395734786987305]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 8.0, 6.0, 10.0, 17.0, 22.0, 27.0, 39.0, 64.0, 67.0, 119.0, 181.0, 291.0, 538.0, 1126.0, 2732.0, 7454.0, 27860.0, 167471.0, 1375864.0, 2209801.0, 334879.0, 47436.0, 11390.0, 3616.0, 1487.0, 721.0, 386.0, 210.0, 112.0, 103.0, 53.0, 37.0, 37.0, 26.0, 25.0, 21.0, 12.0, 11.0, 3.0, 8.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.396484375, -1.350189208984375, -1.30389404296875, -1.257598876953125, -1.2113037109375, -1.165008544921875, -1.11871337890625, -1.072418212890625, -1.026123046875, -0.979827880859375, -0.93353271484375, -0.887237548828125, -0.8409423828125, -0.794647216796875, -0.74835205078125, -0.702056884765625, -0.65576171875, -0.609466552734375, -0.56317138671875, -0.516876220703125, -0.4705810546875, -0.424285888671875, -0.37799072265625, -0.331695556640625, -0.285400390625, -0.239105224609375, -0.19281005859375, -0.146514892578125, -0.1002197265625, -0.053924560546875, -0.00762939453125, 0.038665771484375, 0.0849609375, 0.131256103515625, 0.17755126953125, 0.223846435546875, 0.2701416015625, 0.316436767578125, 0.36273193359375, 0.409027099609375, 0.455322265625, 0.501617431640625, 0.54791259765625, 0.594207763671875, 0.6405029296875, 0.686798095703125, 0.73309326171875, 0.779388427734375, 0.82568359375, 0.871978759765625, 0.91827392578125, 0.964569091796875, 1.0108642578125, 1.057159423828125, 1.10345458984375, 1.149749755859375, 1.196044921875, 1.242340087890625, 1.28863525390625, 1.334930419921875, 1.3812255859375, 1.427520751953125, 1.47381591796875, 1.520111083984375, 1.56640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 6.0, 5.0, 8.0, 9.0, 10.0, 11.0, 11.0, 19.0, 26.0, 31.0, 26.0, 35.0, 33.0, 39.0, 40.0, 40.0, 37.0, 45.0, 52.0, 43.0, 46.0, 42.0, 39.0, 33.0, 43.0, 44.0, 39.0, 28.0, 24.0, 19.0, 16.0, 22.0, 19.0, 12.0, 11.0, 9.0, 5.0, 7.0, 2.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.978515625, -0.95013427734375, -0.9217529296875, -0.89337158203125, -0.864990234375, -0.83660888671875, -0.8082275390625, -0.77984619140625, -0.75146484375, -0.72308349609375, -0.6947021484375, -0.66632080078125, -0.637939453125, -0.60955810546875, -0.5811767578125, -0.55279541015625, -0.5244140625, -0.49603271484375, -0.4676513671875, -0.43927001953125, -0.410888671875, -0.38250732421875, -0.3541259765625, -0.32574462890625, -0.29736328125, -0.26898193359375, -0.2406005859375, -0.21221923828125, -0.183837890625, -0.15545654296875, -0.1270751953125, -0.09869384765625, -0.0703125, -0.04193115234375, -0.0135498046875, 0.01483154296875, 0.043212890625, 0.07159423828125, 0.0999755859375, 0.12835693359375, 0.15673828125, 0.18511962890625, 0.2135009765625, 0.24188232421875, 0.270263671875, 0.29864501953125, 0.3270263671875, 0.35540771484375, 0.3837890625, 0.41217041015625, 0.4405517578125, 0.46893310546875, 0.497314453125, 0.52569580078125, 0.5540771484375, 0.58245849609375, 0.61083984375, 0.63922119140625, 0.6676025390625, 0.69598388671875, 0.724365234375, 0.75274658203125, 0.7811279296875, 0.80950927734375, 0.837890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 17.0, 34.0, 81.0, 115.0, 283.0, 670.0, 2470.0, 22823.0, 3594306.0, 561182.0, 9383.0, 1703.0, 633.0, 279.0, 126.0, 77.0, 44.0, 18.0, 11.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4609375, -6.27001953125, -6.0791015625, -5.88818359375, -5.697265625, -5.50634765625, -5.3154296875, -5.12451171875, -4.93359375, -4.74267578125, -4.5517578125, -4.36083984375, -4.169921875, -3.97900390625, -3.7880859375, -3.59716796875, -3.40625, -3.21533203125, -3.0244140625, -2.83349609375, -2.642578125, -2.45166015625, -2.2607421875, -2.06982421875, -1.87890625, -1.68798828125, -1.4970703125, -1.30615234375, -1.115234375, -0.92431640625, -0.7333984375, -0.54248046875, -0.3515625, -0.16064453125, 0.0302734375, 0.22119140625, 0.412109375, 0.60302734375, 0.7939453125, 0.98486328125, 1.17578125, 1.36669921875, 1.5576171875, 1.74853515625, 1.939453125, 2.13037109375, 2.3212890625, 2.51220703125, 2.703125, 2.89404296875, 3.0849609375, 3.27587890625, 3.466796875, 3.65771484375, 3.8486328125, 4.03955078125, 4.23046875, 4.42138671875, 4.6123046875, 4.80322265625, 4.994140625, 5.18505859375, 5.3759765625, 5.56689453125, 5.7578125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 16.0, 34.0, 50.0, 98.0, 218.0, 524.0, 1061.0, 1029.0, 544.0, 225.0, 111.0, 59.0, 31.0, 13.0, 11.0, 9.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.06640625, -2.93280029296875, -2.7991943359375, -2.66558837890625, -2.531982421875, -2.39837646484375, -2.2647705078125, -2.13116455078125, -1.99755859375, -1.86395263671875, -1.7303466796875, -1.59674072265625, -1.463134765625, -1.32952880859375, -1.1959228515625, -1.06231689453125, -0.9287109375, -0.79510498046875, -0.6614990234375, -0.52789306640625, -0.394287109375, -0.26068115234375, -0.1270751953125, 0.00653076171875, 0.14013671875, 0.27374267578125, 0.4073486328125, 0.54095458984375, 0.674560546875, 0.80816650390625, 0.9417724609375, 1.07537841796875, 1.208984375, 1.34259033203125, 1.4761962890625, 1.60980224609375, 1.743408203125, 1.87701416015625, 2.0106201171875, 2.14422607421875, 2.27783203125, 2.41143798828125, 2.5450439453125, 2.67864990234375, 2.812255859375, 2.94586181640625, 3.0794677734375, 3.21307373046875, 3.3466796875, 3.48028564453125, 3.6138916015625, 3.74749755859375, 3.881103515625, 4.01470947265625, 4.1483154296875, 4.28192138671875, 4.41552734375, 4.54913330078125, 4.6827392578125, 4.81634521484375, 4.949951171875, 5.08355712890625, 5.2171630859375, 5.35076904296875, 5.484375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 12.0, 45.0, 103.0, 221.0, 259.0, 200.0, 87.0, 34.0, 13.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.412261962890625, -32.137489318847656, -30.862712860107422, -29.58793830871582, -28.31316375732422, -27.03839111328125, -25.76361656188965, -24.488842010498047, -23.214067459106445, -21.939292907714844, -20.664518356323242, -19.38974380493164, -18.114971160888672, -16.840194702148438, -15.565422058105469, -14.290647506713867, -13.015872955322266, -11.741098403930664, -10.466323852539062, -9.191550254821777, -7.916775703430176, -6.642001152038574, -5.367227077484131, -4.0924530029296875, -2.817678451538086, -1.5429041385650635, -0.268129825592041, 1.0066444873809814, 2.281418800354004, 3.5561933517456055, 4.830967426300049, 6.105741500854492, 7.380516052246094, 8.655290603637695, 9.930065155029297, 11.204838752746582, 12.479613304138184, 13.754387855529785, 15.02916145324707, 16.303936004638672, 17.578710556030273, 18.853485107421875, 20.128259658813477, 21.403034210205078, 22.677806854248047, 23.95258331298828, 25.22735595703125, 26.50213050842285, 27.776905059814453, 29.051679611206055, 30.326454162597656, 31.601228713989258, 32.87600326538086, 34.15077590942383, 35.42555236816406, 36.70032501220703, 37.97509765625, 39.24987030029297, 40.5246467590332, 41.79941940307617, 43.074195861816406, 44.348968505859375, 45.62374496459961, 46.89851760864258, 48.17329406738281]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 4.0, 10.0, 6.0, 8.0, 17.0, 16.0, 15.0, 28.0, 44.0, 38.0, 39.0, 34.0, 49.0, 44.0, 59.0, 49.0, 51.0, 62.0, 53.0, 36.0, 37.0, 38.0, 37.0, 28.0, 31.0, 33.0, 30.0, 28.0, 12.0, 14.0, 8.0, 7.0, 11.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0], "bins": [-19.158945083618164, -18.691299438476562, -18.223655700683594, -17.756010055541992, -17.28836441040039, -16.820720672607422, -16.35307502746582, -15.885429382324219, -15.417784690856934, -14.950139999389648, -14.482494354248047, -14.014849662780762, -13.54720401763916, -13.079559326171875, -12.611913681030273, -12.144268989562988, -11.676624298095703, -11.208979606628418, -10.741333961486816, -10.273689270019531, -9.80604362487793, -9.338398933410645, -8.87075424194336, -8.403108596801758, -7.935462951660156, -7.467817783355713, -7.0001726150512695, -6.532527923583984, -6.064882755279541, -5.597237586975098, -5.129592418670654, -4.661947250366211, -4.194302558898926, -3.7266573905944824, -3.259012460708618, -2.791367292404175, -2.3237223625183105, -1.8560771942138672, -1.3884320259094238, -0.9207870960235596, -0.4531419277191162, 0.014503151178359985, 0.4821482300758362, 0.9497933387756348, 1.4174383878707886, 1.8850834369659424, 2.3527286052703857, 2.82037353515625, 3.2880187034606934, 3.7556638717651367, 4.22330904006958, 4.690954208374023, 5.158598899841309, 5.626244068145752, 6.093889236450195, 6.5615339279174805, 7.029179573059082, 7.496824741363525, 7.964469909667969, 8.432114601135254, 8.899760246276855, 9.36740493774414, 9.835050582885742, 10.302695274353027, 10.770339965820312]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 4.0, 11.0, 17.0, 30.0, 49.0, 66.0, 106.0, 178.0, 272.0, 429.0, 700.0, 1180.0, 2054.0, 3451.0, 6181.0, 11094.0, 20851.0, 40623.0, 77849.0, 139837.0, 209286.0, 212577.0, 146584.0, 82073.0, 43111.0, 22495.0, 12027.0, 6441.0, 3629.0, 2088.0, 1279.0, 765.0, 440.0, 289.0, 190.0, 104.0, 69.0, 44.0, 34.0, 15.0, 9.0, 12.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.3310546875, -1.2930755615234375, -1.255096435546875, -1.2171173095703125, -1.17913818359375, -1.1411590576171875, -1.103179931640625, -1.0652008056640625, -1.0272216796875, -0.9892425537109375, -0.951263427734375, -0.9132843017578125, -0.87530517578125, -0.8373260498046875, -0.799346923828125, -0.7613677978515625, -0.723388671875, -0.6854095458984375, -0.647430419921875, -0.6094512939453125, -0.57147216796875, -0.5334930419921875, -0.495513916015625, -0.4575347900390625, -0.4195556640625, -0.3815765380859375, -0.343597412109375, -0.3056182861328125, -0.26763916015625, -0.2296600341796875, -0.191680908203125, -0.1537017822265625, -0.11572265625, -0.0777435302734375, -0.039764404296875, -0.0017852783203125, 0.03619384765625, 0.0741729736328125, 0.112152099609375, 0.1501312255859375, 0.1881103515625, 0.2260894775390625, 0.264068603515625, 0.3020477294921875, 0.34002685546875, 0.3780059814453125, 0.415985107421875, 0.4539642333984375, 0.491943359375, 0.5299224853515625, 0.567901611328125, 0.6058807373046875, 0.64385986328125, 0.6818389892578125, 0.719818115234375, 0.7577972412109375, 0.7957763671875, 0.8337554931640625, 0.871734619140625, 0.9097137451171875, 0.94769287109375, 0.9856719970703125, 1.023651123046875, 1.0616302490234375, 1.099609375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 9.0, 9.0, 12.0, 18.0, 13.0, 18.0, 21.0, 20.0, 32.0, 20.0, 23.0, 39.0, 25.0, 39.0, 33.0, 39.0, 37.0, 46.0, 42.0, 51.0, 44.0, 41.0, 42.0, 34.0, 36.0, 32.0, 25.0, 30.0, 21.0, 23.0, 15.0, 18.0, 12.0, 7.0, 15.0, 11.0, 9.0, 5.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.875, -0.8453826904296875, -0.815765380859375, -0.7861480712890625, -0.75653076171875, -0.7269134521484375, -0.697296142578125, -0.6676788330078125, -0.6380615234375, -0.6084442138671875, -0.578826904296875, -0.5492095947265625, -0.51959228515625, -0.4899749755859375, -0.460357666015625, -0.4307403564453125, -0.401123046875, -0.3715057373046875, -0.341888427734375, -0.3122711181640625, -0.28265380859375, -0.2530364990234375, -0.223419189453125, -0.1938018798828125, -0.1641845703125, -0.1345672607421875, -0.104949951171875, -0.0753326416015625, -0.04571533203125, -0.0160980224609375, 0.013519287109375, 0.0431365966796875, 0.07275390625, 0.1023712158203125, 0.131988525390625, 0.1616058349609375, 0.19122314453125, 0.2208404541015625, 0.250457763671875, 0.2800750732421875, 0.3096923828125, 0.3393096923828125, 0.368927001953125, 0.3985443115234375, 0.42816162109375, 0.4577789306640625, 0.487396240234375, 0.5170135498046875, 0.546630859375, 0.5762481689453125, 0.605865478515625, 0.6354827880859375, 0.66510009765625, 0.6947174072265625, 0.724334716796875, 0.7539520263671875, 0.7835693359375, 0.8131866455078125, 0.842803955078125, 0.8724212646484375, 0.90203857421875, 0.9316558837890625, 0.961273193359375, 0.9908905029296875, 1.0205078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 8.0, 6.0, 13.0, 17.0, 20.0, 26.0, 50.0, 66.0, 98.0, 162.0, 250.0, 542.0, 1159.0, 2776.0, 8227.0, 30427.0, 142338.0, 600271.0, 201791.0, 43146.0, 10742.0, 3499.0, 1400.0, 653.0, 359.0, 157.0, 103.0, 68.0, 47.0, 27.0, 28.0, 20.0, 16.0, 10.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.31640625, -3.225830078125, -3.13525390625, -3.044677734375, -2.9541015625, -2.863525390625, -2.77294921875, -2.682373046875, -2.591796875, -2.501220703125, -2.41064453125, -2.320068359375, -2.2294921875, -2.138916015625, -2.04833984375, -1.957763671875, -1.8671875, -1.776611328125, -1.68603515625, -1.595458984375, -1.5048828125, -1.414306640625, -1.32373046875, -1.233154296875, -1.142578125, -1.052001953125, -0.96142578125, -0.870849609375, -0.7802734375, -0.689697265625, -0.59912109375, -0.508544921875, -0.41796875, -0.327392578125, -0.23681640625, -0.146240234375, -0.0556640625, 0.034912109375, 0.12548828125, 0.216064453125, 0.306640625, 0.397216796875, 0.48779296875, 0.578369140625, 0.6689453125, 0.759521484375, 0.85009765625, 0.940673828125, 1.03125, 1.121826171875, 1.21240234375, 1.302978515625, 1.3935546875, 1.484130859375, 1.57470703125, 1.665283203125, 1.755859375, 1.846435546875, 1.93701171875, 2.027587890625, 2.1181640625, 2.208740234375, 2.29931640625, 2.389892578125, 2.48046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 13.0, 6.0, 7.0, 14.0, 12.0, 18.0, 21.0, 23.0, 29.0, 25.0, 34.0, 37.0, 38.0, 44.0, 49.0, 45.0, 54.0, 59.0, 59.0, 54.0, 51.0, 43.0, 38.0, 40.0, 36.0, 22.0, 18.0, 15.0, 18.0, 10.0, 12.0, 10.0, 8.0, 8.0, 8.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.01953125, -3.89141845703125, -3.7633056640625, -3.63519287109375, -3.507080078125, -3.37896728515625, -3.2508544921875, -3.12274169921875, -2.99462890625, -2.86651611328125, -2.7384033203125, -2.61029052734375, -2.482177734375, -2.35406494140625, -2.2259521484375, -2.09783935546875, -1.9697265625, -1.84161376953125, -1.7135009765625, -1.58538818359375, -1.457275390625, -1.32916259765625, -1.2010498046875, -1.07293701171875, -0.94482421875, -0.81671142578125, -0.6885986328125, -0.56048583984375, -0.432373046875, -0.30426025390625, -0.1761474609375, -0.04803466796875, 0.080078125, 0.20819091796875, 0.3363037109375, 0.46441650390625, 0.592529296875, 0.72064208984375, 0.8487548828125, 0.97686767578125, 1.10498046875, 1.23309326171875, 1.3612060546875, 1.48931884765625, 1.617431640625, 1.74554443359375, 1.8736572265625, 2.00177001953125, 2.1298828125, 2.25799560546875, 2.3861083984375, 2.51422119140625, 2.642333984375, 2.77044677734375, 2.8985595703125, 3.02667236328125, 3.15478515625, 3.28289794921875, 3.4110107421875, 3.53912353515625, 3.667236328125, 3.79534912109375, 3.9234619140625, 4.05157470703125, 4.1796875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 10.0, 13.0, 19.0, 22.0, 22.0, 36.0, 44.0, 75.0, 111.0, 174.0, 306.0, 434.0, 778.0, 1471.0, 3102.0, 7457.0, 23093.0, 100536.0, 620508.0, 223931.0, 44608.0, 12501.0, 4582.0, 2033.0, 1070.0, 616.0, 320.0, 218.0, 141.0, 85.0, 70.0, 40.0, 37.0, 17.0, 20.0, 15.0, 12.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0], "bins": [-1.2744140625, -1.2387542724609375, -1.203094482421875, -1.1674346923828125, -1.13177490234375, -1.0961151123046875, -1.060455322265625, -1.0247955322265625, -0.9891357421875, -0.9534759521484375, -0.917816162109375, -0.8821563720703125, -0.84649658203125, -0.8108367919921875, -0.775177001953125, -0.7395172119140625, -0.703857421875, -0.6681976318359375, -0.632537841796875, -0.5968780517578125, -0.56121826171875, -0.5255584716796875, -0.489898681640625, -0.4542388916015625, -0.4185791015625, -0.3829193115234375, -0.347259521484375, -0.3115997314453125, -0.27593994140625, -0.2402801513671875, -0.204620361328125, -0.1689605712890625, -0.13330078125, -0.0976409912109375, -0.061981201171875, -0.0263214111328125, 0.00933837890625, 0.0449981689453125, 0.080657958984375, 0.1163177490234375, 0.1519775390625, 0.1876373291015625, 0.223297119140625, 0.2589569091796875, 0.29461669921875, 0.3302764892578125, 0.365936279296875, 0.4015960693359375, 0.437255859375, 0.4729156494140625, 0.508575439453125, 0.5442352294921875, 0.57989501953125, 0.6155548095703125, 0.651214599609375, 0.6868743896484375, 0.7225341796875, 0.7581939697265625, 0.793853759765625, 0.8295135498046875, 0.86517333984375, 0.9008331298828125, 0.936492919921875, 0.9721527099609375, 1.0078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 16.0, 35.0, 99.0, 186.0, 288.0, 174.0, 101.0, 39.0, 23.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009074211120605469, -0.0008755847811698914, -0.0008437484502792358, -0.0008119121193885803, -0.0007800757884979248, -0.0007482394576072693, -0.0007164031267166138, -0.0006845667958259583, -0.0006527304649353027, -0.0006208941340446472, -0.0005890578031539917, -0.0005572214722633362, -0.0005253851413726807, -0.0004935488104820251, -0.00046171247959136963, -0.0004298761487007141, -0.0003980398178100586, -0.0003662034869194031, -0.00033436715602874756, -0.00030253082513809204, -0.0002706944942474365, -0.000238858163356781, -0.0002070218324661255, -0.00017518550157546997, -0.00014334917068481445, -0.00011151283979415894, -7.967650890350342e-05, -4.78401780128479e-05, -1.6003847122192383e-05, 1.5832483768463135e-05, 4.766881465911865e-05, 7.950514554977417e-05, 0.00011134147644042969, 0.0001431778073310852, 0.00017501413822174072, 0.00020685046911239624, 0.00023868680000305176, 0.0002705231308937073, 0.0003023594617843628, 0.0003341957926750183, 0.00036603212356567383, 0.00039786845445632935, 0.00042970478534698486, 0.0004615411162376404, 0.0004933774471282959, 0.0005252137780189514, 0.0005570501089096069, 0.0005888864398002625, 0.000620722770690918, 0.0006525591015815735, 0.000684395432472229, 0.0007162317633628845, 0.00074806809425354, 0.0007799044251441956, 0.0008117407560348511, 0.0008435770869255066, 0.0008754134178161621, 0.0009072497487068176, 0.0009390860795974731, 0.0009709224104881287, 0.0010027587413787842, 0.0010345950722694397, 0.0010664314031600952, 0.0010982677340507507, 0.0011301040649414062]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 12.0, 13.0, 7.0, 21.0, 38.0, 61.0, 113.0, 259.0, 637.0, 1681.0, 5895.0, 25898.0, 172151.0, 710633.0, 106804.0, 17611.0, 4286.0, 1466.0, 489.0, 202.0, 120.0, 57.0, 49.0, 20.0, 11.0, 5.0, 7.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884765625, -1.1434326171875, -1.098388671875, -1.0533447265625, -1.00830078125, -0.9632568359375, -0.918212890625, -0.8731689453125, -0.828125, -0.7830810546875, -0.738037109375, -0.6929931640625, -0.64794921875, -0.6029052734375, -0.557861328125, -0.5128173828125, -0.4677734375, -0.4227294921875, -0.377685546875, -0.3326416015625, -0.28759765625, -0.2425537109375, -0.197509765625, -0.1524658203125, -0.107421875, -0.0623779296875, -0.017333984375, 0.0277099609375, 0.07275390625, 0.1177978515625, 0.162841796875, 0.2078857421875, 0.2529296875, 0.2979736328125, 0.343017578125, 0.3880615234375, 0.43310546875, 0.4781494140625, 0.523193359375, 0.5682373046875, 0.61328125, 0.6583251953125, 0.703369140625, 0.7484130859375, 0.79345703125, 0.8385009765625, 0.883544921875, 0.9285888671875, 0.9736328125, 1.0186767578125, 1.063720703125, 1.1087646484375, 1.15380859375, 1.1988525390625, 1.243896484375, 1.2889404296875, 1.333984375, 1.3790283203125, 1.424072265625, 1.4691162109375, 1.51416015625, 1.5592041015625, 1.604248046875, 1.6492919921875, 1.6943359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 2.0, 6.0, 8.0, 10.0, 13.0, 18.0, 17.0, 24.0, 25.0, 31.0, 33.0, 38.0, 58.0, 56.0, 66.0, 67.0, 78.0, 58.0, 60.0, 52.0, 51.0, 41.0, 27.0, 34.0, 12.0, 17.0, 18.0, 15.0, 8.0, 5.0, 10.0, 12.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.931640625, -0.90252685546875, -0.8734130859375, -0.84429931640625, -0.815185546875, -0.78607177734375, -0.7569580078125, -0.72784423828125, -0.69873046875, -0.66961669921875, -0.6405029296875, -0.61138916015625, -0.582275390625, -0.55316162109375, -0.5240478515625, -0.49493408203125, -0.4658203125, -0.43670654296875, -0.4075927734375, -0.37847900390625, -0.349365234375, -0.32025146484375, -0.2911376953125, -0.26202392578125, -0.23291015625, -0.20379638671875, -0.1746826171875, -0.14556884765625, -0.116455078125, -0.08734130859375, -0.0582275390625, -0.02911376953125, 0.0, 0.02911376953125, 0.0582275390625, 0.08734130859375, 0.116455078125, 0.14556884765625, 0.1746826171875, 0.20379638671875, 0.23291015625, 0.26202392578125, 0.2911376953125, 0.32025146484375, 0.349365234375, 0.37847900390625, 0.4075927734375, 0.43670654296875, 0.4658203125, 0.49493408203125, 0.5240478515625, 0.55316162109375, 0.582275390625, 0.61138916015625, 0.6405029296875, 0.66961669921875, 0.69873046875, 0.72784423828125, 0.7569580078125, 0.78607177734375, 0.815185546875, 0.84429931640625, 0.8734130859375, 0.90252685546875, 0.931640625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 17.0, 16.0, 26.0, 43.0, 74.0, 97.0, 129.0, 197.0, 112.0, 97.0, 58.0, 37.0, 27.0, 15.0, 12.0, 5.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.30418586730957, -17.682147979736328, -17.06011199951172, -16.438074111938477, -15.816036224365234, -15.193998336791992, -14.571961402893066, -13.94992446899414, -13.327886581420898, -12.705848693847656, -12.08381175994873, -11.461774826049805, -10.839736938476562, -10.21769905090332, -9.595662117004395, -8.973625183105469, -8.351587295532227, -7.729549884796143, -7.107512474060059, -6.485475063323975, -5.863437652587891, -5.241400241851807, -4.619362831115723, -3.9973254203796387, -3.3752880096435547, -2.7532505989074707, -2.1312131881713867, -1.5091757774353027, -0.8871383666992188, -0.26510095596313477, 0.3569364547729492, 0.9789738655090332, 1.6010093688964844, 2.2230467796325684, 2.8450841903686523, 3.4671216011047363, 4.08915901184082, 4.711196422576904, 5.333233833312988, 5.955271244049072, 6.577308654785156, 7.19934606552124, 7.821383476257324, 8.44342041015625, 9.065458297729492, 9.687496185302734, 10.30953311920166, 10.931570053100586, 11.553607940673828, 12.17564582824707, 12.797682762145996, 13.419719696044922, 14.041757583618164, 14.663795471191406, 15.285832405090332, 15.907869338989258, 16.5299072265625, 17.151945114135742, 17.773983001708984, 18.396018981933594, 19.018056869506836, 19.640094757080078, 20.262130737304688, 20.88416862487793, 21.506206512451172]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 5.0, 8.0, 8.0, 10.0, 10.0, 21.0, 15.0, 25.0, 22.0, 29.0, 28.0, 37.0, 33.0, 40.0, 55.0, 79.0, 97.0, 81.0, 40.0, 42.0, 40.0, 30.0, 23.0, 38.0, 29.0, 25.0, 19.0, 18.0, 20.0, 14.0, 13.0, 9.0, 7.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.516998291015625, -17.951467514038086, -17.38593864440918, -16.82040786743164, -16.254878997802734, -15.689349174499512, -15.123819351196289, -14.55828857421875, -13.992759704589844, -13.427229881286621, -12.861700057983398, -12.296170234680176, -11.730640411376953, -11.16511058807373, -10.599580764770508, -10.034049987792969, -9.468520164489746, -8.902990341186523, -8.3374605178833, -7.771930694580078, -7.2064008712768555, -6.640871047973633, -6.075340747833252, -5.509810924530029, -4.944281101226807, -4.378751277923584, -3.8132214546203613, -3.2476913928985596, -2.682161569595337, -2.1166317462921143, -1.5511016845703125, -0.9855718612670898, -0.4200420379638672, 0.14548784494400024, 0.7110177278518677, 1.2765476703643799, 1.8420774936676025, 2.407607316970825, 2.973137378692627, 3.5386672019958496, 4.104197025299072, 4.669726848602295, 5.235256671905518, 5.800786972045898, 6.366316795349121, 6.931846618652344, 7.497376441955566, 8.062906265258789, 8.628436088562012, 9.193965911865234, 9.759495735168457, 10.32502555847168, 10.890555381774902, 11.456085205078125, 12.021615982055664, 12.58714485168457, 13.15267562866211, 13.718205451965332, 14.283735275268555, 14.849265098571777, 15.414794921875, 15.980324745178223, 16.545854568481445, 17.111385345458984, 17.67691421508789]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 4.0, 8.0, 15.0, 20.0, 36.0, 25.0, 51.0, 58.0, 79.0, 109.0, 158.0, 269.0, 363.0, 610.0, 1241.0, 2592.0, 5983.0, 16297.0, 59048.0, 281817.0, 1331996.0, 1869728.0, 490907.0, 93293.0, 24114.0, 8203.0, 3449.0, 1567.0, 832.0, 455.0, 289.0, 167.0, 143.0, 95.0, 60.0, 50.0, 30.0, 36.0, 12.0, 15.0, 13.0, 7.0, 7.0, 2.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.2255859375, -1.1874847412109375, -1.149383544921875, -1.1112823486328125, -1.07318115234375, -1.0350799560546875, -0.996978759765625, -0.9588775634765625, -0.9207763671875, -0.8826751708984375, -0.844573974609375, -0.8064727783203125, -0.76837158203125, -0.7302703857421875, -0.692169189453125, -0.6540679931640625, -0.615966796875, -0.5778656005859375, -0.539764404296875, -0.5016632080078125, -0.46356201171875, -0.4254608154296875, -0.387359619140625, -0.3492584228515625, -0.3111572265625, -0.2730560302734375, -0.234954833984375, -0.1968536376953125, -0.15875244140625, -0.1206512451171875, -0.082550048828125, -0.0444488525390625, -0.00634765625, 0.0317535400390625, 0.069854736328125, 0.1079559326171875, 0.14605712890625, 0.1841583251953125, 0.222259521484375, 0.2603607177734375, 0.2984619140625, 0.3365631103515625, 0.374664306640625, 0.4127655029296875, 0.45086669921875, 0.4889678955078125, 0.527069091796875, 0.5651702880859375, 0.603271484375, 0.6413726806640625, 0.679473876953125, 0.7175750732421875, 0.75567626953125, 0.7937774658203125, 0.831878662109375, 0.8699798583984375, 0.9080810546875, 0.9461822509765625, 0.984283447265625, 1.0223846435546875, 1.06048583984375, 1.0985870361328125, 1.136688232421875, 1.1747894287109375, 1.212890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 6.0, 5.0, 9.0, 19.0, 16.0, 22.0, 29.0, 33.0, 37.0, 30.0, 41.0, 42.0, 46.0, 56.0, 48.0, 59.0, 56.0, 47.0, 54.0, 40.0, 39.0, 38.0, 33.0, 30.0, 31.0, 29.0, 21.0, 17.0, 16.0, 11.0, 10.0, 11.0, 3.0, 7.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.068084716796875, -1.03265380859375, -0.997222900390625, -0.9617919921875, -0.926361083984375, -0.89093017578125, -0.855499267578125, -0.820068359375, -0.784637451171875, -0.74920654296875, -0.713775634765625, -0.6783447265625, -0.642913818359375, -0.60748291015625, -0.572052001953125, -0.53662109375, -0.501190185546875, -0.46575927734375, -0.430328369140625, -0.3948974609375, -0.359466552734375, -0.32403564453125, -0.288604736328125, -0.253173828125, -0.217742919921875, -0.18231201171875, -0.146881103515625, -0.1114501953125, -0.076019287109375, -0.04058837890625, -0.005157470703125, 0.0302734375, 0.065704345703125, 0.10113525390625, 0.136566162109375, 0.1719970703125, 0.207427978515625, 0.24285888671875, 0.278289794921875, 0.313720703125, 0.349151611328125, 0.38458251953125, 0.420013427734375, 0.4554443359375, 0.490875244140625, 0.52630615234375, 0.561737060546875, 0.59716796875, 0.632598876953125, 0.66802978515625, 0.703460693359375, 0.7388916015625, 0.774322509765625, 0.80975341796875, 0.845184326171875, 0.880615234375, 0.916046142578125, 0.95147705078125, 0.986907958984375, 1.0223388671875, 1.057769775390625, 1.09320068359375, 1.128631591796875, 1.1640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 13.0, 20.0, 30.0, 38.0, 63.0, 98.0, 179.0, 365.0, 915.0, 2550.0, 11657.0, 127069.0, 3563651.0, 458596.0, 22868.0, 3929.0, 1195.0, 450.0, 244.0, 109.0, 76.0, 41.0, 34.0, 25.0, 11.0, 14.0, 6.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6328125, -3.521636962890625, -3.41046142578125, -3.299285888671875, -3.1881103515625, -3.076934814453125, -2.96575927734375, -2.854583740234375, -2.743408203125, -2.632232666015625, -2.52105712890625, -2.409881591796875, -2.2987060546875, -2.187530517578125, -2.07635498046875, -1.965179443359375, -1.85400390625, -1.742828369140625, -1.63165283203125, -1.520477294921875, -1.4093017578125, -1.298126220703125, -1.18695068359375, -1.075775146484375, -0.964599609375, -0.853424072265625, -0.74224853515625, -0.631072998046875, -0.5198974609375, -0.408721923828125, -0.29754638671875, -0.186370849609375, -0.0751953125, 0.035980224609375, 0.14715576171875, 0.258331298828125, 0.3695068359375, 0.480682373046875, 0.59185791015625, 0.703033447265625, 0.814208984375, 0.925384521484375, 1.03656005859375, 1.147735595703125, 1.2589111328125, 1.370086669921875, 1.48126220703125, 1.592437744140625, 1.70361328125, 1.814788818359375, 1.92596435546875, 2.037139892578125, 2.1483154296875, 2.259490966796875, 2.37066650390625, 2.481842041015625, 2.593017578125, 2.704193115234375, 2.81536865234375, 2.926544189453125, 3.0377197265625, 3.148895263671875, 3.26007080078125, 3.371246337890625, 3.482421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 7.0, 15.0, 16.0, 26.0, 38.0, 38.0, 38.0, 67.0, 99.0, 129.0, 208.0, 270.0, 448.0, 493.0, 593.0, 482.0, 367.0, 228.0, 149.0, 103.0, 76.0, 35.0, 38.0, 24.0, 15.0, 18.0, 13.0, 5.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.041015625, -1.973297119140625, -1.90557861328125, -1.837860107421875, -1.7701416015625, -1.702423095703125, -1.63470458984375, -1.566986083984375, -1.499267578125, -1.431549072265625, -1.36383056640625, -1.296112060546875, -1.2283935546875, -1.160675048828125, -1.09295654296875, -1.025238037109375, -0.95751953125, -0.889801025390625, -0.82208251953125, -0.754364013671875, -0.6866455078125, -0.618927001953125, -0.55120849609375, -0.483489990234375, -0.415771484375, -0.348052978515625, -0.28033447265625, -0.212615966796875, -0.1448974609375, -0.077178955078125, -0.00946044921875, 0.058258056640625, 0.1259765625, 0.193695068359375, 0.26141357421875, 0.329132080078125, 0.3968505859375, 0.464569091796875, 0.53228759765625, 0.600006103515625, 0.667724609375, 0.735443115234375, 0.80316162109375, 0.870880126953125, 0.9385986328125, 1.006317138671875, 1.07403564453125, 1.141754150390625, 1.20947265625, 1.277191162109375, 1.34490966796875, 1.412628173828125, 1.4803466796875, 1.548065185546875, 1.61578369140625, 1.683502197265625, 1.751220703125, 1.818939208984375, 1.88665771484375, 1.954376220703125, 2.0220947265625, 2.089813232421875, 2.15753173828125, 2.225250244140625, 2.29296875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 12.0, 22.0, 32.0, 57.0, 87.0, 153.0, 145.0, 165.0, 118.0, 93.0, 42.0, 33.0, 19.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.616308212280273, -24.925312042236328, -24.234315872192383, -23.543319702148438, -22.852325439453125, -22.16132926940918, -21.470333099365234, -20.77933692932129, -20.088340759277344, -19.3973445892334, -18.706348419189453, -18.01535415649414, -17.324357986450195, -16.63336181640625, -15.942365646362305, -15.25136947631836, -14.560375213623047, -13.869379043579102, -13.178383827209473, -12.487387657165527, -11.796392440795898, -11.105396270751953, -10.414400100708008, -9.723403930664062, -9.032408714294434, -8.341412544250488, -7.650417327880859, -6.959421157836914, -6.268425464630127, -5.57742977142334, -4.8864336013793945, -4.195437908172607, -3.504444122314453, -2.813448429107666, -2.1224524974823, -1.4314565658569336, -0.7404608726501465, -0.049465179443359375, 0.6415309906005859, 1.332526683807373, 2.02352237701416, 2.7145180702209473, 3.4055140018463135, 4.09650993347168, 4.787505626678467, 5.478501319885254, 6.169497489929199, 6.860493183135986, 7.551488876342773, 8.242485046386719, 8.933480262756348, 9.624476432800293, 10.315471649169922, 11.006467819213867, 11.697463989257812, 12.388460159301758, 13.079455375671387, 13.770451545715332, 14.461446762084961, 15.152442932128906, 15.843439102172852, 16.534435272216797, 17.22542953491211, 17.916425704956055, 18.607421875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 11.0, 9.0, 17.0, 11.0, 16.0, 16.0, 22.0, 30.0, 28.0, 27.0, 43.0, 44.0, 48.0, 39.0, 59.0, 40.0, 51.0, 59.0, 38.0, 49.0, 40.0, 37.0, 44.0, 27.0, 30.0, 32.0, 22.0, 22.0, 14.0, 16.0, 11.0, 5.0, 8.0, 5.0, 3.0, 8.0, 1.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.094172477722168, -9.75648021697998, -9.418787956237793, -9.081095695495605, -8.743402481079102, -8.405710220336914, -8.068017959594727, -7.730325698852539, -7.392633438110352, -7.054941177368164, -6.717248916625977, -6.379556179046631, -6.041863918304443, -5.704171657562256, -5.36647891998291, -5.028786659240723, -4.691094398498535, -4.353402137756348, -4.01570987701416, -3.6780171394348145, -3.340324878692627, -3.0026326179504395, -2.664940118789673, -2.3272476196289062, -1.9895553588867188, -1.6518629789352417, -1.3141705989837646, -0.9764782190322876, -0.6387858390808105, -0.3010934591293335, 0.036598920822143555, 0.37429141998291016, 0.7119836807250977, 1.0496760606765747, 1.3873684406280518, 1.7250608205795288, 2.062753200531006, 2.4004454612731934, 2.73813796043396, 3.0758304595947266, 3.413522720336914, 3.7512149810791016, 4.088907241821289, 4.426599979400635, 4.764292240142822, 5.10198450088501, 5.4396772384643555, 5.777369499206543, 6.1150617599487305, 6.452754020690918, 6.7904462814331055, 7.128139019012451, 7.465831279754639, 7.803523540496826, 8.141216278076172, 8.47890853881836, 8.816600799560547, 9.154293060302734, 9.491985321044922, 9.82967758178711, 10.167369842529297, 10.5050630569458, 10.842755317687988, 11.180447578430176, 11.518139839172363]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 9.0, 16.0, 31.0, 34.0, 45.0, 63.0, 96.0, 148.0, 257.0, 421.0, 681.0, 1236.0, 2188.0, 3830.0, 7380.0, 14065.0, 26180.0, 50202.0, 94722.0, 169900.0, 238702.0, 195963.0, 113703.0, 60517.0, 31773.0, 16495.0, 8736.0, 4844.0, 2580.0, 1449.0, 876.0, 536.0, 305.0, 182.0, 107.0, 78.0, 58.0, 41.0, 28.0, 13.0, 14.0, 7.0, 5.0, 6.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1259765625, -1.0879974365234375, -1.050018310546875, -1.0120391845703125, -0.97406005859375, -0.9360809326171875, -0.898101806640625, -0.8601226806640625, -0.8221435546875, -0.7841644287109375, -0.746185302734375, -0.7082061767578125, -0.67022705078125, -0.6322479248046875, -0.594268798828125, -0.5562896728515625, -0.518310546875, -0.4803314208984375, -0.442352294921875, -0.4043731689453125, -0.36639404296875, -0.3284149169921875, -0.290435791015625, -0.2524566650390625, -0.2144775390625, -0.1764984130859375, -0.138519287109375, -0.1005401611328125, -0.06256103515625, -0.0245819091796875, 0.013397216796875, 0.0513763427734375, 0.08935546875, 0.1273345947265625, 0.165313720703125, 0.2032928466796875, 0.24127197265625, 0.2792510986328125, 0.317230224609375, 0.3552093505859375, 0.3931884765625, 0.4311676025390625, 0.469146728515625, 0.5071258544921875, 0.54510498046875, 0.5830841064453125, 0.621063232421875, 0.6590423583984375, 0.697021484375, 0.7350006103515625, 0.772979736328125, 0.8109588623046875, 0.84893798828125, 0.8869171142578125, 0.924896240234375, 0.9628753662109375, 1.0008544921875, 1.0388336181640625, 1.076812744140625, 1.1147918701171875, 1.15277099609375, 1.1907501220703125, 1.228729248046875, 1.2667083740234375, 1.3046875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 6.0, 10.0, 10.0, 8.0, 16.0, 22.0, 24.0, 24.0, 37.0, 32.0, 36.0, 39.0, 37.0, 54.0, 64.0, 43.0, 62.0, 46.0, 43.0, 56.0, 44.0, 49.0, 34.0, 28.0, 23.0, 36.0, 26.0, 25.0, 10.0, 12.0, 8.0, 7.0, 5.0, 11.0, 5.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1533203125, -1.1158905029296875, -1.078460693359375, -1.0410308837890625, -1.00360107421875, -0.9661712646484375, -0.928741455078125, -0.8913116455078125, -0.8538818359375, -0.8164520263671875, -0.779022216796875, -0.7415924072265625, -0.70416259765625, -0.6667327880859375, -0.629302978515625, -0.5918731689453125, -0.554443359375, -0.5170135498046875, -0.479583740234375, -0.4421539306640625, -0.40472412109375, -0.3672943115234375, -0.329864501953125, -0.2924346923828125, -0.2550048828125, -0.2175750732421875, -0.180145263671875, -0.1427154541015625, -0.10528564453125, -0.0678558349609375, -0.030426025390625, 0.0070037841796875, 0.04443359375, 0.0818634033203125, 0.119293212890625, 0.1567230224609375, 0.19415283203125, 0.2315826416015625, 0.269012451171875, 0.3064422607421875, 0.3438720703125, 0.3813018798828125, 0.418731689453125, 0.4561614990234375, 0.49359130859375, 0.5310211181640625, 0.568450927734375, 0.6058807373046875, 0.643310546875, 0.6807403564453125, 0.718170166015625, 0.7555999755859375, 0.79302978515625, 0.8304595947265625, 0.867889404296875, 0.9053192138671875, 0.9427490234375, 0.9801788330078125, 1.017608642578125, 1.0550384521484375, 1.09246826171875, 1.1298980712890625, 1.167327880859375, 1.2047576904296875, 1.2421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 8.0, 8.0, 12.0, 10.0, 14.0, 22.0, 31.0, 34.0, 71.0, 71.0, 119.0, 159.0, 218.0, 304.0, 489.0, 853.0, 1670.0, 3677.0, 9822.0, 30534.0, 112140.0, 565215.0, 232194.0, 60923.0, 17930.0, 6252.0, 2570.0, 1227.0, 657.0, 377.0, 268.0, 185.0, 124.0, 75.0, 71.0, 42.0, 39.0, 37.0, 21.0, 21.0, 9.0, 11.0, 9.0, 9.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0], "bins": [-2.60546875, -2.525970458984375, -2.44647216796875, -2.366973876953125, -2.2874755859375, -2.207977294921875, -2.12847900390625, -2.048980712890625, -1.969482421875, -1.889984130859375, -1.81048583984375, -1.730987548828125, -1.6514892578125, -1.571990966796875, -1.49249267578125, -1.412994384765625, -1.33349609375, -1.253997802734375, -1.17449951171875, -1.095001220703125, -1.0155029296875, -0.936004638671875, -0.85650634765625, -0.777008056640625, -0.697509765625, -0.618011474609375, -0.53851318359375, -0.459014892578125, -0.3795166015625, -0.300018310546875, -0.22052001953125, -0.141021728515625, -0.0615234375, 0.017974853515625, 0.09747314453125, 0.176971435546875, 0.2564697265625, 0.335968017578125, 0.41546630859375, 0.494964599609375, 0.574462890625, 0.653961181640625, 0.73345947265625, 0.812957763671875, 0.8924560546875, 0.971954345703125, 1.05145263671875, 1.130950927734375, 1.21044921875, 1.289947509765625, 1.36944580078125, 1.448944091796875, 1.5284423828125, 1.607940673828125, 1.68743896484375, 1.766937255859375, 1.846435546875, 1.925933837890625, 2.00543212890625, 2.084930419921875, 2.1644287109375, 2.243927001953125, 2.32342529296875, 2.402923583984375, 2.482421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 5.0, 7.0, 20.0, 12.0, 8.0, 18.0, 28.0, 27.0, 32.0, 32.0, 41.0, 55.0, 60.0, 59.0, 58.0, 54.0, 49.0, 57.0, 52.0, 44.0, 42.0, 39.0, 34.0, 28.0, 23.0, 31.0, 17.0, 12.0, 12.0, 11.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75390625, -4.60821533203125, -4.4625244140625, -4.31683349609375, -4.171142578125, -4.02545166015625, -3.8797607421875, -3.73406982421875, -3.58837890625, -3.44268798828125, -3.2969970703125, -3.15130615234375, -3.005615234375, -2.85992431640625, -2.7142333984375, -2.56854248046875, -2.4228515625, -2.27716064453125, -2.1314697265625, -1.98577880859375, -1.840087890625, -1.69439697265625, -1.5487060546875, -1.40301513671875, -1.25732421875, -1.11163330078125, -0.9659423828125, -0.82025146484375, -0.674560546875, -0.52886962890625, -0.3831787109375, -0.23748779296875, -0.091796875, 0.05389404296875, 0.1995849609375, 0.34527587890625, 0.490966796875, 0.63665771484375, 0.7823486328125, 0.92803955078125, 1.07373046875, 1.21942138671875, 1.3651123046875, 1.51080322265625, 1.656494140625, 1.80218505859375, 1.9478759765625, 2.09356689453125, 2.2392578125, 2.38494873046875, 2.5306396484375, 2.67633056640625, 2.822021484375, 2.96771240234375, 3.1134033203125, 3.25909423828125, 3.40478515625, 3.55047607421875, 3.6961669921875, 3.84185791015625, 3.987548828125, 4.13323974609375, 4.2789306640625, 4.42462158203125, 4.5703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 6.0, 1.0, 2.0, 6.0, 3.0, 10.0, 6.0, 16.0, 20.0, 17.0, 21.0, 49.0, 44.0, 70.0, 76.0, 132.0, 175.0, 310.0, 518.0, 996.0, 1900.0, 4213.0, 10508.0, 29379.0, 97141.0, 577568.0, 231069.0, 60680.0, 19753.0, 7206.0, 3063.0, 1476.0, 787.0, 439.0, 286.0, 177.0, 116.0, 91.0, 63.0, 40.0, 28.0, 22.0, 22.0, 5.0, 9.0, 10.0, 12.0, 4.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.765625, -0.74298095703125, -0.7203369140625, -0.69769287109375, -0.675048828125, -0.65240478515625, -0.6297607421875, -0.60711669921875, -0.58447265625, -0.56182861328125, -0.5391845703125, -0.51654052734375, -0.493896484375, -0.47125244140625, -0.4486083984375, -0.42596435546875, -0.4033203125, -0.38067626953125, -0.3580322265625, -0.33538818359375, -0.312744140625, -0.29010009765625, -0.2674560546875, -0.24481201171875, -0.22216796875, -0.19952392578125, -0.1768798828125, -0.15423583984375, -0.131591796875, -0.10894775390625, -0.0863037109375, -0.06365966796875, -0.041015625, -0.01837158203125, 0.0042724609375, 0.02691650390625, 0.049560546875, 0.07220458984375, 0.0948486328125, 0.11749267578125, 0.14013671875, 0.16278076171875, 0.1854248046875, 0.20806884765625, 0.230712890625, 0.25335693359375, 0.2760009765625, 0.29864501953125, 0.3212890625, 0.34393310546875, 0.3665771484375, 0.38922119140625, 0.411865234375, 0.43450927734375, 0.4571533203125, 0.47979736328125, 0.50244140625, 0.52508544921875, 0.5477294921875, 0.57037353515625, 0.593017578125, 0.61566162109375, 0.6383056640625, 0.66094970703125, 0.68359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 10.0, 7.0, 18.0, 24.0, 27.0, 28.0, 40.0, 64.0, 87.0, 124.0, 147.0, 103.0, 75.0, 63.0, 34.0, 30.0, 25.0, 23.0, 12.0, 12.0, 9.0, 8.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003604888916015625, -0.0003499835729598999, -0.0003394782543182373, -0.0003289729356765747, -0.0003184676170349121, -0.0003079622983932495, -0.0002974569797515869, -0.0002869516611099243, -0.0002764463424682617, -0.0002659410238265991, -0.0002554357051849365, -0.0002449303865432739, -0.00023442506790161133, -0.00022391974925994873, -0.00021341443061828613, -0.00020290911197662354, -0.00019240379333496094, -0.00018189847469329834, -0.00017139315605163574, -0.00016088783740997314, -0.00015038251876831055, -0.00013987720012664795, -0.00012937188148498535, -0.00011886656284332275, -0.00010836124420166016, -9.785592555999756e-05, -8.735060691833496e-05, -7.684528827667236e-05, -6.633996963500977e-05, -5.583465099334717e-05, -4.532933235168457e-05, -3.482401371002197e-05, -2.4318695068359375e-05, -1.3813376426696777e-05, -3.3080577850341797e-06, 7.197260856628418e-06, 1.7702579498291016e-05, 2.8207898139953613e-05, 3.871321678161621e-05, 4.921853542327881e-05, 5.9723854064941406e-05, 7.0229172706604e-05, 8.07344913482666e-05, 9.12398099899292e-05, 0.0001017451286315918, 0.0001122504472732544, 0.000122755765914917, 0.0001332610845565796, 0.0001437664031982422, 0.00015427172183990479, 0.00016477704048156738, 0.00017528235912322998, 0.00018578767776489258, 0.00019629299640655518, 0.00020679831504821777, 0.00021730363368988037, 0.00022780895233154297, 0.00023831427097320557, 0.00024881958961486816, 0.00025932490825653076, 0.00026983022689819336, 0.00028033554553985596, 0.00029084086418151855, 0.00030134618282318115, 0.00031185150146484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 3.0, 6.0, 6.0, 6.0, 15.0, 13.0, 25.0, 34.0, 33.0, 74.0, 114.0, 156.0, 284.0, 445.0, 840.0, 1709.0, 3946.0, 10930.0, 35420.0, 148503.0, 652036.0, 141977.0, 34022.0, 10460.0, 3890.0, 1666.0, 766.0, 435.0, 217.0, 149.0, 114.0, 75.0, 58.0, 35.0, 15.0, 17.0, 16.0, 11.0, 4.0, 4.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7783203125, -0.751922607421875, -0.72552490234375, -0.699127197265625, -0.6727294921875, -0.646331787109375, -0.61993408203125, -0.593536376953125, -0.567138671875, -0.540740966796875, -0.51434326171875, -0.487945556640625, -0.4615478515625, -0.435150146484375, -0.40875244140625, -0.382354736328125, -0.35595703125, -0.329559326171875, -0.30316162109375, -0.276763916015625, -0.2503662109375, -0.223968505859375, -0.19757080078125, -0.171173095703125, -0.144775390625, -0.118377685546875, -0.09197998046875, -0.065582275390625, -0.0391845703125, -0.012786865234375, 0.01361083984375, 0.040008544921875, 0.06640625, 0.092803955078125, 0.11920166015625, 0.145599365234375, 0.1719970703125, 0.198394775390625, 0.22479248046875, 0.251190185546875, 0.277587890625, 0.303985595703125, 0.33038330078125, 0.356781005859375, 0.3831787109375, 0.409576416015625, 0.43597412109375, 0.462371826171875, 0.48876953125, 0.515167236328125, 0.54156494140625, 0.567962646484375, 0.5943603515625, 0.620758056640625, 0.64715576171875, 0.673553466796875, 0.699951171875, 0.726348876953125, 0.75274658203125, 0.779144287109375, 0.8055419921875, 0.831939697265625, 0.85833740234375, 0.884735107421875, 0.9111328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 12.0, 13.0, 11.0, 15.0, 20.0, 25.0, 35.0, 46.0, 49.0, 64.0, 74.0, 85.0, 80.0, 83.0, 75.0, 57.0, 49.0, 39.0, 28.0, 25.0, 18.0, 15.0, 10.0, 19.0, 12.0, 3.0, 3.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1015625, -1.070709228515625, -1.03985595703125, -1.009002685546875, -0.9781494140625, -0.947296142578125, -0.91644287109375, -0.885589599609375, -0.854736328125, -0.823883056640625, -0.79302978515625, -0.762176513671875, -0.7313232421875, -0.700469970703125, -0.66961669921875, -0.638763427734375, -0.60791015625, -0.577056884765625, -0.54620361328125, -0.515350341796875, -0.4844970703125, -0.453643798828125, -0.42279052734375, -0.391937255859375, -0.361083984375, -0.330230712890625, -0.29937744140625, -0.268524169921875, -0.2376708984375, -0.206817626953125, -0.17596435546875, -0.145111083984375, -0.1142578125, -0.083404541015625, -0.05255126953125, -0.021697998046875, 0.0091552734375, 0.040008544921875, 0.07086181640625, 0.101715087890625, 0.132568359375, 0.163421630859375, 0.19427490234375, 0.225128173828125, 0.2559814453125, 0.286834716796875, 0.31768798828125, 0.348541259765625, 0.37939453125, 0.410247802734375, 0.44110107421875, 0.471954345703125, 0.5028076171875, 0.533660888671875, 0.56451416015625, 0.595367431640625, 0.626220703125, 0.657073974609375, 0.68792724609375, 0.718780517578125, 0.7496337890625, 0.780487060546875, 0.81134033203125, 0.842193603515625, 0.873046875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 13.0, 9.0, 12.0, 33.0, 24.0, 61.0, 96.0, 227.0, 209.0, 107.0, 80.0, 53.0, 23.0, 22.0, 10.0, 8.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.340713500976562, -19.66080093383789, -18.98088836669922, -18.300975799560547, -17.621063232421875, -16.941152572631836, -16.261240005493164, -15.581327438354492, -14.90141487121582, -14.221502304077148, -13.541589736938477, -12.861678123474121, -12.18176555633545, -11.501852989196777, -10.821941375732422, -10.14202880859375, -9.462116241455078, -8.782203674316406, -8.102291107177734, -7.422379493713379, -6.742466926574707, -6.062554359436035, -5.3826422691345215, -4.702730178833008, -4.022817611694336, -3.342905282974243, -2.6629929542541504, -1.9830806255340576, -1.3031682968139648, -0.6232559680938721, 0.0566563606262207, 0.7365684509277344, 1.4164810180664062, 2.096393346786499, 2.776305675506592, 3.4562180042266846, 4.136130332946777, 4.816042900085449, 5.495954990386963, 6.175867080688477, 6.855779647827148, 7.53569221496582, 8.215604782104492, 8.895516395568848, 9.57542896270752, 10.255341529846191, 10.935253143310547, 11.615165710449219, 12.29507827758789, 12.974990844726562, 13.654903411865234, 14.33481502532959, 15.014727592468262, 15.694640159606934, 16.37455177307129, 17.05446434020996, 17.734376907348633, 18.414289474487305, 19.094202041625977, 19.77411460876465, 20.454025268554688, 21.13393783569336, 21.81385040283203, 22.493762969970703, 23.173675537109375]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 7.0, 13.0, 13.0, 21.0, 16.0, 27.0, 21.0, 27.0, 31.0, 24.0, 32.0, 48.0, 62.0, 97.0, 138.0, 68.0, 46.0, 43.0, 33.0, 27.0, 36.0, 33.0, 28.0, 14.0, 12.0, 10.0, 12.0, 10.0, 11.0, 6.0, 3.0, 1.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.02457046508789, -19.438522338867188, -18.852474212646484, -18.26642417907715, -17.680376052856445, -17.094327926635742, -16.508277893066406, -15.922229766845703, -15.336181640625, -14.750133514404297, -14.164084434509277, -13.578035354614258, -12.991987228393555, -12.405939102172852, -11.819890022277832, -11.233840942382812, -10.64779281616211, -10.061744689941406, -9.475695610046387, -8.889646530151367, -8.303598403930664, -7.717549800872803, -7.131501197814941, -6.54545259475708, -5.959403991699219, -5.373355388641357, -4.787306785583496, -4.201258182525635, -3.6152095794677734, -3.029160976409912, -2.443112373352051, -1.8570637702941895, -1.2710151672363281, -0.6849665641784668, -0.09891796112060547, 0.48713064193725586, 1.0731792449951172, 1.6592278480529785, 2.24527645111084, 2.831325054168701, 3.4173736572265625, 4.003422260284424, 4.589470863342285, 5.1755194664001465, 5.761568069458008, 6.347616672515869, 6.9336652755737305, 7.519713878631592, 8.105762481689453, 8.691810607910156, 9.277859687805176, 9.863908767700195, 10.449956893920898, 11.036005020141602, 11.622054100036621, 12.20810317993164, 12.794151306152344, 13.380199432373047, 13.966248512268066, 14.552297592163086, 15.138345718383789, 15.724393844604492, 16.310443878173828, 16.89649200439453, 17.482540130615234]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 8.0, 14.0, 29.0, 41.0, 72.0, 111.0, 177.0, 295.0, 506.0, 936.0, 1792.0, 3727.0, 8277.0, 20201.0, 56956.0, 177781.0, 589893.0, 1491019.0, 1224795.0, 424058.0, 125614.0, 40095.0, 14944.0, 6407.0, 3021.0, 1540.0, 771.0, 464.0, 284.0, 177.0, 123.0, 53.0, 35.0, 26.0, 16.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0537109375, -1.024322509765625, -0.99493408203125, -0.965545654296875, -0.9361572265625, -0.906768798828125, -0.87738037109375, -0.847991943359375, -0.818603515625, -0.789215087890625, -0.75982666015625, -0.730438232421875, -0.7010498046875, -0.671661376953125, -0.64227294921875, -0.612884521484375, -0.58349609375, -0.554107666015625, -0.52471923828125, -0.495330810546875, -0.4659423828125, -0.436553955078125, -0.40716552734375, -0.377777099609375, -0.348388671875, -0.319000244140625, -0.28961181640625, -0.260223388671875, -0.2308349609375, -0.201446533203125, -0.17205810546875, -0.142669677734375, -0.11328125, -0.083892822265625, -0.05450439453125, -0.025115966796875, 0.0042724609375, 0.033660888671875, 0.06304931640625, 0.092437744140625, 0.121826171875, 0.151214599609375, 0.18060302734375, 0.209991455078125, 0.2393798828125, 0.268768310546875, 0.29815673828125, 0.327545166015625, 0.35693359375, 0.386322021484375, 0.41571044921875, 0.445098876953125, 0.4744873046875, 0.503875732421875, 0.53326416015625, 0.562652587890625, 0.592041015625, 0.621429443359375, 0.65081787109375, 0.680206298828125, 0.7095947265625, 0.738983154296875, 0.76837158203125, 0.797760009765625, 0.8271484375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 7.0, 0.0, 6.0, 8.0, 9.0, 7.0, 12.0, 17.0, 20.0, 16.0, 22.0, 32.0, 39.0, 34.0, 36.0, 45.0, 48.0, 48.0, 46.0, 53.0, 45.0, 52.0, 51.0, 46.0, 44.0, 46.0, 41.0, 30.0, 20.0, 17.0, 23.0, 14.0, 14.0, 10.0, 9.0, 9.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.015625, -0.9805145263671875, -0.945404052734375, -0.9102935791015625, -0.87518310546875, -0.8400726318359375, -0.804962158203125, -0.7698516845703125, -0.7347412109375, -0.6996307373046875, -0.664520263671875, -0.6294097900390625, -0.59429931640625, -0.5591888427734375, -0.524078369140625, -0.4889678955078125, -0.453857421875, -0.4187469482421875, -0.383636474609375, -0.3485260009765625, -0.31341552734375, -0.2783050537109375, -0.243194580078125, -0.2080841064453125, -0.1729736328125, -0.1378631591796875, -0.102752685546875, -0.0676422119140625, -0.03253173828125, 0.0025787353515625, 0.037689208984375, 0.0727996826171875, 0.10791015625, 0.1430206298828125, 0.178131103515625, 0.2132415771484375, 0.24835205078125, 0.2834625244140625, 0.318572998046875, 0.3536834716796875, 0.3887939453125, 0.4239044189453125, 0.459014892578125, 0.4941253662109375, 0.52923583984375, 0.5643463134765625, 0.599456787109375, 0.6345672607421875, 0.669677734375, 0.7047882080078125, 0.739898681640625, 0.7750091552734375, 0.81011962890625, 0.8452301025390625, 0.880340576171875, 0.9154510498046875, 0.9505615234375, 0.9856719970703125, 1.020782470703125, 1.0558929443359375, 1.09100341796875, 1.1261138916015625, 1.161224365234375, 1.1963348388671875, 1.2314453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 11.0, 13.0, 17.0, 31.0, 47.0, 68.0, 138.0, 272.0, 641.0, 2427.0, 16022.0, 292653.0, 3720221.0, 148473.0, 10315.0, 1837.0, 548.0, 233.0, 110.0, 70.0, 42.0, 27.0, 21.0, 14.0, 9.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.55078125, -3.4300537109375, -3.309326171875, -3.1885986328125, -3.06787109375, -2.9471435546875, -2.826416015625, -2.7056884765625, -2.5849609375, -2.4642333984375, -2.343505859375, -2.2227783203125, -2.10205078125, -1.9813232421875, -1.860595703125, -1.7398681640625, -1.619140625, -1.4984130859375, -1.377685546875, -1.2569580078125, -1.13623046875, -1.0155029296875, -0.894775390625, -0.7740478515625, -0.6533203125, -0.5325927734375, -0.411865234375, -0.2911376953125, -0.17041015625, -0.0496826171875, 0.071044921875, 0.1917724609375, 0.3125, 0.4332275390625, 0.553955078125, 0.6746826171875, 0.79541015625, 0.9161376953125, 1.036865234375, 1.1575927734375, 1.2783203125, 1.3990478515625, 1.519775390625, 1.6405029296875, 1.76123046875, 1.8819580078125, 2.002685546875, 2.1234130859375, 2.244140625, 2.3648681640625, 2.485595703125, 2.6063232421875, 2.72705078125, 2.8477783203125, 2.968505859375, 3.0892333984375, 3.2099609375, 3.3306884765625, 3.451416015625, 3.5721435546875, 3.69287109375, 3.8135986328125, 3.934326171875, 4.0550537109375, 4.17578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 8.0, 16.0, 17.0, 27.0, 24.0, 44.0, 43.0, 71.0, 95.0, 155.0, 229.0, 326.0, 483.0, 537.0, 574.0, 442.0, 309.0, 211.0, 131.0, 95.0, 57.0, 43.0, 30.0, 24.0, 16.0, 17.0, 8.0, 10.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.26171875, -2.188629150390625, -2.11553955078125, -2.042449951171875, -1.9693603515625, -1.896270751953125, -1.82318115234375, -1.750091552734375, -1.677001953125, -1.603912353515625, -1.53082275390625, -1.457733154296875, -1.3846435546875, -1.311553955078125, -1.23846435546875, -1.165374755859375, -1.09228515625, -1.019195556640625, -0.94610595703125, -0.873016357421875, -0.7999267578125, -0.726837158203125, -0.65374755859375, -0.580657958984375, -0.507568359375, -0.434478759765625, -0.36138916015625, -0.288299560546875, -0.2152099609375, -0.142120361328125, -0.06903076171875, 0.004058837890625, 0.0771484375, 0.150238037109375, 0.22332763671875, 0.296417236328125, 0.3695068359375, 0.442596435546875, 0.51568603515625, 0.588775634765625, 0.661865234375, 0.734954833984375, 0.80804443359375, 0.881134033203125, 0.9542236328125, 1.027313232421875, 1.10040283203125, 1.173492431640625, 1.24658203125, 1.319671630859375, 1.39276123046875, 1.465850830078125, 1.5389404296875, 1.612030029296875, 1.68511962890625, 1.758209228515625, 1.831298828125, 1.904388427734375, 1.97747802734375, 2.050567626953125, 2.1236572265625, 2.196746826171875, 2.26983642578125, 2.342926025390625, 2.416015625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 1.0, 5.0, 6.0, 27.0, 58.0, 109.0, 195.0, 238.0, 182.0, 110.0, 37.0, 11.0, 11.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.34957504272461, -17.300260543823242, -16.250946044921875, -15.20163345336914, -14.152318954467773, -13.103004455566406, -12.053690910339355, -11.004377365112305, -9.955062866210938, -8.90574836730957, -7.8564348220825195, -6.8071208000183105, -5.757806777954102, -4.708492755889893, -3.6591787338256836, -2.6098647117614746, -1.5605506896972656, -0.5112366676330566, 0.5380773544311523, 1.5873913764953613, 2.6367053985595703, 3.6860194206237793, 4.735333442687988, 5.784647464752197, 6.833961486816406, 7.883275508880615, 8.932589530944824, 9.981903076171875, 11.031217575073242, 12.08053207397461, 13.12984561920166, 14.179159164428711, 15.228477478027344, 16.27779197692871, 17.327106475830078, 18.376419067382812, 19.42573356628418, 20.475048065185547, 21.52436065673828, 22.57367515563965, 23.622989654541016, 24.672304153442383, 25.72161865234375, 26.770931243896484, 27.82024574279785, 28.86956024169922, 29.918872833251953, 30.96818733215332, 32.01750183105469, 33.06681442260742, 34.11613082885742, 35.165443420410156, 36.214759826660156, 37.26407241821289, 38.313385009765625, 39.362701416015625, 40.41201400756836, 41.461326599121094, 42.510643005371094, 43.55995559692383, 44.60926818847656, 45.65858459472656, 46.7078971862793, 47.7572135925293, 48.80652618408203]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 11.0, 5.0, 11.0, 12.0, 17.0, 20.0, 28.0, 24.0, 29.0, 25.0, 30.0, 16.0, 39.0, 41.0, 48.0, 46.0, 35.0, 27.0, 53.0, 37.0, 34.0, 37.0, 49.0, 47.0, 37.0, 25.0, 42.0, 20.0, 34.0, 14.0, 20.0, 17.0, 20.0, 17.0, 11.0, 4.0, 8.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.1329345703125, -11.789010047912598, -11.445085525512695, -11.101161003112793, -10.75723648071289, -10.413312911987305, -10.069388389587402, -9.7254638671875, -9.381539344787598, -9.037614822387695, -8.693690299987793, -8.34976577758789, -8.005842208862305, -7.661917209625244, -7.3179931640625, -6.974068641662598, -6.630144119262695, -6.286219596862793, -5.942295074462891, -5.5983710289001465, -5.254446506500244, -4.910521984100342, -4.566597938537598, -4.222673416137695, -3.878748893737793, -3.5348243713378906, -3.1909000873565674, -2.846975803375244, -2.503051280975342, -2.1591267585754395, -1.8152024745941162, -1.471278190612793, -1.1273527145385742, -0.7834283113479614, -0.43950390815734863, -0.09557950496673584, 0.24834489822387695, 0.5922693014144897, 0.9361937046051025, 1.2801179885864258, 1.6240425109863281, 1.967966914176941, 2.3118913173675537, 2.655815601348877, 2.9997401237487793, 3.3436646461486816, 3.687588930130005, 4.031513214111328, 4.3754377365112305, 4.719362258911133, 5.063286781311035, 5.407210826873779, 5.751135349273682, 6.095059871673584, 6.438983917236328, 6.7829084396362305, 7.126832962036133, 7.470757484436035, 7.8146820068359375, 8.15860652923584, 8.502531051635742, 8.846454620361328, 9.19037914276123, 9.534303665161133, 9.878228187561035]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 11.0, 7.0, 12.0, 15.0, 13.0, 27.0, 50.0, 84.0, 135.0, 159.0, 288.0, 422.0, 610.0, 1056.0, 1584.0, 2684.0, 4443.0, 7769.0, 14268.0, 26968.0, 52934.0, 110498.0, 225874.0, 280177.0, 160509.0, 75955.0, 37132.0, 19454.0, 10408.0, 5796.0, 3587.0, 2031.0, 1258.0, 820.0, 517.0, 336.0, 204.0, 147.0, 104.0, 73.0, 57.0, 30.0, 20.0, 5.0, 5.0, 3.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0], "bins": [-1.8017578125, -1.750640869140625, -1.69952392578125, -1.648406982421875, -1.5972900390625, -1.546173095703125, -1.49505615234375, -1.443939208984375, -1.392822265625, -1.341705322265625, -1.29058837890625, -1.239471435546875, -1.1883544921875, -1.137237548828125, -1.08612060546875, -1.035003662109375, -0.98388671875, -0.932769775390625, -0.88165283203125, -0.830535888671875, -0.7794189453125, -0.728302001953125, -0.67718505859375, -0.626068115234375, -0.574951171875, -0.523834228515625, -0.47271728515625, -0.421600341796875, -0.3704833984375, -0.319366455078125, -0.26824951171875, -0.217132568359375, -0.166015625, -0.114898681640625, -0.06378173828125, -0.012664794921875, 0.0384521484375, 0.089569091796875, 0.14068603515625, 0.191802978515625, 0.242919921875, 0.294036865234375, 0.34515380859375, 0.396270751953125, 0.4473876953125, 0.498504638671875, 0.54962158203125, 0.600738525390625, 0.65185546875, 0.702972412109375, 0.75408935546875, 0.805206298828125, 0.8563232421875, 0.907440185546875, 0.95855712890625, 1.009674072265625, 1.060791015625, 1.111907958984375, 1.16302490234375, 1.214141845703125, 1.2652587890625, 1.316375732421875, 1.36749267578125, 1.418609619140625, 1.4697265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 4.0, 10.0, 3.0, 6.0, 7.0, 8.0, 8.0, 11.0, 21.0, 13.0, 30.0, 22.0, 26.0, 23.0, 33.0, 38.0, 22.0, 23.0, 42.0, 38.0, 46.0, 52.0, 50.0, 47.0, 36.0, 38.0, 27.0, 44.0, 30.0, 27.0, 22.0, 32.0, 20.0, 20.0, 19.0, 12.0, 12.0, 13.0, 10.0, 7.0, 9.0, 6.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.93603515625, -0.9051132202148438, -0.8741912841796875, -0.8432693481445312, -0.812347412109375, -0.7814254760742188, -0.7505035400390625, -0.7195816040039062, -0.68865966796875, -0.6577377319335938, -0.6268157958984375, -0.5958938598632812, -0.564971923828125, -0.5340499877929688, -0.5031280517578125, -0.47220611572265625, -0.4412841796875, -0.41036224365234375, -0.3794403076171875, -0.34851837158203125, -0.317596435546875, -0.28667449951171875, -0.2557525634765625, -0.22483062744140625, -0.19390869140625, -0.16298675537109375, -0.1320648193359375, -0.10114288330078125, -0.070220947265625, -0.03929901123046875, -0.0083770751953125, 0.02254486083984375, 0.053466796875, 0.08438873291015625, 0.1153106689453125, 0.14623260498046875, 0.177154541015625, 0.20807647705078125, 0.2389984130859375, 0.26992034912109375, 0.30084228515625, 0.33176422119140625, 0.3626861572265625, 0.39360809326171875, 0.424530029296875, 0.45545196533203125, 0.4863739013671875, 0.5172958374023438, 0.5482177734375, 0.5791397094726562, 0.6100616455078125, 0.6409835815429688, 0.671905517578125, 0.7028274536132812, 0.7337493896484375, 0.7646713256835938, 0.79559326171875, 0.8265151977539062, 0.8574371337890625, 0.8883590698242188, 0.919281005859375, 0.9502029418945312, 0.9811248779296875, 1.0120468139648438, 1.04296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 4.0, 11.0, 12.0, 11.0, 13.0, 31.0, 33.0, 34.0, 63.0, 61.0, 108.0, 156.0, 212.0, 316.0, 490.0, 857.0, 1684.0, 4142.0, 13515.0, 68983.0, 684425.0, 224801.0, 34384.0, 8044.0, 2886.0, 1265.0, 688.0, 404.0, 271.0, 176.0, 119.0, 101.0, 66.0, 36.0, 46.0, 30.0, 15.0, 21.0, 4.0, 10.0, 6.0, 5.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0], "bins": [-4.1484375, -4.03570556640625, -3.9229736328125, -3.81024169921875, -3.697509765625, -3.58477783203125, -3.4720458984375, -3.35931396484375, -3.24658203125, -3.13385009765625, -3.0211181640625, -2.90838623046875, -2.795654296875, -2.68292236328125, -2.5701904296875, -2.45745849609375, -2.3447265625, -2.23199462890625, -2.1192626953125, -2.00653076171875, -1.893798828125, -1.78106689453125, -1.6683349609375, -1.55560302734375, -1.44287109375, -1.33013916015625, -1.2174072265625, -1.10467529296875, -0.991943359375, -0.87921142578125, -0.7664794921875, -0.65374755859375, -0.541015625, -0.42828369140625, -0.3155517578125, -0.20281982421875, -0.090087890625, 0.02264404296875, 0.1353759765625, 0.24810791015625, 0.36083984375, 0.47357177734375, 0.5863037109375, 0.69903564453125, 0.811767578125, 0.92449951171875, 1.0372314453125, 1.14996337890625, 1.2626953125, 1.37542724609375, 1.4881591796875, 1.60089111328125, 1.713623046875, 1.82635498046875, 1.9390869140625, 2.05181884765625, 2.16455078125, 2.27728271484375, 2.3900146484375, 2.50274658203125, 2.615478515625, 2.72821044921875, 2.8409423828125, 2.95367431640625, 3.06640625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 9.0, 13.0, 11.0, 13.0, 14.0, 23.0, 19.0, 36.0, 36.0, 38.0, 52.0, 60.0, 73.0, 77.0, 73.0, 61.0, 64.0, 66.0, 52.0, 36.0, 39.0, 32.0, 23.0, 21.0, 11.0, 15.0, 8.0, 7.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.95703125, -5.783447265625, -5.60986328125, -5.436279296875, -5.2626953125, -5.089111328125, -4.91552734375, -4.741943359375, -4.568359375, -4.394775390625, -4.22119140625, -4.047607421875, -3.8740234375, -3.700439453125, -3.52685546875, -3.353271484375, -3.1796875, -3.006103515625, -2.83251953125, -2.658935546875, -2.4853515625, -2.311767578125, -2.13818359375, -1.964599609375, -1.791015625, -1.617431640625, -1.44384765625, -1.270263671875, -1.0966796875, -0.923095703125, -0.74951171875, -0.575927734375, -0.40234375, -0.228759765625, -0.05517578125, 0.118408203125, 0.2919921875, 0.465576171875, 0.63916015625, 0.812744140625, 0.986328125, 1.159912109375, 1.33349609375, 1.507080078125, 1.6806640625, 1.854248046875, 2.02783203125, 2.201416015625, 2.375, 2.548583984375, 2.72216796875, 2.895751953125, 3.0693359375, 3.242919921875, 3.41650390625, 3.590087890625, 3.763671875, 3.937255859375, 4.11083984375, 4.284423828125, 4.4580078125, 4.631591796875, 4.80517578125, 4.978759765625, 5.15234375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 14.0, 21.0, 32.0, 40.0, 43.0, 77.0, 114.0, 209.0, 293.0, 616.0, 1152.0, 2633.0, 7276.0, 24870.0, 100615.0, 666028.0, 183734.0, 42228.0, 11495.0, 3657.0, 1557.0, 752.0, 418.0, 222.0, 130.0, 109.0, 51.0, 44.0, 22.0, 19.0, 13.0, 12.0, 10.0, 7.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6064453125, -0.5845489501953125, -0.562652587890625, -0.5407562255859375, -0.51885986328125, -0.4969635009765625, -0.475067138671875, -0.4531707763671875, -0.4312744140625, -0.4093780517578125, -0.387481689453125, -0.3655853271484375, -0.34368896484375, -0.3217926025390625, -0.299896240234375, -0.2779998779296875, -0.256103515625, -0.2342071533203125, -0.212310791015625, -0.1904144287109375, -0.16851806640625, -0.1466217041015625, -0.124725341796875, -0.1028289794921875, -0.0809326171875, -0.0590362548828125, -0.037139892578125, -0.0152435302734375, 0.00665283203125, 0.0285491943359375, 0.050445556640625, 0.0723419189453125, 0.09423828125, 0.1161346435546875, 0.138031005859375, 0.1599273681640625, 0.18182373046875, 0.2037200927734375, 0.225616455078125, 0.2475128173828125, 0.2694091796875, 0.2913055419921875, 0.313201904296875, 0.3350982666015625, 0.35699462890625, 0.3788909912109375, 0.400787353515625, 0.4226837158203125, 0.444580078125, 0.4664764404296875, 0.488372802734375, 0.5102691650390625, 0.53216552734375, 0.5540618896484375, 0.575958251953125, 0.5978546142578125, 0.6197509765625, 0.6416473388671875, 0.663543701171875, 0.6854400634765625, 0.70733642578125, 0.7292327880859375, 0.751129150390625, 0.7730255126953125, 0.794921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 8.0, 13.0, 19.0, 28.0, 35.0, 39.0, 59.0, 72.0, 100.0, 129.0, 117.0, 108.0, 75.0, 50.0, 37.0, 33.0, 23.0, 15.0, 7.0, 6.0, 6.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027680397033691406, -0.0002661310136318207, -0.0002554580569267273, -0.0002447851002216339, -0.00023411214351654053, -0.00022343918681144714, -0.00021276623010635376, -0.00020209327340126038, -0.000191420316696167, -0.0001807473599910736, -0.00017007440328598022, -0.00015940144658088684, -0.00014872848987579346, -0.00013805553317070007, -0.0001273825764656067, -0.0001167096197605133, -0.00010603666305541992, -9.536370635032654e-05, -8.469074964523315e-05, -7.401779294013977e-05, -6.334483623504639e-05, -5.2671879529953e-05, -4.199892282485962e-05, -3.1325966119766235e-05, -2.065300941467285e-05, -9.980052709579468e-06, 6.92903995513916e-07, 1.13658607006073e-05, 2.2038817405700684e-05, 3.271177411079407e-05, 4.338473081588745e-05, 5.4057687520980835e-05, 6.473064422607422e-05, 7.54036009311676e-05, 8.607655763626099e-05, 9.674951434135437e-05, 0.00010742247104644775, 0.00011809542775154114, 0.00012876838445663452, 0.0001394413411617279, 0.0001501142978668213, 0.00016078725457191467, 0.00017146021127700806, 0.00018213316798210144, 0.00019280612468719482, 0.0002034790813922882, 0.0002141520380973816, 0.00022482499480247498, 0.00023549795150756836, 0.00024617090821266174, 0.0002568438649177551, 0.0002675168216228485, 0.0002781897783279419, 0.0002888627350330353, 0.00029953569173812866, 0.00031020864844322205, 0.00032088160514831543, 0.0003315545618534088, 0.0003422275185585022, 0.0003529004752635956, 0.00036357343196868896, 0.00037424638867378235, 0.00038491934537887573, 0.0003955923020839691, 0.0004062652587890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 10.0, 15.0, 12.0, 29.0, 26.0, 43.0, 54.0, 99.0, 153.0, 256.0, 453.0, 944.0, 2116.0, 6334.0, 26309.0, 160875.0, 725179.0, 99818.0, 17563.0, 4734.0, 1693.0, 806.0, 391.0, 212.0, 133.0, 97.0, 45.0, 36.0, 26.0, 27.0, 11.0, 11.0, 8.0, 8.0, 6.0, 7.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.82080078125, -0.7946395874023438, -0.7684783935546875, -0.7423171997070312, -0.716156005859375, -0.6899948120117188, -0.6638336181640625, -0.6376724243164062, -0.61151123046875, -0.5853500366210938, -0.5591888427734375, -0.5330276489257812, -0.506866455078125, -0.48070526123046875, -0.4545440673828125, -0.42838287353515625, -0.4022216796875, -0.37606048583984375, -0.3498992919921875, -0.32373809814453125, -0.297576904296875, -0.27141571044921875, -0.2452545166015625, -0.21909332275390625, -0.19293212890625, -0.16677093505859375, -0.1406097412109375, -0.11444854736328125, -0.088287353515625, -0.06212615966796875, -0.0359649658203125, -0.00980377197265625, 0.016357421875, 0.04251861572265625, 0.0686798095703125, 0.09484100341796875, 0.121002197265625, 0.14716339111328125, 0.1733245849609375, 0.19948577880859375, 0.22564697265625, 0.25180816650390625, 0.2779693603515625, 0.30413055419921875, 0.330291748046875, 0.35645294189453125, 0.3826141357421875, 0.40877532958984375, 0.4349365234375, 0.46109771728515625, 0.4872589111328125, 0.5134201049804688, 0.539581298828125, 0.5657424926757812, 0.5919036865234375, 0.6180648803710938, 0.64422607421875, 0.6703872680664062, 0.6965484619140625, 0.7227096557617188, 0.748870849609375, 0.7750320434570312, 0.8011932373046875, 0.8273544311523438, 0.853515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 6.0, 5.0, 8.0, 15.0, 7.0, 20.0, 19.0, 22.0, 16.0, 37.0, 55.0, 51.0, 60.0, 71.0, 54.0, 74.0, 59.0, 63.0, 74.0, 57.0, 42.0, 34.0, 36.0, 19.0, 21.0, 16.0, 9.0, 11.0, 10.0, 4.0, 7.0, 7.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59130859375, -0.5698623657226562, -0.5484161376953125, -0.5269699096679688, -0.505523681640625, -0.48407745361328125, -0.4626312255859375, -0.44118499755859375, -0.41973876953125, -0.39829254150390625, -0.3768463134765625, -0.35540008544921875, -0.333953857421875, -0.31250762939453125, -0.2910614013671875, -0.26961517333984375, -0.2481689453125, -0.22672271728515625, -0.2052764892578125, -0.18383026123046875, -0.162384033203125, -0.14093780517578125, -0.1194915771484375, -0.09804534912109375, -0.07659912109375, -0.05515289306640625, -0.0337066650390625, -0.01226043701171875, 0.009185791015625, 0.03063201904296875, 0.0520782470703125, 0.07352447509765625, 0.094970703125, 0.11641693115234375, 0.1378631591796875, 0.15930938720703125, 0.180755615234375, 0.20220184326171875, 0.2236480712890625, 0.24509429931640625, 0.26654052734375, 0.28798675537109375, 0.3094329833984375, 0.33087921142578125, 0.352325439453125, 0.37377166748046875, 0.3952178955078125, 0.41666412353515625, 0.4381103515625, 0.45955657958984375, 0.4810028076171875, 0.5024490356445312, 0.523895263671875, 0.5453414916992188, 0.5667877197265625, 0.5882339477539062, 0.60968017578125, 0.6311264038085938, 0.6525726318359375, 0.6740188598632812, 0.695465087890625, 0.7169113159179688, 0.7383575439453125, 0.7598037719726562, 0.78125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 16.0, 18.0, 56.0, 117.0, 362.0, 223.0, 101.0, 50.0, 19.0, 16.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.81583786010742, -43.74491882324219, -42.67399597167969, -41.60307693481445, -40.53215789794922, -39.46123504638672, -38.390316009521484, -37.31939697265625, -36.24847412109375, -35.177555084228516, -34.106632232666016, -33.03571319580078, -31.964794158935547, -30.89387321472168, -29.822952270507812, -28.752033233642578, -27.681114196777344, -26.610193252563477, -25.539274215698242, -24.468353271484375, -23.39743423461914, -22.326513290405273, -21.255592346191406, -20.184673309326172, -19.113752365112305, -18.042831420898438, -16.971912384033203, -15.900991439819336, -14.830071449279785, -13.759151458740234, -12.688230514526367, -11.617310523986816, -10.546388626098633, -9.475468635559082, -8.404548645019531, -7.333627700805664, -6.262707710266113, -5.1917877197265625, -4.1208672523498535, -3.0499467849731445, -1.9790267944335938, -0.9081065654754639, 0.16281366348266602, 1.233733892440796, 2.304654121398926, 3.3755741119384766, 4.4464945793151855, 5.5174150466918945, 6.588335037231445, 7.659255027770996, 8.730175018310547, 9.801095962524414, 10.872015953063965, 11.942935943603516, 13.013856887817383, 14.084776878356934, 15.155696868896484, 16.22661781311035, 17.297536849975586, 18.368457794189453, 19.439376831054688, 20.510297775268555, 21.581218719482422, 22.652137756347656, 23.723058700561523]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 5.0, 0.0, 6.0, 6.0, 6.0, 8.0, 7.0, 8.0, 10.0, 9.0, 16.0, 12.0, 26.0, 21.0, 29.0, 23.0, 27.0, 27.0, 36.0, 97.0, 178.0, 86.0, 44.0, 30.0, 36.0, 17.0, 38.0, 24.0, 19.0, 25.0, 21.0, 19.0, 13.0, 11.0, 10.0, 11.0, 9.0, 5.0, 10.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-18.386028289794922, -17.867717742919922, -17.349407196044922, -16.831098556518555, -16.312788009643555, -15.794477462768555, -15.276167869567871, -14.757858276367188, -14.239547729492188, -13.721237182617188, -13.202927589416504, -12.68461799621582, -12.16630744934082, -11.64799690246582, -11.129687309265137, -10.611377716064453, -10.093067169189453, -9.574756622314453, -9.05644702911377, -8.538137435913086, -8.019826889038086, -7.501516819000244, -6.983206748962402, -6.4648966789245605, -5.946586608886719, -5.428276538848877, -4.909966468811035, -4.391656398773193, -3.8733463287353516, -3.3550362586975098, -2.836726188659668, -2.318416118621826, -1.8001060485839844, -1.2817959785461426, -0.7634859085083008, -0.24517583847045898, 0.2731342315673828, 0.7914443016052246, 1.3097543716430664, 1.8280644416809082, 2.34637451171875, 2.864684581756592, 3.3829946517944336, 3.9013047218322754, 4.419614791870117, 4.937924861907959, 5.456234931945801, 5.974545001983643, 6.492855072021484, 7.011165142059326, 7.529475212097168, 8.047784805297852, 8.566095352172852, 9.084405899047852, 9.602715492248535, 10.121025085449219, 10.639335632324219, 11.157646179199219, 11.675955772399902, 12.194265365600586, 12.712575912475586, 13.230886459350586, 13.74919605255127, 14.267505645751953, 14.785816192626953]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 13.0, 16.0, 20.0, 25.0, 53.0, 55.0, 111.0, 176.0, 240.0, 347.0, 545.0, 890.0, 1519.0, 2787.0, 5194.0, 11384.0, 29011.0, 88355.0, 283939.0, 835597.0, 1530565.0, 927123.0, 321501.0, 97700.0, 32116.0, 12242.0, 5642.0, 2848.0, 1609.0, 939.0, 605.0, 379.0, 234.0, 145.0, 118.0, 75.0, 36.0, 42.0, 26.0, 15.0, 4.0, 9.0, 10.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1953125, -1.15618896484375, -1.1170654296875, -1.07794189453125, -1.038818359375, -0.99969482421875, -0.9605712890625, -0.92144775390625, -0.88232421875, -0.84320068359375, -0.8040771484375, -0.76495361328125, -0.725830078125, -0.68670654296875, -0.6475830078125, -0.60845947265625, -0.5693359375, -0.53021240234375, -0.4910888671875, -0.45196533203125, -0.412841796875, -0.37371826171875, -0.3345947265625, -0.29547119140625, -0.25634765625, -0.21722412109375, -0.1781005859375, -0.13897705078125, -0.099853515625, -0.06072998046875, -0.0216064453125, 0.01751708984375, 0.056640625, 0.09576416015625, 0.1348876953125, 0.17401123046875, 0.213134765625, 0.25225830078125, 0.2913818359375, 0.33050537109375, 0.36962890625, 0.40875244140625, 0.4478759765625, 0.48699951171875, 0.526123046875, 0.56524658203125, 0.6043701171875, 0.64349365234375, 0.6826171875, 0.72174072265625, 0.7608642578125, 0.79998779296875, 0.839111328125, 0.87823486328125, 0.9173583984375, 0.95648193359375, 0.99560546875, 1.03472900390625, 1.0738525390625, 1.11297607421875, 1.152099609375, 1.19122314453125, 1.2303466796875, 1.26947021484375, 1.30859375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 7.0, 6.0, 16.0, 11.0, 10.0, 13.0, 18.0, 21.0, 18.0, 21.0, 48.0, 37.0, 35.0, 46.0, 49.0, 60.0, 59.0, 43.0, 52.0, 44.0, 40.0, 30.0, 24.0, 34.0, 37.0, 36.0, 17.0, 31.0, 26.0, 12.0, 21.0, 15.0, 9.0, 11.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0224609375, -0.9902801513671875, -0.958099365234375, -0.9259185791015625, -0.89373779296875, -0.8615570068359375, -0.829376220703125, -0.7971954345703125, -0.7650146484375, -0.7328338623046875, -0.700653076171875, -0.6684722900390625, -0.63629150390625, -0.6041107177734375, -0.571929931640625, -0.5397491455078125, -0.507568359375, -0.4753875732421875, -0.443206787109375, -0.4110260009765625, -0.37884521484375, -0.3466644287109375, -0.314483642578125, -0.2823028564453125, -0.2501220703125, -0.2179412841796875, -0.185760498046875, -0.1535797119140625, -0.12139892578125, -0.0892181396484375, -0.057037353515625, -0.0248565673828125, 0.00732421875, 0.0395050048828125, 0.071685791015625, 0.1038665771484375, 0.13604736328125, 0.1682281494140625, 0.200408935546875, 0.2325897216796875, 0.2647705078125, 0.2969512939453125, 0.329132080078125, 0.3613128662109375, 0.39349365234375, 0.4256744384765625, 0.457855224609375, 0.4900360107421875, 0.522216796875, 0.5543975830078125, 0.586578369140625, 0.6187591552734375, 0.65093994140625, 0.6831207275390625, 0.715301513671875, 0.7474822998046875, 0.7796630859375, 0.8118438720703125, 0.844024658203125, 0.8762054443359375, 0.90838623046875, 0.9405670166015625, 0.972747802734375, 1.0049285888671875, 1.037109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 4.0, 5.0, 6.0, 22.0, 24.0, 52.0, 67.0, 121.0, 256.0, 483.0, 1132.0, 3280.0, 23887.0, 3600322.0, 551327.0, 9640.0, 2082.0, 766.0, 367.0, 178.0, 96.0, 67.0, 34.0, 21.0, 13.0, 9.0, 10.0, 2.0, 9.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.3160400390625, -6.089111328125, -5.8621826171875, -5.63525390625, -5.4083251953125, -5.181396484375, -4.9544677734375, -4.7275390625, -4.5006103515625, -4.273681640625, -4.0467529296875, -3.81982421875, -3.5928955078125, -3.365966796875, -3.1390380859375, -2.912109375, -2.6851806640625, -2.458251953125, -2.2313232421875, -2.00439453125, -1.7774658203125, -1.550537109375, -1.3236083984375, -1.0966796875, -0.8697509765625, -0.642822265625, -0.4158935546875, -0.18896484375, 0.0379638671875, 0.264892578125, 0.4918212890625, 0.71875, 0.9456787109375, 1.172607421875, 1.3995361328125, 1.62646484375, 1.8533935546875, 2.080322265625, 2.3072509765625, 2.5341796875, 2.7611083984375, 2.988037109375, 3.2149658203125, 3.44189453125, 3.6688232421875, 3.895751953125, 4.1226806640625, 4.349609375, 4.5765380859375, 4.803466796875, 5.0303955078125, 5.25732421875, 5.4842529296875, 5.711181640625, 5.9381103515625, 6.1650390625, 6.3919677734375, 6.618896484375, 6.8458251953125, 7.07275390625, 7.2996826171875, 7.526611328125, 7.7535400390625, 7.98046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 6.0, 3.0, 10.0, 13.0, 19.0, 39.0, 42.0, 85.0, 122.0, 148.0, 242.0, 352.0, 501.0, 656.0, 622.0, 408.0, 310.0, 176.0, 117.0, 72.0, 50.0, 27.0, 16.0, 8.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.046875, -4.916473388671875, -4.78607177734375, -4.655670166015625, -4.5252685546875, -4.394866943359375, -4.26446533203125, -4.134063720703125, -4.003662109375, -3.873260498046875, -3.74285888671875, -3.612457275390625, -3.4820556640625, -3.351654052734375, -3.22125244140625, -3.090850830078125, -2.96044921875, -2.830047607421875, -2.69964599609375, -2.569244384765625, -2.4388427734375, -2.308441162109375, -2.17803955078125, -2.047637939453125, -1.917236328125, -1.786834716796875, -1.65643310546875, -1.526031494140625, -1.3956298828125, -1.265228271484375, -1.13482666015625, -1.004425048828125, -0.8740234375, -0.743621826171875, -0.61322021484375, -0.482818603515625, -0.3524169921875, -0.222015380859375, -0.09161376953125, 0.038787841796875, 0.169189453125, 0.299591064453125, 0.42999267578125, 0.560394287109375, 0.6907958984375, 0.821197509765625, 0.95159912109375, 1.082000732421875, 1.21240234375, 1.342803955078125, 1.47320556640625, 1.603607177734375, 1.7340087890625, 1.864410400390625, 1.99481201171875, 2.125213623046875, 2.255615234375, 2.386016845703125, 2.51641845703125, 2.646820068359375, 2.7772216796875, 2.907623291015625, 3.03802490234375, 3.168426513671875, 3.298828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 11.0, 13.0, 30.0, 66.0, 115.0, 216.0, 230.0, 144.0, 82.0, 39.0, 20.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-76.03483581542969, -74.31876373291016, -72.6026840209961, -70.88661193847656, -69.17053985595703, -67.45446014404297, -65.73838806152344, -64.0223159790039, -62.30624008178711, -60.59016418457031, -58.87409210205078, -57.158016204833984, -55.44194030761719, -53.725868225097656, -52.00979232788086, -50.29371643066406, -48.57764434814453, -46.861568450927734, -45.1454963684082, -43.429420471191406, -41.71334457397461, -39.99727249145508, -38.28119659423828, -36.56512451171875, -34.84904479980469, -33.13296890258789, -31.416894912719727, -29.700820922851562, -27.9847469329834, -26.268672943115234, -24.552597045898438, -22.836523056030273, -21.12044906616211, -19.404375076293945, -17.68829917907715, -15.972225189208984, -14.25615119934082, -12.54007625579834, -10.82400131225586, -9.107927322387695, -7.391852378845215, -5.675777912139893, -3.959703207015991, -2.24362850189209, -0.5275540351867676, 1.1885204315185547, 2.904595375061035, 4.620669364929199, 6.33674430847168, 8.05281925201416, 9.768893241882324, 11.484968185424805, 13.201042175292969, 14.91711711883545, 16.63319206237793, 18.349266052246094, 20.06534194946289, 21.781415939331055, 23.49749183654785, 25.213565826416016, 26.92963981628418, 28.645713806152344, 30.36178970336914, 32.07786560058594, 33.79393768310547]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 5.0, 2.0, 7.0, 3.0, 10.0, 7.0, 11.0, 10.0, 15.0, 16.0, 31.0, 33.0, 25.0, 35.0, 26.0, 38.0, 45.0, 63.0, 61.0, 59.0, 52.0, 54.0, 52.0, 52.0, 49.0, 36.0, 31.0, 42.0, 25.0, 20.0, 24.0, 14.0, 12.0, 10.0, 9.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.1195068359375, -21.467880249023438, -20.816253662109375, -20.164628982543945, -19.513002395629883, -18.86137580871582, -18.20975112915039, -17.558124542236328, -16.906497955322266, -16.254871368408203, -15.603245735168457, -14.951620101928711, -14.299993515014648, -13.648366928100586, -12.99674129486084, -12.345115661621094, -11.693489074707031, -11.041862487792969, -10.390236854553223, -9.738611221313477, -9.086984634399414, -8.435358047485352, -7.7837324142456055, -7.132106304168701, -6.480480194091797, -5.828854084014893, -5.177227973937988, -4.525601863861084, -3.8739757537841797, -3.2223496437072754, -2.570723533630371, -1.9190974235534668, -1.2674713134765625, -0.6158452033996582, 0.035780906677246094, 0.6874070167541504, 1.3390331268310547, 1.990659236907959, 2.6422853469848633, 3.2939114570617676, 3.945537567138672, 4.597163677215576, 5.2487897872924805, 5.900415897369385, 6.552042007446289, 7.203668117523193, 7.855294227600098, 8.506919860839844, 9.158546447753906, 9.810173034667969, 10.461798667907715, 11.113424301147461, 11.765050888061523, 12.416677474975586, 13.068303108215332, 13.719928741455078, 14.37155532836914, 15.023181915283203, 15.67480754852295, 16.326433181762695, 16.978059768676758, 17.62968635559082, 18.28131103515625, 18.932937622070312, 19.584564208984375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 9.0, 1.0, 7.0, 16.0, 30.0, 33.0, 49.0, 77.0, 111.0, 215.0, 340.0, 584.0, 970.0, 1694.0, 3114.0, 5913.0, 12459.0, 28790.0, 74236.0, 239478.0, 474323.0, 124469.0, 45085.0, 18604.0, 8444.0, 4085.0, 2311.0, 1235.0, 740.0, 429.0, 258.0, 153.0, 114.0, 66.0, 34.0, 28.0, 19.0, 17.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.22265625, -2.1595916748046875, -2.096527099609375, -2.0334625244140625, -1.97039794921875, -1.9073333740234375, -1.844268798828125, -1.7812042236328125, -1.7181396484375, -1.6550750732421875, -1.592010498046875, -1.5289459228515625, -1.46588134765625, -1.4028167724609375, -1.339752197265625, -1.2766876220703125, -1.213623046875, -1.1505584716796875, -1.087493896484375, -1.0244293212890625, -0.96136474609375, -0.8983001708984375, -0.835235595703125, -0.7721710205078125, -0.7091064453125, -0.6460418701171875, -0.582977294921875, -0.5199127197265625, -0.45684814453125, -0.3937835693359375, -0.330718994140625, -0.2676544189453125, -0.20458984375, -0.1415252685546875, -0.078460693359375, -0.0153961181640625, 0.04766845703125, 0.1107330322265625, 0.173797607421875, 0.2368621826171875, 0.2999267578125, 0.3629913330078125, 0.426055908203125, 0.4891204833984375, 0.55218505859375, 0.6152496337890625, 0.678314208984375, 0.7413787841796875, 0.804443359375, 0.8675079345703125, 0.930572509765625, 0.9936370849609375, 1.05670166015625, 1.1197662353515625, 1.182830810546875, 1.2458953857421875, 1.3089599609375, 1.3720245361328125, 1.435089111328125, 1.4981536865234375, 1.56121826171875, 1.6242828369140625, 1.687347412109375, 1.7504119873046875, 1.8134765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 11.0, 5.0, 6.0, 9.0, 15.0, 19.0, 5.0, 19.0, 21.0, 27.0, 23.0, 26.0, 31.0, 39.0, 38.0, 58.0, 38.0, 54.0, 51.0, 48.0, 50.0, 48.0, 45.0, 44.0, 37.0, 34.0, 33.0, 33.0, 27.0, 13.0, 17.0, 12.0, 8.0, 15.0, 10.0, 7.0, 5.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3623046875, -1.3222808837890625, -1.282257080078125, -1.2422332763671875, -1.20220947265625, -1.1621856689453125, -1.122161865234375, -1.0821380615234375, -1.0421142578125, -1.0020904541015625, -0.962066650390625, -0.9220428466796875, -0.88201904296875, -0.8419952392578125, -0.801971435546875, -0.7619476318359375, -0.721923828125, -0.6819000244140625, -0.641876220703125, -0.6018524169921875, -0.56182861328125, -0.5218048095703125, -0.481781005859375, -0.4417572021484375, -0.4017333984375, -0.3617095947265625, -0.321685791015625, -0.2816619873046875, -0.24163818359375, -0.2016143798828125, -0.161590576171875, -0.1215667724609375, -0.08154296875, -0.0415191650390625, -0.001495361328125, 0.0385284423828125, 0.07855224609375, 0.1185760498046875, 0.158599853515625, 0.1986236572265625, 0.2386474609375, 0.2786712646484375, 0.318695068359375, 0.3587188720703125, 0.39874267578125, 0.4387664794921875, 0.478790283203125, 0.5188140869140625, 0.558837890625, 0.5988616943359375, 0.638885498046875, 0.6789093017578125, 0.71893310546875, 0.7589569091796875, 0.798980712890625, 0.8390045166015625, 0.8790283203125, 0.9190521240234375, 0.959075927734375, 0.9990997314453125, 1.03912353515625, 1.0791473388671875, 1.119171142578125, 1.1591949462890625, 1.19921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 11.0, 23.0, 18.0, 12.0, 21.0, 45.0, 63.0, 94.0, 135.0, 253.0, 394.0, 774.0, 1854.0, 5520.0, 26653.0, 593985.0, 383695.0, 25842.0, 5566.0, 1860.0, 714.0, 374.0, 240.0, 119.0, 68.0, 57.0, 48.0, 31.0, 17.0, 18.0, 9.0, 6.0, 4.0, 2.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.884765625, -3.76702880859375, -3.6492919921875, -3.53155517578125, -3.413818359375, -3.29608154296875, -3.1783447265625, -3.06060791015625, -2.94287109375, -2.82513427734375, -2.7073974609375, -2.58966064453125, -2.471923828125, -2.35418701171875, -2.2364501953125, -2.11871337890625, -2.0009765625, -1.88323974609375, -1.7655029296875, -1.64776611328125, -1.530029296875, -1.41229248046875, -1.2945556640625, -1.17681884765625, -1.05908203125, -0.94134521484375, -0.8236083984375, -0.70587158203125, -0.588134765625, -0.47039794921875, -0.3526611328125, -0.23492431640625, -0.1171875, 0.00054931640625, 0.1182861328125, 0.23602294921875, 0.353759765625, 0.47149658203125, 0.5892333984375, 0.70697021484375, 0.82470703125, 0.94244384765625, 1.0601806640625, 1.17791748046875, 1.295654296875, 1.41339111328125, 1.5311279296875, 1.64886474609375, 1.7666015625, 1.88433837890625, 2.0020751953125, 2.11981201171875, 2.237548828125, 2.35528564453125, 2.4730224609375, 2.59075927734375, 2.70849609375, 2.82623291015625, 2.9439697265625, 3.06170654296875, 3.179443359375, 3.29718017578125, 3.4149169921875, 3.53265380859375, 3.650390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 4.0, 9.0, 8.0, 10.0, 10.0, 13.0, 19.0, 20.0, 26.0, 28.0, 37.0, 29.0, 58.0, 56.0, 74.0, 86.0, 77.0, 74.0, 68.0, 56.0, 37.0, 34.0, 22.0, 20.0, 25.0, 11.0, 11.0, 9.0, 17.0, 13.0, 6.0, 6.0, 9.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6796875, -5.5029296875, -5.326171875, -5.1494140625, -4.97265625, -4.7958984375, -4.619140625, -4.4423828125, -4.265625, -4.0888671875, -3.912109375, -3.7353515625, -3.55859375, -3.3818359375, -3.205078125, -3.0283203125, -2.8515625, -2.6748046875, -2.498046875, -2.3212890625, -2.14453125, -1.9677734375, -1.791015625, -1.6142578125, -1.4375, -1.2607421875, -1.083984375, -0.9072265625, -0.73046875, -0.5537109375, -0.376953125, -0.2001953125, -0.0234375, 0.1533203125, 0.330078125, 0.5068359375, 0.68359375, 0.8603515625, 1.037109375, 1.2138671875, 1.390625, 1.5673828125, 1.744140625, 1.9208984375, 2.09765625, 2.2744140625, 2.451171875, 2.6279296875, 2.8046875, 2.9814453125, 3.158203125, 3.3349609375, 3.51171875, 3.6884765625, 3.865234375, 4.0419921875, 4.21875, 4.3955078125, 4.572265625, 4.7490234375, 4.92578125, 5.1025390625, 5.279296875, 5.4560546875, 5.6328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 6.0, 7.0, 11.0, 11.0, 12.0, 30.0, 29.0, 31.0, 58.0, 86.0, 128.0, 215.0, 428.0, 864.0, 1871.0, 4669.0, 13846.0, 59549.0, 841393.0, 96217.0, 18551.0, 5956.0, 2352.0, 1046.0, 508.0, 239.0, 139.0, 87.0, 51.0, 39.0, 32.0, 20.0, 14.0, 21.0, 18.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.79150390625, -0.7698898315429688, -0.7482757568359375, -0.7266616821289062, -0.705047607421875, -0.6834335327148438, -0.6618194580078125, -0.6402053833007812, -0.61859130859375, -0.5969772338867188, -0.5753631591796875, -0.5537490844726562, -0.532135009765625, -0.5105209350585938, -0.4889068603515625, -0.46729278564453125, -0.4456787109375, -0.42406463623046875, -0.4024505615234375, -0.38083648681640625, -0.359222412109375, -0.33760833740234375, -0.3159942626953125, -0.29438018798828125, -0.27276611328125, -0.25115203857421875, -0.2295379638671875, -0.20792388916015625, -0.186309814453125, -0.16469573974609375, -0.1430816650390625, -0.12146759033203125, -0.099853515625, -0.07823944091796875, -0.0566253662109375, -0.03501129150390625, -0.013397216796875, 0.00821685791015625, 0.0298309326171875, 0.05144500732421875, 0.07305908203125, 0.09467315673828125, 0.1162872314453125, 0.13790130615234375, 0.159515380859375, 0.18112945556640625, 0.2027435302734375, 0.22435760498046875, 0.2459716796875, 0.26758575439453125, 0.2891998291015625, 0.31081390380859375, 0.332427978515625, 0.35404205322265625, 0.3756561279296875, 0.39727020263671875, 0.41888427734375, 0.44049835205078125, 0.4621124267578125, 0.48372650146484375, 0.505340576171875, 0.5269546508789062, 0.5485687255859375, 0.5701828002929688, 0.591796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 3.0, 5.0, 11.0, 9.0, 18.0, 13.0, 15.0, 27.0, 31.0, 34.0, 47.0, 73.0, 120.0, 120.0, 110.0, 94.0, 69.0, 28.0, 43.0, 26.0, 27.0, 12.0, 7.0, 9.0, 11.0, 7.0, 11.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002486705780029297, -0.00024131685495376587, -0.00023396313190460205, -0.00022660940885543823, -0.00021925568580627441, -0.0002119019627571106, -0.00020454823970794678, -0.00019719451665878296, -0.00018984079360961914, -0.00018248707056045532, -0.0001751333475112915, -0.00016777962446212769, -0.00016042590141296387, -0.00015307217836380005, -0.00014571845531463623, -0.0001383647322654724, -0.0001310110092163086, -0.00012365728616714478, -0.00011630356311798096, -0.00010894984006881714, -0.00010159611701965332, -9.42423939704895e-05, -8.688867092132568e-05, -7.953494787216187e-05, -7.218122482299805e-05, -6.482750177383423e-05, -5.747377872467041e-05, -5.012005567550659e-05, -4.2766332626342773e-05, -3.5412609577178955e-05, -2.8058886528015137e-05, -2.070516347885132e-05, -1.33514404296875e-05, -5.997717380523682e-06, 1.3560056686401367e-06, 8.709728717803955e-06, 1.6063451766967773e-05, 2.3417174816131592e-05, 3.077089786529541e-05, 3.812462091445923e-05, 4.547834396362305e-05, 5.2832067012786865e-05, 6.0185790061950684e-05, 6.75395131111145e-05, 7.489323616027832e-05, 8.224695920944214e-05, 8.960068225860596e-05, 9.695440530776978e-05, 0.0001043081283569336, 0.00011166185140609741, 0.00011901557445526123, 0.00012636929750442505, 0.00013372302055358887, 0.00014107674360275269, 0.0001484304666519165, 0.00015578418970108032, 0.00016313791275024414, 0.00017049163579940796, 0.00017784535884857178, 0.0001851990818977356, 0.00019255280494689941, 0.00019990652799606323, 0.00020726025104522705, 0.00021461397409439087, 0.0002219676971435547]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 6.0, 12.0, 11.0, 15.0, 35.0, 35.0, 67.0, 85.0, 131.0, 241.0, 420.0, 795.0, 1702.0, 3906.0, 10603.0, 36027.0, 242603.0, 692884.0, 39414.0, 11563.0, 4323.0, 1700.0, 887.0, 411.0, 240.0, 138.0, 97.0, 54.0, 42.0, 32.0, 16.0, 14.0, 8.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5478515625, -0.5322151184082031, -0.5165786743164062, -0.5009422302246094, -0.4853057861328125, -0.4696693420410156, -0.45403289794921875, -0.4383964538574219, -0.422760009765625, -0.4071235656738281, -0.39148712158203125, -0.3758506774902344, -0.3602142333984375, -0.3445777893066406, -0.32894134521484375, -0.3133049011230469, -0.29766845703125, -0.2820320129394531, -0.26639556884765625, -0.2507591247558594, -0.2351226806640625, -0.21948623657226562, -0.20384979248046875, -0.18821334838867188, -0.172576904296875, -0.15694046020507812, -0.14130401611328125, -0.12566757202148438, -0.1100311279296875, -0.09439468383789062, -0.07875823974609375, -0.06312179565429688, -0.0474853515625, -0.031848907470703125, -0.01621246337890625, -0.000576019287109375, 0.0150604248046875, 0.030696868896484375, 0.04633331298828125, 0.061969757080078125, 0.077606201171875, 0.09324264526367188, 0.10887908935546875, 0.12451553344726562, 0.1401519775390625, 0.15578842163085938, 0.17142486572265625, 0.18706130981445312, 0.20269775390625, 0.21833419799804688, 0.23397064208984375, 0.24960708618164062, 0.2652435302734375, 0.2808799743652344, 0.29651641845703125, 0.3121528625488281, 0.327789306640625, 0.3434257507324219, 0.35906219482421875, 0.3746986389160156, 0.3903350830078125, 0.4059715270996094, 0.42160797119140625, 0.4372444152832031, 0.452880859375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 3.0, 1.0, 10.0, 9.0, 16.0, 14.0, 17.0, 33.0, 30.0, 31.0, 56.0, 82.0, 97.0, 116.0, 100.0, 97.0, 71.0, 43.0, 39.0, 29.0, 15.0, 17.0, 17.0, 6.0, 8.0, 5.0, 9.0, 1.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.72705078125, -0.7056045532226562, -0.6841583251953125, -0.6627120971679688, -0.641265869140625, -0.6198196411132812, -0.5983734130859375, -0.5769271850585938, -0.55548095703125, -0.5340347290039062, -0.5125885009765625, -0.49114227294921875, -0.469696044921875, -0.44824981689453125, -0.4268035888671875, -0.40535736083984375, -0.3839111328125, -0.36246490478515625, -0.3410186767578125, -0.31957244873046875, -0.298126220703125, -0.27667999267578125, -0.2552337646484375, -0.23378753662109375, -0.21234130859375, -0.19089508056640625, -0.1694488525390625, -0.14800262451171875, -0.126556396484375, -0.10511016845703125, -0.0836639404296875, -0.06221771240234375, -0.040771484375, -0.01932525634765625, 0.0021209716796875, 0.02356719970703125, 0.045013427734375, 0.06645965576171875, 0.0879058837890625, 0.10935211181640625, 0.13079833984375, 0.15224456787109375, 0.1736907958984375, 0.19513702392578125, 0.216583251953125, 0.23802947998046875, 0.2594757080078125, 0.28092193603515625, 0.3023681640625, 0.32381439208984375, 0.3452606201171875, 0.36670684814453125, 0.388153076171875, 0.40959930419921875, 0.4310455322265625, 0.45249176025390625, 0.47393798828125, 0.49538421630859375, 0.5168304443359375, 0.5382766723632812, 0.559722900390625, 0.5811691284179688, 0.6026153564453125, 0.6240615844726562, 0.6455078125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 15.0, 32.0, 66.0, 87.0, 510.0, 127.0, 67.0, 42.0, 22.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.34033966064453, -40.39403533935547, -39.44772720336914, -38.50142288208008, -37.555118560791016, -36.60881042480469, -35.662506103515625, -34.71620178222656, -33.769893646240234, -32.82358932495117, -31.877283096313477, -30.93097686767578, -29.984670639038086, -29.03836441040039, -28.092060089111328, -27.145753860473633, -26.19944953918457, -25.253143310546875, -24.306838989257812, -23.360532760620117, -22.414226531982422, -21.46792221069336, -20.521615982055664, -19.57530975341797, -18.629005432128906, -17.68269920349121, -16.73639488220215, -15.790088653564453, -14.843782424926758, -13.897477149963379, -12.951171875, -12.004865646362305, -11.05855941772461, -10.11225414276123, -9.165947914123535, -8.219642639160156, -7.273336887359619, -6.327031135559082, -5.380725860595703, -4.434420108795166, -3.488114356994629, -2.541808605194092, -1.5955030918121338, -0.6491975784301758, 0.29710817337036133, 1.2434139251708984, 2.1897192001342773, 3.1360249519348145, 4.082330703735352, 5.028636455535889, 5.974942207336426, 6.921247482299805, 7.867553234100342, 8.813858985900879, 9.760164260864258, 10.706470489501953, 11.652775764465332, 12.599081039428711, 13.545387268066406, 14.491692543029785, 15.437997817993164, 16.38430404663086, 17.330608367919922, 18.276914596557617, 19.223220825195312]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 6.0, 2.0, 3.0, 6.0, 5.0, 12.0, 15.0, 9.0, 18.0, 8.0, 18.0, 18.0, 27.0, 42.0, 28.0, 32.0, 94.0, 325.0, 100.0, 37.0, 29.0, 20.0, 17.0, 16.0, 20.0, 17.0, 10.0, 18.0, 11.0, 9.0, 10.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-18.823379516601562, -18.32134246826172, -17.819303512573242, -17.3172664642334, -16.815227508544922, -16.313190460205078, -15.811152458190918, -15.309114456176758, -14.807076454162598, -14.305038452148438, -13.803000450134277, -13.300962448120117, -12.798925399780273, -12.296886444091797, -11.794849395751953, -11.292811393737793, -10.790773391723633, -10.288735389709473, -9.786697387695312, -9.284659385681152, -8.782621383666992, -8.280584335327148, -7.778546333312988, -7.276508331298828, -6.774470329284668, -6.272432327270508, -5.770394325256348, -5.268356800079346, -4.7663187980651855, -4.264280796051025, -3.7622430324554443, -3.2602052688598633, -2.7581663131713867, -2.2561283111572266, -1.7540905475616455, -1.252052664756775, -0.7500147819519043, -0.24797677993774414, 0.2540609836578369, 0.756098747253418, 1.2581367492675781, 1.7601746320724487, 2.2622125148773193, 2.7642502784729004, 3.2662882804870605, 3.7683262825012207, 4.270363807678223, 4.772401809692383, 5.274439811706543, 5.776477813720703, 6.278515815734863, 6.780553340911865, 7.282591342926025, 7.7846293449401855, 8.286666870117188, 8.788704872131348, 9.290742874145508, 9.792780876159668, 10.294818878173828, 10.796856880187988, 11.298894882202148, 11.800931930541992, 12.302969932556152, 12.805007934570312, 13.307045936584473]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 8.0, 13.0, 7.0, 10.0, 7.0, 9.0, 6.0, 22.0, 12.0, 14.0, 15.0, 24.0, 20.0, 33.0, 41.0, 38.0, 82.0, 184.0, 108.0, 55.0, 28.0, 32.0, 40.0, 23.0, 24.0, 17.0, 14.0, 18.0, 15.0, 9.0, 10.0, 10.0, 10.0, 6.0, 4.0, 5.0, 7.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9736328125, -0.9417266845703125, -0.909820556640625, -0.8779144287109375, -0.84600830078125, -0.8141021728515625, -0.782196044921875, -0.7502899169921875, -0.7183837890625, -0.6864776611328125, -0.654571533203125, -0.6226654052734375, -0.59075927734375, -0.5588531494140625, -0.526947021484375, -0.4950408935546875, -0.463134765625, -0.4312286376953125, -0.399322509765625, -0.3674163818359375, -0.33551025390625, -0.3036041259765625, -0.271697998046875, -0.2397918701171875, -0.2078857421875, -0.1759796142578125, -0.144073486328125, -0.1121673583984375, -0.08026123046875, -0.0483551025390625, -0.016448974609375, 0.0154571533203125, 0.04736328125, 0.0792694091796875, 0.111175537109375, 0.1430816650390625, 0.17498779296875, 0.2068939208984375, 0.238800048828125, 0.2707061767578125, 0.3026123046875, 0.3345184326171875, 0.366424560546875, 0.3983306884765625, 0.43023681640625, 0.4621429443359375, 0.494049072265625, 0.5259552001953125, 0.557861328125, 0.5897674560546875, 0.621673583984375, 0.6535797119140625, 0.68548583984375, 0.7173919677734375, 0.749298095703125, 0.7812042236328125, 0.8131103515625, 0.8450164794921875, 0.876922607421875, 0.9088287353515625, 0.94073486328125, 0.9726409912109375, 1.004547119140625, 1.0364532470703125, 1.068359375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 7.0, 0.0, 8.0, 4.0, 9.0, 6.0, 4.0, 15.0, 21.0, 23.0, 45.0, 90.0, 156.0, 321.0, 1052.0, 4136.0, 39021.0, 8331728.0, 8890.0, 1930.0, 564.0, 220.0, 108.0, 63.0, 23.0, 26.0, 22.0, 26.0, 2.0, 7.0, 9.0, 6.0, 4.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 4.0], "bins": [-13.309447288513184, -12.883353233337402, -12.457258224487305, -12.031164169311523, -11.605069160461426, -11.178975105285645, -10.752880096435547, -10.326786041259766, -9.900691032409668, -9.474596977233887, -9.048501968383789, -8.622407913208008, -8.19631290435791, -7.770218849182129, -7.344123840332031, -6.91802978515625, -6.4919352531433105, -6.065840721130371, -5.639746189117432, -5.213651657104492, -4.787557125091553, -4.361462593078613, -3.935368299484253, -3.5092737674713135, -3.083179235458374, -2.6570847034454346, -2.230990171432495, -1.8048957586288452, -1.3788012266159058, -0.9527068138122559, -0.5266122817993164, -0.10051774978637695, 0.3255767822265625, 0.751671314239502, 1.1777658462524414, 1.6038602590560913, 2.0299549102783203, 2.4560492038726807, 2.88214373588562, 3.3082382678985596, 3.734332799911499, 4.160427093505859, 4.586521625518799, 5.012616157531738, 5.438710689544678, 5.864805221557617, 6.290899753570557, 6.716994285583496, 7.1430888175964355, 7.569183349609375, 7.9952778816223145, 8.421372413635254, 8.847466468811035, 9.273561477661133, 9.699655532836914, 10.125750541687012, 10.551844596862793, 10.977938652038574, 11.404033660888672, 11.830127716064453, 12.25622272491455, 12.682316780090332, 13.10841178894043, 13.534505844116211, 13.960600852966309]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 7.0, 5.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 1.0, 6.0, 4.0, 3.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.521769523620605, -11.245092391967773, -10.968414306640625, -10.691737174987793, -10.415060043334961, -10.138382911682129, -9.86170482635498, -9.585027694702148, -9.308350563049316, -9.031673431396484, -8.754995346069336, -8.478318214416504, -8.201641082763672, -7.924963474273682, -7.648285865783691, -7.371608734130859, -7.094931125640869, -6.818253517150879, -6.541576385498047, -6.264898777008057, -5.988221645355225, -5.711544036865234, -5.434866905212402, -5.158189296722412, -4.881511688232422, -4.604834079742432, -4.3281569480896, -4.051479339599609, -3.7748022079467773, -3.498124599456787, -3.221447229385376, -2.944769859313965, -2.6680922508239746, -2.3914148807525635, -2.1147375106811523, -1.8380600214004517, -1.5613826513290405, -1.2847052812576294, -1.0080277919769287, -0.7313504219055176, -0.45467305183410645, -0.17799565196037292, 0.0986817479133606, 0.3753591775894165, 0.6520365476608276, 0.9287139177322388, 1.2053914070129395, 1.4820687770843506, 1.7587461471557617, 2.035423517227173, 2.312100887298584, 2.588778495788574, 2.8654556274414062, 3.1421332359313965, 3.4188106060028076, 3.6954879760742188, 3.97216534614563, 4.248842716217041, 4.525520324707031, 4.802197456359863, 5.0788750648498535, 5.3555521965026855, 5.632229804992676, 5.908906936645508, 6.185584545135498]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 1.0, 7.0, 12.0, 20.0, 20.0, 31.0, 46.0, 55.0, 91.0, 148.0, 253.0, 481.0, 949.0, 2207.0, 5936.0, 16898.0, 51651.0, 158694.0, 189592.0, 64860.0, 20375.0, 7079.0, 2688.0, 991.0, 487.0, 248.0, 144.0, 88.0, 62.0, 40.0, 30.0, 23.0, 10.0, 13.0, 11.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-12.6015625, -12.2525634765625, -11.903564453125, -11.5545654296875, -11.20556640625, -10.8565673828125, -10.507568359375, -10.1585693359375, -9.8095703125, -9.4605712890625, -9.111572265625, -8.7625732421875, -8.41357421875, -8.0645751953125, -7.715576171875, -7.3665771484375, -7.017578125, -6.6685791015625, -6.319580078125, -5.9705810546875, -5.62158203125, -5.2725830078125, -4.923583984375, -4.5745849609375, -4.2255859375, -3.8765869140625, -3.527587890625, -3.1785888671875, -2.82958984375, -2.4805908203125, -2.131591796875, -1.7825927734375, -1.43359375, -1.0845947265625, -0.735595703125, -0.3865966796875, -0.03759765625, 0.3114013671875, 0.660400390625, 1.0093994140625, 1.3583984375, 1.7073974609375, 2.056396484375, 2.4053955078125, 2.75439453125, 3.1033935546875, 3.452392578125, 3.8013916015625, 4.150390625, 4.4993896484375, 4.848388671875, 5.1973876953125, 5.54638671875, 5.8953857421875, 6.244384765625, 6.5933837890625, 6.9423828125, 7.2913818359375, 7.640380859375, 7.9893798828125, 8.33837890625, 8.6873779296875, 9.036376953125, 9.3853759765625, 9.734375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 7.0, 6.0, 10.0, 15.0, 12.0, 15.0, 18.0, 21.0, 33.0, 30.0, 48.0, 53.0, 68.0, 72.0, 71.0, 69.0, 60.0, 56.0, 54.0, 59.0, 32.0, 35.0, 33.0, 29.0, 9.0, 12.0, 17.0, 6.0, 8.0, 7.0, 9.0, 5.0, 1.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.818359375, -1.7715301513671875, -1.724700927734375, -1.6778717041015625, -1.63104248046875, -1.5842132568359375, -1.537384033203125, -1.4905548095703125, -1.4437255859375, -1.3968963623046875, -1.350067138671875, -1.3032379150390625, -1.25640869140625, -1.2095794677734375, -1.162750244140625, -1.1159210205078125, -1.069091796875, -1.0222625732421875, -0.975433349609375, -0.9286041259765625, -0.88177490234375, -0.8349456787109375, -0.788116455078125, -0.7412872314453125, -0.6944580078125, -0.6476287841796875, -0.600799560546875, -0.5539703369140625, -0.50714111328125, -0.4603118896484375, -0.413482666015625, -0.3666534423828125, -0.31982421875, -0.2729949951171875, -0.226165771484375, -0.1793365478515625, -0.13250732421875, -0.0856781005859375, -0.038848876953125, 0.0079803466796875, 0.0548095703125, 0.1016387939453125, 0.148468017578125, 0.1952972412109375, 0.24212646484375, 0.2889556884765625, 0.335784912109375, 0.3826141357421875, 0.429443359375, 0.4762725830078125, 0.523101806640625, 0.5699310302734375, 0.61676025390625, 0.6635894775390625, 0.710418701171875, 0.7572479248046875, 0.8040771484375, 0.8509063720703125, 0.897735595703125, 0.9445648193359375, 0.99139404296875, 1.0382232666015625, 1.085052490234375, 1.1318817138671875, 1.1787109375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 8.0, 2.0, 6.0, 11.0, 13.0, 29.0, 49.0, 83.0, 117.0, 75.0, 39.0, 18.0, 7.0, 6.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.193470001220703, -8.796862602233887, -8.400256156921387, -8.00364875793457, -7.607041835784912, -7.210434913635254, -6.813827991485596, -6.4172210693359375, -6.020613670349121, -5.624006748199463, -5.227399826049805, -4.830792427062988, -4.43418550491333, -4.037578582763672, -3.6409716606140137, -3.2443645000457764, -2.8477578163146973, -2.451150894165039, -2.0545437335968018, -1.6579368114471436, -1.2613297700881958, -0.864722728729248, -0.46811580657958984, -0.07150864601135254, 0.32509827613830566, 0.7217053174972534, 1.1183123588562012, 1.5149192810058594, 1.9115263223648071, 2.308133363723755, 2.704740285873413, 3.1013474464416504, 3.4979543685913086, 3.894561290740967, 4.291168212890625, 4.687775611877441, 5.0843825340271, 5.480989456176758, 5.877596378326416, 6.274203300476074, 6.670810699462891, 7.067417621612549, 7.464024543762207, 7.860631942749023, 8.257238388061523, 8.65384578704834, 9.050453186035156, 9.447059631347656, 9.843666076660156, 10.240273475646973, 10.636879920959473, 11.033487319946289, 11.430093765258789, 11.826701164245605, 12.223308563232422, 12.619915008544922, 13.016522407531738, 13.413129806518555, 13.809736251831055, 14.206343650817871, 14.602950096130371, 14.999557495117188, 15.396163940429688, 15.792771339416504, 16.18937873840332]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 5.0, 11.0, 10.0, 23.0, 47.0, 64.0, 75.0, 73.0, 59.0, 33.0, 20.0, 9.0, 6.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.668726921081543, -6.446429252624512, -6.224132061004639, -6.001834392547607, -5.779537200927734, -5.557239532470703, -5.334941864013672, -5.112644195556641, -4.890347003936768, -4.668049335479736, -4.445752143859863, -4.223454475402832, -4.001156806945801, -3.7788596153259277, -3.5565619468688965, -3.3342645168304443, -3.111967086791992, -2.88966965675354, -2.667372226715088, -2.4450745582580566, -2.2227771282196045, -2.0004796981811523, -1.7781821489334106, -1.555884599685669, -1.3335871696472168, -1.1112897396087646, -0.888992190361023, -0.666694700717926, -0.4443972110748291, -0.22209978103637695, 0.0001977682113647461, 0.22249531745910645, 0.4447932243347168, 0.6670907139778137, 0.8893882036209106, 1.1116857528686523, 1.3339831829071045, 1.5562806129455566, 1.7785781621932983, 2.00087571144104, 2.223173141479492, 2.4454705715179443, 2.6677680015563965, 2.8900656700134277, 3.11236310005188, 3.334660530090332, 3.5569581985473633, 3.7792556285858154, 4.001553058624268, 4.223850727081299, 4.446147918701172, 4.668445587158203, 4.890743255615234, 5.113040447235107, 5.335338115692139, 5.557635307312012, 5.779932975769043, 6.002230644226074, 6.224527835845947, 6.4468255043029785, 6.669122695922852, 6.891420364379883, 7.113718032836914, 7.336015701293945, 7.558312892913818]}, "eval/loss": 4.192998886108398, "eval/wer": 1.903669178897263, "eval/runtime": 786.9912, "eval/samples_per_second": 3.357, "eval/steps_per_second": 0.281, "train/train_runtime": 6714.5583, "train/train_samples_per_second": 4.25, "train/train_steps_per_second": 0.177, "train/total_flos": 0.0, "train/train_loss": 4.242165094268132} \ No newline at end of file +{"train/loss": 4.3516, "train/learning_rate": 1.741654571843251e-07, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 7937, "_timestamp": 1646130789, "_step": 1192, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 28.0, 680.0, 301.0, 7.0, 1.0], "bins": [-571.5680541992188, -562.168701171875, -552.7693481445312, -543.3699951171875, -533.9706420898438, -524.5712890625, -515.171875, -505.7725524902344, -496.3731689453125, -486.97381591796875, -477.574462890625, -468.1750793457031, -458.7757263183594, -449.3763732910156, -439.9770202636719, -430.5776672363281, -421.1783142089844, -411.7789611816406, -402.3796081542969, -392.980224609375, -383.58087158203125, -374.1815185546875, -364.78216552734375, -355.3828125, -345.98345947265625, -336.5841064453125, -327.18475341796875, -317.7853698730469, -308.3860168457031, -298.9866638183594, -289.5873107910156, -280.1879577636719, -270.78857421875, -261.38922119140625, -251.98985290527344, -242.5904998779297, -233.19113159179688, -223.79177856445312, -214.39242553710938, -204.99307250976562, -195.59368896484375, -186.1943359375, -176.7949676513672, -167.39561462402344, -157.99624633789062, -148.59689331054688, -139.19754028320312, -129.79818725585938, -120.3988265991211, -110.99946594238281, -101.60011291503906, -92.20075225830078, -82.8013916015625, -73.40203094482422, -64.00267028808594, -54.60331726074219, -45.203956604003906, -35.804595947265625, -26.40523910522461, -17.00588035583496, -7.6065216064453125, 1.7928390502929688, 11.192195892333984, 20.591552734375, 29.990915298461914]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 5.0, 3.0, 8.0, 7.0, 9.0, 13.0, 12.0, 15.0, 26.0, 23.0, 30.0, 20.0, 28.0, 43.0, 47.0, 31.0, 42.0, 57.0, 39.0, 53.0, 49.0, 51.0, 40.0, 54.0, 45.0, 24.0, 26.0, 34.0, 19.0, 30.0, 12.0, 17.0, 17.0, 10.0, 11.0, 16.0, 11.0, 7.0, 5.0, 4.0, 0.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.36842346191406, -51.56277847290039, -49.75713348388672, -47.95148849487305, -46.145843505859375, -44.3401985168457, -42.53455352783203, -40.728904724121094, -38.92326354980469, -37.117618560791016, -35.311973571777344, -33.50632858276367, -31.70068359375, -29.895038604736328, -28.089391708374023, -26.28374671936035, -24.478099822998047, -22.672454833984375, -20.866809844970703, -19.06116485595703, -17.25551986694336, -15.449873924255371, -13.644227981567383, -11.838582992553711, -10.032938003540039, -8.227293014526367, -6.421647548675537, -4.616002082824707, -2.810357093811035, -1.0047121047973633, 0.800933837890625, 2.606578826904297, 4.412223815917969, 6.217868804931641, 8.023513793945312, 9.8291597366333, 11.634804725646973, 13.440449714660645, 15.246095657348633, 17.051740646362305, 18.857385635375977, 20.66303062438965, 22.46867561340332, 24.274322509765625, 26.079967498779297, 27.88561248779297, 29.69125747680664, 31.496902465820312, 33.302547454833984, 35.108192443847656, 36.91383743286133, 38.719482421875, 40.52512741088867, 42.330772399902344, 44.13642120361328, 45.94206237792969, 47.747711181640625, 49.5533561706543, 51.35900115966797, 53.16464614868164, 54.97029113769531, 56.775936126708984, 58.581581115722656, 60.387229919433594, 62.19287109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 10.0, 10.0, 15.0, 17.0, 27.0, 42.0, 51.0, 54.0, 68.0, 81.0, 76.0, 97.0, 91.0, 87.0, 69.0, 55.0, 35.0, 38.0, 23.0, 26.0, 15.0, 9.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.70703125, -7.525390625, -7.34375, -7.162109375, -6.98046875, -6.798828125, -6.6171875, -6.435546875, -6.25390625, -6.072265625, -5.890625, -5.708984375, -5.52734375, -5.345703125, -5.1640625, -4.982421875, -4.80078125, -4.619140625, -4.4375, -4.255859375, -4.07421875, -3.892578125, -3.7109375, -3.529296875, -3.34765625, -3.166015625, -2.984375, -2.802734375, -2.62109375, -2.439453125, -2.2578125, -2.076171875, -1.89453125, -1.712890625, -1.53125, -1.349609375, -1.16796875, -0.986328125, -0.8046875, -0.623046875, -0.44140625, -0.259765625, -0.078125, 0.103515625, 0.28515625, 0.466796875, 0.6484375, 0.830078125, 1.01171875, 1.193359375, 1.375, 1.556640625, 1.73828125, 1.919921875, 2.1015625, 2.283203125, 2.46484375, 2.646484375, 2.828125, 3.009765625, 3.19140625, 3.373046875, 3.5546875, 3.736328125, 3.91796875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 7.0, 11.0, 15.0, 14.0, 26.0, 39.0, 78.0, 114.0, 244.0, 480.0, 1043.0, 2971.0, 12037.0, 112525.0, 3599716.0, 434632.0, 22931.0, 4657.0, 1478.0, 619.0, 279.0, 145.0, 78.0, 56.0, 39.0, 21.0, 15.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.484375, -25.833251953125, -25.18212890625, -24.531005859375, -23.8798828125, -23.228759765625, -22.57763671875, -21.926513671875, -21.275390625, -20.624267578125, -19.97314453125, -19.322021484375, -18.6708984375, -18.019775390625, -17.36865234375, -16.717529296875, -16.06640625, -15.415283203125, -14.76416015625, -14.113037109375, -13.4619140625, -12.810791015625, -12.15966796875, -11.508544921875, -10.857421875, -10.206298828125, -9.55517578125, -8.904052734375, -8.2529296875, -7.601806640625, -6.95068359375, -6.299560546875, -5.6484375, -4.997314453125, -4.34619140625, -3.695068359375, -3.0439453125, -2.392822265625, -1.74169921875, -1.090576171875, -0.439453125, 0.211669921875, 0.86279296875, 1.513916015625, 2.1650390625, 2.816162109375, 3.46728515625, 4.118408203125, 4.76953125, 5.420654296875, 6.07177734375, 6.722900390625, 7.3740234375, 8.025146484375, 8.67626953125, 9.327392578125, 9.978515625, 10.629638671875, 11.28076171875, 11.931884765625, 12.5830078125, 13.234130859375, 13.88525390625, 14.536376953125, 15.1875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 11.0, 8.0, 15.0, 24.0, 39.0, 64.0, 102.0, 186.0, 303.0, 565.0, 924.0, 785.0, 450.0, 247.0, 140.0, 85.0, 46.0, 33.0, 16.0, 11.0, 6.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.0625, -25.4390869140625, -24.815673828125, -24.1922607421875, -23.56884765625, -22.9454345703125, -22.322021484375, -21.6986083984375, -21.0751953125, -20.4517822265625, -19.828369140625, -19.2049560546875, -18.58154296875, -17.9581298828125, -17.334716796875, -16.7113037109375, -16.087890625, -15.4644775390625, -14.841064453125, -14.2176513671875, -13.59423828125, -12.9708251953125, -12.347412109375, -11.7239990234375, -11.1005859375, -10.4771728515625, -9.853759765625, -9.2303466796875, -8.60693359375, -7.9835205078125, -7.360107421875, -6.7366943359375, -6.11328125, -5.4898681640625, -4.866455078125, -4.2430419921875, -3.61962890625, -2.9962158203125, -2.372802734375, -1.7493896484375, -1.1259765625, -0.5025634765625, 0.120849609375, 0.7442626953125, 1.36767578125, 1.9910888671875, 2.614501953125, 3.2379150390625, 3.861328125, 4.4847412109375, 5.108154296875, 5.7315673828125, 6.35498046875, 6.9783935546875, 7.601806640625, 8.2252197265625, 8.8486328125, 9.4720458984375, 10.095458984375, 10.7188720703125, 11.34228515625, 11.9656982421875, 12.589111328125, 13.2125244140625, 13.8359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 6.0, 14.0, 17.0, 51.0, 73.0, 166.0, 392.0, 1072.0, 4721.0, 3545464.0, 637411.0, 3411.0, 864.0, 309.0, 133.0, 72.0, 33.0, 34.0, 13.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.4375, -78.71484375, -75.9921875, -73.26953125, -70.546875, -67.82421875, -65.1015625, -62.37890625, -59.65625, -56.93359375, -54.2109375, -51.48828125, -48.765625, -46.04296875, -43.3203125, -40.59765625, -37.875, -35.15234375, -32.4296875, -29.70703125, -26.984375, -24.26171875, -21.5390625, -18.81640625, -16.09375, -13.37109375, -10.6484375, -7.92578125, -5.203125, -2.48046875, 0.2421875, 2.96484375, 5.6875, 8.41015625, 11.1328125, 13.85546875, 16.578125, 19.30078125, 22.0234375, 24.74609375, 27.46875, 30.19140625, 32.9140625, 35.63671875, 38.359375, 41.08203125, 43.8046875, 46.52734375, 49.25, 51.97265625, 54.6953125, 57.41796875, 60.140625, 62.86328125, 65.5859375, 68.30859375, 71.03125, 73.75390625, 76.4765625, 79.19921875, 81.921875, 84.64453125, 87.3671875, 90.08984375, 92.8125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 18.0, 74.0, 299.0, 391.0, 176.0, 42.0, 8.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.13645553588867, -28.68865203857422, -25.240848541259766, -21.793045043945312, -18.34524154663086, -14.897438049316406, -11.449634552001953, -8.0018310546875, -4.554027557373047, -1.1062240600585938, 2.3415794372558594, 5.7893829345703125, 9.237186431884766, 12.684989929199219, 16.132793426513672, 19.580596923828125, 23.028400421142578, 26.47620391845703, 29.924007415771484, 33.37181091308594, 36.81961441040039, 40.267417907714844, 43.7152214050293, 47.16302490234375, 50.6108283996582, 54.058631896972656, 57.50643539428711, 60.95423889160156, 64.40203857421875, 67.84984588623047, 71.29765319824219, 74.74545288085938, 78.19325256347656, 81.64105224609375, 85.08885955810547, 88.53666687011719, 91.98446655273438, 95.43226623535156, 98.88007354736328, 102.327880859375, 105.77568054199219, 109.22348022460938, 112.6712875366211, 116.11909484863281, 119.56689453125, 123.01469421386719, 126.4625015258789, 129.91030883789062, 133.3581085205078, 136.805908203125, 140.25372314453125, 143.70152282714844, 147.14932250976562, 150.5971221923828, 154.044921875, 157.49273681640625, 160.94053649902344, 164.38833618164062, 167.83615112304688, 171.28395080566406, 174.73175048828125, 178.17955017089844, 181.62734985351562, 185.07516479492188, 188.52296447753906]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 11.0, 10.0, 13.0, 17.0, 15.0, 22.0, 38.0, 32.0, 40.0, 48.0, 52.0, 58.0, 50.0, 61.0, 57.0, 54.0, 68.0, 48.0, 61.0, 39.0, 43.0, 29.0, 28.0, 23.0, 23.0, 15.0, 10.0, 12.0, 8.0, 4.0, 4.0, 7.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.120880126953125, -53.443641662597656, -51.76640319824219, -50.08916473388672, -48.41192626953125, -46.73468780517578, -45.05744552612305, -43.38020706176758, -41.70296859741211, -40.02573013305664, -38.34849166870117, -36.6712532043457, -34.99401092529297, -33.3167724609375, -31.63953399658203, -29.962295532226562, -28.285057067871094, -26.607818603515625, -24.930580139160156, -23.253339767456055, -21.576101303100586, -19.898862838745117, -18.221622467041016, -16.544384002685547, -14.867145538330078, -13.18990707397461, -11.512667655944824, -9.835428237915039, -8.15818977355957, -6.480951309204102, -4.803711891174316, -3.1264724731445312, -1.4492340087890625, 0.22800493240356445, 1.9052438735961914, 3.5824828147888184, 5.259721755981445, 6.936960220336914, 8.6141996383667, 10.291439056396484, 11.968677520751953, 13.645915985107422, 15.323155403137207, 17.000394821166992, 18.67763328552246, 20.35487174987793, 22.03211212158203, 23.7093505859375, 25.38658905029297, 27.063827514648438, 28.741065979003906, 30.418306350708008, 32.095542907714844, 33.77278137207031, 35.45002365112305, 37.127262115478516, 38.804500579833984, 40.48173904418945, 42.15897750854492, 43.83621597290039, 45.513458251953125, 47.190696716308594, 48.86793518066406, 50.54517364501953, 52.222412109375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 3.0, 13.0, 15.0, 12.0, 16.0, 17.0, 25.0, 26.0, 26.0, 26.0, 43.0, 40.0, 40.0, 49.0, 63.0, 64.0, 65.0, 65.0, 60.0, 67.0, 38.0, 34.0, 34.0, 28.0, 26.0, 19.0, 19.0, 15.0, 17.0, 9.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.9921875, -4.8699951171875, -4.747802734375, -4.6256103515625, -4.50341796875, -4.3812255859375, -4.259033203125, -4.1368408203125, -4.0146484375, -3.8924560546875, -3.770263671875, -3.6480712890625, -3.52587890625, -3.4036865234375, -3.281494140625, -3.1593017578125, -3.037109375, -2.9149169921875, -2.792724609375, -2.6705322265625, -2.54833984375, -2.4261474609375, -2.303955078125, -2.1817626953125, -2.0595703125, -1.9373779296875, -1.815185546875, -1.6929931640625, -1.57080078125, -1.4486083984375, -1.326416015625, -1.2042236328125, -1.08203125, -0.9598388671875, -0.837646484375, -0.7154541015625, -0.59326171875, -0.4710693359375, -0.348876953125, -0.2266845703125, -0.1044921875, 0.0177001953125, 0.139892578125, 0.2620849609375, 0.38427734375, 0.5064697265625, 0.628662109375, 0.7508544921875, 0.873046875, 0.9952392578125, 1.117431640625, 1.2396240234375, 1.36181640625, 1.4840087890625, 1.606201171875, 1.7283935546875, 1.8505859375, 1.9727783203125, 2.094970703125, 2.2171630859375, 2.33935546875, 2.4615478515625, 2.583740234375, 2.7059326171875, 2.828125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 8.0, 19.0, 22.0, 29.0, 48.0, 63.0, 113.0, 149.0, 236.0, 394.0, 601.0, 959.0, 1544.0, 2700.0, 4523.0, 7869.0, 14193.0, 26898.0, 51923.0, 105188.0, 234836.0, 304580.0, 145208.0, 68993.0, 34600.0, 18535.0, 10306.0, 5606.0, 3285.0, 1886.0, 1227.0, 704.0, 442.0, 263.0, 201.0, 138.0, 85.0, 40.0, 33.0, 31.0, 16.0, 16.0, 8.0, 10.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56298828125, -0.5443496704101562, -0.5257110595703125, -0.5070724487304688, -0.488433837890625, -0.46979522705078125, -0.4511566162109375, -0.43251800537109375, -0.41387939453125, -0.39524078369140625, -0.3766021728515625, -0.35796356201171875, -0.339324951171875, -0.32068634033203125, -0.3020477294921875, -0.28340911865234375, -0.2647705078125, -0.24613189697265625, -0.2274932861328125, -0.20885467529296875, -0.190216064453125, -0.17157745361328125, -0.1529388427734375, -0.13430023193359375, -0.11566162109375, -0.09702301025390625, -0.0783843994140625, -0.05974578857421875, -0.041107177734375, -0.02246856689453125, -0.0038299560546875, 0.01480865478515625, 0.033447265625, 0.05208587646484375, 0.0707244873046875, 0.08936309814453125, 0.108001708984375, 0.12664031982421875, 0.1452789306640625, 0.16391754150390625, 0.18255615234375, 0.20119476318359375, 0.2198333740234375, 0.23847198486328125, 0.257110595703125, 0.27574920654296875, 0.2943878173828125, 0.31302642822265625, 0.3316650390625, 0.35030364990234375, 0.3689422607421875, 0.38758087158203125, 0.406219482421875, 0.42485809326171875, 0.4434967041015625, 0.46213531494140625, 0.48077392578125, 0.49941253662109375, 0.5180511474609375, 0.5366897583007812, 0.555328369140625, 0.5739669799804688, 0.5926055908203125, 0.6112442016601562, 0.6298828125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 9.0, 10.0, 9.0, 9.0, 7.0, 10.0, 19.0, 19.0, 20.0, 21.0, 23.0, 34.0, 25.0, 37.0, 31.0, 39.0, 38.0, 45.0, 36.0, 37.0, 1069.0, 44.0, 24.0, 42.0, 32.0, 37.0, 37.0, 31.0, 25.0, 21.0, 29.0, 24.0, 19.0, 17.0, 19.0, 16.0, 10.0, 10.0, 7.0, 5.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7822265625, -1.7237091064453125, -1.665191650390625, -1.6066741943359375, -1.54815673828125, -1.4896392822265625, -1.431121826171875, -1.3726043701171875, -1.3140869140625, -1.2555694580078125, -1.197052001953125, -1.1385345458984375, -1.08001708984375, -1.0214996337890625, -0.962982177734375, -0.9044647216796875, -0.845947265625, -0.7874298095703125, -0.728912353515625, -0.6703948974609375, -0.61187744140625, -0.5533599853515625, -0.494842529296875, -0.4363250732421875, -0.3778076171875, -0.3192901611328125, -0.260772705078125, -0.2022552490234375, -0.14373779296875, -0.0852203369140625, -0.026702880859375, 0.0318145751953125, 0.09033203125, 0.1488494873046875, 0.207366943359375, 0.2658843994140625, 0.32440185546875, 0.3829193115234375, 0.441436767578125, 0.4999542236328125, 0.5584716796875, 0.6169891357421875, 0.675506591796875, 0.7340240478515625, 0.79254150390625, 0.8510589599609375, 0.909576416015625, 0.9680938720703125, 1.026611328125, 1.0851287841796875, 1.143646240234375, 1.2021636962890625, 1.26068115234375, 1.3191986083984375, 1.377716064453125, 1.4362335205078125, 1.4947509765625, 1.5532684326171875, 1.611785888671875, 1.6703033447265625, 1.72882080078125, 1.7873382568359375, 1.845855712890625, 1.9043731689453125, 1.962890625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 6.0, 6.0, 9.0, 21.0, 36.0, 37.0, 60.0, 110.0, 160.0, 235.0, 356.0, 604.0, 885.0, 1563.0, 2494.0, 3972.0, 6892.0, 11570.0, 20294.0, 36413.0, 68491.0, 131573.0, 265142.0, 1237728.0, 142367.0, 74084.0, 39603.0, 21445.0, 12427.0, 7248.0, 4395.0, 2585.0, 1608.0, 1009.0, 607.0, 377.0, 249.0, 179.0, 103.0, 66.0, 36.0, 28.0, 22.0, 18.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.361328125, -0.3503990173339844, -0.33946990966796875, -0.3285408020019531, -0.3176116943359375, -0.3066825866699219, -0.29575347900390625, -0.2848243713378906, -0.273895263671875, -0.2629661560058594, -0.25203704833984375, -0.24110794067382812, -0.2301788330078125, -0.21924972534179688, -0.20832061767578125, -0.19739151000976562, -0.18646240234375, -0.17553329467773438, -0.16460418701171875, -0.15367507934570312, -0.1427459716796875, -0.13181686401367188, -0.12088775634765625, -0.10995864868164062, -0.099029541015625, -0.08810043334960938, -0.07717132568359375, -0.06624221801757812, -0.0553131103515625, -0.044384002685546875, -0.03345489501953125, -0.022525787353515625, -0.0115966796875, -0.000667572021484375, 0.01026153564453125, 0.021190643310546875, 0.0321197509765625, 0.043048858642578125, 0.05397796630859375, 0.06490707397460938, 0.075836181640625, 0.08676528930664062, 0.09769439697265625, 0.10862350463867188, 0.1195526123046875, 0.13048171997070312, 0.14141082763671875, 0.15233993530273438, 0.16326904296875, 0.17419815063476562, 0.18512725830078125, 0.19605636596679688, 0.2069854736328125, 0.21791458129882812, 0.22884368896484375, 0.23977279663085938, 0.250701904296875, 0.2616310119628906, 0.27256011962890625, 0.2834892272949219, 0.2944183349609375, 0.3053474426269531, 0.31627655029296875, 0.3272056579589844, 0.338134765625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 5.0, 16.0, 11.0, 14.0, 10.0, 10.0, 24.0, 24.0, 29.0, 36.0, 39.0, 47.0, 55.0, 75.0, 72.0, 76.0, 80.0, 64.0, 59.0, 44.0, 42.0, 26.0, 27.0, 27.0, 11.0, 23.0, 10.0, 5.0, 7.0, 7.0, 1.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018644332885742188, -0.0018067359924316406, -0.0017490386962890625, -0.0016913414001464844, -0.0016336441040039062, -0.0015759468078613281, -0.00151824951171875, -0.0014605522155761719, -0.0014028549194335938, -0.0013451576232910156, -0.0012874603271484375, -0.0012297630310058594, -0.0011720657348632812, -0.0011143684387207031, -0.001056671142578125, -0.0009989738464355469, -0.0009412765502929688, -0.0008835792541503906, -0.0008258819580078125, -0.0007681846618652344, -0.0007104873657226562, -0.0006527900695800781, -0.0005950927734375, -0.0005373954772949219, -0.00047969818115234375, -0.0004220008850097656, -0.0003643035888671875, -0.0003066062927246094, -0.00024890899658203125, -0.00019121170043945312, -0.000133514404296875, -7.581710815429688e-05, -1.811981201171875e-05, 3.9577484130859375e-05, 9.72747802734375e-05, 0.00015497207641601562, 0.00021266937255859375, 0.0002703666687011719, 0.00032806396484375, 0.0003857612609863281, 0.00044345855712890625, 0.0005011558532714844, 0.0005588531494140625, 0.0006165504455566406, 0.0006742477416992188, 0.0007319450378417969, 0.000789642333984375, 0.0008473396301269531, 0.0009050369262695312, 0.0009627342224121094, 0.0010204315185546875, 0.0010781288146972656, 0.0011358261108398438, 0.0011935234069824219, 0.001251220703125, 0.0013089179992675781, 0.0013666152954101562, 0.0014243125915527344, 0.0014820098876953125, 0.0015397071838378906, 0.0015974044799804688, 0.0016551017761230469, 0.001712799072265625, 0.0017704963684082031, 0.0018281936645507812]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 5.0, 8.0, 6.0, 19.0, 23.0, 31.0, 34.0, 69.0, 99.0, 112.0, 163.0, 222.0, 325.0, 474.0, 1284.0, 1038664.0, 5160.0, 609.0, 354.0, 232.0, 151.0, 133.0, 103.0, 65.0, 69.0, 24.0, 26.0, 18.0, 28.0, 5.0, 8.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.044189453125, -0.04287576675415039, -0.04156208038330078, -0.04024839401245117, -0.03893470764160156, -0.03762102127075195, -0.036307334899902344, -0.034993648529052734, -0.033679962158203125, -0.032366275787353516, -0.031052589416503906, -0.029738903045654297, -0.028425216674804688, -0.027111530303955078, -0.02579784393310547, -0.02448415756225586, -0.02317047119140625, -0.02185678482055664, -0.02054309844970703, -0.019229412078857422, -0.017915725708007812, -0.016602039337158203, -0.015288352966308594, -0.013974666595458984, -0.012660980224609375, -0.011347293853759766, -0.010033607482910156, -0.008719921112060547, -0.0074062347412109375, -0.006092548370361328, -0.004778861999511719, -0.0034651756286621094, -0.0021514892578125, -0.0008378028869628906, 0.00047588348388671875, 0.0017895698547363281, 0.0031032562255859375, 0.004416942596435547, 0.005730628967285156, 0.007044315338134766, 0.008358001708984375, 0.009671688079833984, 0.010985374450683594, 0.012299060821533203, 0.013612747192382812, 0.014926433563232422, 0.01624011993408203, 0.01755380630493164, 0.01886749267578125, 0.02018117904663086, 0.02149486541748047, 0.022808551788330078, 0.024122238159179688, 0.025435924530029297, 0.026749610900878906, 0.028063297271728516, 0.029376983642578125, 0.030690670013427734, 0.032004356384277344, 0.03331804275512695, 0.03463172912597656, 0.03594541549682617, 0.03725910186767578, 0.03857278823852539, 0.039886474609375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1008.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006473960820585489, 0.00025259109679609537, 0.0011525782756507397, 0.002052565338090062, 0.0029525526333600283, 0.0038525399286299944, 0.004752526991069317, 0.005652514286339283, 0.006552501581609249, 0.007452488876879215, 0.008352476172149181, 0.009252462536096573, 0.010152449831366539, 0.011052437126636505, 0.011952424421906471, 0.012852411717176437, 0.013752399012446404, 0.01465238630771637, 0.015552373602986336, 0.016452360898256302, 0.017352348193526268, 0.018252335488796234, 0.01915232092142105, 0.020052310079336166, 0.020952295511960983, 0.02185228280723095, 0.022752270102500916, 0.02365225739777088, 0.024552244693040848, 0.025452231988310814, 0.02635221928358078, 0.027252204716205597, 0.028152193874120712, 0.02905218116939068, 0.029952168464660645, 0.03085215575993061, 0.03175214305520058, 0.032652128487825394, 0.03355211764574051, 0.034452103078365326, 0.03535209223628044, 0.03625207766890526, 0.037152066826820374, 0.03805205225944519, 0.038952041417360306, 0.03985202684998512, 0.04075201600790024, 0.041652001440525055, 0.04255198687314987, 0.04345197230577469, 0.044351961463689804, 0.04525194689631462, 0.046151936054229736, 0.04705192148685455, 0.04795191064476967, 0.048851896077394485, 0.0497518852353096, 0.05065187066793442, 0.05155185982584953, 0.05245184525847435, 0.053351834416389465, 0.05425181984901428, 0.0551518090069294, 0.056051794439554214, 0.05695178359746933]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 22.0, 11.0, 31.0, 39.0, 40.0, 62.0, 70.0, 77.0, 54.0, 83.0, 75.0, 79.0, 50.0, 72.0, 75.0, 43.0, 39.0, 24.0, 24.0, 18.0, 10.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020893216133117676, -0.0020346548408269882, -0.001979988068342209, -0.0019253212958574295, -0.0018706545233726501, -0.0018159877508878708, -0.0017613209784030914, -0.001706654205918312, -0.0016519874334335327, -0.0015973206609487534, -0.001542653888463974, -0.0014879871159791946, -0.0014333203434944153, -0.001378653571009636, -0.0013239867985248566, -0.0012693200260400772, -0.0012146532535552979, -0.0011599864810705185, -0.0011053197085857391, -0.0010506529361009598, -0.0009959861636161804, -0.0009413193911314011, -0.0008866526186466217, -0.0008319858461618423, -0.000777319073677063, -0.0007226523011922836, -0.0006679855287075043, -0.0006133187562227249, -0.0005586519837379456, -0.0005039852112531662, -0.00044931843876838684, -0.0003946516662836075, -0.0003399848937988281, -0.00028531812131404877, -0.0002306513488292694, -0.00017598457634449005, -0.0001213178038597107, -6.665103137493134e-05, -1.1984258890151978e-05, 4.268251359462738e-05, 9.734928607940674e-05, 0.0001520160585641861, 0.00020668283104896545, 0.0002613496035337448, 0.00031601637601852417, 0.00037068314850330353, 0.0004253499209880829, 0.00048001669347286224, 0.0005346834659576416, 0.000589350238442421, 0.0006440170109272003, 0.0006986837834119797, 0.000753350555896759, 0.0008080173283815384, 0.0008626841008663177, 0.0009173508733510971, 0.0009720176458358765, 0.0010266844183206558, 0.0010813511908054352, 0.0011360179632902145, 0.001190684735774994, 0.0012453515082597733, 0.0013000182807445526, 0.001354685053229332, 0.0014093518257141113]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 3.0, 14.0, 14.0, 12.0, 16.0, 17.0, 25.0, 26.0, 26.0, 26.0, 43.0, 40.0, 40.0, 49.0, 63.0, 64.0, 65.0, 65.0, 60.0, 67.0, 38.0, 34.0, 34.0, 28.0, 26.0, 19.0, 19.0, 15.0, 17.0, 9.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.9921875, -4.8699951171875, -4.747802734375, -4.6256103515625, -4.50341796875, -4.3812255859375, -4.259033203125, -4.1368408203125, -4.0146484375, -3.8924560546875, -3.770263671875, -3.6480712890625, -3.52587890625, -3.4036865234375, -3.281494140625, -3.1593017578125, -3.037109375, -2.9149169921875, -2.792724609375, -2.6705322265625, -2.54833984375, -2.4261474609375, -2.303955078125, -2.1817626953125, -2.0595703125, -1.9373779296875, -1.815185546875, -1.6929931640625, -1.57080078125, -1.4486083984375, -1.326416015625, -1.2042236328125, -1.08203125, -0.9598388671875, -0.837646484375, -0.7154541015625, -0.59326171875, -0.4710693359375, -0.348876953125, -0.2266845703125, -0.1044921875, 0.0177001953125, 0.139892578125, 0.2620849609375, 0.38427734375, 0.5064697265625, 0.628662109375, 0.7508544921875, 0.873046875, 0.9952392578125, 1.117431640625, 1.2396240234375, 1.36181640625, 1.4840087890625, 1.606201171875, 1.7283935546875, 1.8505859375, 1.9727783203125, 2.094970703125, 2.2171630859375, 2.33935546875, 2.4615478515625, 2.583740234375, 2.7059326171875, 2.828125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 10.0, 6.0, 22.0, 20.0, 26.0, 41.0, 70.0, 77.0, 91.0, 142.0, 198.0, 248.0, 374.0, 517.0, 776.0, 1126.0, 1690.0, 2672.0, 4374.0, 7768.0, 14682.0, 44616.0, 646530.0, 264752.0, 28594.0, 11713.0, 6518.0, 3687.0, 2340.0, 1446.0, 1032.0, 686.0, 487.0, 334.0, 239.0, 177.0, 138.0, 81.0, 77.0, 41.0, 39.0, 24.0, 28.0, 10.0, 7.0, 7.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-16.65625, -16.149169921875, -15.64208984375, -15.135009765625, -14.6279296875, -14.120849609375, -13.61376953125, -13.106689453125, -12.599609375, -12.092529296875, -11.58544921875, -11.078369140625, -10.5712890625, -10.064208984375, -9.55712890625, -9.050048828125, -8.54296875, -8.035888671875, -7.52880859375, -7.021728515625, -6.5146484375, -6.007568359375, -5.50048828125, -4.993408203125, -4.486328125, -3.979248046875, -3.47216796875, -2.965087890625, -2.4580078125, -1.950927734375, -1.44384765625, -0.936767578125, -0.4296875, 0.077392578125, 0.58447265625, 1.091552734375, 1.5986328125, 2.105712890625, 2.61279296875, 3.119873046875, 3.626953125, 4.134033203125, 4.64111328125, 5.148193359375, 5.6552734375, 6.162353515625, 6.66943359375, 7.176513671875, 7.68359375, 8.190673828125, 8.69775390625, 9.204833984375, 9.7119140625, 10.218994140625, 10.72607421875, 11.233154296875, 11.740234375, 12.247314453125, 12.75439453125, 13.261474609375, 13.7685546875, 14.275634765625, 14.78271484375, 15.289794921875, 15.796875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 6.0, 5.0, 4.0, 10.0, 8.0, 7.0, 19.0, 17.0, 19.0, 15.0, 29.0, 27.0, 26.0, 24.0, 31.0, 43.0, 46.0, 45.0, 67.0, 139.0, 304.0, 1485.0, 185.0, 72.0, 64.0, 45.0, 43.0, 40.0, 29.0, 31.0, 30.0, 24.0, 18.0, 19.0, 21.0, 15.0, 11.0, 9.0, 5.0, 6.0, 4.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.421875, -9.138916015625, -8.85595703125, -8.572998046875, -8.2900390625, -8.007080078125, -7.72412109375, -7.441162109375, -7.158203125, -6.875244140625, -6.59228515625, -6.309326171875, -6.0263671875, -5.743408203125, -5.46044921875, -5.177490234375, -4.89453125, -4.611572265625, -4.32861328125, -4.045654296875, -3.7626953125, -3.479736328125, -3.19677734375, -2.913818359375, -2.630859375, -2.347900390625, -2.06494140625, -1.781982421875, -1.4990234375, -1.216064453125, -0.93310546875, -0.650146484375, -0.3671875, -0.084228515625, 0.19873046875, 0.481689453125, 0.7646484375, 1.047607421875, 1.33056640625, 1.613525390625, 1.896484375, 2.179443359375, 2.46240234375, 2.745361328125, 3.0283203125, 3.311279296875, 3.59423828125, 3.877197265625, 4.16015625, 4.443115234375, 4.72607421875, 5.009033203125, 5.2919921875, 5.574951171875, 5.85791015625, 6.140869140625, 6.423828125, 6.706787109375, 6.98974609375, 7.272705078125, 7.5556640625, 7.838623046875, 8.12158203125, 8.404541015625, 8.6875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 3.0, 9.0, 5.0, 15.0, 16.0, 15.0, 16.0, 28.0, 26.0, 31.0, 32.0, 37.0, 49.0, 70.0, 126.0, 359.0, 1690.0, 609565.0, 2530616.0, 1980.0, 440.0, 171.0, 77.0, 63.0, 40.0, 25.0, 27.0, 27.0, 17.0, 20.0, 23.0, 16.0, 15.0, 9.0, 13.0, 7.0, 3.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.0625, -36.7958984375, -35.529296875, -34.2626953125, -32.99609375, -31.7294921875, -30.462890625, -29.1962890625, -27.9296875, -26.6630859375, -25.396484375, -24.1298828125, -22.86328125, -21.5966796875, -20.330078125, -19.0634765625, -17.796875, -16.5302734375, -15.263671875, -13.9970703125, -12.73046875, -11.4638671875, -10.197265625, -8.9306640625, -7.6640625, -6.3974609375, -5.130859375, -3.8642578125, -2.59765625, -1.3310546875, -0.064453125, 1.2021484375, 2.46875, 3.7353515625, 5.001953125, 6.2685546875, 7.53515625, 8.8017578125, 10.068359375, 11.3349609375, 12.6015625, 13.8681640625, 15.134765625, 16.4013671875, 17.66796875, 18.9345703125, 20.201171875, 21.4677734375, 22.734375, 24.0009765625, 25.267578125, 26.5341796875, 27.80078125, 29.0673828125, 30.333984375, 31.6005859375, 32.8671875, 34.1337890625, 35.400390625, 36.6669921875, 37.93359375, 39.2001953125, 40.466796875, 41.7333984375, 43.0]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 530.0, 481.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.5656433105469, -267.69378662109375, -262.8218994140625, -257.9500427246094, -253.0781707763672, -248.206298828125, -243.3344268798828, -238.46255493164062, -233.59068298339844, -228.71881103515625, -223.84693908691406, -218.97506713867188, -214.10321044921875, -209.23133850097656, -204.35946655273438, -199.4875946044922, -194.61572265625, -189.7438507080078, -184.87197875976562, -180.0001220703125, -175.1282501220703, -170.25637817382812, -165.38450622558594, -160.51263427734375, -155.64077758789062, -150.76890563964844, -145.89703369140625, -141.02517700195312, -136.15330505371094, -131.28143310546875, -126.40956115722656, -121.53768920898438, -116.66583251953125, -111.79396057128906, -106.9220962524414, -102.05022430419922, -97.17835235595703, -92.30648803710938, -87.43461608886719, -82.562744140625, -77.69087219238281, -72.81900024414062, -67.94713592529297, -63.07526397705078, -58.203392028808594, -53.33152389526367, -48.45965576171875, -43.58778381347656, -38.71591567993164, -33.84404754638672, -28.97217559814453, -24.10030746459961, -19.228437423706055, -14.3565673828125, -9.484699249267578, -4.612827301025391, 0.25904083251953125, 5.130910396575928, 10.002779960632324, 14.874649047851562, 19.746519088745117, 24.618389129638672, 29.490257263183594, 34.36212921142578, 39.2339973449707]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 4.0, 4.0, 9.0, 11.0, 11.0, 8.0, 11.0, 14.0, 11.0, 24.0, 26.0, 32.0, 17.0, 33.0, 27.0, 24.0, 43.0, 32.0, 34.0, 43.0, 37.0, 39.0, 35.0, 32.0, 48.0, 43.0, 38.0, 31.0, 23.0, 32.0, 23.0, 32.0, 22.0, 16.0, 30.0, 15.0, 6.0, 14.0, 15.0, 11.0, 5.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.228797912597656, -27.306621551513672, -26.384445190429688, -25.462268829345703, -24.540090560913086, -23.6179141998291, -22.695737838745117, -21.773561477661133, -20.851383209228516, -19.92920684814453, -19.007030487060547, -18.084854125976562, -17.162675857543945, -16.24049949645996, -15.318323135375977, -14.396146774291992, -13.473970413208008, -12.551794052124023, -11.629616737365723, -10.707440376281738, -9.785263061523438, -8.863086700439453, -7.940910339355469, -7.018733501434326, -6.096556663513184, -5.174379825592041, -4.252202987670898, -3.330026626586914, -2.4078497886657715, -1.485672950744629, -0.5634965896606445, 0.35868024826049805, 1.2808570861816406, 2.203033924102783, 3.1252105236053467, 4.04738712310791, 4.969563961029053, 5.891740798950195, 6.81391716003418, 7.736093997955322, 8.658270835876465, 9.58044719696045, 10.50262451171875, 11.424800872802734, 12.346977233886719, 13.26915454864502, 14.191330909729004, 15.113508224487305, 16.03568458557129, 16.957860946655273, 17.880037307739258, 18.802215576171875, 19.72439193725586, 20.646568298339844, 21.568744659423828, 22.490921020507812, 23.413097381591797, 24.33527374267578, 25.257450103759766, 26.17962646484375, 27.101804733276367, 28.02398109436035, 28.946157455444336, 29.86833381652832, 30.790512084960938]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 6.0, 5.0, 4.0, 10.0, 13.0, 9.0, 12.0, 14.0, 26.0, 24.0, 26.0, 34.0, 34.0, 31.0, 29.0, 49.0, 47.0, 61.0, 67.0, 57.0, 71.0, 54.0, 61.0, 48.0, 34.0, 25.0, 33.0, 18.0, 23.0, 22.0, 12.0, 15.0, 12.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.90625, -4.779541015625, -4.65283203125, -4.526123046875, -4.3994140625, -4.272705078125, -4.14599609375, -4.019287109375, -3.892578125, -3.765869140625, -3.63916015625, -3.512451171875, -3.3857421875, -3.259033203125, -3.13232421875, -3.005615234375, -2.87890625, -2.752197265625, -2.62548828125, -2.498779296875, -2.3720703125, -2.245361328125, -2.11865234375, -1.991943359375, -1.865234375, -1.738525390625, -1.61181640625, -1.485107421875, -1.3583984375, -1.231689453125, -1.10498046875, -0.978271484375, -0.8515625, -0.724853515625, -0.59814453125, -0.471435546875, -0.3447265625, -0.218017578125, -0.09130859375, 0.035400390625, 0.162109375, 0.288818359375, 0.41552734375, 0.542236328125, 0.6689453125, 0.795654296875, 0.92236328125, 1.049072265625, 1.17578125, 1.302490234375, 1.42919921875, 1.555908203125, 1.6826171875, 1.809326171875, 1.93603515625, 2.062744140625, 2.189453125, 2.316162109375, 2.44287109375, 2.569580078125, 2.6962890625, 2.822998046875, 2.94970703125, 3.076416015625, 3.203125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 6.0, 6.0, 14.0, 24.0, 24.0, 30.0, 58.0, 77.0, 102.0, 154.0, 281.0, 514.0, 930.0, 1923.0, 4757.0, 13803.0, 60827.0, 1049947.0, 2901525.0, 125747.0, 21171.0, 6680.0, 2701.0, 1324.0, 650.0, 363.0, 218.0, 133.0, 88.0, 60.0, 38.0, 31.0, 20.0, 21.0, 11.0, 9.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.25, -20.66259765625, -20.0751953125, -19.48779296875, -18.900390625, -18.31298828125, -17.7255859375, -17.13818359375, -16.55078125, -15.96337890625, -15.3759765625, -14.78857421875, -14.201171875, -13.61376953125, -13.0263671875, -12.43896484375, -11.8515625, -11.26416015625, -10.6767578125, -10.08935546875, -9.501953125, -8.91455078125, -8.3271484375, -7.73974609375, -7.15234375, -6.56494140625, -5.9775390625, -5.39013671875, -4.802734375, -4.21533203125, -3.6279296875, -3.04052734375, -2.453125, -1.86572265625, -1.2783203125, -0.69091796875, -0.103515625, 0.48388671875, 1.0712890625, 1.65869140625, 2.24609375, 2.83349609375, 3.4208984375, 4.00830078125, 4.595703125, 5.18310546875, 5.7705078125, 6.35791015625, 6.9453125, 7.53271484375, 8.1201171875, 8.70751953125, 9.294921875, 9.88232421875, 10.4697265625, 11.05712890625, 11.64453125, 12.23193359375, 12.8193359375, 13.40673828125, 13.994140625, 14.58154296875, 15.1689453125, 15.75634765625, 16.34375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 8.0, 16.0, 29.0, 31.0, 65.0, 61.0, 94.0, 152.0, 259.0, 369.0, 574.0, 680.0, 592.0, 363.0, 236.0, 161.0, 130.0, 77.0, 46.0, 35.0, 30.0, 20.0, 11.0, 10.0, 5.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.474853515625, -14.93408203125, -14.393310546875, -13.8525390625, -13.311767578125, -12.77099609375, -12.230224609375, -11.689453125, -11.148681640625, -10.60791015625, -10.067138671875, -9.5263671875, -8.985595703125, -8.44482421875, -7.904052734375, -7.36328125, -6.822509765625, -6.28173828125, -5.740966796875, -5.2001953125, -4.659423828125, -4.11865234375, -3.577880859375, -3.037109375, -2.496337890625, -1.95556640625, -1.414794921875, -0.8740234375, -0.333251953125, 0.20751953125, 0.748291015625, 1.2890625, 1.829833984375, 2.37060546875, 2.911376953125, 3.4521484375, 3.992919921875, 4.53369140625, 5.074462890625, 5.615234375, 6.156005859375, 6.69677734375, 7.237548828125, 7.7783203125, 8.319091796875, 8.85986328125, 9.400634765625, 9.94140625, 10.482177734375, 11.02294921875, 11.563720703125, 12.1044921875, 12.645263671875, 13.18603515625, 13.726806640625, 14.267578125, 14.808349609375, 15.34912109375, 15.889892578125, 16.4306640625, 16.971435546875, 17.51220703125, 18.052978515625, 18.59375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 6.0, 3.0, 8.0, 8.0, 16.0, 17.0, 16.0, 27.0, 43.0, 57.0, 75.0, 125.0, 230.0, 468.0, 1557.0, 26131.0, 4121096.0, 41456.0, 1770.0, 517.0, 242.0, 149.0, 88.0, 51.0, 43.0, 26.0, 16.0, 15.0, 13.0, 7.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.78125, -43.65576171875, -41.5302734375, -39.40478515625, -37.279296875, -35.15380859375, -33.0283203125, -30.90283203125, -28.77734375, -26.65185546875, -24.5263671875, -22.40087890625, -20.275390625, -18.14990234375, -16.0244140625, -13.89892578125, -11.7734375, -9.64794921875, -7.5224609375, -5.39697265625, -3.271484375, -1.14599609375, 0.9794921875, 3.10498046875, 5.23046875, 7.35595703125, 9.4814453125, 11.60693359375, 13.732421875, 15.85791015625, 17.9833984375, 20.10888671875, 22.234375, 24.35986328125, 26.4853515625, 28.61083984375, 30.736328125, 32.86181640625, 34.9873046875, 37.11279296875, 39.23828125, 41.36376953125, 43.4892578125, 45.61474609375, 47.740234375, 49.86572265625, 51.9912109375, 54.11669921875, 56.2421875, 58.36767578125, 60.4931640625, 62.61865234375, 64.744140625, 66.86962890625, 68.9951171875, 71.12060546875, 73.24609375, 75.37158203125, 77.4970703125, 79.62255859375, 81.748046875, 83.87353515625, 85.9990234375, 88.12451171875, 90.25]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [3.0, 6.0, 40.0, 255.0, 494.0, 200.0, 18.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.083255767822266, -16.30394744873047, -11.524641036987305, -6.745333671569824, -1.9660263061523438, 2.813282012939453, 7.592588424682617, 12.371894836425781, 17.151203155517578, 21.930511474609375, 26.70981788635254, 31.489124298095703, 36.2684326171875, 41.0477409362793, 45.827049255371094, 50.606353759765625, 55.38566207885742, 60.16497039794922, 64.94427490234375, 69.72358703613281, 74.50289154052734, 79.28219604492188, 84.06150817871094, 88.84081268310547, 93.6201171875, 98.39942169189453, 103.1787338256836, 107.95803833007812, 112.73735046386719, 117.51665496826172, 122.29595947265625, 127.07527160644531, 131.85458374023438, 136.63389587402344, 141.41319274902344, 146.1925048828125, 150.97181701660156, 155.75112915039062, 160.53042602539062, 165.3097381591797, 170.08905029296875, 174.8683624267578, 179.6476593017578, 184.42697143554688, 189.20628356933594, 193.985595703125, 198.764892578125, 203.54420471191406, 208.32350158691406, 213.10281372070312, 217.88211059570312, 222.6614227294922, 227.44073486328125, 232.22003173828125, 236.9993438720703, 241.77865600585938, 246.55795288085938, 251.33726501464844, 256.1165771484375, 260.8958740234375, 265.6751708984375, 270.4544982910156, 275.2337951660156, 280.0130920410156, 284.79241943359375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 5.0, 13.0, 8.0, 12.0, 29.0, 24.0, 19.0, 29.0, 32.0, 37.0, 27.0, 40.0, 28.0, 34.0, 42.0, 41.0, 45.0, 39.0, 49.0, 36.0, 42.0, 31.0, 31.0, 36.0, 26.0, 35.0, 29.0, 24.0, 25.0, 24.0, 21.0, 13.0, 10.0, 12.0, 8.0, 8.0, 1.0, 9.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-46.40675354003906, -45.116554260253906, -43.826358795166016, -42.53615951538086, -41.24596405029297, -39.95576477050781, -38.66556930541992, -37.375370025634766, -36.085174560546875, -34.79497528076172, -33.50477981567383, -32.21458053588867, -30.92438507080078, -29.634185791015625, -28.3439884185791, -27.053791046142578, -25.763591766357422, -24.4733943939209, -23.183197021484375, -21.89299964904785, -20.602802276611328, -19.312602996826172, -18.02240562438965, -16.732208251953125, -15.442010879516602, -14.151813507080078, -12.861616134643555, -11.571417808532715, -10.281220436096191, -8.991023063659668, -7.700825214385986, -6.410627365112305, -5.120429992675781, -3.8302323818206787, -2.540034770965576, -1.2498371601104736, 0.040360450744628906, 1.3305578231811523, 2.620755672454834, 3.9109535217285156, 5.201150894165039, 6.4913482666015625, 7.781546115875244, 9.071743965148926, 10.36194133758545, 11.652138710021973, 12.942337036132812, 14.232534408569336, 15.52273178100586, 16.812929153442383, 18.103126525878906, 19.39332389831543, 20.683521270751953, 21.97372055053711, 23.263917922973633, 24.554115295410156, 25.84431266784668, 27.134510040283203, 28.424707412719727, 29.71490478515625, 31.005104064941406, 32.2952995300293, 33.58549880981445, 34.875694274902344, 36.1658935546875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 1.0, 6.0, 3.0, 10.0, 11.0, 9.0, 14.0, 13.0, 14.0, 19.0, 28.0, 26.0, 30.0, 27.0, 32.0, 47.0, 42.0, 43.0, 51.0, 50.0, 67.0, 49.0, 50.0, 45.0, 53.0, 40.0, 35.0, 33.0, 28.0, 25.0, 22.0, 9.0, 22.0, 7.0, 6.0, 11.0, 8.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.49609375, -4.37762451171875, -4.2591552734375, -4.14068603515625, -4.022216796875, -3.90374755859375, -3.7852783203125, -3.66680908203125, -3.54833984375, -3.42987060546875, -3.3114013671875, -3.19293212890625, -3.074462890625, -2.95599365234375, -2.8375244140625, -2.71905517578125, -2.6005859375, -2.48211669921875, -2.3636474609375, -2.24517822265625, -2.126708984375, -2.00823974609375, -1.8897705078125, -1.77130126953125, -1.65283203125, -1.53436279296875, -1.4158935546875, -1.29742431640625, -1.178955078125, -1.06048583984375, -0.9420166015625, -0.82354736328125, -0.705078125, -0.58660888671875, -0.4681396484375, -0.34967041015625, -0.231201171875, -0.11273193359375, 0.0057373046875, 0.12420654296875, 0.24267578125, 0.36114501953125, 0.4796142578125, 0.59808349609375, 0.716552734375, 0.83502197265625, 0.9534912109375, 1.07196044921875, 1.1904296875, 1.30889892578125, 1.4273681640625, 1.54583740234375, 1.664306640625, 1.78277587890625, 1.9012451171875, 2.01971435546875, 2.13818359375, 2.25665283203125, 2.3751220703125, 2.49359130859375, 2.612060546875, 2.73052978515625, 2.8489990234375, 2.96746826171875, 3.0859375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 13.0, 6.0, 23.0, 19.0, 39.0, 53.0, 77.0, 116.0, 183.0, 284.0, 474.0, 747.0, 1227.0, 2047.0, 3547.0, 6184.0, 11355.0, 21021.0, 41068.0, 86923.0, 200200.0, 325293.0, 184761.0, 79960.0, 38326.0, 19745.0, 10609.0, 5810.0, 3377.0, 1961.0, 1163.0, 685.0, 451.0, 260.0, 190.0, 104.0, 77.0, 55.0, 29.0, 30.0, 15.0, 11.0, 13.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.669921875, -0.6492767333984375, -0.628631591796875, -0.6079864501953125, -0.58734130859375, -0.5666961669921875, -0.546051025390625, -0.5254058837890625, -0.5047607421875, -0.4841156005859375, -0.463470458984375, -0.4428253173828125, -0.42218017578125, -0.4015350341796875, -0.380889892578125, -0.3602447509765625, -0.339599609375, -0.3189544677734375, -0.298309326171875, -0.2776641845703125, -0.25701904296875, -0.2363739013671875, -0.215728759765625, -0.1950836181640625, -0.1744384765625, -0.1537933349609375, -0.133148193359375, -0.1125030517578125, -0.09185791015625, -0.0712127685546875, -0.050567626953125, -0.0299224853515625, -0.00927734375, 0.0113677978515625, 0.032012939453125, 0.0526580810546875, 0.07330322265625, 0.0939483642578125, 0.114593505859375, 0.1352386474609375, 0.1558837890625, 0.1765289306640625, 0.197174072265625, 0.2178192138671875, 0.23846435546875, 0.2591094970703125, 0.279754638671875, 0.3003997802734375, 0.321044921875, 0.3416900634765625, 0.362335205078125, 0.3829803466796875, 0.40362548828125, 0.4242706298828125, 0.444915771484375, 0.4655609130859375, 0.4862060546875, 0.5068511962890625, 0.527496337890625, 0.5481414794921875, 0.56878662109375, 0.5894317626953125, 0.610076904296875, 0.6307220458984375, 0.6513671875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 7.0, 7.0, 8.0, 12.0, 8.0, 14.0, 22.0, 20.0, 25.0, 29.0, 26.0, 37.0, 41.0, 37.0, 42.0, 43.0, 32.0, 41.0, 1070.0, 48.0, 40.0, 47.0, 43.0, 51.0, 32.0, 26.0, 38.0, 34.0, 14.0, 26.0, 20.0, 12.0, 17.0, 16.0, 7.0, 10.0, 7.0, 6.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.646484375, -2.5726318359375, -2.498779296875, -2.4249267578125, -2.35107421875, -2.2772216796875, -2.203369140625, -2.1295166015625, -2.0556640625, -1.9818115234375, -1.907958984375, -1.8341064453125, -1.76025390625, -1.6864013671875, -1.612548828125, -1.5386962890625, -1.46484375, -1.3909912109375, -1.317138671875, -1.2432861328125, -1.16943359375, -1.0955810546875, -1.021728515625, -0.9478759765625, -0.8740234375, -0.8001708984375, -0.726318359375, -0.6524658203125, -0.57861328125, -0.5047607421875, -0.430908203125, -0.3570556640625, -0.283203125, -0.2093505859375, -0.135498046875, -0.0616455078125, 0.01220703125, 0.0860595703125, 0.159912109375, 0.2337646484375, 0.3076171875, 0.3814697265625, 0.455322265625, 0.5291748046875, 0.60302734375, 0.6768798828125, 0.750732421875, 0.8245849609375, 0.8984375, 0.9722900390625, 1.046142578125, 1.1199951171875, 1.19384765625, 1.2677001953125, 1.341552734375, 1.4154052734375, 1.4892578125, 1.5631103515625, 1.636962890625, 1.7108154296875, 1.78466796875, 1.8585205078125, 1.932373046875, 2.0062255859375, 2.080078125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 7.0, 11.0, 26.0, 23.0, 39.0, 70.0, 110.0, 160.0, 255.0, 354.0, 612.0, 1009.0, 1554.0, 2522.0, 4265.0, 7103.0, 11614.0, 20325.0, 36282.0, 65720.0, 121570.0, 211293.0, 1277478.0, 149742.0, 80383.0, 44400.0, 24601.0, 14130.0, 8389.0, 4950.0, 3010.0, 1829.0, 1257.0, 746.0, 461.0, 305.0, 176.0, 126.0, 77.0, 48.0, 36.0, 23.0, 12.0, 10.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370361328125, -0.3584785461425781, -0.34659576416015625, -0.3347129821777344, -0.3228302001953125, -0.3109474182128906, -0.29906463623046875, -0.2871818542480469, -0.275299072265625, -0.2634162902832031, -0.25153350830078125, -0.23965072631835938, -0.2277679443359375, -0.21588516235351562, -0.20400238037109375, -0.19211959838867188, -0.18023681640625, -0.16835403442382812, -0.15647125244140625, -0.14458847045898438, -0.1327056884765625, -0.12082290649414062, -0.10894012451171875, -0.09705734252929688, -0.085174560546875, -0.07329177856445312, -0.06140899658203125, -0.049526214599609375, -0.0376434326171875, -0.025760650634765625, -0.01387786865234375, -0.001995086669921875, 0.0098876953125, 0.021770477294921875, 0.03365325927734375, 0.045536041259765625, 0.0574188232421875, 0.06930160522460938, 0.08118438720703125, 0.09306716918945312, 0.104949951171875, 0.11683273315429688, 0.12871551513671875, 0.14059829711914062, 0.1524810791015625, 0.16436386108398438, 0.17624664306640625, 0.18812942504882812, 0.20001220703125, 0.21189498901367188, 0.22377777099609375, 0.23566055297851562, 0.2475433349609375, 0.2594261169433594, 0.27130889892578125, 0.2831916809082031, 0.295074462890625, 0.3069572448730469, 0.31884002685546875, 0.3307228088378906, 0.3426055908203125, 0.3544883728027344, 0.36637115478515625, 0.3782539367675781, 0.39013671875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 8.0, 6.0, 8.0, 11.0, 8.0, 8.0, 14.0, 22.0, 31.0, 47.0, 64.0, 81.0, 91.0, 113.0, 88.0, 104.0, 78.0, 53.0, 48.0, 26.0, 15.0, 17.0, 13.0, 9.0, 5.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002483367919921875, -0.0024057626724243164, -0.002328157424926758, -0.0022505521774291992, -0.0021729469299316406, -0.002095341682434082, -0.0020177364349365234, -0.0019401311874389648, -0.0018625259399414062, -0.0017849206924438477, -0.001707315444946289, -0.0016297101974487305, -0.0015521049499511719, -0.0014744997024536133, -0.0013968944549560547, -0.001319289207458496, -0.0012416839599609375, -0.001164078712463379, -0.0010864734649658203, -0.0010088682174682617, -0.0009312629699707031, -0.0008536577224731445, -0.0007760524749755859, -0.0006984472274780273, -0.0006208419799804688, -0.0005432367324829102, -0.00046563148498535156, -0.00038802623748779297, -0.0003104209899902344, -0.00023281574249267578, -0.0001552104949951172, -7.76052474975586e-05, 0.0, 7.76052474975586e-05, 0.0001552104949951172, 0.00023281574249267578, 0.0003104209899902344, 0.00038802623748779297, 0.00046563148498535156, 0.0005432367324829102, 0.0006208419799804688, 0.0006984472274780273, 0.0007760524749755859, 0.0008536577224731445, 0.0009312629699707031, 0.0010088682174682617, 0.0010864734649658203, 0.001164078712463379, 0.0012416839599609375, 0.001319289207458496, 0.0013968944549560547, 0.0014744997024536133, 0.0015521049499511719, 0.0016297101974487305, 0.001707315444946289, 0.0017849206924438477, 0.0018625259399414062, 0.0019401311874389648, 0.0020177364349365234, 0.002095341682434082, 0.0021729469299316406, 0.0022505521774291992, 0.002328157424926758, 0.0024057626724243164, 0.002483367919921875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 2.0, 2.0, 6.0, 10.0, 11.0, 18.0, 17.0, 21.0, 34.0, 25.0, 58.0, 99.0, 184.0, 357.0, 876.0, 1039773.0, 5860.0, 549.0, 222.0, 103.0, 81.0, 58.0, 40.0, 30.0, 17.0, 13.0, 22.0, 12.0, 10.0, 6.0, 5.0, 4.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.057647705078125, -0.0557103157043457, -0.053772926330566406, -0.05183553695678711, -0.04989814758300781, -0.047960758209228516, -0.04602336883544922, -0.04408597946166992, -0.042148590087890625, -0.04021120071411133, -0.03827381134033203, -0.036336421966552734, -0.03439903259277344, -0.03246164321899414, -0.030524253845214844, -0.028586864471435547, -0.02664947509765625, -0.024712085723876953, -0.022774696350097656, -0.02083730697631836, -0.018899917602539062, -0.016962528228759766, -0.015025138854980469, -0.013087749481201172, -0.011150360107421875, -0.009212970733642578, -0.007275581359863281, -0.005338191986083984, -0.0034008026123046875, -0.0014634132385253906, 0.00047397613525390625, 0.002411365509033203, 0.0043487548828125, 0.006286144256591797, 0.008223533630371094, 0.01016092300415039, 0.012098312377929688, 0.014035701751708984, 0.01597309112548828, 0.017910480499267578, 0.019847869873046875, 0.021785259246826172, 0.02372264862060547, 0.025660037994384766, 0.027597427368164062, 0.02953481674194336, 0.031472206115722656, 0.03340959548950195, 0.03534698486328125, 0.03728437423706055, 0.039221763610839844, 0.04115915298461914, 0.04309654235839844, 0.045033931732177734, 0.04697132110595703, 0.04890871047973633, 0.050846099853515625, 0.05278348922729492, 0.05472087860107422, 0.056658267974853516, 0.05859565734863281, 0.06053304672241211, 0.062470436096191406, 0.0644078254699707, 0.06634521484375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1020.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004157747142016888, -0.0025714323855936527, -0.0009851173963397741, 0.0006011975929141045, 0.0021875123493373394, 0.0037738271057605743, 0.005360142327845097, 0.006946456618607044, 0.008532771840691566, 0.010119087062776089, 0.011705401353538036, 0.013291716575622559, 0.014878030866384506, 0.016464345157146454, 0.01805066131055355, 0.0196369756013155, 0.021223291754722595, 0.022809606045484543, 0.02439592219889164, 0.025982236489653587, 0.027568550780415535, 0.029154866933822632, 0.03074118122458458, 0.03232749551534653, 0.033913809806108475, 0.03550012409687042, 0.03708643838763237, 0.03867275267839432, 0.040259070694446564, 0.04184538498520851, 0.04343169927597046, 0.04501801356673241, 0.04660433158278465, 0.0481906458735466, 0.04977696016430855, 0.051363274455070496, 0.05294959247112274, 0.05453590676188469, 0.05612222105264664, 0.057708535343408585, 0.05929484963417053, 0.06088116392493248, 0.06246747821569443, 0.06405379623174667, 0.06564010679721832, 0.06722642481327057, 0.06881274282932281, 0.07039905339479446, 0.07198537141084671, 0.07357168942689896, 0.0751579999923706, 0.07674431800842285, 0.0783306285738945, 0.07991694658994675, 0.0815032571554184, 0.08308957517147064, 0.08467588573694229, 0.08626220375299454, 0.08784851431846619, 0.08943483233451843, 0.09102114289999008, 0.09260746091604233, 0.09419377148151398, 0.09578008949756622, 0.09736640751361847]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 13.0, 17.0, 17.0, 25.0, 32.0, 38.0, 59.0, 46.0, 69.0, 64.0, 81.0, 68.0, 65.0, 75.0, 67.0, 54.0, 42.0, 42.0, 28.0, 33.0, 18.0, 16.0, 12.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0023022890090942383, -0.0022492017596960068, -0.0021961145102977753, -0.0021430272608995438, -0.0020899400115013123, -0.0020368527621030807, -0.0019837655127048492, -0.0019306782633066177, -0.0018775910139083862, -0.0018245037645101547, -0.0017714165151119232, -0.0017183292657136917, -0.0016652420163154602, -0.0016121547669172287, -0.0015590675175189972, -0.0015059802681207657, -0.0014528930187225342, -0.0013998057693243027, -0.0013467185199260712, -0.0012936312705278397, -0.0012405440211296082, -0.0011874567717313766, -0.0011343695223331451, -0.0010812822729349136, -0.0010281950235366821, -0.0009751077741384506, -0.0009220205247402191, -0.0008689332753419876, -0.0008158460259437561, -0.0007627587765455246, -0.0007096715271472931, -0.0006565842777490616, -0.0006034970283508301, -0.0005504097789525986, -0.0004973225295543671, -0.00044423528015613556, -0.00039114803075790405, -0.00033806078135967255, -0.00028497353196144104, -0.00023188628256320953, -0.00017879903316497803, -0.00012571178376674652, -7.262453436851501e-05, -1.9537284970283508e-05, 3.3549964427948e-05, 8.66372138261795e-05, 0.000139724463224411, 0.00019281171262264252, 0.000245898962020874, 0.00029898621141910553, 0.00035207346081733704, 0.00040516071021556854, 0.00045824795961380005, 0.0005113352090120316, 0.0005644224584102631, 0.0006175097078084946, 0.0006705969572067261, 0.0007236842066049576, 0.0007767714560031891, 0.0008298587054014206, 0.0008829459547996521, 0.0009360332041978836, 0.0009891204535961151, 0.0010422077029943466, 0.0010952949523925781]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 1.0, 6.0, 3.0, 10.0, 11.0, 9.0, 14.0, 13.0, 14.0, 19.0, 28.0, 26.0, 30.0, 27.0, 32.0, 47.0, 42.0, 43.0, 51.0, 50.0, 67.0, 49.0, 50.0, 45.0, 53.0, 40.0, 35.0, 33.0, 28.0, 25.0, 22.0, 9.0, 22.0, 7.0, 6.0, 11.0, 8.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.49609375, -4.37762451171875, -4.2591552734375, -4.14068603515625, -4.022216796875, -3.90374755859375, -3.7852783203125, -3.66680908203125, -3.54833984375, -3.42987060546875, -3.3114013671875, -3.19293212890625, -3.074462890625, -2.95599365234375, -2.8375244140625, -2.71905517578125, -2.6005859375, -2.48211669921875, -2.3636474609375, -2.24517822265625, -2.126708984375, -2.00823974609375, -1.8897705078125, -1.77130126953125, -1.65283203125, -1.53436279296875, -1.4158935546875, -1.29742431640625, -1.178955078125, -1.06048583984375, -0.9420166015625, -0.82354736328125, -0.705078125, -0.58660888671875, -0.4681396484375, -0.34967041015625, -0.231201171875, -0.11273193359375, 0.0057373046875, 0.12420654296875, 0.24267578125, 0.36114501953125, 0.4796142578125, 0.59808349609375, 0.716552734375, 0.83502197265625, 0.9534912109375, 1.07196044921875, 1.1904296875, 1.30889892578125, 1.4273681640625, 1.54583740234375, 1.664306640625, 1.78277587890625, 1.9012451171875, 2.01971435546875, 2.13818359375, 2.25665283203125, 2.3751220703125, 2.49359130859375, 2.612060546875, 2.73052978515625, 2.8489990234375, 2.96746826171875, 3.0859375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 8.0, 8.0, 5.0, 16.0, 34.0, 34.0, 58.0, 69.0, 99.0, 139.0, 255.0, 349.0, 672.0, 1421.0, 3299.0, 9388.0, 31628.0, 124581.0, 467862.0, 304425.0, 73147.0, 19804.0, 6328.0, 2432.0, 1048.0, 542.0, 305.0, 187.0, 118.0, 79.0, 63.0, 52.0, 32.0, 21.0, 11.0, 14.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.59375, -4.4617919921875, -4.329833984375, -4.1978759765625, -4.06591796875, -3.9339599609375, -3.802001953125, -3.6700439453125, -3.5380859375, -3.4061279296875, -3.274169921875, -3.1422119140625, -3.01025390625, -2.8782958984375, -2.746337890625, -2.6143798828125, -2.482421875, -2.3504638671875, -2.218505859375, -2.0865478515625, -1.95458984375, -1.8226318359375, -1.690673828125, -1.5587158203125, -1.4267578125, -1.2947998046875, -1.162841796875, -1.0308837890625, -0.89892578125, -0.7669677734375, -0.635009765625, -0.5030517578125, -0.37109375, -0.2391357421875, -0.107177734375, 0.0247802734375, 0.15673828125, 0.2886962890625, 0.420654296875, 0.5526123046875, 0.6845703125, 0.8165283203125, 0.948486328125, 1.0804443359375, 1.21240234375, 1.3443603515625, 1.476318359375, 1.6082763671875, 1.740234375, 1.8721923828125, 2.004150390625, 2.1361083984375, 2.26806640625, 2.4000244140625, 2.531982421875, 2.6639404296875, 2.7958984375, 2.9278564453125, 3.059814453125, 3.1917724609375, 3.32373046875, 3.4556884765625, 3.587646484375, 3.7196044921875, 3.8515625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 4.0, 14.0, 6.0, 5.0, 8.0, 9.0, 20.0, 14.0, 14.0, 21.0, 27.0, 30.0, 24.0, 39.0, 33.0, 30.0, 48.0, 50.0, 76.0, 133.0, 1613.0, 322.0, 86.0, 37.0, 33.0, 41.0, 40.0, 30.0, 27.0, 24.0, 25.0, 23.0, 23.0, 19.0, 19.0, 19.0, 8.0, 13.0, 10.0, 5.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-11.375, -11.0380859375, -10.701171875, -10.3642578125, -10.02734375, -9.6904296875, -9.353515625, -9.0166015625, -8.6796875, -8.3427734375, -8.005859375, -7.6689453125, -7.33203125, -6.9951171875, -6.658203125, -6.3212890625, -5.984375, -5.6474609375, -5.310546875, -4.9736328125, -4.63671875, -4.2998046875, -3.962890625, -3.6259765625, -3.2890625, -2.9521484375, -2.615234375, -2.2783203125, -1.94140625, -1.6044921875, -1.267578125, -0.9306640625, -0.59375, -0.2568359375, 0.080078125, 0.4169921875, 0.75390625, 1.0908203125, 1.427734375, 1.7646484375, 2.1015625, 2.4384765625, 2.775390625, 3.1123046875, 3.44921875, 3.7861328125, 4.123046875, 4.4599609375, 4.796875, 5.1337890625, 5.470703125, 5.8076171875, 6.14453125, 6.4814453125, 6.818359375, 7.1552734375, 7.4921875, 7.8291015625, 8.166015625, 8.5029296875, 8.83984375, 9.1767578125, 9.513671875, 9.8505859375, 10.1875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 10.0, 7.0, 13.0, 8.0, 18.0, 20.0, 24.0, 12.0, 27.0, 23.0, 34.0, 42.0, 49.0, 79.0, 109.0, 149.0, 359.0, 1111.0, 17289.0, 3096045.0, 27944.0, 1233.0, 394.0, 194.0, 111.0, 77.0, 51.0, 49.0, 27.0, 32.0, 24.0, 28.0, 12.0, 20.0, 10.0, 10.0, 8.0, 5.0, 8.0, 8.0, 7.0, 4.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-21.890625, -21.149658203125, -20.40869140625, -19.667724609375, -18.9267578125, -18.185791015625, -17.44482421875, -16.703857421875, -15.962890625, -15.221923828125, -14.48095703125, -13.739990234375, -12.9990234375, -12.258056640625, -11.51708984375, -10.776123046875, -10.03515625, -9.294189453125, -8.55322265625, -7.812255859375, -7.0712890625, -6.330322265625, -5.58935546875, -4.848388671875, -4.107421875, -3.366455078125, -2.62548828125, -1.884521484375, -1.1435546875, -0.402587890625, 0.33837890625, 1.079345703125, 1.8203125, 2.561279296875, 3.30224609375, 4.043212890625, 4.7841796875, 5.525146484375, 6.26611328125, 7.007080078125, 7.748046875, 8.489013671875, 9.22998046875, 9.970947265625, 10.7119140625, 11.452880859375, 12.19384765625, 12.934814453125, 13.67578125, 14.416748046875, 15.15771484375, 15.898681640625, 16.6396484375, 17.380615234375, 18.12158203125, 18.862548828125, 19.603515625, 20.344482421875, 21.08544921875, 21.826416015625, 22.5673828125, 23.308349609375, 24.04931640625, 24.790283203125, 25.53125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 12.0, 286.0, 639.0, 77.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.906078338623047, -4.106780052185059, -2.307481288909912, -0.5081825256347656, 1.2911157608032227, 3.090414047241211, 4.889713287353516, 6.689011573791504, 8.488309860229492, 10.28760814666748, 12.086906433105469, 13.886205673217773, 15.685503959655762, 17.48480224609375, 19.284101486206055, 21.08340072631836, 22.88269805908203, 24.681997299194336, 26.481294631958008, 28.280593872070312, 30.079891204833984, 31.87919044494629, 33.678489685058594, 35.477787017822266, 37.27708435058594, 39.07638168334961, 40.87568283081055, 42.67498016357422, 44.47427749633789, 46.27357482910156, 48.0728759765625, 49.87217330932617, 51.671478271484375, 53.47077560424805, 55.270076751708984, 57.069374084472656, 58.86867141723633, 60.66796875, 62.46726989746094, 64.26657104492188, 66.06586456298828, 67.86516571044922, 69.66445922851562, 71.46376037597656, 73.2630615234375, 75.0623550415039, 76.86165618896484, 78.66095733642578, 80.46025085449219, 82.25955200195312, 84.05884552001953, 85.85814666748047, 87.6574478149414, 89.45674133300781, 91.25604248046875, 93.05534362792969, 94.85464477539062, 96.65394592285156, 98.45323944091797, 100.2525405883789, 102.05184173583984, 103.85113525390625, 105.65043640136719, 107.44973754882812, 109.24903106689453]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 9.0, 7.0, 10.0, 15.0, 14.0, 22.0, 24.0, 31.0, 33.0, 39.0, 34.0, 44.0, 25.0, 46.0, 41.0, 35.0, 50.0, 44.0, 45.0, 44.0, 45.0, 45.0, 33.0, 37.0, 31.0, 20.0, 25.0, 19.0, 23.0, 20.0, 23.0, 9.0, 10.0, 8.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.88740921020508, -36.67438507080078, -35.461360931396484, -34.24833679199219, -33.03531265258789, -31.822288513183594, -30.609264373779297, -29.396240234375, -28.183216094970703, -26.970191955566406, -25.75716781616211, -24.544143676757812, -23.331119537353516, -22.11809539794922, -20.905071258544922, -19.692047119140625, -18.479022979736328, -17.26599884033203, -16.052974700927734, -14.839950561523438, -13.62692642211914, -12.413902282714844, -11.200878143310547, -9.98785400390625, -8.774829864501953, -7.561805725097656, -6.348781585693359, -5.1357574462890625, -3.9227333068847656, -2.7097091674804688, -1.4966850280761719, -0.283660888671875, 0.9293594360351562, 2.142383575439453, 3.35540771484375, 4.568431854248047, 5.781455993652344, 6.994480133056641, 8.207504272460938, 9.420528411865234, 10.633552551269531, 11.846576690673828, 13.059600830078125, 14.272624969482422, 15.485649108886719, 16.698673248291016, 17.911697387695312, 19.12472152709961, 20.337745666503906, 21.550769805908203, 22.7637939453125, 23.976818084716797, 25.189842224121094, 26.40286636352539, 27.615890502929688, 28.828914642333984, 30.04193878173828, 31.254962921142578, 32.467987060546875, 33.68101119995117, 34.89403533935547, 36.107059478759766, 37.32008361816406, 38.53310775756836, 39.746131896972656]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 4.0, 8.0, 11.0, 7.0, 11.0, 17.0, 14.0, 16.0, 18.0, 32.0, 30.0, 33.0, 24.0, 45.0, 41.0, 48.0, 38.0, 53.0, 61.0, 53.0, 51.0, 50.0, 50.0, 37.0, 36.0, 37.0, 33.0, 31.0, 15.0, 17.0, 13.0, 16.0, 4.0, 11.0, 8.0, 9.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.5, -4.3792724609375, -4.258544921875, -4.1378173828125, -4.01708984375, -3.8963623046875, -3.775634765625, -3.6549072265625, -3.5341796875, -3.4134521484375, -3.292724609375, -3.1719970703125, -3.05126953125, -2.9305419921875, -2.809814453125, -2.6890869140625, -2.568359375, -2.4476318359375, -2.326904296875, -2.2061767578125, -2.08544921875, -1.9647216796875, -1.843994140625, -1.7232666015625, -1.6025390625, -1.4818115234375, -1.361083984375, -1.2403564453125, -1.11962890625, -0.9989013671875, -0.878173828125, -0.7574462890625, -0.63671875, -0.5159912109375, -0.395263671875, -0.2745361328125, -0.15380859375, -0.0330810546875, 0.087646484375, 0.2083740234375, 0.3291015625, 0.4498291015625, 0.570556640625, 0.6912841796875, 0.81201171875, 0.9327392578125, 1.053466796875, 1.1741943359375, 1.294921875, 1.4156494140625, 1.536376953125, 1.6571044921875, 1.77783203125, 1.8985595703125, 2.019287109375, 2.1400146484375, 2.2607421875, 2.3814697265625, 2.502197265625, 2.6229248046875, 2.74365234375, 2.8643798828125, 2.985107421875, 3.1058349609375, 3.2265625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 1.0, 5.0, 9.0, 11.0, 16.0, 10.0, 13.0, 17.0, 20.0, 35.0, 54.0, 70.0, 94.0, 135.0, 255.0, 438.0, 1143.0, 4768.0, 33193.0, 520498.0, 3229445.0, 371754.0, 26251.0, 3902.0, 1009.0, 466.0, 229.0, 133.0, 87.0, 61.0, 41.0, 29.0, 15.0, 20.0, 18.0, 14.0, 7.0, 5.0, 6.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-15.2734375, -14.8543701171875, -14.435302734375, -14.0162353515625, -13.59716796875, -13.1781005859375, -12.759033203125, -12.3399658203125, -11.9208984375, -11.5018310546875, -11.082763671875, -10.6636962890625, -10.24462890625, -9.8255615234375, -9.406494140625, -8.9874267578125, -8.568359375, -8.1492919921875, -7.730224609375, -7.3111572265625, -6.89208984375, -6.4730224609375, -6.053955078125, -5.6348876953125, -5.2158203125, -4.7967529296875, -4.377685546875, -3.9586181640625, -3.53955078125, -3.1204833984375, -2.701416015625, -2.2823486328125, -1.86328125, -1.4442138671875, -1.025146484375, -0.6060791015625, -0.18701171875, 0.2320556640625, 0.651123046875, 1.0701904296875, 1.4892578125, 1.9083251953125, 2.327392578125, 2.7464599609375, 3.16552734375, 3.5845947265625, 4.003662109375, 4.4227294921875, 4.841796875, 5.2608642578125, 5.679931640625, 6.0989990234375, 6.51806640625, 6.9371337890625, 7.356201171875, 7.7752685546875, 8.1943359375, 8.6134033203125, 9.032470703125, 9.4515380859375, 9.87060546875, 10.2896728515625, 10.708740234375, 11.1278076171875, 11.546875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 4.0, 7.0, 19.0, 20.0, 35.0, 39.0, 83.0, 124.0, 179.0, 270.0, 474.0, 672.0, 685.0, 511.0, 330.0, 219.0, 139.0, 88.0, 76.0, 39.0, 20.0, 20.0, 12.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.78125, -18.231201171875, -17.68115234375, -17.131103515625, -16.5810546875, -16.031005859375, -15.48095703125, -14.930908203125, -14.380859375, -13.830810546875, -13.28076171875, -12.730712890625, -12.1806640625, -11.630615234375, -11.08056640625, -10.530517578125, -9.98046875, -9.430419921875, -8.88037109375, -8.330322265625, -7.7802734375, -7.230224609375, -6.68017578125, -6.130126953125, -5.580078125, -5.030029296875, -4.47998046875, -3.929931640625, -3.3798828125, -2.829833984375, -2.27978515625, -1.729736328125, -1.1796875, -0.629638671875, -0.07958984375, 0.470458984375, 1.0205078125, 1.570556640625, 2.12060546875, 2.670654296875, 3.220703125, 3.770751953125, 4.32080078125, 4.870849609375, 5.4208984375, 5.970947265625, 6.52099609375, 7.071044921875, 7.62109375, 8.171142578125, 8.72119140625, 9.271240234375, 9.8212890625, 10.371337890625, 10.92138671875, 11.471435546875, 12.021484375, 12.571533203125, 13.12158203125, 13.671630859375, 14.2216796875, 14.771728515625, 15.32177734375, 15.871826171875, 16.421875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 11.0, 15.0, 18.0, 31.0, 38.0, 63.0, 100.0, 157.0, 279.0, 422.0, 982.0, 4997.0, 154571.0, 3914460.0, 111998.0, 4081.0, 984.0, 412.0, 219.0, 138.0, 98.0, 64.0, 43.0, 24.0, 24.0, 12.0, 10.0, 5.0, 11.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.53125, -27.26123046875, -25.9912109375, -24.72119140625, -23.451171875, -22.18115234375, -20.9111328125, -19.64111328125, -18.37109375, -17.10107421875, -15.8310546875, -14.56103515625, -13.291015625, -12.02099609375, -10.7509765625, -9.48095703125, -8.2109375, -6.94091796875, -5.6708984375, -4.40087890625, -3.130859375, -1.86083984375, -0.5908203125, 0.67919921875, 1.94921875, 3.21923828125, 4.4892578125, 5.75927734375, 7.029296875, 8.29931640625, 9.5693359375, 10.83935546875, 12.109375, 13.37939453125, 14.6494140625, 15.91943359375, 17.189453125, 18.45947265625, 19.7294921875, 20.99951171875, 22.26953125, 23.53955078125, 24.8095703125, 26.07958984375, 27.349609375, 28.61962890625, 29.8896484375, 31.15966796875, 32.4296875, 33.69970703125, 34.9697265625, 36.23974609375, 37.509765625, 38.77978515625, 40.0498046875, 41.31982421875, 42.58984375, 43.85986328125, 45.1298828125, 46.39990234375, 47.669921875, 48.93994140625, 50.2099609375, 51.47998046875, 52.75]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 78.0, 507.0, 393.0, 35.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-412.53875732421875, -405.15386962890625, -397.7689514160156, -390.3840637207031, -382.9991760253906, -375.6142578125, -368.2293701171875, -360.844482421875, -353.4595947265625, -346.07470703125, -338.6897888183594, -331.3049011230469, -323.9200134277344, -316.53509521484375, -309.15020751953125, -301.76531982421875, -294.3804016113281, -286.9955139160156, -279.610595703125, -272.2257080078125, -264.8408203125, -257.4559326171875, -250.07101440429688, -242.68612670898438, -235.30123901367188, -227.9163360595703, -220.5314483642578, -213.14654541015625, -205.76165771484375, -198.3767547607422, -190.99185180664062, -183.60696411132812, -176.22206115722656, -168.837158203125, -161.4522705078125, -154.06736755371094, -146.68247985839844, -139.29757690429688, -131.91268920898438, -124.52778625488281, -117.14288330078125, -109.75798797607422, -102.37309265136719, -94.98818969726562, -87.6032943725586, -80.21839904785156, -72.83350372314453, -65.4486083984375, -58.0637092590332, -50.67881393432617, -43.293914794921875, -35.909019470214844, -28.52412223815918, -21.139225006103516, -13.754329681396484, -6.3694305419921875, 1.0154647827148438, 8.400362014770508, 15.785258293151855, 23.170154571533203, 30.555051803588867, 37.93994903564453, 45.32484436035156, 52.70974349975586, 60.09463882446289]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 7.0, 9.0, 9.0, 8.0, 12.0, 10.0, 21.0, 19.0, 21.0, 21.0, 25.0, 29.0, 21.0, 32.0, 23.0, 30.0, 26.0, 32.0, 34.0, 30.0, 38.0, 40.0, 45.0, 22.0, 43.0, 25.0, 26.0, 39.0, 34.0, 36.0, 27.0, 23.0, 19.0, 20.0, 18.0, 25.0, 20.0, 10.0, 11.0, 12.0, 15.0, 9.0, 5.0, 10.0, 6.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-36.43756103515625, -35.34339904785156, -34.249237060546875, -33.15507507324219, -32.0609130859375, -30.96674919128418, -29.87258529663086, -28.778423309326172, -27.684261322021484, -26.590099334716797, -25.49593734741211, -24.40177345275879, -23.3076114654541, -22.213449478149414, -21.119285583496094, -20.025123596191406, -18.93096160888672, -17.83679962158203, -16.742637634277344, -15.648473739624023, -14.554311752319336, -13.460149765014648, -12.365986824035645, -11.27182388305664, -10.177661895751953, -9.083499908447266, -7.989336967468262, -6.895174503326416, -5.80101203918457, -4.706849575042725, -3.612687110900879, -2.518524646759033, -1.4243621826171875, -0.3301997184753418, 0.7639627456665039, 1.8581252098083496, 2.9522876739501953, 4.046450138092041, 5.140612602233887, 6.234775066375732, 7.328937530517578, 8.423099517822266, 9.51726245880127, 10.611425399780273, 11.705587387084961, 12.799749374389648, 13.893912315368652, 14.988075256347656, 16.082237243652344, 17.17639923095703, 18.27056121826172, 19.36472511291504, 20.458887100219727, 21.553049087524414, 22.647212982177734, 23.741374969482422, 24.83553695678711, 25.929698944091797, 27.023860931396484, 28.118024826049805, 29.212186813354492, 30.30634880065918, 31.4005126953125, 32.49467468261719, 33.588836669921875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 7.0, 6.0, 6.0, 15.0, 15.0, 10.0, 22.0, 25.0, 17.0, 36.0, 39.0, 36.0, 26.0, 42.0, 44.0, 50.0, 46.0, 54.0, 47.0, 55.0, 52.0, 44.0, 60.0, 34.0, 35.0, 22.0, 29.0, 21.0, 23.0, 13.0, 14.0, 12.0, 5.0, 7.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1640625, -4.0396728515625, -3.915283203125, -3.7908935546875, -3.66650390625, -3.5421142578125, -3.417724609375, -3.2933349609375, -3.1689453125, -3.0445556640625, -2.920166015625, -2.7957763671875, -2.67138671875, -2.5469970703125, -2.422607421875, -2.2982177734375, -2.173828125, -2.0494384765625, -1.925048828125, -1.8006591796875, -1.67626953125, -1.5518798828125, -1.427490234375, -1.3031005859375, -1.1787109375, -1.0543212890625, -0.929931640625, -0.8055419921875, -0.68115234375, -0.5567626953125, -0.432373046875, -0.3079833984375, -0.18359375, -0.0592041015625, 0.065185546875, 0.1895751953125, 0.31396484375, 0.4383544921875, 0.562744140625, 0.6871337890625, 0.8115234375, 0.9359130859375, 1.060302734375, 1.1846923828125, 1.30908203125, 1.4334716796875, 1.557861328125, 1.6822509765625, 1.806640625, 1.9310302734375, 2.055419921875, 2.1798095703125, 2.30419921875, 2.4285888671875, 2.552978515625, 2.6773681640625, 2.8017578125, 2.9261474609375, 3.050537109375, 3.1749267578125, 3.29931640625, 3.4237060546875, 3.548095703125, 3.6724853515625, 3.796875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 11.0, 14.0, 30.0, 34.0, 63.0, 97.0, 141.0, 241.0, 382.0, 612.0, 990.0, 1695.0, 3017.0, 5315.0, 9535.0, 17028.0, 30665.0, 56246.0, 111574.0, 234081.0, 281938.0, 141184.0, 69616.0, 36973.0, 20440.0, 11320.0, 6560.0, 3609.0, 2145.0, 1162.0, 664.0, 464.0, 251.0, 163.0, 94.0, 56.0, 45.0, 36.0, 22.0, 14.0, 10.0, 6.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.68408203125, -0.6634521484375, -0.642822265625, -0.6221923828125, -0.6015625, -0.5809326171875, -0.560302734375, -0.5396728515625, -0.51904296875, -0.4984130859375, -0.477783203125, -0.4571533203125, -0.4365234375, -0.4158935546875, -0.395263671875, -0.3746337890625, -0.35400390625, -0.3333740234375, -0.312744140625, -0.2921142578125, -0.271484375, -0.2508544921875, -0.230224609375, -0.2095947265625, -0.18896484375, -0.1683349609375, -0.147705078125, -0.1270751953125, -0.1064453125, -0.0858154296875, -0.065185546875, -0.0445556640625, -0.02392578125, -0.0032958984375, 0.017333984375, 0.0379638671875, 0.05859375, 0.0792236328125, 0.099853515625, 0.1204833984375, 0.14111328125, 0.1617431640625, 0.182373046875, 0.2030029296875, 0.2236328125, 0.2442626953125, 0.264892578125, 0.2855224609375, 0.30615234375, 0.3267822265625, 0.347412109375, 0.3680419921875, 0.388671875, 0.4093017578125, 0.429931640625, 0.4505615234375, 0.47119140625, 0.4918212890625, 0.512451171875, 0.5330810546875, 0.5537109375, 0.5743408203125, 0.594970703125, 0.6156005859375, 0.63623046875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 9.0, 11.0, 9.0, 14.0, 18.0, 15.0, 17.0, 22.0, 19.0, 25.0, 39.0, 42.0, 35.0, 41.0, 31.0, 41.0, 33.0, 31.0, 1063.0, 39.0, 41.0, 45.0, 35.0, 40.0, 41.0, 27.0, 32.0, 24.0, 30.0, 17.0, 19.0, 15.0, 17.0, 18.0, 12.0, 10.0, 13.0, 10.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.140625, -2.070465087890625, -2.00030517578125, -1.930145263671875, -1.8599853515625, -1.789825439453125, -1.71966552734375, -1.649505615234375, -1.579345703125, -1.509185791015625, -1.43902587890625, -1.368865966796875, -1.2987060546875, -1.228546142578125, -1.15838623046875, -1.088226318359375, -1.01806640625, -0.947906494140625, -0.87774658203125, -0.807586669921875, -0.7374267578125, -0.667266845703125, -0.59710693359375, -0.526947021484375, -0.456787109375, -0.386627197265625, -0.31646728515625, -0.246307373046875, -0.1761474609375, -0.105987548828125, -0.03582763671875, 0.034332275390625, 0.1044921875, 0.174652099609375, 0.24481201171875, 0.314971923828125, 0.3851318359375, 0.455291748046875, 0.52545166015625, 0.595611572265625, 0.665771484375, 0.735931396484375, 0.80609130859375, 0.876251220703125, 0.9464111328125, 1.016571044921875, 1.08673095703125, 1.156890869140625, 1.22705078125, 1.297210693359375, 1.36737060546875, 1.437530517578125, 1.5076904296875, 1.577850341796875, 1.64801025390625, 1.718170166015625, 1.788330078125, 1.858489990234375, 1.92864990234375, 1.998809814453125, 2.0689697265625, 2.139129638671875, 2.20928955078125, 2.279449462890625, 2.349609375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 5.0, 5.0, 10.0, 22.0, 18.0, 41.0, 60.0, 101.0, 125.0, 209.0, 337.0, 533.0, 921.0, 1533.0, 2631.0, 4345.0, 7707.0, 13837.0, 24416.0, 45091.0, 85555.0, 166151.0, 1307196.0, 203635.0, 107578.0, 55908.0, 29741.0, 16629.0, 9448.0, 5511.0, 3094.0, 1856.0, 1139.0, 646.0, 405.0, 255.0, 151.0, 95.0, 68.0, 43.0, 21.0, 22.0, 16.0, 9.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.462890625, -0.4491424560546875, -0.435394287109375, -0.4216461181640625, -0.40789794921875, -0.3941497802734375, -0.380401611328125, -0.3666534423828125, -0.3529052734375, -0.3391571044921875, -0.325408935546875, -0.3116607666015625, -0.29791259765625, -0.2841644287109375, -0.270416259765625, -0.2566680908203125, -0.242919921875, -0.2291717529296875, -0.215423583984375, -0.2016754150390625, -0.18792724609375, -0.1741790771484375, -0.160430908203125, -0.1466827392578125, -0.1329345703125, -0.1191864013671875, -0.105438232421875, -0.0916900634765625, -0.07794189453125, -0.0641937255859375, -0.050445556640625, -0.0366973876953125, -0.02294921875, -0.0092010498046875, 0.004547119140625, 0.0182952880859375, 0.03204345703125, 0.0457916259765625, 0.059539794921875, 0.0732879638671875, 0.0870361328125, 0.1007843017578125, 0.114532470703125, 0.1282806396484375, 0.14202880859375, 0.1557769775390625, 0.169525146484375, 0.1832733154296875, 0.197021484375, 0.2107696533203125, 0.224517822265625, 0.2382659912109375, 0.25201416015625, 0.2657623291015625, 0.279510498046875, 0.2932586669921875, 0.3070068359375, 0.3207550048828125, 0.334503173828125, 0.3482513427734375, 0.36199951171875, 0.3757476806640625, 0.389495849609375, 0.4032440185546875, 0.4169921875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 14.0, 10.0, 17.0, 13.0, 24.0, 20.0, 42.0, 35.0, 49.0, 58.0, 101.0, 94.0, 98.0, 93.0, 76.0, 62.0, 41.0, 21.0, 22.0, 19.0, 18.0, 11.0, 8.0, 12.0, 3.0, 5.0, 4.0, 8.0, 0.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0033397674560546875, -0.0032536983489990234, -0.0031676292419433594, -0.0030815601348876953, -0.0029954910278320312, -0.002909421920776367, -0.002823352813720703, -0.002737283706665039, -0.002651214599609375, -0.002565145492553711, -0.002479076385498047, -0.002393007278442383, -0.0023069381713867188, -0.0022208690643310547, -0.0021347999572753906, -0.0020487308502197266, -0.0019626617431640625, -0.0018765926361083984, -0.0017905235290527344, -0.0017044544219970703, -0.0016183853149414062, -0.0015323162078857422, -0.0014462471008300781, -0.001360177993774414, -0.00127410888671875, -0.001188039779663086, -0.0011019706726074219, -0.0010159015655517578, -0.0009298324584960938, -0.0008437633514404297, -0.0007576942443847656, -0.0006716251373291016, -0.0005855560302734375, -0.0004994869232177734, -0.0004134178161621094, -0.0003273487091064453, -0.00024127960205078125, -0.0001552104949951172, -6.914138793945312e-05, 1.6927719116210938e-05, 0.000102996826171875, 0.00018906593322753906, 0.0002751350402832031, 0.0003612041473388672, 0.00044727325439453125, 0.0005333423614501953, 0.0006194114685058594, 0.0007054805755615234, 0.0007915496826171875, 0.0008776187896728516, 0.0009636878967285156, 0.0010497570037841797, 0.0011358261108398438, 0.0012218952178955078, 0.0013079643249511719, 0.001394033432006836, 0.0014801025390625, 0.001566171646118164, 0.0016522407531738281, 0.0017383098602294922, 0.0018243789672851562, 0.0019104480743408203, 0.0019965171813964844, 0.0020825862884521484, 0.0021686553955078125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 9.0, 11.0, 9.0, 20.0, 15.0, 21.0, 27.0, 35.0, 67.0, 104.0, 215.0, 367.0, 1204.0, 1042886.0, 2535.0, 474.0, 175.0, 102.0, 67.0, 46.0, 30.0, 28.0, 13.0, 15.0, 18.0, 10.0, 8.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05743408203125, -0.05527687072753906, -0.053119659423828125, -0.05096244812011719, -0.04880523681640625, -0.04664802551269531, -0.044490814208984375, -0.04233360290527344, -0.0401763916015625, -0.03801918029785156, -0.035861968994140625, -0.03370475769042969, -0.03154754638671875, -0.029390335083007812, -0.027233123779296875, -0.025075912475585938, -0.022918701171875, -0.020761489868164062, -0.018604278564453125, -0.016447067260742188, -0.01428985595703125, -0.012132644653320312, -0.009975433349609375, -0.007818222045898438, -0.0056610107421875, -0.0035037994384765625, -0.001346588134765625, 0.0008106231689453125, 0.00296783447265625, 0.0051250457763671875, 0.007282257080078125, 0.009439468383789062, 0.0115966796875, 0.013753890991210938, 0.015911102294921875, 0.018068313598632812, 0.02022552490234375, 0.022382736206054688, 0.024539947509765625, 0.026697158813476562, 0.0288543701171875, 0.031011581420898438, 0.033168792724609375, 0.03532600402832031, 0.03748321533203125, 0.03964042663574219, 0.041797637939453125, 0.04395484924316406, 0.046112060546875, 0.04826927185058594, 0.050426483154296875, 0.05258369445800781, 0.05474090576171875, 0.05689811706542969, 0.059055328369140625, 0.06121253967285156, 0.0633697509765625, 0.06552696228027344, 0.06768417358398438, 0.06984138488769531, 0.07199859619140625, 0.07415580749511719, 0.07631301879882812, 0.07847023010253906, 0.08062744140625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1018.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006074903532862663, -0.0038381684571504593, -0.0016014333814382553, 0.0006353016942739487, 0.0028720367699861526, 0.005108771845698357, 0.007345506921410561, 0.009582241997122765, 0.011818977072834969, 0.014055712148547173, 0.016292447224259377, 0.01852918229997158, 0.020765917375683784, 0.02300265245139599, 0.025239387527108192, 0.027476122602820396, 0.0297128576785326, 0.031949594616889954, 0.03418632596731186, 0.03642306476831436, 0.03865979611873627, 0.04089653491973877, 0.043133266270160675, 0.04537000507116318, 0.04760673642158508, 0.04984347149729729, 0.05208020657300949, 0.054316941648721695, 0.0565536767244339, 0.0587904118001461, 0.06102714687585831, 0.06326387822628021, 0.06550061702728271, 0.06773735582828522, 0.06997408717870712, 0.07221081852912903, 0.07444755733013153, 0.07668429613113403, 0.07892102748155594, 0.08115775883197784, 0.08339449763298035, 0.08563123643398285, 0.08786796778440475, 0.09010469913482666, 0.09234143793582916, 0.09457817673683167, 0.09681490808725357, 0.09905163943767548, 0.10128837823867798, 0.10352511703968048, 0.10576184839010239, 0.10799857974052429, 0.1102353185415268, 0.1124720573425293, 0.1147087886929512, 0.11694552004337311, 0.11918225884437561, 0.12141899764537811, 0.12365572899580002, 0.12589246034622192, 0.12812919914722443, 0.13036593794822693, 0.13260266184806824, 0.13483940064907074, 0.13707613945007324]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 18.0, 24.0, 39.0, 46.0, 55.0, 53.0, 75.0, 91.0, 92.0, 85.0, 77.0, 86.0, 82.0, 57.0, 41.0, 39.0, 18.0, 13.0, 7.0, 6.0, 2.0, 2.0], "bins": [-0.0042359232902526855, -0.0041525838896632195, -0.004069244489073753, -0.003985905088484287, -0.003902565687894821, -0.003819226287305355, -0.003735886886715889, -0.003652547486126423, -0.003569208085536957, -0.0034858686849474907, -0.0034025292843580246, -0.0033191898837685585, -0.0032358504831790924, -0.0031525110825896263, -0.0030691716820001602, -0.002985832281410694, -0.002902492880821228, -0.002819153480231762, -0.002735814079642296, -0.0026524746790528297, -0.0025691352784633636, -0.0024857958778738976, -0.0024024564772844315, -0.0023191170766949654, -0.0022357776761054993, -0.002152438275516033, -0.002069098874926567, -0.001985759474337101, -0.0019024200737476349, -0.0018190806731581688, -0.0017357412725687027, -0.0016524018719792366, -0.0015690624713897705, -0.0014857230708003044, -0.0014023836702108383, -0.0013190442696213722, -0.0012357048690319061, -0.00115236546844244, -0.001069026067852974, -0.0009856866672635078, -0.0009023472666740417, -0.0008190078660845757, -0.0007356684654951096, -0.0006523290649056435, -0.0005689896643161774, -0.0004856502637267113, -0.0004023108631372452, -0.0003189714625477791, -0.000235632061958313, -0.0001522926613688469, -6.89532607793808e-05, 1.4386139810085297e-05, 9.772554039955139e-05, 0.0001810649409890175, 0.0002644043415784836, 0.0003477437421679497, 0.00043108314275741577, 0.0005144225433468819, 0.000597761943936348, 0.0006811013445258141, 0.0007644407451152802, 0.0008477801457047462, 0.0009311195462942123, 0.0010144589468836784, 0.0010977983474731445]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 7.0, 6.0, 6.0, 15.0, 15.0, 10.0, 22.0, 25.0, 17.0, 36.0, 39.0, 36.0, 26.0, 42.0, 44.0, 50.0, 46.0, 54.0, 47.0, 55.0, 52.0, 44.0, 60.0, 34.0, 35.0, 22.0, 29.0, 21.0, 23.0, 13.0, 14.0, 12.0, 5.0, 7.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1640625, -4.0396728515625, -3.915283203125, -3.7908935546875, -3.66650390625, -3.5421142578125, -3.417724609375, -3.2933349609375, -3.1689453125, -3.0445556640625, -2.920166015625, -2.7957763671875, -2.67138671875, -2.5469970703125, -2.422607421875, -2.2982177734375, -2.173828125, -2.0494384765625, -1.925048828125, -1.8006591796875, -1.67626953125, -1.5518798828125, -1.427490234375, -1.3031005859375, -1.1787109375, -1.0543212890625, -0.929931640625, -0.8055419921875, -0.68115234375, -0.5567626953125, -0.432373046875, -0.3079833984375, -0.18359375, -0.0592041015625, 0.065185546875, 0.1895751953125, 0.31396484375, 0.4383544921875, 0.562744140625, 0.6871337890625, 0.8115234375, 0.9359130859375, 1.060302734375, 1.1846923828125, 1.30908203125, 1.4334716796875, 1.557861328125, 1.6822509765625, 1.806640625, 1.9310302734375, 2.055419921875, 2.1798095703125, 2.30419921875, 2.4285888671875, 2.552978515625, 2.6773681640625, 2.8017578125, 2.9261474609375, 3.050537109375, 3.1749267578125, 3.29931640625, 3.4237060546875, 3.548095703125, 3.6724853515625, 3.796875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 12.0, 11.0, 11.0, 28.0, 33.0, 42.0, 60.0, 86.0, 133.0, 215.0, 288.0, 488.0, 705.0, 1101.0, 1927.0, 3386.0, 6268.0, 12189.0, 25005.0, 59744.0, 172050.0, 439991.0, 199976.0, 67673.0, 27935.0, 13191.0, 6851.0, 3643.0, 2068.0, 1201.0, 792.0, 476.0, 313.0, 194.0, 147.0, 78.0, 76.0, 58.0, 32.0, 25.0, 16.0, 12.0, 1.0, 3.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.830078125, -2.74041748046875, -2.6507568359375, -2.56109619140625, -2.471435546875, -2.38177490234375, -2.2921142578125, -2.20245361328125, -2.11279296875, -2.02313232421875, -1.9334716796875, -1.84381103515625, -1.754150390625, -1.66448974609375, -1.5748291015625, -1.48516845703125, -1.3955078125, -1.30584716796875, -1.2161865234375, -1.12652587890625, -1.036865234375, -0.94720458984375, -0.8575439453125, -0.76788330078125, -0.67822265625, -0.58856201171875, -0.4989013671875, -0.40924072265625, -0.319580078125, -0.22991943359375, -0.1402587890625, -0.05059814453125, 0.0390625, 0.12872314453125, 0.2183837890625, 0.30804443359375, 0.397705078125, 0.48736572265625, 0.5770263671875, 0.66668701171875, 0.75634765625, 0.84600830078125, 0.9356689453125, 1.02532958984375, 1.114990234375, 1.20465087890625, 1.2943115234375, 1.38397216796875, 1.4736328125, 1.56329345703125, 1.6529541015625, 1.74261474609375, 1.832275390625, 1.92193603515625, 2.0115966796875, 2.10125732421875, 2.19091796875, 2.28057861328125, 2.3702392578125, 2.45989990234375, 2.549560546875, 2.63922119140625, 2.7288818359375, 2.81854248046875, 2.908203125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 5.0, 2.0, 10.0, 6.0, 17.0, 6.0, 7.0, 13.0, 24.0, 24.0, 22.0, 25.0, 36.0, 33.0, 34.0, 43.0, 47.0, 61.0, 64.0, 137.0, 1769.0, 167.0, 68.0, 59.0, 44.0, 43.0, 46.0, 40.0, 31.0, 25.0, 25.0, 25.0, 20.0, 23.0, 12.0, 6.0, 9.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.9193115234375, -11.502685546875, -11.0860595703125, -10.66943359375, -10.2528076171875, -9.836181640625, -9.4195556640625, -9.0029296875, -8.5863037109375, -8.169677734375, -7.7530517578125, -7.33642578125, -6.9197998046875, -6.503173828125, -6.0865478515625, -5.669921875, -5.2532958984375, -4.836669921875, -4.4200439453125, -4.00341796875, -3.5867919921875, -3.170166015625, -2.7535400390625, -2.3369140625, -1.9202880859375, -1.503662109375, -1.0870361328125, -0.67041015625, -0.2537841796875, 0.162841796875, 0.5794677734375, 0.99609375, 1.4127197265625, 1.829345703125, 2.2459716796875, 2.66259765625, 3.0792236328125, 3.495849609375, 3.9124755859375, 4.3291015625, 4.7457275390625, 5.162353515625, 5.5789794921875, 5.99560546875, 6.4122314453125, 6.828857421875, 7.2454833984375, 7.662109375, 8.0787353515625, 8.495361328125, 8.9119873046875, 9.32861328125, 9.7452392578125, 10.161865234375, 10.5784912109375, 10.9951171875, 11.4117431640625, 11.828369140625, 12.2449951171875, 12.66162109375, 13.0782470703125, 13.494873046875, 13.9114990234375, 14.328125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 7.0, 8.0, 5.0, 7.0, 9.0, 14.0, 24.0, 29.0, 40.0, 32.0, 41.0, 60.0, 78.0, 94.0, 199.0, 380.0, 1075.0, 7280.0, 840275.0, 2284413.0, 9270.0, 1228.0, 424.0, 197.0, 118.0, 91.0, 62.0, 47.0, 41.0, 33.0, 21.0, 22.0, 13.0, 13.0, 12.0, 13.0, 7.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-24.28125, -23.58837890625, -22.8955078125, -22.20263671875, -21.509765625, -20.81689453125, -20.1240234375, -19.43115234375, -18.73828125, -18.04541015625, -17.3525390625, -16.65966796875, -15.966796875, -15.27392578125, -14.5810546875, -13.88818359375, -13.1953125, -12.50244140625, -11.8095703125, -11.11669921875, -10.423828125, -9.73095703125, -9.0380859375, -8.34521484375, -7.65234375, -6.95947265625, -6.2666015625, -5.57373046875, -4.880859375, -4.18798828125, -3.4951171875, -2.80224609375, -2.109375, -1.41650390625, -0.7236328125, -0.03076171875, 0.662109375, 1.35498046875, 2.0478515625, 2.74072265625, 3.43359375, 4.12646484375, 4.8193359375, 5.51220703125, 6.205078125, 6.89794921875, 7.5908203125, 8.28369140625, 8.9765625, 9.66943359375, 10.3623046875, 11.05517578125, 11.748046875, 12.44091796875, 13.1337890625, 13.82666015625, 14.51953125, 15.21240234375, 15.9052734375, 16.59814453125, 17.291015625, 17.98388671875, 18.6767578125, 19.36962890625, 20.0625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 12.0, 37.0, 132.0, 280.0, 288.0, 177.0, 58.0, 23.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.660255432128906, -35.67465591430664, -34.68905258178711, -33.703453063964844, -32.71785354614258, -31.73225212097168, -30.74665069580078, -29.761051177978516, -28.775449752807617, -27.78984832763672, -26.804248809814453, -25.818647384643555, -24.833045959472656, -23.84744644165039, -22.861845016479492, -21.876243591308594, -20.890644073486328, -19.90504264831543, -18.919443130493164, -17.933841705322266, -16.948240280151367, -15.962640762329102, -14.977039337158203, -13.991438865661621, -13.005836486816406, -12.020236015319824, -11.034634590148926, -10.049034118652344, -9.063433647155762, -8.07783317565918, -7.092231750488281, -6.106631278991699, -5.121030807495117, -4.135429859161377, -3.149829387664795, -2.1642284393310547, -1.1786277294158936, -0.19302701950073242, 0.7925739288330078, 1.7781744003295898, 2.76377534866333, 3.749376058578491, 4.734976768493652, 5.720577716827393, 6.706178665161133, 7.691779136657715, 8.677379608154297, 9.662981033325195, 10.648581504821777, 11.63418197631836, 12.619783401489258, 13.60538387298584, 14.590984344482422, 15.57658576965332, 16.56218719482422, 17.547786712646484, 18.533388137817383, 19.51898956298828, 20.504589080810547, 21.490190505981445, 22.475791931152344, 23.46139144897461, 24.446992874145508, 25.432594299316406, 26.418193817138672]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 3.0, 4.0, 7.0, 11.0, 17.0, 14.0, 18.0, 28.0, 38.0, 42.0, 36.0, 39.0, 46.0, 52.0, 47.0, 51.0, 49.0, 40.0, 44.0, 41.0, 39.0, 36.0, 41.0, 32.0, 33.0, 22.0, 24.0, 30.0, 17.0, 24.0, 8.0, 12.0, 9.0, 10.0, 11.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.41718673706055, -43.99454879760742, -42.5719108581543, -41.14927291870117, -39.72663116455078, -38.303993225097656, -36.88135528564453, -35.458717346191406, -34.03607940673828, -32.613441467285156, -31.19080352783203, -29.768163681030273, -28.34552574157715, -26.922887802124023, -25.500247955322266, -24.07761001586914, -22.654972076416016, -21.23233413696289, -19.809696197509766, -18.387056350708008, -16.964418411254883, -15.541780471801758, -14.119141578674316, -12.696502685546875, -11.27386474609375, -9.851226806640625, -8.428587913513184, -7.0059494972229, -5.583311080932617, -4.160672664642334, -2.738034248352051, -1.3153953552246094, 0.10724639892578125, 1.5298848152160645, 2.9525232315063477, 4.375161647796631, 5.797800064086914, 7.220438480377197, 8.64307689666748, 10.065715789794922, 11.488353729248047, 12.910991668701172, 14.333630561828613, 15.756269454956055, 17.17890739440918, 18.601545333862305, 20.024185180664062, 21.446823120117188, 22.869461059570312, 24.292098999023438, 25.714736938476562, 27.13737678527832, 28.560014724731445, 29.98265266418457, 31.405292510986328, 32.82793045043945, 34.25056838989258, 35.6732063293457, 37.09584426879883, 38.51848220825195, 39.941123962402344, 41.36376190185547, 42.786399841308594, 44.20903778076172, 45.631675720214844]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 2.0, 8.0, 4.0, 6.0, 6.0, 10.0, 10.0, 11.0, 20.0, 20.0, 20.0, 19.0, 32.0, 35.0, 35.0, 31.0, 41.0, 45.0, 52.0, 44.0, 58.0, 45.0, 55.0, 61.0, 40.0, 42.0, 49.0, 37.0, 22.0, 26.0, 20.0, 20.0, 14.0, 24.0, 7.0, 7.0, 5.0, 7.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.0550537109375, -3.926513671875, -3.7979736328125, -3.66943359375, -3.5408935546875, -3.412353515625, -3.2838134765625, -3.1552734375, -3.0267333984375, -2.898193359375, -2.7696533203125, -2.64111328125, -2.5125732421875, -2.384033203125, -2.2554931640625, -2.126953125, -1.9984130859375, -1.869873046875, -1.7413330078125, -1.61279296875, -1.4842529296875, -1.355712890625, -1.2271728515625, -1.0986328125, -0.9700927734375, -0.841552734375, -0.7130126953125, -0.58447265625, -0.4559326171875, -0.327392578125, -0.1988525390625, -0.0703125, 0.0582275390625, 0.186767578125, 0.3153076171875, 0.44384765625, 0.5723876953125, 0.700927734375, 0.8294677734375, 0.9580078125, 1.0865478515625, 1.215087890625, 1.3436279296875, 1.47216796875, 1.6007080078125, 1.729248046875, 1.8577880859375, 1.986328125, 2.1148681640625, 2.243408203125, 2.3719482421875, 2.50048828125, 2.6290283203125, 2.757568359375, 2.8861083984375, 3.0146484375, 3.1431884765625, 3.271728515625, 3.4002685546875, 3.52880859375, 3.6573486328125, 3.785888671875, 3.9144287109375, 4.04296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 5.0, 6.0, 6.0, 9.0, 14.0, 16.0, 19.0, 20.0, 14.0, 31.0, 27.0, 23.0, 28.0, 43.0, 54.0, 162.0, 665.0, 4494.0, 87891.0, 3497458.0, 587731.0, 13508.0, 1348.0, 298.0, 102.0, 46.0, 46.0, 22.0, 21.0, 27.0, 27.0, 20.0, 21.0, 13.0, 11.0, 11.0, 10.0, 7.0, 9.0, 1.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.359375, -17.719970703125, -17.08056640625, -16.441162109375, -15.8017578125, -15.162353515625, -14.52294921875, -13.883544921875, -13.244140625, -12.604736328125, -11.96533203125, -11.325927734375, -10.6865234375, -10.047119140625, -9.40771484375, -8.768310546875, -8.12890625, -7.489501953125, -6.85009765625, -6.210693359375, -5.5712890625, -4.931884765625, -4.29248046875, -3.653076171875, -3.013671875, -2.374267578125, -1.73486328125, -1.095458984375, -0.4560546875, 0.183349609375, 0.82275390625, 1.462158203125, 2.1015625, 2.740966796875, 3.38037109375, 4.019775390625, 4.6591796875, 5.298583984375, 5.93798828125, 6.577392578125, 7.216796875, 7.856201171875, 8.49560546875, 9.135009765625, 9.7744140625, 10.413818359375, 11.05322265625, 11.692626953125, 12.33203125, 12.971435546875, 13.61083984375, 14.250244140625, 14.8896484375, 15.529052734375, 16.16845703125, 16.807861328125, 17.447265625, 18.086669921875, 18.72607421875, 19.365478515625, 20.0048828125, 20.644287109375, 21.28369140625, 21.923095703125, 22.5625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 7.0, 11.0, 15.0, 15.0, 25.0, 39.0, 37.0, 70.0, 99.0, 163.0, 211.0, 302.0, 452.0, 590.0, 595.0, 467.0, 306.0, 216.0, 138.0, 103.0, 75.0, 46.0, 28.0, 23.0, 13.0, 9.0, 9.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-18.890625, -18.4508056640625, -18.010986328125, -17.5711669921875, -17.13134765625, -16.6915283203125, -16.251708984375, -15.8118896484375, -15.3720703125, -14.9322509765625, -14.492431640625, -14.0526123046875, -13.61279296875, -13.1729736328125, -12.733154296875, -12.2933349609375, -11.853515625, -11.4136962890625, -10.973876953125, -10.5340576171875, -10.09423828125, -9.6544189453125, -9.214599609375, -8.7747802734375, -8.3349609375, -7.8951416015625, -7.455322265625, -7.0155029296875, -6.57568359375, -6.1358642578125, -5.696044921875, -5.2562255859375, -4.81640625, -4.3765869140625, -3.936767578125, -3.4969482421875, -3.05712890625, -2.6173095703125, -2.177490234375, -1.7376708984375, -1.2978515625, -0.8580322265625, -0.418212890625, 0.0216064453125, 0.46142578125, 0.9012451171875, 1.341064453125, 1.7808837890625, 2.220703125, 2.6605224609375, 3.100341796875, 3.5401611328125, 3.97998046875, 4.4197998046875, 4.859619140625, 5.2994384765625, 5.7392578125, 6.1790771484375, 6.618896484375, 7.0587158203125, 7.49853515625, 7.9383544921875, 8.378173828125, 8.8179931640625, 9.2578125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 18.0, 26.0, 44.0, 59.0, 105.0, 175.0, 312.0, 570.0, 2230.0, 105036.0, 4047379.0, 35649.0, 1552.0, 472.0, 259.0, 134.0, 105.0, 58.0, 34.0, 12.0, 13.0, 12.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.71875, -37.94580078125, -36.1728515625, -34.39990234375, -32.626953125, -30.85400390625, -29.0810546875, -27.30810546875, -25.53515625, -23.76220703125, -21.9892578125, -20.21630859375, -18.443359375, -16.67041015625, -14.8974609375, -13.12451171875, -11.3515625, -9.57861328125, -7.8056640625, -6.03271484375, -4.259765625, -2.48681640625, -0.7138671875, 1.05908203125, 2.83203125, 4.60498046875, 6.3779296875, 8.15087890625, 9.923828125, 11.69677734375, 13.4697265625, 15.24267578125, 17.015625, 18.78857421875, 20.5615234375, 22.33447265625, 24.107421875, 25.88037109375, 27.6533203125, 29.42626953125, 31.19921875, 32.97216796875, 34.7451171875, 36.51806640625, 38.291015625, 40.06396484375, 41.8369140625, 43.60986328125, 45.3828125, 47.15576171875, 48.9287109375, 50.70166015625, 52.474609375, 54.24755859375, 56.0205078125, 57.79345703125, 59.56640625, 61.33935546875, 63.1123046875, 64.88525390625, 66.658203125, 68.43115234375, 70.2041015625, 71.97705078125, 73.75]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 38.0, 120.0, 311.0, 316.0, 167.0, 49.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-227.37490844726562, -223.09507751464844, -218.81524658203125, -214.53543090820312, -210.25559997558594, -205.97576904296875, -201.69595336914062, -197.41612243652344, -193.13629150390625, -188.85646057128906, -184.57662963867188, -180.29681396484375, -176.01698303222656, -171.73715209960938, -167.45733642578125, -163.17750549316406, -158.89767456054688, -154.6178436279297, -150.3380126953125, -146.05819702148438, -141.7783660888672, -137.49853515625, -133.21871948242188, -128.9388885498047, -124.6590576171875, -120.37922668457031, -116.09940338134766, -111.819580078125, -107.53974914550781, -103.25991821289062, -98.98009490966797, -94.70027160644531, -90.42044067382812, -86.14060974121094, -81.86078643798828, -77.58096313476562, -73.30113220214844, -69.02130126953125, -64.7414779663086, -60.46165084838867, -56.18182373046875, -51.90199661254883, -47.622169494628906, -43.342342376708984, -39.06251525878906, -34.78268814086914, -30.50286102294922, -26.223033905029297, -21.943206787109375, -17.663379669189453, -13.383552551269531, -9.10372543334961, -4.8238983154296875, -0.5440711975097656, 3.7357559204101562, 8.015583038330078, 12.29541015625, 16.575237274169922, 20.855064392089844, 25.134891510009766, 29.414718627929688, 33.69454574584961, 37.97437286376953, 42.25419998168945, 46.534027099609375]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 3.0, 7.0, 6.0, 6.0, 8.0, 10.0, 10.0, 14.0, 19.0, 12.0, 23.0, 30.0, 26.0, 27.0, 42.0, 25.0, 39.0, 41.0, 42.0, 43.0, 47.0, 49.0, 36.0, 46.0, 41.0, 37.0, 42.0, 26.0, 31.0, 28.0, 35.0, 33.0, 10.0, 18.0, 19.0, 15.0, 14.0, 7.0, 9.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.37052917480469, -35.0737419128418, -33.77695083618164, -32.48016357421875, -31.183374404907227, -29.886585235595703, -28.589797973632812, -27.29300880432129, -25.996219635009766, -24.699430465698242, -23.40264129638672, -22.105854034423828, -20.809064865112305, -19.51227569580078, -18.21548843383789, -16.918699264526367, -15.621910095214844, -14.32512092590332, -13.028332710266113, -11.731544494628906, -10.434755325317383, -9.13796615600586, -7.841177940368652, -6.544389724731445, -5.247600555419922, -3.9508118629455566, -2.6540231704711914, -1.3572344779968262, -0.06044578552246094, 1.2363429069519043, 2.5331315994262695, 3.8299198150634766, 5.126708984375, 6.423497676849365, 7.7202863693237305, 9.017074584960938, 10.313863754272461, 11.610652923583984, 12.907441139221191, 14.204229354858398, 15.501018524169922, 16.797807693481445, 18.09459686279297, 19.39138412475586, 20.688173294067383, 21.984962463378906, 23.281749725341797, 24.57853889465332, 25.875328063964844, 27.172117233276367, 28.46890640258789, 29.76569366455078, 31.062482833862305, 32.35927200317383, 33.65605926513672, 34.952850341796875, 36.249637603759766, 37.546424865722656, 38.84321594238281, 40.1400032043457, 41.436790466308594, 42.73358154296875, 44.03036880493164, 45.32715606689453, 46.62394714355469]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 6.0, 8.0, 11.0, 16.0, 18.0, 19.0, 15.0, 22.0, 23.0, 29.0, 34.0, 28.0, 28.0, 33.0, 54.0, 56.0, 47.0, 55.0, 50.0, 47.0, 44.0, 46.0, 51.0, 35.0, 32.0, 29.0, 27.0, 23.0, 25.0, 11.0, 13.0, 12.0, 14.0, 7.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.0997314453125, -3.968994140625, -3.8382568359375, -3.70751953125, -3.5767822265625, -3.446044921875, -3.3153076171875, -3.1845703125, -3.0538330078125, -2.923095703125, -2.7923583984375, -2.66162109375, -2.5308837890625, -2.400146484375, -2.2694091796875, -2.138671875, -2.0079345703125, -1.877197265625, -1.7464599609375, -1.61572265625, -1.4849853515625, -1.354248046875, -1.2235107421875, -1.0927734375, -0.9620361328125, -0.831298828125, -0.7005615234375, -0.56982421875, -0.4390869140625, -0.308349609375, -0.1776123046875, -0.046875, 0.0838623046875, 0.214599609375, 0.3453369140625, 0.47607421875, 0.6068115234375, 0.737548828125, 0.8682861328125, 0.9990234375, 1.1297607421875, 1.260498046875, 1.3912353515625, 1.52197265625, 1.6527099609375, 1.783447265625, 1.9141845703125, 2.044921875, 2.1756591796875, 2.306396484375, 2.4371337890625, 2.56787109375, 2.6986083984375, 2.829345703125, 2.9600830078125, 3.0908203125, 3.2215576171875, 3.352294921875, 3.4830322265625, 3.61376953125, 3.7445068359375, 3.875244140625, 4.0059814453125, 4.13671875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 10.0, 20.0, 16.0, 24.0, 42.0, 58.0, 80.0, 117.0, 157.0, 241.0, 380.0, 570.0, 886.0, 1497.0, 2306.0, 3804.0, 6510.0, 11031.0, 18570.0, 32690.0, 59946.0, 117934.0, 232594.0, 260700.0, 139127.0, 69405.0, 37405.0, 21189.0, 12323.0, 7416.0, 4449.0, 2522.0, 1635.0, 1036.0, 680.0, 384.0, 258.0, 170.0, 117.0, 70.0, 54.0, 36.0, 28.0, 16.0, 9.0, 9.0, 5.0, 7.0, 6.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.626953125, -0.6068038940429688, -0.5866546630859375, -0.5665054321289062, -0.546356201171875, -0.5262069702148438, -0.5060577392578125, -0.48590850830078125, -0.46575927734375, -0.44561004638671875, -0.4254608154296875, -0.40531158447265625, -0.385162353515625, -0.36501312255859375, -0.3448638916015625, -0.32471466064453125, -0.3045654296875, -0.28441619873046875, -0.2642669677734375, -0.24411773681640625, -0.223968505859375, -0.20381927490234375, -0.1836700439453125, -0.16352081298828125, -0.14337158203125, -0.12322235107421875, -0.1030731201171875, -0.08292388916015625, -0.062774658203125, -0.04262542724609375, -0.0224761962890625, -0.00232696533203125, 0.017822265625, 0.03797149658203125, 0.0581207275390625, 0.07826995849609375, 0.098419189453125, 0.11856842041015625, 0.1387176513671875, 0.15886688232421875, 0.17901611328125, 0.19916534423828125, 0.2193145751953125, 0.23946380615234375, 0.259613037109375, 0.27976226806640625, 0.2999114990234375, 0.32006072998046875, 0.3402099609375, 0.36035919189453125, 0.3805084228515625, 0.40065765380859375, 0.420806884765625, 0.44095611572265625, 0.4611053466796875, 0.48125457763671875, 0.50140380859375, 0.5215530395507812, 0.5417022705078125, 0.5618515014648438, 0.582000732421875, 0.6021499633789062, 0.6222991943359375, 0.6424484252929688, 0.66259765625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 1.0, 3.0, 6.0, 7.0, 11.0, 7.0, 10.0, 11.0, 16.0, 21.0, 17.0, 30.0, 31.0, 29.0, 36.0, 38.0, 30.0, 32.0, 44.0, 49.0, 32.0, 40.0, 1054.0, 45.0, 39.0, 37.0, 32.0, 36.0, 26.0, 34.0, 22.0, 24.0, 27.0, 23.0, 20.0, 13.0, 13.0, 20.0, 15.0, 8.0, 6.0, 5.0, 2.0, 6.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.205078125, -2.135955810546875, -2.06683349609375, -1.997711181640625, -1.9285888671875, -1.859466552734375, -1.79034423828125, -1.721221923828125, -1.652099609375, -1.582977294921875, -1.51385498046875, -1.444732666015625, -1.3756103515625, -1.306488037109375, -1.23736572265625, -1.168243408203125, -1.09912109375, -1.029998779296875, -0.96087646484375, -0.891754150390625, -0.8226318359375, -0.753509521484375, -0.68438720703125, -0.615264892578125, -0.546142578125, -0.477020263671875, -0.40789794921875, -0.338775634765625, -0.2696533203125, -0.200531005859375, -0.13140869140625, -0.062286376953125, 0.0068359375, 0.075958251953125, 0.14508056640625, 0.214202880859375, 0.2833251953125, 0.352447509765625, 0.42156982421875, 0.490692138671875, 0.559814453125, 0.628936767578125, 0.69805908203125, 0.767181396484375, 0.8363037109375, 0.905426025390625, 0.97454833984375, 1.043670654296875, 1.11279296875, 1.181915283203125, 1.25103759765625, 1.320159912109375, 1.3892822265625, 1.458404541015625, 1.52752685546875, 1.596649169921875, 1.665771484375, 1.734893798828125, 1.80401611328125, 1.873138427734375, 1.9422607421875, 2.011383056640625, 2.08050537109375, 2.149627685546875, 2.21875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 10.0, 7.0, 14.0, 20.0, 41.0, 42.0, 63.0, 117.0, 156.0, 262.0, 413.0, 754.0, 1091.0, 1867.0, 2972.0, 4949.0, 8411.0, 14433.0, 25282.0, 44767.0, 83069.0, 152201.0, 1284045.0, 206615.0, 118675.0, 63547.0, 34871.0, 19980.0, 11375.0, 6682.0, 3941.0, 2445.0, 1468.0, 913.0, 627.0, 349.0, 224.0, 138.0, 106.0, 62.0, 53.0, 19.0, 20.0, 16.0, 12.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.4443359375, -0.4307861328125, -0.417236328125, -0.4036865234375, -0.39013671875, -0.3765869140625, -0.363037109375, -0.3494873046875, -0.3359375, -0.3223876953125, -0.308837890625, -0.2952880859375, -0.28173828125, -0.2681884765625, -0.254638671875, -0.2410888671875, -0.2275390625, -0.2139892578125, -0.200439453125, -0.1868896484375, -0.17333984375, -0.1597900390625, -0.146240234375, -0.1326904296875, -0.119140625, -0.1055908203125, -0.092041015625, -0.0784912109375, -0.06494140625, -0.0513916015625, -0.037841796875, -0.0242919921875, -0.0107421875, 0.0028076171875, 0.016357421875, 0.0299072265625, 0.04345703125, 0.0570068359375, 0.070556640625, 0.0841064453125, 0.09765625, 0.1112060546875, 0.124755859375, 0.1383056640625, 0.15185546875, 0.1654052734375, 0.178955078125, 0.1925048828125, 0.2060546875, 0.2196044921875, 0.233154296875, 0.2467041015625, 0.26025390625, 0.2738037109375, 0.287353515625, 0.3009033203125, 0.314453125, 0.3280029296875, 0.341552734375, 0.3551025390625, 0.36865234375, 0.3822021484375, 0.395751953125, 0.4093017578125, 0.4228515625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 4.0, 5.0, 7.0, 13.0, 14.0, 7.0, 26.0, 29.0, 25.0, 43.0, 41.0, 51.0, 74.0, 64.0, 71.0, 62.0, 61.0, 69.0, 52.0, 51.0, 46.0, 34.0, 35.0, 19.0, 17.0, 11.0, 17.0, 8.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0017118453979492188, -0.0016632080078125, -0.0016145706176757812, -0.0015659332275390625, -0.0015172958374023438, -0.001468658447265625, -0.0014200210571289062, -0.0013713836669921875, -0.0013227462768554688, -0.00127410888671875, -0.0012254714965820312, -0.0011768341064453125, -0.0011281967163085938, -0.001079559326171875, -0.0010309219360351562, -0.0009822845458984375, -0.0009336471557617188, -0.000885009765625, -0.0008363723754882812, -0.0007877349853515625, -0.0007390975952148438, -0.000690460205078125, -0.0006418228149414062, -0.0005931854248046875, -0.0005445480346679688, -0.00049591064453125, -0.00044727325439453125, -0.0003986358642578125, -0.00034999847412109375, -0.000301361083984375, -0.00025272369384765625, -0.0002040863037109375, -0.00015544891357421875, -0.0001068115234375, -5.817413330078125e-05, -9.5367431640625e-06, 3.910064697265625e-05, 8.7738037109375e-05, 0.00013637542724609375, 0.0001850128173828125, 0.00023365020751953125, 0.00028228759765625, 0.00033092498779296875, 0.0003795623779296875, 0.00042819976806640625, 0.000476837158203125, 0.0005254745483398438, 0.0005741119384765625, 0.0006227493286132812, 0.00067138671875, 0.0007200241088867188, 0.0007686614990234375, 0.0008172988891601562, 0.000865936279296875, 0.0009145736694335938, 0.0009632110595703125, 0.0010118484497070312, 0.00106048583984375, 0.0011091232299804688, 0.0011577606201171875, 0.0012063980102539062, 0.001255035400390625, 0.0013036727905273438, 0.0013523101806640625, 0.0014009475708007812]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 4.0, 6.0, 11.0, 13.0, 12.0, 17.0, 27.0, 24.0, 37.0, 64.0, 67.0, 114.0, 161.0, 369.0, 909.0, 533945.0, 510902.0, 898.0, 395.0, 163.0, 97.0, 74.0, 43.0, 41.0, 36.0, 21.0, 8.0, 10.0, 12.0, 18.0, 9.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.04388427734375, -0.04246854782104492, -0.041052818298339844, -0.039637088775634766, -0.03822135925292969, -0.03680562973022461, -0.03538990020751953, -0.03397417068481445, -0.032558441162109375, -0.031142711639404297, -0.02972698211669922, -0.02831125259399414, -0.026895523071289062, -0.025479793548583984, -0.024064064025878906, -0.022648334503173828, -0.02123260498046875, -0.019816875457763672, -0.018401145935058594, -0.016985416412353516, -0.015569686889648438, -0.01415395736694336, -0.012738227844238281, -0.011322498321533203, -0.009906768798828125, -0.008491039276123047, -0.007075309753417969, -0.005659580230712891, -0.0042438507080078125, -0.0028281211853027344, -0.0014123916625976562, 3.337860107421875e-06, 0.0014190673828125, 0.002834796905517578, 0.004250526428222656, 0.005666255950927734, 0.0070819854736328125, 0.00849771499633789, 0.009913444519042969, 0.011329174041748047, 0.012744903564453125, 0.014160633087158203, 0.015576362609863281, 0.01699209213256836, 0.018407821655273438, 0.019823551177978516, 0.021239280700683594, 0.022655010223388672, 0.02407073974609375, 0.025486469268798828, 0.026902198791503906, 0.028317928314208984, 0.029733657836914062, 0.03114938735961914, 0.03256511688232422, 0.0339808464050293, 0.035396575927734375, 0.03681230545043945, 0.03822803497314453, 0.03964376449584961, 0.04105949401855469, 0.042475223541259766, 0.043890953063964844, 0.04530668258666992, 0.046722412109375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1018.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007014077622443438, -0.00571267819032073, -0.0044112782925367355, -0.003109878860414028, -0.0018084794282913208, -0.0005070799961686134, 0.0007943199016153812, 0.0020957193337380886, 0.003397118765860796, 0.004698518197983503, 0.005999918095767498, 0.007301317527890205, 0.008602716960012913, 0.00990411639213562, 0.011205516755580902, 0.012506915256381035, 0.013808315619826317, 0.015109715051949024, 0.01641111448407173, 0.017712514847517014, 0.019013913348317146, 0.02031531371176243, 0.02161671221256256, 0.022918112576007843, 0.024219511076807976, 0.025520911440253258, 0.02682230994105339, 0.028123710304498672, 0.029425108805298805, 0.030726509168744087, 0.03202790766954422, 0.0333293080329895, 0.034630704671144485, 0.03593210503458977, 0.03723350539803505, 0.03853490203619003, 0.039836302399635315, 0.0411377027630806, 0.04243910312652588, 0.04374050348997116, 0.045041900128126144, 0.046343300491571426, 0.04764470085501671, 0.04894609749317169, 0.050247497856616974, 0.051548898220062256, 0.05285029858350754, 0.05415169894695282, 0.0554530993103981, 0.056754499673843384, 0.058055900037288666, 0.05935729667544365, 0.06065869703888893, 0.06196009740233421, 0.0632614940404892, 0.06456289440393448, 0.06586429476737976, 0.06716569513082504, 0.06846709549427032, 0.0697684958577156, 0.07106989622116089, 0.07237128913402557, 0.07367268949747086, 0.07497408986091614, 0.07627549022436142]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 9.0, 7.0, 9.0, 15.0, 15.0, 22.0, 24.0, 19.0, 29.0, 45.0, 45.0, 47.0, 67.0, 62.0, 70.0, 53.0, 61.0, 47.0, 60.0, 52.0, 42.0, 45.0, 29.0, 27.0, 34.0, 19.0, 16.0, 13.0, 13.0, 12.0, 5.0, 2.0, 3.0], "bins": [-0.0016615986824035645, -0.0016258619725704193, -0.0015901252627372742, -0.001554388552904129, -0.0015186518430709839, -0.0014829151332378387, -0.0014471784234046936, -0.0014114417135715485, -0.0013757050037384033, -0.0013399682939052582, -0.001304231584072113, -0.001268494874238968, -0.0012327581644058228, -0.0011970214545726776, -0.0011612847447395325, -0.0011255480349063873, -0.0010898113250732422, -0.001054074615240097, -0.001018337905406952, -0.0009826011955738068, -0.0009468644857406616, -0.0009111277759075165, -0.0008753910660743713, -0.0008396543562412262, -0.0008039176464080811, -0.0007681809365749359, -0.0007324442267417908, -0.0006967075169086456, -0.0006609708070755005, -0.0006252340972423553, -0.0005894973874092102, -0.0005537606775760651, -0.0005180239677429199, -0.0004822872579097748, -0.00044655054807662964, -0.0004108138382434845, -0.00037507712841033936, -0.0003393404185771942, -0.00030360370874404907, -0.00026786699891090393, -0.0002321302890777588, -0.00019639357924461365, -0.0001606568694114685, -0.00012492015957832336, -8.918344974517822e-05, -5.344673991203308e-05, -1.771003007888794e-05, 1.8026679754257202e-05, 5.3763389587402344e-05, 8.950009942054749e-05, 0.00012523680925369263, 0.00016097351908683777, 0.0001967102289199829, 0.00023244693875312805, 0.0002681836485862732, 0.00030392035841941833, 0.0003396570682525635, 0.0003753937780857086, 0.00041113048791885376, 0.0004468671977519989, 0.00048260390758514404, 0.0005183406174182892, 0.0005540773272514343, 0.0005898140370845795, 0.0006255507469177246]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 6.0, 8.0, 11.0, 16.0, 18.0, 19.0, 15.0, 22.0, 23.0, 29.0, 34.0, 28.0, 28.0, 33.0, 54.0, 56.0, 47.0, 55.0, 50.0, 47.0, 44.0, 46.0, 51.0, 35.0, 32.0, 29.0, 27.0, 23.0, 25.0, 11.0, 13.0, 12.0, 14.0, 7.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.0997314453125, -3.968994140625, -3.8382568359375, -3.70751953125, -3.5767822265625, -3.446044921875, -3.3153076171875, -3.1845703125, -3.0538330078125, -2.923095703125, -2.7923583984375, -2.66162109375, -2.5308837890625, -2.400146484375, -2.2694091796875, -2.138671875, -2.0079345703125, -1.877197265625, -1.7464599609375, -1.61572265625, -1.4849853515625, -1.354248046875, -1.2235107421875, -1.0927734375, -0.9620361328125, -0.831298828125, -0.7005615234375, -0.56982421875, -0.4390869140625, -0.308349609375, -0.1776123046875, -0.046875, 0.0838623046875, 0.214599609375, 0.3453369140625, 0.47607421875, 0.6068115234375, 0.737548828125, 0.8682861328125, 0.9990234375, 1.1297607421875, 1.260498046875, 1.3912353515625, 1.52197265625, 1.6527099609375, 1.783447265625, 1.9141845703125, 2.044921875, 2.1756591796875, 2.306396484375, 2.4371337890625, 2.56787109375, 2.6986083984375, 2.829345703125, 2.9600830078125, 3.0908203125, 3.2215576171875, 3.352294921875, 3.4830322265625, 3.61376953125, 3.7445068359375, 3.875244140625, 4.0059814453125, 4.13671875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 14.0, 10.0, 13.0, 19.0, 24.0, 35.0, 57.0, 65.0, 110.0, 160.0, 246.0, 429.0, 722.0, 1277.0, 2468.0, 5173.0, 12257.0, 35204.0, 122409.0, 521154.0, 251345.0, 60355.0, 19652.0, 7634.0, 3519.0, 1754.0, 950.0, 529.0, 338.0, 213.0, 109.0, 93.0, 53.0, 39.0, 33.0, 27.0, 17.0, 14.0, 5.0, 3.0, 3.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.59375, -3.487213134765625, -3.38067626953125, -3.274139404296875, -3.1676025390625, -3.061065673828125, -2.95452880859375, -2.847991943359375, -2.741455078125, -2.634918212890625, -2.52838134765625, -2.421844482421875, -2.3153076171875, -2.208770751953125, -2.10223388671875, -1.995697021484375, -1.88916015625, -1.782623291015625, -1.67608642578125, -1.569549560546875, -1.4630126953125, -1.356475830078125, -1.24993896484375, -1.143402099609375, -1.036865234375, -0.930328369140625, -0.82379150390625, -0.717254638671875, -0.6107177734375, -0.504180908203125, -0.39764404296875, -0.291107177734375, -0.1845703125, -0.078033447265625, 0.02850341796875, 0.135040283203125, 0.2415771484375, 0.348114013671875, 0.45465087890625, 0.561187744140625, 0.667724609375, 0.774261474609375, 0.88079833984375, 0.987335205078125, 1.0938720703125, 1.200408935546875, 1.30694580078125, 1.413482666015625, 1.52001953125, 1.626556396484375, 1.73309326171875, 1.839630126953125, 1.9461669921875, 2.052703857421875, 2.15924072265625, 2.265777587890625, 2.372314453125, 2.478851318359375, 2.58538818359375, 2.691925048828125, 2.7984619140625, 2.904998779296875, 3.01153564453125, 3.118072509765625, 3.224609375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 8.0, 6.0, 11.0, 7.0, 17.0, 17.0, 24.0, 27.0, 35.0, 43.0, 39.0, 41.0, 44.0, 73.0, 95.0, 1734.0, 322.0, 84.0, 66.0, 43.0, 51.0, 40.0, 44.0, 30.0, 30.0, 17.0, 23.0, 15.0, 8.0, 13.0, 8.0, 3.0, 10.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-18.53125, -18.028076171875, -17.52490234375, -17.021728515625, -16.5185546875, -16.015380859375, -15.51220703125, -15.009033203125, -14.505859375, -14.002685546875, -13.49951171875, -12.996337890625, -12.4931640625, -11.989990234375, -11.48681640625, -10.983642578125, -10.48046875, -9.977294921875, -9.47412109375, -8.970947265625, -8.4677734375, -7.964599609375, -7.46142578125, -6.958251953125, -6.455078125, -5.951904296875, -5.44873046875, -4.945556640625, -4.4423828125, -3.939208984375, -3.43603515625, -2.932861328125, -2.4296875, -1.926513671875, -1.42333984375, -0.920166015625, -0.4169921875, 0.086181640625, 0.58935546875, 1.092529296875, 1.595703125, 2.098876953125, 2.60205078125, 3.105224609375, 3.6083984375, 4.111572265625, 4.61474609375, 5.117919921875, 5.62109375, 6.124267578125, 6.62744140625, 7.130615234375, 7.6337890625, 8.136962890625, 8.64013671875, 9.143310546875, 9.646484375, 10.149658203125, 10.65283203125, 11.156005859375, 11.6591796875, 12.162353515625, 12.66552734375, 13.168701171875, 13.671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 3.0, 6.0, 7.0, 3.0, 13.0, 13.0, 19.0, 24.0, 15.0, 33.0, 45.0, 55.0, 81.0, 108.0, 180.0, 342.0, 883.0, 8215.0, 3018011.0, 114333.0, 2089.0, 519.0, 228.0, 124.0, 95.0, 66.0, 48.0, 23.0, 21.0, 28.0, 16.0, 10.0, 12.0, 6.0, 7.0, 6.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.3125, -20.544921875, -19.77734375, -19.009765625, -18.2421875, -17.474609375, -16.70703125, -15.939453125, -15.171875, -14.404296875, -13.63671875, -12.869140625, -12.1015625, -11.333984375, -10.56640625, -9.798828125, -9.03125, -8.263671875, -7.49609375, -6.728515625, -5.9609375, -5.193359375, -4.42578125, -3.658203125, -2.890625, -2.123046875, -1.35546875, -0.587890625, 0.1796875, 0.947265625, 1.71484375, 2.482421875, 3.25, 4.017578125, 4.78515625, 5.552734375, 6.3203125, 7.087890625, 7.85546875, 8.623046875, 9.390625, 10.158203125, 10.92578125, 11.693359375, 12.4609375, 13.228515625, 13.99609375, 14.763671875, 15.53125, 16.298828125, 17.06640625, 17.833984375, 18.6015625, 19.369140625, 20.13671875, 20.904296875, 21.671875, 22.439453125, 23.20703125, 23.974609375, 24.7421875, 25.509765625, 26.27734375, 27.044921875, 27.8125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 47.0, 233.0, 381.0, 273.0, 60.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.573726654052734, -48.43610382080078, -47.29848098754883, -46.16085433959961, -45.023231506347656, -43.8856086730957, -42.74798583984375, -41.61035919189453, -40.47273635864258, -39.335113525390625, -38.19749069213867, -37.05986404418945, -35.9222412109375, -34.78461837768555, -33.646995544433594, -32.509368896484375, -31.371747970581055, -30.2341251373291, -29.096500396728516, -27.958877563476562, -26.821252822875977, -25.683629989624023, -24.546005249023438, -23.408382415771484, -22.27075958251953, -21.133136749267578, -19.995512008666992, -18.85788917541504, -17.720264434814453, -16.5826416015625, -15.44501781463623, -14.307394027709961, -13.169767379760742, -12.032143592834473, -10.894519805908203, -9.75689697265625, -8.619272232055664, -7.481648921966553, -6.344025611877441, -5.206401824951172, -4.068778038024902, -2.931154251098633, -1.7935307025909424, -0.655907154083252, 0.4817166328430176, 1.619340419769287, 2.7569637298583984, 3.894587516784668, 5.0322113037109375, 6.169835090637207, 7.307458877563477, 8.44508171081543, 9.582706451416016, 10.720329284667969, 11.857953071594238, 12.995576858520508, 14.133200645446777, 15.270824432373047, 16.408447265625, 17.546072006225586, 18.68369483947754, 19.821319580078125, 20.958942413330078, 22.09656524658203, 23.234189987182617]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 9.0, 6.0, 15.0, 11.0, 15.0, 14.0, 24.0, 27.0, 34.0, 29.0, 37.0, 31.0, 32.0, 34.0, 33.0, 44.0, 41.0, 27.0, 33.0, 46.0, 26.0, 43.0, 36.0, 31.0, 44.0, 38.0, 22.0, 22.0, 18.0, 19.0, 12.0, 21.0, 21.0, 19.0, 13.0, 8.0, 6.0, 13.0, 9.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.89753723144531, -34.700870513916016, -33.50420379638672, -32.30754089355469, -31.11087417602539, -29.914207458496094, -28.717540740966797, -27.520875930786133, -26.32421112060547, -25.127544403076172, -23.930879592895508, -22.73421287536621, -21.537548065185547, -20.34088134765625, -19.144214630126953, -17.94754981994629, -16.750883102416992, -15.554217338562012, -14.357551574707031, -13.160884857177734, -11.96422004699707, -10.767553329467773, -9.570887565612793, -8.374221801757812, -7.177556037902832, -5.980890274047852, -4.784224510192871, -3.5875582695007324, -2.390892505645752, -1.1942267417907715, 0.0024394989013671875, 1.1991052627563477, 2.395771026611328, 3.5924367904663086, 4.789102554321289, 5.985768795013428, 7.182434558868408, 8.379100799560547, 9.575766563415527, 10.772432327270508, 11.969098091125488, 13.165763854980469, 14.36242961883545, 15.55909538269043, 16.755762100219727, 17.95242691040039, 19.149093627929688, 20.345760345458984, 21.54242515563965, 22.739091873168945, 23.93575668334961, 25.132423400878906, 26.32908821105957, 27.525754928588867, 28.72241973876953, 29.919086456298828, 31.115753173828125, 32.31241989135742, 33.50908660888672, 34.70574951171875, 35.90241622924805, 37.099082946777344, 38.29574966430664, 39.49241638183594, 40.68907928466797]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 5.0, 7.0, 7.0, 8.0, 11.0, 12.0, 19.0, 14.0, 19.0, 22.0, 25.0, 23.0, 30.0, 31.0, 33.0, 37.0, 49.0, 52.0, 40.0, 66.0, 51.0, 42.0, 37.0, 50.0, 52.0, 45.0, 28.0, 27.0, 33.0, 30.0, 21.0, 10.0, 15.0, 10.0, 13.0, 8.0, 8.0, 5.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.38671875, -4.25201416015625, -4.1173095703125, -3.98260498046875, -3.847900390625, -3.71319580078125, -3.5784912109375, -3.44378662109375, -3.30908203125, -3.17437744140625, -3.0396728515625, -2.90496826171875, -2.770263671875, -2.63555908203125, -2.5008544921875, -2.36614990234375, -2.2314453125, -2.09674072265625, -1.9620361328125, -1.82733154296875, -1.692626953125, -1.55792236328125, -1.4232177734375, -1.28851318359375, -1.15380859375, -1.01910400390625, -0.8843994140625, -0.74969482421875, -0.614990234375, -0.48028564453125, -0.3455810546875, -0.21087646484375, -0.076171875, 0.05853271484375, 0.1932373046875, 0.32794189453125, 0.462646484375, 0.59735107421875, 0.7320556640625, 0.86676025390625, 1.00146484375, 1.13616943359375, 1.2708740234375, 1.40557861328125, 1.540283203125, 1.67498779296875, 1.8096923828125, 1.94439697265625, 2.0791015625, 2.21380615234375, 2.3485107421875, 2.48321533203125, 2.617919921875, 2.75262451171875, 2.8873291015625, 3.02203369140625, 3.15673828125, 3.29144287109375, 3.4261474609375, 3.56085205078125, 3.695556640625, 3.83026123046875, 3.9649658203125, 4.09967041015625, 4.234375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 7.0, 12.0, 11.0, 13.0, 11.0, 19.0, 32.0, 27.0, 70.0, 87.0, 168.0, 344.0, 946.0, 2709.0, 9599.0, 39473.0, 248779.0, 1945804.0, 1687099.0, 211583.0, 34633.0, 8597.0, 2537.0, 862.0, 372.0, 170.0, 89.0, 62.0, 44.0, 25.0, 11.0, 16.0, 15.0, 5.0, 10.0, 9.0, 8.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-9.9765625, -9.691162109375, -9.40576171875, -9.120361328125, -8.8349609375, -8.549560546875, -8.26416015625, -7.978759765625, -7.693359375, -7.407958984375, -7.12255859375, -6.837158203125, -6.5517578125, -6.266357421875, -5.98095703125, -5.695556640625, -5.41015625, -5.124755859375, -4.83935546875, -4.553955078125, -4.2685546875, -3.983154296875, -3.69775390625, -3.412353515625, -3.126953125, -2.841552734375, -2.55615234375, -2.270751953125, -1.9853515625, -1.699951171875, -1.41455078125, -1.129150390625, -0.84375, -0.558349609375, -0.27294921875, 0.012451171875, 0.2978515625, 0.583251953125, 0.86865234375, 1.154052734375, 1.439453125, 1.724853515625, 2.01025390625, 2.295654296875, 2.5810546875, 2.866455078125, 3.15185546875, 3.437255859375, 3.72265625, 4.008056640625, 4.29345703125, 4.578857421875, 4.8642578125, 5.149658203125, 5.43505859375, 5.720458984375, 6.005859375, 6.291259765625, 6.57666015625, 6.862060546875, 7.1474609375, 7.432861328125, 7.71826171875, 8.003662109375, 8.2890625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 8.0, 5.0, 6.0, 23.0, 30.0, 32.0, 81.0, 96.0, 130.0, 257.0, 360.0, 543.0, 687.0, 599.0, 424.0, 291.0, 194.0, 100.0, 72.0, 50.0, 34.0, 19.0, 15.0, 3.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.796875, -18.2841796875, -17.771484375, -17.2587890625, -16.74609375, -16.2333984375, -15.720703125, -15.2080078125, -14.6953125, -14.1826171875, -13.669921875, -13.1572265625, -12.64453125, -12.1318359375, -11.619140625, -11.1064453125, -10.59375, -10.0810546875, -9.568359375, -9.0556640625, -8.54296875, -8.0302734375, -7.517578125, -7.0048828125, -6.4921875, -5.9794921875, -5.466796875, -4.9541015625, -4.44140625, -3.9287109375, -3.416015625, -2.9033203125, -2.390625, -1.8779296875, -1.365234375, -0.8525390625, -0.33984375, 0.1728515625, 0.685546875, 1.1982421875, 1.7109375, 2.2236328125, 2.736328125, 3.2490234375, 3.76171875, 4.2744140625, 4.787109375, 5.2998046875, 5.8125, 6.3251953125, 6.837890625, 7.3505859375, 7.86328125, 8.3759765625, 8.888671875, 9.4013671875, 9.9140625, 10.4267578125, 10.939453125, 11.4521484375, 11.96484375, 12.4775390625, 12.990234375, 13.5029296875, 14.015625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 12.0, 12.0, 18.0, 28.0, 42.0, 65.0, 99.0, 177.0, 398.0, 1761.0, 64863.0, 4070773.0, 53575.0, 1639.0, 336.0, 189.0, 103.0, 57.0, 41.0, 29.0, 24.0, 15.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.375, -51.6240234375, -49.873046875, -48.1220703125, -46.37109375, -44.6201171875, -42.869140625, -41.1181640625, -39.3671875, -37.6162109375, -35.865234375, -34.1142578125, -32.36328125, -30.6123046875, -28.861328125, -27.1103515625, -25.359375, -23.6083984375, -21.857421875, -20.1064453125, -18.35546875, -16.6044921875, -14.853515625, -13.1025390625, -11.3515625, -9.6005859375, -7.849609375, -6.0986328125, -4.34765625, -2.5966796875, -0.845703125, 0.9052734375, 2.65625, 4.4072265625, 6.158203125, 7.9091796875, 9.66015625, 11.4111328125, 13.162109375, 14.9130859375, 16.6640625, 18.4150390625, 20.166015625, 21.9169921875, 23.66796875, 25.4189453125, 27.169921875, 28.9208984375, 30.671875, 32.4228515625, 34.173828125, 35.9248046875, 37.67578125, 39.4267578125, 41.177734375, 42.9287109375, 44.6796875, 46.4306640625, 48.181640625, 49.9326171875, 51.68359375, 53.4345703125, 55.185546875, 56.9365234375, 58.6875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 9.0, 27.0, 66.0, 154.0, 232.0, 251.0, 140.0, 102.0, 24.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.12625122070312, -67.08890533447266, -64.05156707763672, -61.01422119140625, -57.97688293457031, -54.939537048339844, -51.90219497680664, -48.86485290527344, -45.827510833740234, -42.79016876220703, -39.75282669067383, -36.715484619140625, -33.678138732910156, -30.640798568725586, -27.60345458984375, -24.566112518310547, -21.528770446777344, -18.49142837524414, -15.454085350036621, -12.416742324829102, -9.379400253295898, -6.342058181762695, -3.3047142028808594, -0.26737213134765625, 2.769969940185547, 5.807312488555908, 8.84465503692627, 11.881998062133789, 14.919340133666992, 17.956682205200195, 20.99402618408203, 24.031368255615234, 27.068702697753906, 30.10604476928711, 33.14338684082031, 36.18073272705078, 39.21807098388672, 42.25541687011719, 45.29275894165039, 48.330101013183594, 51.3674430847168, 54.40478515625, 57.4421272277832, 60.479469299316406, 63.516815185546875, 66.55415344238281, 69.59149932861328, 72.62884521484375, 75.66618347167969, 78.70352935791016, 81.7408676147461, 84.77821350097656, 87.8155517578125, 90.85289764404297, 93.89024353027344, 96.92758178710938, 99.96492004394531, 103.00226593017578, 106.03960418701172, 109.07695007324219, 112.11428833007812, 115.1516342163086, 118.18898010253906, 121.226318359375, 124.26366424560547]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 6.0, 5.0, 5.0, 7.0, 9.0, 5.0, 14.0, 13.0, 18.0, 25.0, 33.0, 24.0, 24.0, 41.0, 28.0, 39.0, 32.0, 40.0, 42.0, 38.0, 34.0, 37.0, 43.0, 42.0, 35.0, 32.0, 32.0, 35.0, 34.0, 26.0, 28.0, 27.0, 24.0, 17.0, 13.0, 9.0, 15.0, 18.0, 16.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-40.74736022949219, -39.589813232421875, -38.4322624206543, -37.27471160888672, -36.117164611816406, -34.959617614746094, -33.802066802978516, -32.64451599121094, -31.486968994140625, -30.32942008972168, -29.171871185302734, -28.01432228088379, -26.856773376464844, -25.6992244720459, -24.541675567626953, -23.384126663208008, -22.226577758789062, -21.069028854370117, -19.911479949951172, -18.753931045532227, -17.59638214111328, -16.438833236694336, -15.28128433227539, -14.123735427856445, -12.9661865234375, -11.808637619018555, -10.65108871459961, -9.493539810180664, -8.335990905761719, -7.178442001342773, -6.020893096923828, -4.863344192504883, -3.705791473388672, -2.5482425689697266, -1.3906936645507812, -0.23314476013183594, 0.9244041442871094, 2.0819530487060547, 3.239501953125, 4.397050857543945, 5.554599761962891, 6.712148666381836, 7.869697570800781, 9.027246475219727, 10.184795379638672, 11.342344284057617, 12.499893188476562, 13.657442092895508, 14.814990997314453, 15.972539901733398, 17.130088806152344, 18.28763771057129, 19.445186614990234, 20.60273551940918, 21.760284423828125, 22.91783332824707, 24.075382232666016, 25.23293113708496, 26.390480041503906, 27.54802894592285, 28.705577850341797, 29.863126754760742, 31.020675659179688, 32.17822265625, 33.33577346801758]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 2.0, 6.0, 5.0, 5.0, 6.0, 8.0, 13.0, 14.0, 18.0, 19.0, 13.0, 17.0, 27.0, 23.0, 40.0, 31.0, 29.0, 32.0, 52.0, 44.0, 49.0, 49.0, 38.0, 49.0, 50.0, 41.0, 38.0, 40.0, 31.0, 34.0, 29.0, 33.0, 17.0, 22.0, 6.0, 18.0, 8.0, 14.0, 13.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.0625, -3.93463134765625, -3.8067626953125, -3.67889404296875, -3.551025390625, -3.42315673828125, -3.2952880859375, -3.16741943359375, -3.03955078125, -2.91168212890625, -2.7838134765625, -2.65594482421875, -2.528076171875, -2.40020751953125, -2.2723388671875, -2.14447021484375, -2.0166015625, -1.88873291015625, -1.7608642578125, -1.63299560546875, -1.505126953125, -1.37725830078125, -1.2493896484375, -1.12152099609375, -0.99365234375, -0.86578369140625, -0.7379150390625, -0.61004638671875, -0.482177734375, -0.35430908203125, -0.2264404296875, -0.09857177734375, 0.029296875, 0.15716552734375, 0.2850341796875, 0.41290283203125, 0.540771484375, 0.66864013671875, 0.7965087890625, 0.92437744140625, 1.05224609375, 1.18011474609375, 1.3079833984375, 1.43585205078125, 1.563720703125, 1.69158935546875, 1.8194580078125, 1.94732666015625, 2.0751953125, 2.20306396484375, 2.3309326171875, 2.45880126953125, 2.586669921875, 2.71453857421875, 2.8424072265625, 2.97027587890625, 3.09814453125, 3.22601318359375, 3.3538818359375, 3.48175048828125, 3.609619140625, 3.73748779296875, 3.8653564453125, 3.99322509765625, 4.12109375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 9.0, 11.0, 24.0, 19.0, 43.0, 54.0, 95.0, 123.0, 180.0, 267.0, 423.0, 668.0, 1121.0, 1766.0, 3096.0, 5136.0, 8884.0, 15481.0, 27102.0, 50508.0, 98507.0, 201509.0, 283850.0, 168604.0, 82436.0, 43016.0, 23261.0, 13201.0, 7738.0, 4427.0, 2608.0, 1640.0, 1004.0, 643.0, 386.0, 234.0, 170.0, 95.0, 69.0, 43.0, 32.0, 26.0, 9.0, 9.0, 9.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.68115234375, -0.6594390869140625, -0.637725830078125, -0.6160125732421875, -0.59429931640625, -0.5725860595703125, -0.550872802734375, -0.5291595458984375, -0.5074462890625, -0.4857330322265625, -0.464019775390625, -0.4423065185546875, -0.42059326171875, -0.3988800048828125, -0.377166748046875, -0.3554534912109375, -0.333740234375, -0.3120269775390625, -0.290313720703125, -0.2686004638671875, -0.24688720703125, -0.2251739501953125, -0.203460693359375, -0.1817474365234375, -0.1600341796875, -0.1383209228515625, -0.116607666015625, -0.0948944091796875, -0.07318115234375, -0.0514678955078125, -0.029754638671875, -0.0080413818359375, 0.013671875, 0.0353851318359375, 0.057098388671875, 0.0788116455078125, 0.10052490234375, 0.1222381591796875, 0.143951416015625, 0.1656646728515625, 0.1873779296875, 0.2090911865234375, 0.230804443359375, 0.2525177001953125, 0.27423095703125, 0.2959442138671875, 0.317657470703125, 0.3393707275390625, 0.361083984375, 0.3827972412109375, 0.404510498046875, 0.4262237548828125, 0.44793701171875, 0.4696502685546875, 0.491363525390625, 0.5130767822265625, 0.5347900390625, 0.5565032958984375, 0.578216552734375, 0.5999298095703125, 0.62164306640625, 0.6433563232421875, 0.665069580078125, 0.6867828369140625, 0.70849609375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 5.0, 6.0, 8.0, 7.0, 20.0, 15.0, 15.0, 16.0, 20.0, 26.0, 28.0, 28.0, 38.0, 25.0, 30.0, 37.0, 50.0, 42.0, 40.0, 34.0, 1046.0, 31.0, 33.0, 35.0, 37.0, 43.0, 31.0, 45.0, 33.0, 26.0, 25.0, 15.0, 17.0, 17.0, 17.0, 15.0, 12.0, 10.0, 10.0, 6.0, 8.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0], "bins": [-2.57421875, -2.503326416015625, -2.43243408203125, -2.361541748046875, -2.2906494140625, -2.219757080078125, -2.14886474609375, -2.077972412109375, -2.007080078125, -1.936187744140625, -1.86529541015625, -1.794403076171875, -1.7235107421875, -1.652618408203125, -1.58172607421875, -1.510833740234375, -1.43994140625, -1.369049072265625, -1.29815673828125, -1.227264404296875, -1.1563720703125, -1.085479736328125, -1.01458740234375, -0.943695068359375, -0.872802734375, -0.801910400390625, -0.73101806640625, -0.660125732421875, -0.5892333984375, -0.518341064453125, -0.44744873046875, -0.376556396484375, -0.3056640625, -0.234771728515625, -0.16387939453125, -0.092987060546875, -0.0220947265625, 0.048797607421875, 0.11968994140625, 0.190582275390625, 0.261474609375, 0.332366943359375, 0.40325927734375, 0.474151611328125, 0.5450439453125, 0.615936279296875, 0.68682861328125, 0.757720947265625, 0.82861328125, 0.899505615234375, 0.97039794921875, 1.041290283203125, 1.1121826171875, 1.183074951171875, 1.25396728515625, 1.324859619140625, 1.395751953125, 1.466644287109375, 1.53753662109375, 1.608428955078125, 1.6793212890625, 1.750213623046875, 1.82110595703125, 1.891998291015625, 1.962890625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 5.0, 5.0, 8.0, 12.0, 21.0, 35.0, 55.0, 77.0, 107.0, 175.0, 326.0, 504.0, 779.0, 1194.0, 2080.0, 3282.0, 5545.0, 9419.0, 16180.0, 28295.0, 50109.0, 91348.0, 169611.0, 1292761.0, 188776.0, 103721.0, 56629.0, 31849.0, 17954.0, 10456.0, 6228.0, 3785.0, 2150.0, 1350.0, 824.0, 509.0, 350.0, 216.0, 138.0, 81.0, 69.0, 41.0, 28.0, 14.0, 12.0, 7.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.471923828125, -0.45787811279296875, -0.4438323974609375, -0.42978668212890625, -0.415740966796875, -0.40169525146484375, -0.3876495361328125, -0.37360382080078125, -0.35955810546875, -0.34551239013671875, -0.3314666748046875, -0.31742095947265625, -0.303375244140625, -0.28932952880859375, -0.2752838134765625, -0.26123809814453125, -0.2471923828125, -0.23314666748046875, -0.2191009521484375, -0.20505523681640625, -0.191009521484375, -0.17696380615234375, -0.1629180908203125, -0.14887237548828125, -0.13482666015625, -0.12078094482421875, -0.1067352294921875, -0.09268951416015625, -0.078643798828125, -0.06459808349609375, -0.0505523681640625, -0.03650665283203125, -0.0224609375, -0.00841522216796875, 0.0056304931640625, 0.01967620849609375, 0.033721923828125, 0.04776763916015625, 0.0618133544921875, 0.07585906982421875, 0.08990478515625, 0.10395050048828125, 0.1179962158203125, 0.13204193115234375, 0.146087646484375, 0.16013336181640625, 0.1741790771484375, 0.18822479248046875, 0.2022705078125, 0.21631622314453125, 0.2303619384765625, 0.24440765380859375, 0.258453369140625, 0.27249908447265625, 0.2865447998046875, 0.30059051513671875, 0.31463623046875, 0.32868194580078125, 0.3427276611328125, 0.35677337646484375, 0.370819091796875, 0.38486480712890625, 0.3989105224609375, 0.41295623779296875, 0.427001953125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 7.0, 4.0, 6.0, 9.0, 14.0, 9.0, 12.0, 18.0, 12.0, 25.0, 31.0, 37.0, 45.0, 55.0, 70.0, 69.0, 78.0, 79.0, 77.0, 64.0, 57.0, 39.0, 38.0, 35.0, 20.0, 18.0, 17.0, 10.0, 4.0, 5.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021152496337890625, -0.002048969268798828, -0.0019826889038085938, -0.0019164085388183594, -0.001850128173828125, -0.0017838478088378906, -0.0017175674438476562, -0.0016512870788574219, -0.0015850067138671875, -0.0015187263488769531, -0.0014524459838867188, -0.0013861656188964844, -0.00131988525390625, -0.0012536048889160156, -0.0011873245239257812, -0.0011210441589355469, -0.0010547637939453125, -0.0009884834289550781, -0.0009222030639648438, -0.0008559226989746094, -0.000789642333984375, -0.0007233619689941406, -0.0006570816040039062, -0.0005908012390136719, -0.0005245208740234375, -0.0004582405090332031, -0.00039196014404296875, -0.0003256797790527344, -0.0002593994140625, -0.00019311904907226562, -0.00012683868408203125, -6.0558319091796875e-05, 5.7220458984375e-06, 7.200241088867188e-05, 0.00013828277587890625, 0.00020456314086914062, 0.000270843505859375, 0.0003371238708496094, 0.00040340423583984375, 0.0004696846008300781, 0.0005359649658203125, 0.0006022453308105469, 0.0006685256958007812, 0.0007348060607910156, 0.00080108642578125, 0.0008673667907714844, 0.0009336471557617188, 0.0009999275207519531, 0.0010662078857421875, 0.0011324882507324219, 0.0011987686157226562, 0.0012650489807128906, 0.001331329345703125, 0.0013976097106933594, 0.0014638900756835938, 0.0015301704406738281, 0.0015964508056640625, 0.0016627311706542969, 0.0017290115356445312, 0.0017952919006347656, 0.001861572265625, 0.0019278526306152344, 0.0019941329956054688, 0.002060413360595703, 0.0021266937255859375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 10.0, 10.0, 13.0, 17.0, 16.0, 27.0, 49.0, 84.0, 125.0, 227.0, 542.0, 3579.0, 1039957.0, 2735.0, 486.0, 257.0, 133.0, 73.0, 41.0, 28.0, 27.0, 16.0, 8.0, 13.0, 11.0, 14.0, 3.0, 12.0, 5.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059326171875, -0.05749940872192383, -0.055672645568847656, -0.053845882415771484, -0.05201911926269531, -0.05019235610961914, -0.04836559295654297, -0.0465388298034668, -0.044712066650390625, -0.04288530349731445, -0.04105854034423828, -0.03923177719116211, -0.03740501403808594, -0.035578250885009766, -0.033751487731933594, -0.03192472457885742, -0.03009796142578125, -0.028271198272705078, -0.026444435119628906, -0.024617671966552734, -0.022790908813476562, -0.02096414566040039, -0.01913738250732422, -0.017310619354248047, -0.015483856201171875, -0.013657093048095703, -0.011830329895019531, -0.01000356674194336, -0.008176803588867188, -0.006350040435791016, -0.004523277282714844, -0.002696514129638672, -0.0008697509765625, 0.0009570121765136719, 0.0027837753295898438, 0.004610538482666016, 0.0064373016357421875, 0.00826406478881836, 0.010090827941894531, 0.011917591094970703, 0.013744354248046875, 0.015571117401123047, 0.01739788055419922, 0.01922464370727539, 0.021051406860351562, 0.022878170013427734, 0.024704933166503906, 0.026531696319580078, 0.02835845947265625, 0.030185222625732422, 0.032011985778808594, 0.033838748931884766, 0.03566551208496094, 0.03749227523803711, 0.03931903839111328, 0.04114580154418945, 0.042972564697265625, 0.0447993278503418, 0.04662609100341797, 0.04845285415649414, 0.05027961730957031, 0.052106380462646484, 0.053933143615722656, 0.05575990676879883, 0.057586669921875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 80.0, 939.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005784960929304361, -0.004382389597594738, -0.002979818033054471, -0.001577246468514204, -0.0001746751368045807, 0.0012278961949050426, 0.0026304679922759533, 0.004033038858324289, 0.0054356106556952, 0.006838181987404823, 0.008240753784775734, 0.009643325582146645, 0.01104589644819498, 0.012448467314243317, 0.013851039111614227, 0.015253610908985138, 0.01665618270635605, 0.01805875450372696, 0.01946132630109787, 0.02086389809846878, 0.022266468033194542, 0.023669039830565453, 0.025071611627936363, 0.026474181562662125, 0.027876753360033035, 0.029279325157403946, 0.030681896954774857, 0.03208446875214577, 0.03348704054951668, 0.03488960862159729, 0.0362921804189682, 0.03769475221633911, 0.03909732773900032, 0.04049989953637123, 0.04190247133374214, 0.04330504313111305, 0.04470761492848396, 0.046110183000564575, 0.047512754797935486, 0.048915326595306396, 0.05031789839267731, 0.05172047019004822, 0.05312304198741913, 0.05452561378479004, 0.05592818558216095, 0.05733075737953186, 0.05873332917690277, 0.06013589724898338, 0.06153847277164459, 0.0629410445690155, 0.06434361636638641, 0.06574618816375732, 0.06714875996112823, 0.06855133175849915, 0.06995390355587006, 0.07135647535324097, 0.07275903970003128, 0.07416161149740219, 0.0755641832947731, 0.07696675509214401, 0.07836932688951492, 0.07977189868688583, 0.08117447048425674, 0.08257704228162766, 0.08397961407899857]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 11.0, 9.0, 11.0, 13.0, 26.0, 32.0, 42.0, 39.0, 47.0, 48.0, 55.0, 65.0, 66.0, 67.0, 72.0, 77.0, 62.0, 63.0, 42.0, 26.0, 27.0, 31.0, 19.0, 17.0, 9.0, 14.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0022071003913879395, -0.0021561840549111366, -0.002105267718434334, -0.002054351381957531, -0.002003435045480728, -0.0019525187090039253, -0.0019016023725271225, -0.0018506860360503197, -0.0017997696995735168, -0.001748853363096714, -0.0016979370266199112, -0.0016470206901431084, -0.0015961043536663055, -0.0015451880171895027, -0.0014942716807126999, -0.001443355344235897, -0.0013924390077590942, -0.0013415226712822914, -0.0012906063348054886, -0.0012396899983286858, -0.001188773661851883, -0.0011378573253750801, -0.0010869409888982773, -0.0010360246524214745, -0.0009851083159446716, -0.0009341919794678688, -0.000883275642991066, -0.0008323593065142632, -0.0007814429700374603, -0.0007305266335606575, -0.0006796102970838547, -0.0006286939606070518, -0.000577777624130249, -0.0005268612876534462, -0.00047594495117664337, -0.00042502861469984055, -0.0003741122782230377, -0.0003231959417462349, -0.00027227960526943207, -0.00022136326879262924, -0.00017044693231582642, -0.00011953059583902359, -6.861425936222076e-05, -1.7697922885417938e-05, 3.321841359138489e-05, 8.413475006818771e-05, 0.00013505108654499054, 0.00018596742302179337, 0.0002368837594985962, 0.000287800095975399, 0.00033871643245220184, 0.00038963276892900467, 0.0004405491054058075, 0.0004914654418826103, 0.0005423817783594131, 0.000593298114836216, 0.0006442144513130188, 0.0006951307877898216, 0.0007460471242666245, 0.0007969634607434273, 0.0008478797972202301, 0.0008987961336970329, 0.0009497124701738358, 0.0010006288066506386, 0.0010515451431274414]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 2.0, 6.0, 5.0, 5.0, 6.0, 8.0, 13.0, 14.0, 18.0, 19.0, 13.0, 17.0, 27.0, 23.0, 40.0, 31.0, 29.0, 32.0, 52.0, 44.0, 49.0, 49.0, 38.0, 49.0, 50.0, 41.0, 38.0, 40.0, 31.0, 34.0, 29.0, 33.0, 17.0, 22.0, 6.0, 18.0, 8.0, 14.0, 13.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.0625, -3.93463134765625, -3.8067626953125, -3.67889404296875, -3.551025390625, -3.42315673828125, -3.2952880859375, -3.16741943359375, -3.03955078125, -2.91168212890625, -2.7838134765625, -2.65594482421875, -2.528076171875, -2.40020751953125, -2.2723388671875, -2.14447021484375, -2.0166015625, -1.88873291015625, -1.7608642578125, -1.63299560546875, -1.505126953125, -1.37725830078125, -1.2493896484375, -1.12152099609375, -0.99365234375, -0.86578369140625, -0.7379150390625, -0.61004638671875, -0.482177734375, -0.35430908203125, -0.2264404296875, -0.09857177734375, 0.029296875, 0.15716552734375, 0.2850341796875, 0.41290283203125, 0.540771484375, 0.66864013671875, 0.7965087890625, 0.92437744140625, 1.05224609375, 1.18011474609375, 1.3079833984375, 1.43585205078125, 1.563720703125, 1.69158935546875, 1.8194580078125, 1.94732666015625, 2.0751953125, 2.20306396484375, 2.3309326171875, 2.45880126953125, 2.586669921875, 2.71453857421875, 2.8424072265625, 2.97027587890625, 3.09814453125, 3.22601318359375, 3.3538818359375, 3.48175048828125, 3.609619140625, 3.73748779296875, 3.8653564453125, 3.99322509765625, 4.12109375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 9.0, 2.0, 12.0, 7.0, 15.0, 18.0, 35.0, 24.0, 54.0, 78.0, 135.0, 183.0, 356.0, 539.0, 909.0, 1592.0, 2904.0, 5377.0, 9890.0, 21155.0, 47447.0, 122927.0, 320665.0, 309943.0, 116403.0, 45790.0, 20528.0, 9983.0, 4999.0, 2728.0, 1513.0, 920.0, 508.0, 303.0, 198.0, 140.0, 76.0, 61.0, 37.0, 34.0, 15.0, 14.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5546875, -2.47479248046875, -2.3948974609375, -2.31500244140625, -2.235107421875, -2.15521240234375, -2.0753173828125, -1.99542236328125, -1.91552734375, -1.83563232421875, -1.7557373046875, -1.67584228515625, -1.595947265625, -1.51605224609375, -1.4361572265625, -1.35626220703125, -1.2763671875, -1.19647216796875, -1.1165771484375, -1.03668212890625, -0.956787109375, -0.87689208984375, -0.7969970703125, -0.71710205078125, -0.63720703125, -0.55731201171875, -0.4774169921875, -0.39752197265625, -0.317626953125, -0.23773193359375, -0.1578369140625, -0.07794189453125, 0.001953125, 0.08184814453125, 0.1617431640625, 0.24163818359375, 0.321533203125, 0.40142822265625, 0.4813232421875, 0.56121826171875, 0.64111328125, 0.72100830078125, 0.8009033203125, 0.88079833984375, 0.960693359375, 1.04058837890625, 1.1204833984375, 1.20037841796875, 1.2802734375, 1.36016845703125, 1.4400634765625, 1.51995849609375, 1.599853515625, 1.67974853515625, 1.7596435546875, 1.83953857421875, 1.91943359375, 1.99932861328125, 2.0792236328125, 2.15911865234375, 2.239013671875, 2.31890869140625, 2.3988037109375, 2.47869873046875, 2.55859375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 1.0, 5.0, 5.0, 9.0, 19.0, 12.0, 18.0, 22.0, 30.0, 27.0, 28.0, 37.0, 39.0, 44.0, 37.0, 44.0, 53.0, 73.0, 236.0, 1699.0, 140.0, 63.0, 60.0, 54.0, 41.0, 36.0, 32.0, 22.0, 24.0, 21.0, 20.0, 25.0, 16.0, 14.0, 6.0, 6.0, 10.0, 10.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.421875, -13.9615478515625, -13.501220703125, -13.0408935546875, -12.58056640625, -12.1202392578125, -11.659912109375, -11.1995849609375, -10.7392578125, -10.2789306640625, -9.818603515625, -9.3582763671875, -8.89794921875, -8.4376220703125, -7.977294921875, -7.5169677734375, -7.056640625, -6.5963134765625, -6.135986328125, -5.6756591796875, -5.21533203125, -4.7550048828125, -4.294677734375, -3.8343505859375, -3.3740234375, -2.9136962890625, -2.453369140625, -1.9930419921875, -1.53271484375, -1.0723876953125, -0.612060546875, -0.1517333984375, 0.30859375, 0.7689208984375, 1.229248046875, 1.6895751953125, 2.14990234375, 2.6102294921875, 3.070556640625, 3.5308837890625, 3.9912109375, 4.4515380859375, 4.911865234375, 5.3721923828125, 5.83251953125, 6.2928466796875, 6.753173828125, 7.2135009765625, 7.673828125, 8.1341552734375, 8.594482421875, 9.0548095703125, 9.51513671875, 9.9754638671875, 10.435791015625, 10.8961181640625, 11.3564453125, 11.8167724609375, 12.277099609375, 12.7374267578125, 13.19775390625, 13.6580810546875, 14.118408203125, 14.5787353515625, 15.0390625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 11.0, 5.0, 12.0, 13.0, 24.0, 25.0, 21.0, 34.0, 31.0, 50.0, 83.0, 132.0, 185.0, 299.0, 672.0, 3459.0, 207884.0, 2920189.0, 10299.0, 1104.0, 402.0, 210.0, 151.0, 87.0, 62.0, 53.0, 27.0, 47.0, 23.0, 25.0, 17.0, 17.0, 12.0, 11.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.65625, -23.890380859375, -23.12451171875, -22.358642578125, -21.5927734375, -20.826904296875, -20.06103515625, -19.295166015625, -18.529296875, -17.763427734375, -16.99755859375, -16.231689453125, -15.4658203125, -14.699951171875, -13.93408203125, -13.168212890625, -12.40234375, -11.636474609375, -10.87060546875, -10.104736328125, -9.3388671875, -8.572998046875, -7.80712890625, -7.041259765625, -6.275390625, -5.509521484375, -4.74365234375, -3.977783203125, -3.2119140625, -2.446044921875, -1.68017578125, -0.914306640625, -0.1484375, 0.617431640625, 1.38330078125, 2.149169921875, 2.9150390625, 3.680908203125, 4.44677734375, 5.212646484375, 5.978515625, 6.744384765625, 7.51025390625, 8.276123046875, 9.0419921875, 9.807861328125, 10.57373046875, 11.339599609375, 12.10546875, 12.871337890625, 13.63720703125, 14.403076171875, 15.1689453125, 15.934814453125, 16.70068359375, 17.466552734375, 18.232421875, 18.998291015625, 19.76416015625, 20.530029296875, 21.2958984375, 22.061767578125, 22.82763671875, 23.593505859375, 24.359375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 330.0, 642.0, 35.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.857102394104004, -7.4332780838012695, -4.009453773498535, -0.5856294631958008, 2.8381948471069336, 6.262019157409668, 9.685843467712402, 13.109667778015137, 16.533493041992188, 19.957317352294922, 23.381141662597656, 26.80496597290039, 30.228790283203125, 33.65261459350586, 37.076438903808594, 40.50026321411133, 43.92408752441406, 47.3479118347168, 50.77173614501953, 54.195560455322266, 57.619384765625, 61.043209075927734, 64.46703338623047, 67.89085388183594, 71.31468200683594, 74.73851013183594, 78.1623306274414, 81.58615112304688, 85.00997924804688, 88.43380737304688, 91.85762786865234, 95.28144836425781, 98.70527648925781, 102.12910461425781, 105.55292510986328, 108.97674560546875, 112.40057373046875, 115.82440185546875, 119.24822235107422, 122.67204284667969, 126.09587097167969, 129.5196990966797, 132.94351196289062, 136.36734008789062, 139.79116821289062, 143.21499633789062, 146.63882446289062, 150.06263732910156, 153.48646545410156, 156.91029357910156, 160.3341064453125, 163.7579345703125, 167.1817626953125, 170.6055908203125, 174.0294189453125, 177.45323181152344, 180.87705993652344, 184.30088806152344, 187.72470092773438, 191.14852905273438, 194.57235717773438, 197.99618530273438, 201.42001342773438, 204.8438262939453, 208.2676544189453]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 10.0, 7.0, 11.0, 13.0, 11.0, 12.0, 17.0, 23.0, 14.0, 27.0, 22.0, 21.0, 41.0, 27.0, 36.0, 39.0, 43.0, 42.0, 41.0, 45.0, 35.0, 48.0, 33.0, 42.0, 31.0, 36.0, 26.0, 34.0, 26.0, 29.0, 29.0, 15.0, 14.0, 12.0, 14.0, 15.0, 12.0, 7.0, 10.0, 6.0, 9.0, 5.0, 3.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.402992248535156, -45.00642395019531, -43.6098518371582, -42.21328353881836, -40.816715240478516, -39.420143127441406, -38.02357482910156, -36.62700653076172, -35.230438232421875, -33.83386993408203, -32.43729782104492, -31.040729522705078, -29.644161224365234, -28.247591018676758, -26.85102081298828, -25.454452514648438, -24.057880401611328, -22.66131019592285, -21.264741897583008, -19.86817169189453, -18.471603393554688, -17.07503318786621, -15.678462982177734, -14.281893730163574, -12.885324478149414, -11.488755226135254, -10.092185974121094, -8.695615768432617, -7.299046516418457, -5.902477264404297, -4.50590705871582, -3.10933780670166, -1.7127685546875, -0.31619906425476074, 1.0803704261779785, 2.476940155029297, 3.873509407043457, 5.270078659057617, 6.666648864746094, 8.063218116760254, 9.459787368774414, 10.856356620788574, 12.252925872802734, 13.649496078491211, 15.046065330505371, 16.44263458251953, 17.839204788208008, 19.235774993896484, 20.632343292236328, 22.028913497924805, 23.42548179626465, 24.822052001953125, 26.21862030029297, 27.615190505981445, 29.011760711669922, 30.408329010009766, 31.804899215698242, 33.20146942138672, 34.59803771972656, 35.994606018066406, 37.391178131103516, 38.78774642944336, 40.18431854248047, 41.58088684082031, 42.977455139160156]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 6.0, 5.0, 7.0, 6.0, 10.0, 7.0, 12.0, 21.0, 14.0, 23.0, 22.0, 21.0, 24.0, 26.0, 31.0, 43.0, 40.0, 34.0, 38.0, 47.0, 42.0, 49.0, 42.0, 48.0, 35.0, 39.0, 44.0, 29.0, 40.0, 36.0, 29.0, 18.0, 19.0, 15.0, 17.0, 11.0, 9.0, 15.0, 5.0, 6.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.984375, -3.8560791015625, -3.727783203125, -3.5994873046875, -3.47119140625, -3.3428955078125, -3.214599609375, -3.0863037109375, -2.9580078125, -2.8297119140625, -2.701416015625, -2.5731201171875, -2.44482421875, -2.3165283203125, -2.188232421875, -2.0599365234375, -1.931640625, -1.8033447265625, -1.675048828125, -1.5467529296875, -1.41845703125, -1.2901611328125, -1.161865234375, -1.0335693359375, -0.9052734375, -0.7769775390625, -0.648681640625, -0.5203857421875, -0.39208984375, -0.2637939453125, -0.135498046875, -0.0072021484375, 0.12109375, 0.2493896484375, 0.377685546875, 0.5059814453125, 0.63427734375, 0.7625732421875, 0.890869140625, 1.0191650390625, 1.1474609375, 1.2757568359375, 1.404052734375, 1.5323486328125, 1.66064453125, 1.7889404296875, 1.917236328125, 2.0455322265625, 2.173828125, 2.3021240234375, 2.430419921875, 2.5587158203125, 2.68701171875, 2.8153076171875, 2.943603515625, 3.0718994140625, 3.2001953125, 3.3284912109375, 3.456787109375, 3.5850830078125, 3.71337890625, 3.8416748046875, 3.969970703125, 4.0982666015625, 4.2265625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 9.0, 7.0, 8.0, 6.0, 11.0, 12.0, 20.0, 18.0, 28.0, 36.0, 42.0, 48.0, 96.0, 196.0, 458.0, 1461.0, 6701.0, 40312.0, 499362.0, 3050256.0, 543206.0, 42409.0, 6941.0, 1546.0, 508.0, 205.0, 96.0, 74.0, 38.0, 35.0, 34.0, 28.0, 17.0, 13.0, 7.0, 8.0, 8.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.890625, -12.494140625, -12.09765625, -11.701171875, -11.3046875, -10.908203125, -10.51171875, -10.115234375, -9.71875, -9.322265625, -8.92578125, -8.529296875, -8.1328125, -7.736328125, -7.33984375, -6.943359375, -6.546875, -6.150390625, -5.75390625, -5.357421875, -4.9609375, -4.564453125, -4.16796875, -3.771484375, -3.375, -2.978515625, -2.58203125, -2.185546875, -1.7890625, -1.392578125, -0.99609375, -0.599609375, -0.203125, 0.193359375, 0.58984375, 0.986328125, 1.3828125, 1.779296875, 2.17578125, 2.572265625, 2.96875, 3.365234375, 3.76171875, 4.158203125, 4.5546875, 4.951171875, 5.34765625, 5.744140625, 6.140625, 6.537109375, 6.93359375, 7.330078125, 7.7265625, 8.123046875, 8.51953125, 8.916015625, 9.3125, 9.708984375, 10.10546875, 10.501953125, 10.8984375, 11.294921875, 11.69140625, 12.087890625, 12.484375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 3.0, 10.0, 16.0, 15.0, 41.0, 54.0, 85.0, 121.0, 185.0, 301.0, 388.0, 592.0, 662.0, 529.0, 366.0, 248.0, 166.0, 110.0, 55.0, 47.0, 28.0, 15.0, 14.0, 9.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.46875, -13.974365234375, -13.47998046875, -12.985595703125, -12.4912109375, -11.996826171875, -11.50244140625, -11.008056640625, -10.513671875, -10.019287109375, -9.52490234375, -9.030517578125, -8.5361328125, -8.041748046875, -7.54736328125, -7.052978515625, -6.55859375, -6.064208984375, -5.56982421875, -5.075439453125, -4.5810546875, -4.086669921875, -3.59228515625, -3.097900390625, -2.603515625, -2.109130859375, -1.61474609375, -1.120361328125, -0.6259765625, -0.131591796875, 0.36279296875, 0.857177734375, 1.3515625, 1.845947265625, 2.34033203125, 2.834716796875, 3.3291015625, 3.823486328125, 4.31787109375, 4.812255859375, 5.306640625, 5.801025390625, 6.29541015625, 6.789794921875, 7.2841796875, 7.778564453125, 8.27294921875, 8.767333984375, 9.26171875, 9.756103515625, 10.25048828125, 10.744873046875, 11.2392578125, 11.733642578125, 12.22802734375, 12.722412109375, 13.216796875, 13.711181640625, 14.20556640625, 14.699951171875, 15.1943359375, 15.688720703125, 16.18310546875, 16.677490234375, 17.171875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 4.0, 14.0, 11.0, 18.0, 25.0, 31.0, 40.0, 65.0, 81.0, 109.0, 152.0, 281.0, 484.0, 1401.0, 9460.0, 355110.0, 3735260.0, 85421.0, 4204.0, 959.0, 402.0, 204.0, 145.0, 100.0, 86.0, 49.0, 40.0, 30.0, 20.0, 15.0, 10.0, 10.0, 10.0, 10.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.03125, -31.9052734375, -30.779296875, -29.6533203125, -28.52734375, -27.4013671875, -26.275390625, -25.1494140625, -24.0234375, -22.8974609375, -21.771484375, -20.6455078125, -19.51953125, -18.3935546875, -17.267578125, -16.1416015625, -15.015625, -13.8896484375, -12.763671875, -11.6376953125, -10.51171875, -9.3857421875, -8.259765625, -7.1337890625, -6.0078125, -4.8818359375, -3.755859375, -2.6298828125, -1.50390625, -0.3779296875, 0.748046875, 1.8740234375, 3.0, 4.1259765625, 5.251953125, 6.3779296875, 7.50390625, 8.6298828125, 9.755859375, 10.8818359375, 12.0078125, 13.1337890625, 14.259765625, 15.3857421875, 16.51171875, 17.6376953125, 18.763671875, 19.8896484375, 21.015625, 22.1416015625, 23.267578125, 24.3935546875, 25.51953125, 26.6455078125, 27.771484375, 28.8974609375, 30.0234375, 31.1494140625, 32.275390625, 33.4013671875, 34.52734375, 35.6533203125, 36.779296875, 37.9052734375, 39.03125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 15.0, 21.0, 48.0, 80.0, 110.0, 127.0, 148.0, 139.0, 104.0, 91.0, 49.0, 32.0, 22.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.87782287597656, -66.0169448852539, -64.15605926513672, -62.29518127441406, -60.43429946899414, -58.57341766357422, -56.71253967285156, -54.85165786743164, -52.99077606201172, -51.1298942565918, -49.269012451171875, -47.40813446044922, -45.5472526550293, -43.686370849609375, -41.82549285888672, -39.9646110534668, -38.103729248046875, -36.24284744262695, -34.38196563720703, -32.521087646484375, -30.660205841064453, -28.79932403564453, -26.938444137573242, -25.077564239501953, -23.21668243408203, -21.35580062866211, -19.49492073059082, -17.63404083251953, -15.77315902709961, -13.912278175354004, -12.051397323608398, -10.190516471862793, -8.329639434814453, -6.468758583068848, -4.607877731323242, -2.7469968795776367, -0.8861160278320312, 0.9747648239135742, 2.8356456756591797, 4.696526527404785, 6.557407379150391, 8.418288230895996, 10.279169082641602, 12.140049934387207, 14.000930786132812, 15.861811637878418, 17.722692489624023, 19.583572387695312, 21.444454193115234, 23.305335998535156, 25.166215896606445, 27.027095794677734, 28.887977600097656, 30.748859405517578, 32.6097412109375, 34.470619201660156, 36.33150100708008, 38.1923828125, 40.053260803222656, 41.91414260864258, 43.7750244140625, 45.63590621948242, 47.496788024902344, 49.357666015625, 51.21854782104492]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 11.0, 2.0, 9.0, 5.0, 7.0, 7.0, 10.0, 13.0, 13.0, 25.0, 20.0, 24.0, 18.0, 26.0, 34.0, 35.0, 34.0, 32.0, 34.0, 45.0, 45.0, 42.0, 36.0, 32.0, 37.0, 37.0, 40.0, 45.0, 38.0, 34.0, 26.0, 28.0, 25.0, 24.0, 19.0, 10.0, 14.0, 12.0, 6.0, 12.0, 6.0, 9.0, 4.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-37.75487518310547, -36.618038177490234, -35.481201171875, -34.344364166259766, -33.20752716064453, -32.07068634033203, -30.933849334716797, -29.797012329101562, -28.660175323486328, -27.523338317871094, -26.38650131225586, -25.249662399291992, -24.112825393676758, -22.975988388061523, -21.839149475097656, -20.702312469482422, -19.565475463867188, -18.428638458251953, -17.29180145263672, -16.15496253967285, -15.018125534057617, -13.881288528442383, -12.744450569152832, -11.607612609863281, -10.470775604248047, -9.333938598632812, -8.197100639343262, -7.060263156890869, -5.923425674438477, -4.786588191986084, -3.6497507095336914, -2.512913227081299, -1.3760719299316406, -0.23923444747924805, 0.8976030349731445, 2.034440517425537, 3.1712779998779297, 4.308115482330322, 5.444952964782715, 6.581790447235107, 7.7186279296875, 8.855464935302734, 9.992302894592285, 11.129140853881836, 12.26597785949707, 13.402814865112305, 14.539652824401855, 15.676490783691406, 16.81332778930664, 17.950164794921875, 19.08700180053711, 20.223840713500977, 21.36067771911621, 22.497514724731445, 23.634353637695312, 24.771190643310547, 25.90802764892578, 27.044864654541016, 28.18170166015625, 29.318540573120117, 30.45537757873535, 31.592214584350586, 32.72905349731445, 33.86589050292969, 35.00272750854492]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 2.0, 3.0, 9.0, 7.0, 3.0, 14.0, 12.0, 13.0, 15.0, 16.0, 27.0, 30.0, 37.0, 18.0, 31.0, 31.0, 38.0, 36.0, 49.0, 32.0, 24.0, 44.0, 39.0, 41.0, 44.0, 39.0, 42.0, 35.0, 35.0, 25.0, 27.0, 32.0, 14.0, 18.0, 21.0, 15.0, 17.0, 14.0, 9.0, 7.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-3.7734375, -3.6500244140625, -3.526611328125, -3.4031982421875, -3.27978515625, -3.1563720703125, -3.032958984375, -2.9095458984375, -2.7861328125, -2.6627197265625, -2.539306640625, -2.4158935546875, -2.29248046875, -2.1690673828125, -2.045654296875, -1.9222412109375, -1.798828125, -1.6754150390625, -1.552001953125, -1.4285888671875, -1.30517578125, -1.1817626953125, -1.058349609375, -0.9349365234375, -0.8115234375, -0.6881103515625, -0.564697265625, -0.4412841796875, -0.31787109375, -0.1944580078125, -0.071044921875, 0.0523681640625, 0.17578125, 0.2991943359375, 0.422607421875, 0.5460205078125, 0.66943359375, 0.7928466796875, 0.916259765625, 1.0396728515625, 1.1630859375, 1.2864990234375, 1.409912109375, 1.5333251953125, 1.65673828125, 1.7801513671875, 1.903564453125, 2.0269775390625, 2.150390625, 2.2738037109375, 2.397216796875, 2.5206298828125, 2.64404296875, 2.7674560546875, 2.890869140625, 3.0142822265625, 3.1376953125, 3.2611083984375, 3.384521484375, 3.5079345703125, 3.63134765625, 3.7547607421875, 3.878173828125, 4.0015869140625, 4.125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 9.0, 7.0, 17.0, 18.0, 32.0, 50.0, 61.0, 95.0, 157.0, 211.0, 340.0, 504.0, 783.0, 1251.0, 2034.0, 3090.0, 4983.0, 8004.0, 12731.0, 20690.0, 34590.0, 60725.0, 116437.0, 220953.0, 247929.0, 138780.0, 71922.0, 39796.0, 23511.0, 14461.0, 9010.0, 5564.0, 3608.0, 2277.0, 1375.0, 909.0, 558.0, 351.0, 243.0, 155.0, 102.0, 66.0, 62.0, 35.0, 17.0, 16.0, 11.0, 9.0, 9.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0], "bins": [-0.6591796875, -0.6386642456054688, -0.6181488037109375, -0.5976333618164062, -0.577117919921875, -0.5566024780273438, -0.5360870361328125, -0.5155715942382812, -0.49505615234375, -0.47454071044921875, -0.4540252685546875, -0.43350982666015625, -0.412994384765625, -0.39247894287109375, -0.3719635009765625, -0.35144805908203125, -0.3309326171875, -0.31041717529296875, -0.2899017333984375, -0.26938629150390625, -0.248870849609375, -0.22835540771484375, -0.2078399658203125, -0.18732452392578125, -0.16680908203125, -0.14629364013671875, -0.1257781982421875, -0.10526275634765625, -0.084747314453125, -0.06423187255859375, -0.0437164306640625, -0.02320098876953125, -0.002685546875, 0.01782989501953125, 0.0383453369140625, 0.05886077880859375, 0.079376220703125, 0.09989166259765625, 0.1204071044921875, 0.14092254638671875, 0.16143798828125, 0.18195343017578125, 0.2024688720703125, 0.22298431396484375, 0.243499755859375, 0.26401519775390625, 0.2845306396484375, 0.30504608154296875, 0.3255615234375, 0.34607696533203125, 0.3665924072265625, 0.38710784912109375, 0.407623291015625, 0.42813873291015625, 0.4486541748046875, 0.46916961669921875, 0.48968505859375, 0.5102005004882812, 0.5307159423828125, 0.5512313842773438, 0.571746826171875, 0.5922622680664062, 0.6127777099609375, 0.6332931518554688, 0.65380859375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 12.0, 10.0, 14.0, 15.0, 22.0, 20.0, 27.0, 35.0, 29.0, 25.0, 36.0, 35.0, 32.0, 47.0, 38.0, 46.0, 44.0, 1074.0, 51.0, 40.0, 38.0, 30.0, 32.0, 39.0, 24.0, 24.0, 24.0, 23.0, 22.0, 17.0, 21.0, 18.0, 12.0, 7.0, 14.0, 10.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.703125, -2.61761474609375, -2.5321044921875, -2.44659423828125, -2.361083984375, -2.27557373046875, -2.1900634765625, -2.10455322265625, -2.01904296875, -1.93353271484375, -1.8480224609375, -1.76251220703125, -1.677001953125, -1.59149169921875, -1.5059814453125, -1.42047119140625, -1.3349609375, -1.24945068359375, -1.1639404296875, -1.07843017578125, -0.992919921875, -0.90740966796875, -0.8218994140625, -0.73638916015625, -0.65087890625, -0.56536865234375, -0.4798583984375, -0.39434814453125, -0.308837890625, -0.22332763671875, -0.1378173828125, -0.05230712890625, 0.033203125, 0.11871337890625, 0.2042236328125, 0.28973388671875, 0.375244140625, 0.46075439453125, 0.5462646484375, 0.63177490234375, 0.71728515625, 0.80279541015625, 0.8883056640625, 0.97381591796875, 1.059326171875, 1.14483642578125, 1.2303466796875, 1.31585693359375, 1.4013671875, 1.48687744140625, 1.5723876953125, 1.65789794921875, 1.743408203125, 1.82891845703125, 1.9144287109375, 1.99993896484375, 2.08544921875, 2.17095947265625, 2.2564697265625, 2.34197998046875, 2.427490234375, 2.51300048828125, 2.5985107421875, 2.68402099609375, 2.76953125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 14.0, 17.0, 15.0, 23.0, 50.0, 88.0, 123.0, 186.0, 260.0, 460.0, 639.0, 1136.0, 1865.0, 2957.0, 4740.0, 8229.0, 14020.0, 24567.0, 44494.0, 82109.0, 150275.0, 1280807.0, 208124.0, 120739.0, 66204.0, 36189.0, 20022.0, 11507.0, 6784.0, 3896.0, 2558.0, 1496.0, 970.0, 566.0, 355.0, 241.0, 150.0, 86.0, 49.0, 47.0, 31.0, 18.0, 6.0, 7.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.47607421875, -0.46111297607421875, -0.4461517333984375, -0.43119049072265625, -0.416229248046875, -0.40126800537109375, -0.3863067626953125, -0.37134552001953125, -0.35638427734375, -0.34142303466796875, -0.3264617919921875, -0.31150054931640625, -0.296539306640625, -0.28157806396484375, -0.2666168212890625, -0.25165557861328125, -0.2366943359375, -0.22173309326171875, -0.2067718505859375, -0.19181060791015625, -0.176849365234375, -0.16188812255859375, -0.1469268798828125, -0.13196563720703125, -0.11700439453125, -0.10204315185546875, -0.0870819091796875, -0.07212066650390625, -0.057159423828125, -0.04219818115234375, -0.0272369384765625, -0.01227569580078125, 0.002685546875, 0.01764678955078125, 0.0326080322265625, 0.04756927490234375, 0.062530517578125, 0.07749176025390625, 0.0924530029296875, 0.10741424560546875, 0.12237548828125, 0.13733673095703125, 0.1522979736328125, 0.16725921630859375, 0.182220458984375, 0.19718170166015625, 0.2121429443359375, 0.22710418701171875, 0.2420654296875, 0.25702667236328125, 0.2719879150390625, 0.28694915771484375, 0.301910400390625, 0.31687164306640625, 0.3318328857421875, 0.34679412841796875, 0.36175537109375, 0.37671661376953125, 0.3916778564453125, 0.40663909912109375, 0.421600341796875, 0.43656158447265625, 0.4515228271484375, 0.46648406982421875, 0.4814453125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 6.0, 11.0, 13.0, 10.0, 10.0, 19.0, 19.0, 19.0, 26.0, 27.0, 27.0, 35.0, 26.0, 52.0, 49.0, 46.0, 57.0, 48.0, 59.0, 50.0, 57.0, 37.0, 48.0, 47.0, 29.0, 32.0, 23.0, 23.0, 22.0, 14.0, 12.0, 9.0, 7.0, 5.0, 11.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001453399658203125, -0.0014071613550186157, -0.0013609230518341064, -0.0013146847486495972, -0.0012684464454650879, -0.0012222081422805786, -0.0011759698390960693, -0.00112973153591156, -0.0010834932327270508, -0.0010372549295425415, -0.0009910166263580322, -0.000944778323173523, -0.0008985400199890137, -0.0008523017168045044, -0.0008060634136199951, -0.0007598251104354858, -0.0007135868072509766, -0.0006673485040664673, -0.000621110200881958, -0.0005748718976974487, -0.0005286335945129395, -0.0004823952913284302, -0.0004361569881439209, -0.0003899186849594116, -0.00034368038177490234, -0.00029744207859039307, -0.0002512037754058838, -0.0002049654722213745, -0.00015872716903686523, -0.00011248886585235596, -6.625056266784668e-05, -2.0012259483337402e-05, 2.6226043701171875e-05, 7.246434688568115e-05, 0.00011870265007019043, 0.0001649409532546997, 0.00021117925643920898, 0.00025741755962371826, 0.00030365586280822754, 0.0003498941659927368, 0.0003961324691772461, 0.00044237077236175537, 0.0004886090755462646, 0.0005348473787307739, 0.0005810856819152832, 0.0006273239850997925, 0.0006735622882843018, 0.000719800591468811, 0.0007660388946533203, 0.0008122771978378296, 0.0008585155010223389, 0.0009047538042068481, 0.0009509921073913574, 0.0009972304105758667, 0.001043468713760376, 0.0010897070169448853, 0.0011359453201293945, 0.0011821836233139038, 0.001228421926498413, 0.0012746602296829224, 0.0013208985328674316, 0.001367136836051941, 0.0014133751392364502, 0.0014596134424209595, 0.0015058517456054688]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 1.0, 7.0, 9.0, 14.0, 18.0, 17.0, 21.0, 40.0, 53.0, 75.0, 121.0, 251.0, 613.0, 7625.0, 1035418.0, 3174.0, 521.0, 217.0, 105.0, 62.0, 50.0, 36.0, 18.0, 15.0, 20.0, 11.0, 10.0, 12.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05255126953125, -0.05087900161743164, -0.04920673370361328, -0.04753446578979492, -0.04586219787597656, -0.0441899299621582, -0.042517662048339844, -0.040845394134521484, -0.039173126220703125, -0.037500858306884766, -0.035828590393066406, -0.03415632247924805, -0.03248405456542969, -0.030811786651611328, -0.02913951873779297, -0.02746725082397461, -0.02579498291015625, -0.02412271499633789, -0.02245044708251953, -0.020778179168701172, -0.019105911254882812, -0.017433643341064453, -0.015761375427246094, -0.014089107513427734, -0.012416839599609375, -0.010744571685791016, -0.009072303771972656, -0.007400035858154297, -0.0057277679443359375, -0.004055500030517578, -0.0023832321166992188, -0.0007109642028808594, 0.0009613037109375, 0.0026335716247558594, 0.004305839538574219, 0.005978107452392578, 0.0076503753662109375, 0.009322643280029297, 0.010994911193847656, 0.012667179107666016, 0.014339447021484375, 0.016011714935302734, 0.017683982849121094, 0.019356250762939453, 0.021028518676757812, 0.022700786590576172, 0.02437305450439453, 0.02604532241821289, 0.02771759033203125, 0.02938985824584961, 0.03106212615966797, 0.03273439407348633, 0.03440666198730469, 0.03607892990112305, 0.037751197814941406, 0.039423465728759766, 0.041095733642578125, 0.042768001556396484, 0.044440269470214844, 0.0461125373840332, 0.04778480529785156, 0.04945707321166992, 0.05112934112548828, 0.05280160903930664, 0.054473876953125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1017.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0044039469212293625, -0.003146381815895438, -0.001888816710561514, -0.0006312516052275896, 0.0006263135001063347, 0.0018838783726096153, 0.0031414437107741833, 0.004399009048938751, 0.005656573921442032, 0.0069141387939453125, 0.008171703666448593, 0.009429269470274448, 0.010686834342777729, 0.01194439921528101, 0.013201965019106865, 0.014459529891610146, 0.015717094764113426, 0.016974659636616707, 0.018232224509119987, 0.019489789381623268, 0.020747356116771698, 0.02200492098927498, 0.02326248586177826, 0.02452005073428154, 0.02577761560678482, 0.0270351804792881, 0.028292745351791382, 0.029550310224294662, 0.030807875096797943, 0.032065439969301224, 0.033323004841804504, 0.034580573439598083, 0.035838134586811066, 0.037095699459314346, 0.03835326433181763, 0.03961082920432091, 0.04086839407682419, 0.04212595894932747, 0.04338352382183075, 0.04464109241962433, 0.04589865356683731, 0.04715621843934059, 0.04841378331184387, 0.04967134818434715, 0.05092891305685043, 0.052186477929353714, 0.053444042801856995, 0.054701611399650574, 0.055959176272153854, 0.057216741144657135, 0.058474306017160416, 0.059731870889663696, 0.06098943576216698, 0.06224700063467026, 0.06350456923246384, 0.06476213037967682, 0.0660196989774704, 0.06727726757526398, 0.06853482872247696, 0.06979239732027054, 0.07104995846748352, 0.0723075270652771, 0.07356508821249008, 0.07482265681028366, 0.07608021795749664]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 20.0, 24.0, 28.0, 35.0, 44.0, 62.0, 61.0, 63.0, 74.0, 73.0, 73.0, 78.0, 61.0, 64.0, 58.0, 43.0, 40.0, 22.0, 25.0, 21.0, 9.0, 3.0, 11.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019169449806213379, -0.0018700174987316132, -0.0018230900168418884, -0.0017761625349521637, -0.001729235053062439, -0.0016823075711727142, -0.0016353800892829895, -0.0015884526073932648, -0.00154152512550354, -0.0014945976436138153, -0.0014476701617240906, -0.0014007426798343658, -0.0013538151979446411, -0.0013068877160549164, -0.0012599602341651917, -0.001213032752275467, -0.0011661052703857422, -0.0011191777884960175, -0.0010722503066062927, -0.001025322824716568, -0.0009783953428268433, -0.0009314678609371185, -0.0008845403790473938, -0.0008376128971576691, -0.0007906854152679443, -0.0007437579333782196, -0.0006968304514884949, -0.0006499029695987701, -0.0006029754877090454, -0.0005560480058193207, -0.000509120523929596, -0.0004621930420398712, -0.0004152655601501465, -0.00036833807826042175, -0.000321410596370697, -0.0002744831144809723, -0.00022755563259124756, -0.00018062815070152283, -0.0001337006688117981, -8.677318692207336e-05, -3.984570503234863e-05, 7.081776857376099e-06, 5.400925874710083e-05, 0.00010093674063682556, 0.0001478642225265503, 0.00019479170441627502, 0.00024171918630599976, 0.0002886466681957245, 0.0003355741500854492, 0.00038250163197517395, 0.0004294291138648987, 0.0004763565957546234, 0.0005232840776443481, 0.0005702115595340729, 0.0006171390414237976, 0.0006640665233135223, 0.0007109940052032471, 0.0007579214870929718, 0.0008048489689826965, 0.0008517764508724213, 0.000898703932762146, 0.0009456314146518707, 0.0009925588965415955, 0.0010394863784313202, 0.001086413860321045]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 2.0, 3.0, 9.0, 7.0, 3.0, 14.0, 12.0, 13.0, 15.0, 16.0, 27.0, 30.0, 37.0, 18.0, 31.0, 31.0, 38.0, 36.0, 49.0, 32.0, 24.0, 44.0, 39.0, 41.0, 44.0, 39.0, 42.0, 35.0, 35.0, 25.0, 27.0, 32.0, 14.0, 17.0, 22.0, 15.0, 17.0, 14.0, 9.0, 7.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-3.7734375, -3.6500244140625, -3.526611328125, -3.4031982421875, -3.27978515625, -3.1563720703125, -3.032958984375, -2.9095458984375, -2.7861328125, -2.6627197265625, -2.539306640625, -2.4158935546875, -2.29248046875, -2.1690673828125, -2.045654296875, -1.9222412109375, -1.798828125, -1.6754150390625, -1.552001953125, -1.4285888671875, -1.30517578125, -1.1817626953125, -1.058349609375, -0.9349365234375, -0.8115234375, -0.6881103515625, -0.564697265625, -0.4412841796875, -0.31787109375, -0.1944580078125, -0.071044921875, 0.0523681640625, 0.17578125, 0.2991943359375, 0.422607421875, 0.5460205078125, 0.66943359375, 0.7928466796875, 0.916259765625, 1.0396728515625, 1.1630859375, 1.2864990234375, 1.409912109375, 1.5333251953125, 1.65673828125, 1.7801513671875, 1.903564453125, 2.0269775390625, 2.150390625, 2.2738037109375, 2.397216796875, 2.5206298828125, 2.64404296875, 2.7674560546875, 2.890869140625, 3.0142822265625, 3.1376953125, 3.2611083984375, 3.384521484375, 3.5079345703125, 3.63134765625, 3.7547607421875, 3.878173828125, 4.0015869140625, 4.125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 6.0, 16.0, 21.0, 23.0, 43.0, 55.0, 91.0, 141.0, 214.0, 255.0, 449.0, 705.0, 1098.0, 1946.0, 3126.0, 5928.0, 11776.0, 26368.0, 71488.0, 283443.0, 472455.0, 102319.0, 34697.0, 14904.0, 7298.0, 3746.0, 2153.0, 1305.0, 834.0, 558.0, 362.0, 214.0, 167.0, 94.0, 75.0, 58.0, 27.0, 22.0, 24.0, 9.0, 13.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.6015625, -4.4627685546875, -4.323974609375, -4.1851806640625, -4.04638671875, -3.9075927734375, -3.768798828125, -3.6300048828125, -3.4912109375, -3.3524169921875, -3.213623046875, -3.0748291015625, -2.93603515625, -2.7972412109375, -2.658447265625, -2.5196533203125, -2.380859375, -2.2420654296875, -2.103271484375, -1.9644775390625, -1.82568359375, -1.6868896484375, -1.548095703125, -1.4093017578125, -1.2705078125, -1.1317138671875, -0.992919921875, -0.8541259765625, -0.71533203125, -0.5765380859375, -0.437744140625, -0.2989501953125, -0.16015625, -0.0213623046875, 0.117431640625, 0.2562255859375, 0.39501953125, 0.5338134765625, 0.672607421875, 0.8114013671875, 0.9501953125, 1.0889892578125, 1.227783203125, 1.3665771484375, 1.50537109375, 1.6441650390625, 1.782958984375, 1.9217529296875, 2.060546875, 2.1993408203125, 2.338134765625, 2.4769287109375, 2.61572265625, 2.7545166015625, 2.893310546875, 3.0321044921875, 3.1708984375, 3.3096923828125, 3.448486328125, 3.5872802734375, 3.72607421875, 3.8648681640625, 4.003662109375, 4.1424560546875, 4.28125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 3.0, 7.0, 9.0, 10.0, 8.0, 14.0, 10.0, 18.0, 21.0, 24.0, 30.0, 36.0, 38.0, 43.0, 42.0, 43.0, 66.0, 106.0, 426.0, 1516.0, 112.0, 65.0, 51.0, 41.0, 40.0, 38.0, 38.0, 28.0, 22.0, 20.0, 15.0, 21.0, 16.0, 17.0, 8.0, 11.0, 8.0, 7.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4375, -14.9842529296875, -14.531005859375, -14.0777587890625, -13.62451171875, -13.1712646484375, -12.718017578125, -12.2647705078125, -11.8115234375, -11.3582763671875, -10.905029296875, -10.4517822265625, -9.99853515625, -9.5452880859375, -9.092041015625, -8.6387939453125, -8.185546875, -7.7322998046875, -7.279052734375, -6.8258056640625, -6.37255859375, -5.9193115234375, -5.466064453125, -5.0128173828125, -4.5595703125, -4.1063232421875, -3.653076171875, -3.1998291015625, -2.74658203125, -2.2933349609375, -1.840087890625, -1.3868408203125, -0.93359375, -0.4803466796875, -0.027099609375, 0.4261474609375, 0.87939453125, 1.3326416015625, 1.785888671875, 2.2391357421875, 2.6923828125, 3.1456298828125, 3.598876953125, 4.0521240234375, 4.50537109375, 4.9586181640625, 5.411865234375, 5.8651123046875, 6.318359375, 6.7716064453125, 7.224853515625, 7.6781005859375, 8.13134765625, 8.5845947265625, 9.037841796875, 9.4910888671875, 9.9443359375, 10.3975830078125, 10.850830078125, 11.3040771484375, 11.75732421875, 12.2105712890625, 12.663818359375, 13.1170654296875, 13.5703125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 6.0, 13.0, 15.0, 18.0, 18.0, 34.0, 35.0, 34.0, 60.0, 106.0, 183.0, 296.0, 663.0, 5228.0, 2771982.0, 362797.0, 2875.0, 590.0, 282.0, 140.0, 112.0, 62.0, 42.0, 22.0, 28.0, 17.0, 13.0, 10.0, 9.0, 3.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.1875, -31.998046875, -30.80859375, -29.619140625, -28.4296875, -27.240234375, -26.05078125, -24.861328125, -23.671875, -22.482421875, -21.29296875, -20.103515625, -18.9140625, -17.724609375, -16.53515625, -15.345703125, -14.15625, -12.966796875, -11.77734375, -10.587890625, -9.3984375, -8.208984375, -7.01953125, -5.830078125, -4.640625, -3.451171875, -2.26171875, -1.072265625, 0.1171875, 1.306640625, 2.49609375, 3.685546875, 4.875, 6.064453125, 7.25390625, 8.443359375, 9.6328125, 10.822265625, 12.01171875, 13.201171875, 14.390625, 15.580078125, 16.76953125, 17.958984375, 19.1484375, 20.337890625, 21.52734375, 22.716796875, 23.90625, 25.095703125, 26.28515625, 27.474609375, 28.6640625, 29.853515625, 31.04296875, 32.232421875, 33.421875, 34.611328125, 35.80078125, 36.990234375, 38.1796875, 39.369140625, 40.55859375, 41.748046875, 42.9375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 11.0, 108.0, 326.0, 384.0, 154.0, 25.0, 6.0], "bins": [-116.4489974975586, -114.5123062133789, -112.57561492919922, -110.63893127441406, -108.70223999023438, -106.76554870605469, -104.828857421875, -102.89217376708984, -100.95548248291016, -99.01879119873047, -97.08209991455078, -95.14541625976562, -93.20872497558594, -91.27203369140625, -89.33534240722656, -87.3986587524414, -85.46196746826172, -83.52527618408203, -81.58858489990234, -79.65190124511719, -77.7152099609375, -75.77851867675781, -73.84182739257812, -71.90514373779297, -69.96845245361328, -68.0317611694336, -66.0950698852539, -64.15838623046875, -62.22169494628906, -60.285003662109375, -58.34831619262695, -56.411624908447266, -54.474937438964844, -52.538246154785156, -50.601558685302734, -48.66486740112305, -46.728179931640625, -44.79148864746094, -42.854801177978516, -40.91810989379883, -38.98141860961914, -37.04472732543945, -35.10803985595703, -33.171348571777344, -31.234661102294922, -29.297969818115234, -27.361282348632812, -25.424591064453125, -23.487903594970703, -21.55121421813965, -19.614524841308594, -17.67783546447754, -15.741146087646484, -13.804455757141113, -11.867766380310059, -9.931077003479004, -7.994387626647949, -6.0576982498168945, -4.12100887298584, -2.184319019317627, -0.24762964248657227, 1.6890602111816406, 3.6257495880126953, 5.56243896484375, 7.499128341674805]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 3.0, 10.0, 8.0, 12.0, 14.0, 13.0, 14.0, 21.0, 23.0, 18.0, 24.0, 19.0, 28.0, 34.0, 38.0, 39.0, 31.0, 27.0, 44.0, 30.0, 42.0, 47.0, 37.0, 41.0, 26.0, 36.0, 42.0, 27.0, 25.0, 27.0, 26.0, 19.0, 17.0, 18.0, 21.0, 13.0, 14.0, 13.0, 10.0, 10.0, 11.0, 7.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-38.564788818359375, -37.33913040161133, -36.113468170166016, -34.88780975341797, -33.66215133666992, -32.436492919921875, -31.210830688476562, -29.985172271728516, -28.759511947631836, -27.533851623535156, -26.30819320678711, -25.08253288269043, -23.85687255859375, -22.631214141845703, -21.405553817749023, -20.179893493652344, -18.954235076904297, -17.728574752807617, -16.50291633605957, -15.27725601196289, -14.051596641540527, -12.825937271118164, -11.600276947021484, -10.374617576599121, -9.148958206176758, -7.9232988357543945, -6.697638988494873, -5.471979141235352, -4.246319770812988, -3.020660400390625, -1.7950005531311035, -0.569340705871582, 0.6563224792480469, 1.8819820880889893, 3.1076416969299316, 4.333301544189453, 5.558960914611816, 6.78462028503418, 8.01028060913086, 9.235939979553223, 10.461599349975586, 11.68725872039795, 12.912918090820312, 14.138578414916992, 15.364237785339355, 16.58989715576172, 17.8155574798584, 19.041217803955078, 20.266876220703125, 21.492536544799805, 22.71819496154785, 23.94385528564453, 25.169513702392578, 26.395174026489258, 27.620834350585938, 28.846492767333984, 30.072153091430664, 31.297813415527344, 32.52347183227539, 33.74913024902344, 34.97479248046875, 36.2004508972168, 37.426109313964844, 38.651771545410156, 39.8774299621582]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 9.0, 5.0, 10.0, 16.0, 19.0, 15.0, 26.0, 23.0, 29.0, 31.0, 30.0, 30.0, 26.0, 44.0, 40.0, 47.0, 32.0, 31.0, 39.0, 34.0, 48.0, 45.0, 41.0, 34.0, 30.0, 32.0, 27.0, 30.0, 27.0, 16.0, 15.0, 18.0, 18.0, 9.0, 11.0, 9.0, 8.0, 5.0, 8.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.828125, -3.7001953125, -3.572265625, -3.4443359375, -3.31640625, -3.1884765625, -3.060546875, -2.9326171875, -2.8046875, -2.6767578125, -2.548828125, -2.4208984375, -2.29296875, -2.1650390625, -2.037109375, -1.9091796875, -1.78125, -1.6533203125, -1.525390625, -1.3974609375, -1.26953125, -1.1416015625, -1.013671875, -0.8857421875, -0.7578125, -0.6298828125, -0.501953125, -0.3740234375, -0.24609375, -0.1181640625, 0.009765625, 0.1376953125, 0.265625, 0.3935546875, 0.521484375, 0.6494140625, 0.77734375, 0.9052734375, 1.033203125, 1.1611328125, 1.2890625, 1.4169921875, 1.544921875, 1.6728515625, 1.80078125, 1.9287109375, 2.056640625, 2.1845703125, 2.3125, 2.4404296875, 2.568359375, 2.6962890625, 2.82421875, 2.9521484375, 3.080078125, 3.2080078125, 3.3359375, 3.4638671875, 3.591796875, 3.7197265625, 3.84765625, 3.9755859375, 4.103515625, 4.2314453125, 4.359375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 5.0, 14.0, 12.0, 22.0, 33.0, 36.0, 60.0, 94.0, 122.0, 233.0, 357.0, 623.0, 1166.0, 2037.0, 3913.0, 7713.0, 16157.0, 38373.0, 105833.0, 350384.0, 1036272.0, 1471909.0, 778856.0, 246066.0, 77810.0, 29637.0, 13104.0, 6232.0, 3157.0, 1617.0, 977.0, 513.0, 364.0, 188.0, 119.0, 82.0, 54.0, 45.0, 29.0, 21.0, 8.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4921875, -4.333740234375, -4.17529296875, -4.016845703125, -3.8583984375, -3.699951171875, -3.54150390625, -3.383056640625, -3.224609375, -3.066162109375, -2.90771484375, -2.749267578125, -2.5908203125, -2.432373046875, -2.27392578125, -2.115478515625, -1.95703125, -1.798583984375, -1.64013671875, -1.481689453125, -1.3232421875, -1.164794921875, -1.00634765625, -0.847900390625, -0.689453125, -0.531005859375, -0.37255859375, -0.214111328125, -0.0556640625, 0.102783203125, 0.26123046875, 0.419677734375, 0.578125, 0.736572265625, 0.89501953125, 1.053466796875, 1.2119140625, 1.370361328125, 1.52880859375, 1.687255859375, 1.845703125, 2.004150390625, 2.16259765625, 2.321044921875, 2.4794921875, 2.637939453125, 2.79638671875, 2.954833984375, 3.11328125, 3.271728515625, 3.43017578125, 3.588623046875, 3.7470703125, 3.905517578125, 4.06396484375, 4.222412109375, 4.380859375, 4.539306640625, 4.69775390625, 4.856201171875, 5.0146484375, 5.173095703125, 5.33154296875, 5.489990234375, 5.6484375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 6.0, 4.0, 11.0, 19.0, 7.0, 22.0, 32.0, 32.0, 49.0, 82.0, 86.0, 111.0, 180.0, 217.0, 270.0, 346.0, 433.0, 439.0, 428.0, 327.0, 231.0, 196.0, 133.0, 104.0, 102.0, 64.0, 29.0, 38.0, 19.0, 19.0, 11.0, 10.0, 7.0, 7.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-14.53125, -14.1788330078125, -13.826416015625, -13.4739990234375, -13.12158203125, -12.7691650390625, -12.416748046875, -12.0643310546875, -11.7119140625, -11.3594970703125, -11.007080078125, -10.6546630859375, -10.30224609375, -9.9498291015625, -9.597412109375, -9.2449951171875, -8.892578125, -8.5401611328125, -8.187744140625, -7.8353271484375, -7.48291015625, -7.1304931640625, -6.778076171875, -6.4256591796875, -6.0732421875, -5.7208251953125, -5.368408203125, -5.0159912109375, -4.66357421875, -4.3111572265625, -3.958740234375, -3.6063232421875, -3.25390625, -2.9014892578125, -2.549072265625, -2.1966552734375, -1.84423828125, -1.4918212890625, -1.139404296875, -0.7869873046875, -0.4345703125, -0.0821533203125, 0.270263671875, 0.6226806640625, 0.97509765625, 1.3275146484375, 1.679931640625, 2.0323486328125, 2.384765625, 2.7371826171875, 3.089599609375, 3.4420166015625, 3.79443359375, 4.1468505859375, 4.499267578125, 4.8516845703125, 5.2041015625, 5.5565185546875, 5.908935546875, 6.2613525390625, 6.61376953125, 6.9661865234375, 7.318603515625, 7.6710205078125, 8.0234375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 15.0, 8.0, 15.0, 30.0, 36.0, 56.0, 53.0, 92.0, 132.0, 179.0, 394.0, 1002.0, 7275.0, 362465.0, 3756325.0, 61857.0, 2802.0, 673.0, 287.0, 157.0, 95.0, 88.0, 50.0, 42.0, 31.0, 26.0, 16.0, 18.0, 15.0, 10.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.5, -29.294921875, -28.08984375, -26.884765625, -25.6796875, -24.474609375, -23.26953125, -22.064453125, -20.859375, -19.654296875, -18.44921875, -17.244140625, -16.0390625, -14.833984375, -13.62890625, -12.423828125, -11.21875, -10.013671875, -8.80859375, -7.603515625, -6.3984375, -5.193359375, -3.98828125, -2.783203125, -1.578125, -0.373046875, 0.83203125, 2.037109375, 3.2421875, 4.447265625, 5.65234375, 6.857421875, 8.0625, 9.267578125, 10.47265625, 11.677734375, 12.8828125, 14.087890625, 15.29296875, 16.498046875, 17.703125, 18.908203125, 20.11328125, 21.318359375, 22.5234375, 23.728515625, 24.93359375, 26.138671875, 27.34375, 28.548828125, 29.75390625, 30.958984375, 32.1640625, 33.369140625, 34.57421875, 35.779296875, 36.984375, 38.189453125, 39.39453125, 40.599609375, 41.8046875, 43.009765625, 44.21484375, 45.419921875, 46.625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 14.0, 43.0, 101.0, 140.0, 186.0, 222.0, 157.0, 86.0, 32.0, 18.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.33330535888672, -121.43858337402344, -118.54386901855469, -115.6491470336914, -112.75443267822266, -109.85971069335938, -106.96499633789062, -104.07027435302734, -101.17555236816406, -98.28083038330078, -95.38611602783203, -92.49139404296875, -89.5966796875, -86.70195770263672, -83.80723571777344, -80.91252136230469, -78.01780700683594, -75.12308502197266, -72.2283706665039, -69.33364868164062, -66.43893432617188, -63.544212341308594, -60.64949417114258, -57.75477600097656, -54.86005783081055, -51.96533966064453, -49.070621490478516, -46.1759033203125, -43.28118133544922, -40.38646697998047, -37.49174499511719, -34.59702682495117, -31.702301025390625, -28.80758285522461, -25.912864685058594, -23.018144607543945, -20.12342643737793, -17.228708267211914, -14.333988189697266, -11.43927001953125, -8.544551849365234, -5.6498332023620605, -2.7551145553588867, 0.1396045684814453, 3.034322738647461, 5.929040908813477, 8.823760986328125, 11.71847915649414, 14.613197326660156, 17.507915496826172, 20.402633666992188, 23.297353744506836, 26.19207191467285, 29.086790084838867, 31.981510162353516, 34.87622833251953, 37.77094650268555, 40.66566467285156, 43.56038284301758, 46.455101013183594, 49.349822998046875, 52.244537353515625, 55.139259338378906, 58.03397750854492, 60.92869567871094]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 3.0, 7.0, 9.0, 21.0, 13.0, 25.0, 21.0, 19.0, 28.0, 27.0, 27.0, 34.0, 28.0, 52.0, 51.0, 43.0, 34.0, 45.0, 36.0, 39.0, 52.0, 43.0, 29.0, 31.0, 23.0, 28.0, 27.0, 23.0, 23.0, 21.0, 20.0, 19.0, 13.0, 12.0, 10.0, 9.0, 14.0, 9.0, 2.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-40.26957702636719, -39.09467315673828, -37.91977310180664, -36.744869232177734, -35.56996536254883, -34.39506530761719, -33.22016143798828, -32.045257568359375, -30.870357513427734, -29.69545555114746, -28.520551681518555, -27.34564971923828, -26.170747756958008, -24.995845794677734, -23.820941925048828, -22.646039962768555, -21.47113609313965, -20.296234130859375, -19.12133026123047, -17.946428298950195, -16.771526336669922, -15.596623420715332, -14.421720504760742, -13.246818542480469, -12.071915626525879, -10.897012710571289, -9.722110748291016, -8.547207832336426, -7.372305393218994, -6.1974029541015625, -5.022500038146973, -3.847598075866699, -2.6726951599121094, -1.4977926015853882, -0.322890043258667, 0.8520126342773438, 2.0269150733947754, 3.201817512512207, 4.376720428466797, 5.55162239074707, 6.72652530670166, 7.901427745819092, 9.076330184936523, 10.251233100891113, 11.426136016845703, 12.601037979125977, 13.775940895080566, 14.95084285736084, 16.12574577331543, 17.300647735595703, 18.47555160522461, 19.650453567504883, 20.825355529785156, 22.000259399414062, 23.175161361694336, 24.35006332397461, 25.524967193603516, 26.69986915588379, 27.874773025512695, 29.04967498779297, 30.224576950073242, 31.399478912353516, 32.57438278198242, 33.74928283691406, 34.92418670654297]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 13.0, 13.0, 23.0, 21.0, 16.0, 32.0, 31.0, 39.0, 37.0, 32.0, 41.0, 41.0, 36.0, 41.0, 36.0, 40.0, 53.0, 48.0, 46.0, 35.0, 39.0, 26.0, 29.0, 28.0, 25.0, 27.0, 23.0, 12.0, 18.0, 13.0, 13.0, 9.0, 7.0, 3.0, 1.0, 5.0, 4.0, 8.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.6328125, -4.49237060546875, -4.3519287109375, -4.21148681640625, -4.071044921875, -3.93060302734375, -3.7901611328125, -3.64971923828125, -3.50927734375, -3.36883544921875, -3.2283935546875, -3.08795166015625, -2.947509765625, -2.80706787109375, -2.6666259765625, -2.52618408203125, -2.3857421875, -2.24530029296875, -2.1048583984375, -1.96441650390625, -1.823974609375, -1.68353271484375, -1.5430908203125, -1.40264892578125, -1.26220703125, -1.12176513671875, -0.9813232421875, -0.84088134765625, -0.700439453125, -0.55999755859375, -0.4195556640625, -0.27911376953125, -0.138671875, 0.00177001953125, 0.1422119140625, 0.28265380859375, 0.423095703125, 0.56353759765625, 0.7039794921875, 0.84442138671875, 0.98486328125, 1.12530517578125, 1.2657470703125, 1.40618896484375, 1.546630859375, 1.68707275390625, 1.8275146484375, 1.96795654296875, 2.1083984375, 2.24884033203125, 2.3892822265625, 2.52972412109375, 2.670166015625, 2.81060791015625, 2.9510498046875, 3.09149169921875, 3.23193359375, 3.37237548828125, 3.5128173828125, 3.65325927734375, 3.793701171875, 3.93414306640625, 4.0745849609375, 4.21502685546875, 4.35546875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 9.0, 19.0, 18.0, 26.0, 55.0, 57.0, 90.0, 145.0, 196.0, 284.0, 420.0, 642.0, 963.0, 1486.0, 2241.0, 3466.0, 5306.0, 8558.0, 13740.0, 22919.0, 39726.0, 73817.0, 147739.0, 262486.0, 217486.0, 109624.0, 56075.0, 31518.0, 18610.0, 10879.0, 7126.0, 4385.0, 2860.0, 1918.0, 1204.0, 795.0, 536.0, 344.0, 246.0, 174.0, 126.0, 62.0, 62.0, 35.0, 25.0, 19.0, 9.0, 9.0, 5.0, 5.0, 5.0, 3.0, 0.0, 3.0], "bins": [-0.77490234375, -0.7519683837890625, -0.729034423828125, -0.7061004638671875, -0.68316650390625, -0.6602325439453125, -0.637298583984375, -0.6143646240234375, -0.5914306640625, -0.5684967041015625, -0.545562744140625, -0.5226287841796875, -0.49969482421875, -0.4767608642578125, -0.453826904296875, -0.4308929443359375, -0.407958984375, -0.3850250244140625, -0.362091064453125, -0.3391571044921875, -0.31622314453125, -0.2932891845703125, -0.270355224609375, -0.2474212646484375, -0.2244873046875, -0.2015533447265625, -0.178619384765625, -0.1556854248046875, -0.13275146484375, -0.1098175048828125, -0.086883544921875, -0.0639495849609375, -0.041015625, -0.0180816650390625, 0.004852294921875, 0.0277862548828125, 0.05072021484375, 0.0736541748046875, 0.096588134765625, 0.1195220947265625, 0.1424560546875, 0.1653900146484375, 0.188323974609375, 0.2112579345703125, 0.23419189453125, 0.2571258544921875, 0.280059814453125, 0.3029937744140625, 0.325927734375, 0.3488616943359375, 0.371795654296875, 0.3947296142578125, 0.41766357421875, 0.4405975341796875, 0.463531494140625, 0.4864654541015625, 0.5093994140625, 0.5323333740234375, 0.555267333984375, 0.5782012939453125, 0.60113525390625, 0.6240692138671875, 0.647003173828125, 0.6699371337890625, 0.69287109375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 11.0, 11.0, 7.0, 10.0, 13.0, 16.0, 15.0, 18.0, 22.0, 30.0, 35.0, 29.0, 36.0, 34.0, 36.0, 49.0, 41.0, 45.0, 1080.0, 40.0, 38.0, 47.0, 27.0, 30.0, 46.0, 33.0, 25.0, 37.0, 34.0, 17.0, 15.0, 21.0, 8.0, 19.0, 10.0, 8.0, 7.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.982421875, -2.89306640625, -2.8037109375, -2.71435546875, -2.625, -2.53564453125, -2.4462890625, -2.35693359375, -2.267578125, -2.17822265625, -2.0888671875, -1.99951171875, -1.91015625, -1.82080078125, -1.7314453125, -1.64208984375, -1.552734375, -1.46337890625, -1.3740234375, -1.28466796875, -1.1953125, -1.10595703125, -1.0166015625, -0.92724609375, -0.837890625, -0.74853515625, -0.6591796875, -0.56982421875, -0.48046875, -0.39111328125, -0.3017578125, -0.21240234375, -0.123046875, -0.03369140625, 0.0556640625, 0.14501953125, 0.234375, 0.32373046875, 0.4130859375, 0.50244140625, 0.591796875, 0.68115234375, 0.7705078125, 0.85986328125, 0.94921875, 1.03857421875, 1.1279296875, 1.21728515625, 1.306640625, 1.39599609375, 1.4853515625, 1.57470703125, 1.6640625, 1.75341796875, 1.8427734375, 1.93212890625, 2.021484375, 2.11083984375, 2.2001953125, 2.28955078125, 2.37890625, 2.46826171875, 2.5576171875, 2.64697265625, 2.736328125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 6.0, 5.0, 8.0, 13.0, 19.0, 52.0, 65.0, 92.0, 154.0, 238.0, 422.0, 658.0, 1061.0, 1618.0, 2671.0, 4369.0, 7124.0, 11835.0, 20940.0, 36303.0, 65758.0, 124433.0, 218374.0, 1279643.0, 144616.0, 76684.0, 41656.0, 23772.0, 13642.0, 8091.0, 4941.0, 2977.0, 1839.0, 1120.0, 732.0, 443.0, 272.0, 172.0, 117.0, 70.0, 60.0, 19.0, 20.0, 10.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5224609375, -0.506195068359375, -0.48992919921875, -0.473663330078125, -0.4573974609375, -0.441131591796875, -0.42486572265625, -0.408599853515625, -0.392333984375, -0.376068115234375, -0.35980224609375, -0.343536376953125, -0.3272705078125, -0.311004638671875, -0.29473876953125, -0.278472900390625, -0.26220703125, -0.245941162109375, -0.22967529296875, -0.213409423828125, -0.1971435546875, -0.180877685546875, -0.16461181640625, -0.148345947265625, -0.132080078125, -0.115814208984375, -0.09954833984375, -0.083282470703125, -0.0670166015625, -0.050750732421875, -0.03448486328125, -0.018218994140625, -0.001953125, 0.014312744140625, 0.03057861328125, 0.046844482421875, 0.0631103515625, 0.079376220703125, 0.09564208984375, 0.111907958984375, 0.128173828125, 0.144439697265625, 0.16070556640625, 0.176971435546875, 0.1932373046875, 0.209503173828125, 0.22576904296875, 0.242034912109375, 0.25830078125, 0.274566650390625, 0.29083251953125, 0.307098388671875, 0.3233642578125, 0.339630126953125, 0.35589599609375, 0.372161865234375, 0.388427734375, 0.404693603515625, 0.42095947265625, 0.437225341796875, 0.4534912109375, 0.469757080078125, 0.48602294921875, 0.502288818359375, 0.5185546875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 8.0, 2.0, 7.0, 10.0, 15.0, 15.0, 23.0, 27.0, 38.0, 46.0, 50.0, 77.0, 76.0, 73.0, 71.0, 82.0, 65.0, 71.0, 52.0, 32.0, 38.0, 24.0, 30.0, 15.0, 14.0, 10.0, 2.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00278472900390625, -0.002713307738304138, -0.0026418864727020264, -0.0025704652070999146, -0.0024990439414978027, -0.002427622675895691, -0.002356201410293579, -0.0022847801446914673, -0.0022133588790893555, -0.0021419376134872437, -0.002070516347885132, -0.00199909508228302, -0.0019276738166809082, -0.0018562525510787964, -0.0017848312854766846, -0.0017134100198745728, -0.001641988754272461, -0.0015705674886703491, -0.0014991462230682373, -0.0014277249574661255, -0.0013563036918640137, -0.0012848824262619019, -0.00121346116065979, -0.0011420398950576782, -0.0010706186294555664, -0.0009991973638534546, -0.0009277760982513428, -0.000856354832649231, -0.0007849335670471191, -0.0007135123014450073, -0.0006420910358428955, -0.0005706697702407837, -0.0004992485046386719, -0.00042782723903656006, -0.00035640597343444824, -0.0002849847078323364, -0.0002135634422302246, -0.0001421421766281128, -7.072091102600098e-05, 7.003545761108398e-07, 7.212162017822266e-05, 0.00014354288578033447, 0.0002149641513824463, 0.0002863854169845581, 0.0003578066825866699, 0.00042922794818878174, 0.0005006492137908936, 0.0005720704793930054, 0.0006434917449951172, 0.000714913010597229, 0.0007863342761993408, 0.0008577555418014526, 0.0009291768074035645, 0.0010005980730056763, 0.001072019338607788, 0.0011434406042099, 0.0012148618698120117, 0.0012862831354141235, 0.0013577044010162354, 0.0014291256666183472, 0.001500546932220459, 0.0015719681978225708, 0.0016433894634246826, 0.0017148107290267944, 0.0017862319946289062]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 8.0, 6.0, 1.0, 16.0, 16.0, 27.0, 39.0, 56.0, 65.0, 135.0, 298.0, 935.0, 413221.0, 632027.0, 1023.0, 316.0, 133.0, 79.0, 46.0, 28.0, 22.0, 18.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055633544921875, -0.05341005325317383, -0.051186561584472656, -0.048963069915771484, -0.04673957824707031, -0.04451608657836914, -0.04229259490966797, -0.0400691032409668, -0.037845611572265625, -0.03562211990356445, -0.03339862823486328, -0.03117513656616211, -0.028951644897460938, -0.026728153228759766, -0.024504661560058594, -0.022281169891357422, -0.02005767822265625, -0.017834186553955078, -0.015610694885253906, -0.013387203216552734, -0.011163711547851562, -0.00894021987915039, -0.006716728210449219, -0.004493236541748047, -0.002269744873046875, -4.6253204345703125e-05, 0.0021772384643554688, 0.004400730133056641, 0.0066242218017578125, 0.008847713470458984, 0.011071205139160156, 0.013294696807861328, 0.0155181884765625, 0.017741680145263672, 0.019965171813964844, 0.022188663482666016, 0.024412155151367188, 0.02663564682006836, 0.02885913848876953, 0.031082630157470703, 0.033306121826171875, 0.03552961349487305, 0.03775310516357422, 0.03997659683227539, 0.04220008850097656, 0.044423580169677734, 0.046647071838378906, 0.04887056350708008, 0.05109405517578125, 0.05331754684448242, 0.055541038513183594, 0.057764530181884766, 0.05998802185058594, 0.06221151351928711, 0.06443500518798828, 0.06665849685668945, 0.06888198852539062, 0.0711054801940918, 0.07332897186279297, 0.07555246353149414, 0.07777595520019531, 0.07999944686889648, 0.08222293853759766, 0.08444643020629883, 0.086669921875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 12.0, 1007.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009045690298080444, -0.007335582748055458, -0.005625475198030472, -0.0039153676480054855, -0.0022052600979804993, -0.000495152547955513, 0.0012149550020694733, 0.0029250625520944595, 0.004635170102119446, 0.006345277652144432, 0.008055385202169418, 0.009765492752194405, 0.011475600302219391, 0.013185707852244377, 0.014895815402269363, 0.01660592295229435, 0.018316030502319336, 0.020026138052344322, 0.02173624560236931, 0.023446353152394295, 0.02515646070241928, 0.026866568252444267, 0.028576675802469254, 0.03028678335249424, 0.031996890902519226, 0.03370700031518936, 0.0354171060025692, 0.037127211689949036, 0.03883732110261917, 0.04054743051528931, 0.042257536202669144, 0.04396764189004898, 0.045677751302719116, 0.04738786071538925, 0.04909796640276909, 0.050808072090148926, 0.05251818150281906, 0.0542282909154892, 0.055938396602869034, 0.05764850229024887, 0.059358611702919006, 0.06106872111558914, 0.06277883052825928, 0.06448893249034882, 0.06619904190301895, 0.06790915131568909, 0.06961925327777863, 0.07132936269044876, 0.0730394721031189, 0.07474958151578903, 0.07645969092845917, 0.0781697928905487, 0.07987990230321884, 0.08159001171588898, 0.08330011367797852, 0.08501022309064865, 0.08672033250331879, 0.08843044191598892, 0.09014055132865906, 0.0918506532907486, 0.09356076270341873, 0.09527087211608887, 0.0969809740781784, 0.09869108349084854, 0.10040119290351868]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 8.0, 4.0, 9.0, 14.0, 21.0, 39.0, 34.0, 55.0, 72.0, 63.0, 80.0, 76.0, 71.0, 87.0, 80.0, 68.0, 58.0, 43.0, 45.0, 19.0, 19.0, 23.0, 8.0, 8.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0025292038917541504, -0.0024705110117793083, -0.0024118181318044662, -0.002353125251829624, -0.002294432371854782, -0.00223573949187994, -0.002177046611905098, -0.002118353731930256, -0.002059660851955414, -0.0020009679719805717, -0.0019422750920057297, -0.0018835822120308876, -0.0018248893320560455, -0.0017661964520812035, -0.0017075035721063614, -0.0016488106921315193, -0.0015901178121566772, -0.0015314249321818352, -0.001472732052206993, -0.001414039172232151, -0.001355346292257309, -0.0012966534122824669, -0.0012379605323076248, -0.0011792676523327827, -0.0011205747723579407, -0.0010618818923830986, -0.0010031890124082565, -0.0009444961324334145, -0.0008858032524585724, -0.0008271103724837303, -0.0007684174925088882, -0.0007097246125340462, -0.0006510317325592041, -0.000592338852584362, -0.00053364597260952, -0.0004749530926346779, -0.0004162602126598358, -0.00035756733268499374, -0.00029887445271015167, -0.0002401815727353096, -0.00018148869276046753, -0.00012279581278562546, -6.410293281078339e-05, -5.410052835941315e-06, 5.328282713890076e-05, 0.00011197570711374283, 0.0001706685870885849, 0.00022936146706342697, 0.00028805434703826904, 0.0003467472270131111, 0.0004054401069879532, 0.00046413298696279526, 0.0005228258669376373, 0.0005815187469124794, 0.0006402116268873215, 0.0006989045068621635, 0.0007575973868370056, 0.0008162902668118477, 0.0008749831467866898, 0.0009336760267615318, 0.000992368906736374, 0.001051061786711216, 0.001109754666686058, 0.0011684475466609001, 0.0012271404266357422]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 13.0, 13.0, 23.0, 21.0, 16.0, 32.0, 31.0, 39.0, 37.0, 32.0, 41.0, 41.0, 36.0, 41.0, 36.0, 40.0, 53.0, 48.0, 46.0, 35.0, 39.0, 26.0, 29.0, 28.0, 25.0, 27.0, 23.0, 12.0, 18.0, 13.0, 13.0, 9.0, 7.0, 3.0, 1.0, 5.0, 4.0, 8.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.6328125, -4.49237060546875, -4.3519287109375, -4.21148681640625, -4.071044921875, -3.93060302734375, -3.7901611328125, -3.64971923828125, -3.50927734375, -3.36883544921875, -3.2283935546875, -3.08795166015625, -2.947509765625, -2.80706787109375, -2.6666259765625, -2.52618408203125, -2.3857421875, -2.24530029296875, -2.1048583984375, -1.96441650390625, -1.823974609375, -1.68353271484375, -1.5430908203125, -1.40264892578125, -1.26220703125, -1.12176513671875, -0.9813232421875, -0.84088134765625, -0.700439453125, -0.55999755859375, -0.4195556640625, -0.27911376953125, -0.138671875, 0.00177001953125, 0.1422119140625, 0.28265380859375, 0.423095703125, 0.56353759765625, 0.7039794921875, 0.84442138671875, 0.98486328125, 1.12530517578125, 1.2657470703125, 1.40618896484375, 1.546630859375, 1.68707275390625, 1.8275146484375, 1.96795654296875, 2.1083984375, 2.24884033203125, 2.3892822265625, 2.52972412109375, 2.670166015625, 2.81060791015625, 2.9510498046875, 3.09149169921875, 3.23193359375, 3.37237548828125, 3.5128173828125, 3.65325927734375, 3.793701171875, 3.93414306640625, 4.0745849609375, 4.21502685546875, 4.35546875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 8.0, 6.0, 17.0, 22.0, 34.0, 39.0, 77.0, 92.0, 137.0, 245.0, 358.0, 546.0, 913.0, 1488.0, 2511.0, 4113.0, 7532.0, 15574.0, 37017.0, 110044.0, 404714.0, 317147.0, 86416.0, 30234.0, 13097.0, 6696.0, 3677.0, 2143.0, 1346.0, 807.0, 522.0, 310.0, 210.0, 172.0, 92.0, 79.0, 30.0, 18.0, 22.0, 7.0, 12.0, 10.0, 10.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.884765625, -3.762969970703125, -3.64117431640625, -3.519378662109375, -3.3975830078125, -3.275787353515625, -3.15399169921875, -3.032196044921875, -2.910400390625, -2.788604736328125, -2.66680908203125, -2.545013427734375, -2.4232177734375, -2.301422119140625, -2.17962646484375, -2.057830810546875, -1.93603515625, -1.814239501953125, -1.69244384765625, -1.570648193359375, -1.4488525390625, -1.327056884765625, -1.20526123046875, -1.083465576171875, -0.961669921875, -0.839874267578125, -0.71807861328125, -0.596282958984375, -0.4744873046875, -0.352691650390625, -0.23089599609375, -0.109100341796875, 0.0126953125, 0.134490966796875, 0.25628662109375, 0.378082275390625, 0.4998779296875, 0.621673583984375, 0.74346923828125, 0.865264892578125, 0.987060546875, 1.108856201171875, 1.23065185546875, 1.352447509765625, 1.4742431640625, 1.596038818359375, 1.71783447265625, 1.839630126953125, 1.96142578125, 2.083221435546875, 2.20501708984375, 2.326812744140625, 2.4486083984375, 2.570404052734375, 2.69219970703125, 2.813995361328125, 2.935791015625, 3.057586669921875, 3.17938232421875, 3.301177978515625, 3.4229736328125, 3.544769287109375, 3.66656494140625, 3.788360595703125, 3.91015625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 9.0, 13.0, 15.0, 11.0, 22.0, 23.0, 23.0, 31.0, 40.0, 34.0, 33.0, 47.0, 43.0, 66.0, 83.0, 275.0, 1651.0, 167.0, 60.0, 68.0, 41.0, 37.0, 28.0, 28.0, 32.0, 27.0, 22.0, 23.0, 16.0, 15.0, 12.0, 12.0, 3.0, 0.0, 7.0, 5.0, 6.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.40625, -17.88525390625, -17.3642578125, -16.84326171875, -16.322265625, -15.80126953125, -15.2802734375, -14.75927734375, -14.23828125, -13.71728515625, -13.1962890625, -12.67529296875, -12.154296875, -11.63330078125, -11.1123046875, -10.59130859375, -10.0703125, -9.54931640625, -9.0283203125, -8.50732421875, -7.986328125, -7.46533203125, -6.9443359375, -6.42333984375, -5.90234375, -5.38134765625, -4.8603515625, -4.33935546875, -3.818359375, -3.29736328125, -2.7763671875, -2.25537109375, -1.734375, -1.21337890625, -0.6923828125, -0.17138671875, 0.349609375, 0.87060546875, 1.3916015625, 1.91259765625, 2.43359375, 2.95458984375, 3.4755859375, 3.99658203125, 4.517578125, 5.03857421875, 5.5595703125, 6.08056640625, 6.6015625, 7.12255859375, 7.6435546875, 8.16455078125, 8.685546875, 9.20654296875, 9.7275390625, 10.24853515625, 10.76953125, 11.29052734375, 11.8115234375, 12.33251953125, 12.853515625, 13.37451171875, 13.8955078125, 14.41650390625, 14.9375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 4.0, 12.0, 14.0, 15.0, 25.0, 30.0, 25.0, 30.0, 64.0, 49.0, 103.0, 123.0, 175.0, 291.0, 501.0, 2820.0, 341875.0, 2792083.0, 5631.0, 688.0, 333.0, 185.0, 149.0, 115.0, 81.0, 52.0, 46.0, 33.0, 32.0, 18.0, 21.0, 21.0, 9.0, 11.0, 9.0, 4.0, 4.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.5, -28.45068359375, -27.4013671875, -26.35205078125, -25.302734375, -24.25341796875, -23.2041015625, -22.15478515625, -21.10546875, -20.05615234375, -19.0068359375, -17.95751953125, -16.908203125, -15.85888671875, -14.8095703125, -13.76025390625, -12.7109375, -11.66162109375, -10.6123046875, -9.56298828125, -8.513671875, -7.46435546875, -6.4150390625, -5.36572265625, -4.31640625, -3.26708984375, -2.2177734375, -1.16845703125, -0.119140625, 0.93017578125, 1.9794921875, 3.02880859375, 4.078125, 5.12744140625, 6.1767578125, 7.22607421875, 8.275390625, 9.32470703125, 10.3740234375, 11.42333984375, 12.47265625, 13.52197265625, 14.5712890625, 15.62060546875, 16.669921875, 17.71923828125, 18.7685546875, 19.81787109375, 20.8671875, 21.91650390625, 22.9658203125, 24.01513671875, 25.064453125, 26.11376953125, 27.1630859375, 28.21240234375, 29.26171875, 30.31103515625, 31.3603515625, 32.40966796875, 33.458984375, 34.50830078125, 35.5576171875, 36.60693359375, 37.65625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 13.0, 26.0, 100.0, 220.0, 286.0, 234.0, 99.0, 20.0, 7.0, 3.0, 2.0, 1.0], "bins": [-62.753448486328125, -61.642967224121094, -60.5324821472168, -59.422000885009766, -58.31151580810547, -57.20103454589844, -56.090553283691406, -54.98006820678711, -53.86958694458008, -52.75910568237305, -51.64862060546875, -50.53813934326172, -49.42765808105469, -48.31717300415039, -47.20669174194336, -46.09620666503906, -44.98572540283203, -43.875244140625, -42.7647590637207, -41.65427780151367, -40.543792724609375, -39.433311462402344, -38.32283020019531, -37.212345123291016, -36.101863861083984, -34.99138259887695, -33.880897521972656, -32.770416259765625, -31.65993309020996, -30.549449920654297, -29.438968658447266, -28.3284854888916, -27.218006134033203, -26.10752296447754, -24.997039794921875, -23.886558532714844, -22.77607536315918, -21.665592193603516, -20.555110931396484, -19.44462776184082, -18.334144592285156, -17.223661422729492, -16.113178253173828, -15.002696990966797, -13.892213821411133, -12.781730651855469, -11.671248435974121, -10.560766220092773, -9.450282096862793, -8.339799880981445, -7.229316711425781, -6.118834018707275, -5.0083513259887695, -3.8978686332702637, -2.787385940551758, -1.676903247833252, -0.5664205551147461, 0.5440621376037598, 1.6545448303222656, 2.7650275230407715, 3.8755102157592773, 4.985992908477783, 6.096475601196289, 7.206958293914795, 8.3174409866333]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 2.0, 9.0, 14.0, 5.0, 14.0, 20.0, 20.0, 24.0, 18.0, 26.0, 25.0, 29.0, 42.0, 50.0, 53.0, 60.0, 47.0, 46.0, 48.0, 55.0, 48.0, 50.0, 40.0, 33.0, 40.0, 37.0, 24.0, 23.0, 19.0, 21.0, 20.0, 10.0, 7.0, 10.0, 3.0, 2.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.25403594970703, -49.77967834472656, -48.305320739746094, -46.830963134765625, -45.356605529785156, -43.88224792480469, -42.40789031982422, -40.93353271484375, -39.45917510986328, -37.98481750488281, -36.510459899902344, -35.036102294921875, -33.561744689941406, -32.08738708496094, -30.6130313873291, -29.138673782348633, -27.664318084716797, -26.189960479736328, -24.71560287475586, -23.24124526977539, -21.766887664794922, -20.292530059814453, -18.818174362182617, -17.34381675720215, -15.86945915222168, -14.395101547241211, -12.920743942260742, -11.44638729095459, -9.972029685974121, -8.497672080993652, -7.0233154296875, -5.548957824707031, -4.074604034423828, -2.6002466678619385, -1.1258893013000488, 0.3484678268432617, 1.8228254318237305, 3.297183036804199, 4.771539688110352, 6.24589729309082, 7.720254898071289, 9.194612503051758, 10.668970108032227, 12.143326759338379, 13.617684364318848, 15.092041969299316, 16.56639862060547, 18.040756225585938, 19.515113830566406, 20.989471435546875, 22.463829040527344, 23.938186645507812, 25.41254425048828, 26.88690185546875, 28.361257553100586, 29.835615158081055, 31.309972763061523, 32.78432846069336, 34.25868606567383, 35.7330436706543, 37.207401275634766, 38.681758880615234, 40.1561164855957, 41.63047409057617, 43.10483169555664]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 5.0, 5.0, 7.0, 8.0, 11.0, 12.0, 19.0, 13.0, 18.0, 21.0, 30.0, 40.0, 29.0, 44.0, 35.0, 27.0, 38.0, 28.0, 44.0, 46.0, 40.0, 37.0, 49.0, 48.0, 43.0, 30.0, 25.0, 36.0, 28.0, 24.0, 20.0, 22.0, 24.0, 13.0, 14.0, 15.0, 13.0, 12.0, 4.0, 2.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.6484375, -4.50909423828125, -4.3697509765625, -4.23040771484375, -4.091064453125, -3.95172119140625, -3.8123779296875, -3.67303466796875, -3.53369140625, -3.39434814453125, -3.2550048828125, -3.11566162109375, -2.976318359375, -2.83697509765625, -2.6976318359375, -2.55828857421875, -2.4189453125, -2.27960205078125, -2.1402587890625, -2.00091552734375, -1.861572265625, -1.72222900390625, -1.5828857421875, -1.44354248046875, -1.30419921875, -1.16485595703125, -1.0255126953125, -0.88616943359375, -0.746826171875, -0.60748291015625, -0.4681396484375, -0.32879638671875, -0.189453125, -0.05010986328125, 0.0892333984375, 0.22857666015625, 0.367919921875, 0.50726318359375, 0.6466064453125, 0.78594970703125, 0.92529296875, 1.06463623046875, 1.2039794921875, 1.34332275390625, 1.482666015625, 1.62200927734375, 1.7613525390625, 1.90069580078125, 2.0400390625, 2.17938232421875, 2.3187255859375, 2.45806884765625, 2.597412109375, 2.73675537109375, 2.8760986328125, 3.01544189453125, 3.15478515625, 3.29412841796875, 3.4334716796875, 3.57281494140625, 3.712158203125, 3.85150146484375, 3.9908447265625, 4.13018798828125, 4.26953125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 4.0, 7.0, 14.0, 14.0, 16.0, 21.0, 21.0, 27.0, 31.0, 52.0, 54.0, 75.0, 84.0, 116.0, 278.0, 1116.0, 12152.0, 774895.0, 3346999.0, 54178.0, 2957.0, 511.0, 177.0, 97.0, 69.0, 56.0, 39.0, 36.0, 38.0, 27.0, 23.0, 18.0, 11.0, 15.0, 11.0, 6.0, 8.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.875, -25.118896484375, -24.36279296875, -23.606689453125, -22.8505859375, -22.094482421875, -21.33837890625, -20.582275390625, -19.826171875, -19.070068359375, -18.31396484375, -17.557861328125, -16.8017578125, -16.045654296875, -15.28955078125, -14.533447265625, -13.77734375, -13.021240234375, -12.26513671875, -11.509033203125, -10.7529296875, -9.996826171875, -9.24072265625, -8.484619140625, -7.728515625, -6.972412109375, -6.21630859375, -5.460205078125, -4.7041015625, -3.947998046875, -3.19189453125, -2.435791015625, -1.6796875, -0.923583984375, -0.16748046875, 0.588623046875, 1.3447265625, 2.100830078125, 2.85693359375, 3.613037109375, 4.369140625, 5.125244140625, 5.88134765625, 6.637451171875, 7.3935546875, 8.149658203125, 8.90576171875, 9.661865234375, 10.41796875, 11.174072265625, 11.93017578125, 12.686279296875, 13.4423828125, 14.198486328125, 14.95458984375, 15.710693359375, 16.466796875, 17.222900390625, 17.97900390625, 18.735107421875, 19.4912109375, 20.247314453125, 21.00341796875, 21.759521484375, 22.515625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 5.0, 15.0, 19.0, 7.0, 24.0, 33.0, 43.0, 40.0, 57.0, 76.0, 121.0, 140.0, 156.0, 217.0, 297.0, 347.0, 423.0, 375.0, 365.0, 303.0, 204.0, 193.0, 141.0, 99.0, 80.0, 73.0, 49.0, 39.0, 29.0, 24.0, 17.0, 17.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.9442138671875, -8.646240234375, -8.3482666015625, -8.05029296875, -7.7523193359375, -7.454345703125, -7.1563720703125, -6.8583984375, -6.5604248046875, -6.262451171875, -5.9644775390625, -5.66650390625, -5.3685302734375, -5.070556640625, -4.7725830078125, -4.474609375, -4.1766357421875, -3.878662109375, -3.5806884765625, -3.28271484375, -2.9847412109375, -2.686767578125, -2.3887939453125, -2.0908203125, -1.7928466796875, -1.494873046875, -1.1968994140625, -0.89892578125, -0.6009521484375, -0.302978515625, -0.0050048828125, 0.29296875, 0.5909423828125, 0.888916015625, 1.1868896484375, 1.48486328125, 1.7828369140625, 2.080810546875, 2.3787841796875, 2.6767578125, 2.9747314453125, 3.272705078125, 3.5706787109375, 3.86865234375, 4.1666259765625, 4.464599609375, 4.7625732421875, 5.060546875, 5.3585205078125, 5.656494140625, 5.9544677734375, 6.25244140625, 6.5504150390625, 6.848388671875, 7.1463623046875, 7.4443359375, 7.7423095703125, 8.040283203125, 8.3382568359375, 8.63623046875, 8.9342041015625, 9.232177734375, 9.5301513671875, 9.828125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 10.0, 9.0, 4.0, 13.0, 15.0, 29.0, 25.0, 48.0, 52.0, 64.0, 71.0, 95.0, 116.0, 143.0, 194.0, 283.0, 493.0, 1464.0, 13647.0, 749132.0, 3371453.0, 52091.0, 2865.0, 674.0, 340.0, 239.0, 157.0, 111.0, 101.0, 76.0, 59.0, 52.0, 45.0, 14.0, 24.0, 20.0, 13.0, 18.0, 7.0, 6.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.90625, -27.84326171875, -26.7802734375, -25.71728515625, -24.654296875, -23.59130859375, -22.5283203125, -21.46533203125, -20.40234375, -19.33935546875, -18.2763671875, -17.21337890625, -16.150390625, -15.08740234375, -14.0244140625, -12.96142578125, -11.8984375, -10.83544921875, -9.7724609375, -8.70947265625, -7.646484375, -6.58349609375, -5.5205078125, -4.45751953125, -3.39453125, -2.33154296875, -1.2685546875, -0.20556640625, 0.857421875, 1.92041015625, 2.9833984375, 4.04638671875, 5.109375, 6.17236328125, 7.2353515625, 8.29833984375, 9.361328125, 10.42431640625, 11.4873046875, 12.55029296875, 13.61328125, 14.67626953125, 15.7392578125, 16.80224609375, 17.865234375, 18.92822265625, 19.9912109375, 21.05419921875, 22.1171875, 23.18017578125, 24.2431640625, 25.30615234375, 26.369140625, 27.43212890625, 28.4951171875, 29.55810546875, 30.62109375, 31.68408203125, 32.7470703125, 33.81005859375, 34.873046875, 35.93603515625, 36.9990234375, 38.06201171875, 39.125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 6.0, 13.0, 40.0, 76.0, 140.0, 218.0, 217.0, 154.0, 83.0, 44.0, 12.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.778566360473633, -25.900775909423828, -23.022987365722656, -20.145198822021484, -17.26740837097168, -14.389618873596191, -11.511829376220703, -8.634038925170898, -5.756250381469727, -2.8784608840942383, -0.00067138671875, 2.8771181106567383, 5.754907608032227, 8.632697105407715, 11.510486602783203, 14.388277053833008, 17.26606559753418, 20.143856048583984, 23.021644592285156, 25.899433135986328, 28.777223587036133, 31.655014038085938, 34.53280258178711, 37.41059112548828, 40.28838348388672, 43.16617202758789, 46.04396057128906, 48.9217529296875, 51.79954147338867, 54.677330017089844, 57.55512237548828, 60.43291091918945, 63.310699462890625, 66.18849182128906, 69.06627655029297, 71.9440689086914, 74.82185363769531, 77.69964599609375, 80.57743835449219, 83.45523071289062, 86.33301544189453, 89.21080780029297, 92.08859252929688, 94.96638488769531, 97.84417724609375, 100.72196197509766, 103.5997543334961, 106.4775390625, 109.35533142089844, 112.23312377929688, 115.11090850830078, 117.98870086669922, 120.86648559570312, 123.74427795410156, 126.6220703125, 129.49986267089844, 132.37765502929688, 135.2554473876953, 138.13323974609375, 141.01101684570312, 143.88880920410156, 146.7666015625, 149.64439392089844, 152.52218627929688, 155.39996337890625]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 11.0, 6.0, 9.0, 12.0, 14.0, 16.0, 15.0, 14.0, 14.0, 17.0, 16.0, 30.0, 23.0, 29.0, 27.0, 33.0, 43.0, 40.0, 42.0, 34.0, 39.0, 48.0, 35.0, 28.0, 45.0, 35.0, 30.0, 33.0, 26.0, 25.0, 20.0, 25.0, 21.0, 17.0, 22.0, 13.0, 14.0, 13.0, 11.0, 6.0, 10.0, 8.0, 6.0, 5.0, 2.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.614334106445312, -28.640439987182617, -27.666547775268555, -26.69265365600586, -25.718761444091797, -24.7448673248291, -23.770973205566406, -22.797080993652344, -21.82318687438965, -20.849292755126953, -19.87540054321289, -18.901506423950195, -17.9276123046875, -16.953720092773438, -15.979825973510742, -15.005932807922363, -14.032039642333984, -13.058146476745605, -12.084253311157227, -11.110359191894531, -10.136466026306152, -9.162572860717773, -8.188678741455078, -7.214785575866699, -6.24089241027832, -5.266999244689941, -4.293105602264404, -3.3192121982574463, -2.3453187942504883, -1.3714256286621094, -0.39753198623657227, 0.5763616561889648, 1.5502548217773438, 2.5241482257843018, 3.4980416297912598, 4.471935272216797, 5.445828437805176, 6.419721603393555, 7.393615245819092, 8.367508888244629, 9.341402053833008, 10.315295219421387, 11.289188385009766, 12.263082504272461, 13.23697566986084, 14.210868835449219, 15.184762954711914, 16.15865707397461, 17.132549285888672, 18.106443405151367, 19.08033561706543, 20.054229736328125, 21.028121948242188, 22.002016067504883, 22.975910186767578, 23.94980239868164, 24.923696517944336, 25.89759063720703, 26.871482849121094, 27.84537696838379, 28.819271087646484, 29.793163299560547, 30.767057418823242, 31.740951538085938, 32.71484375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 5.0, 6.0, 14.0, 18.0, 13.0, 19.0, 30.0, 20.0, 26.0, 36.0, 31.0, 34.0, 44.0, 34.0, 42.0, 36.0, 28.0, 32.0, 37.0, 44.0, 36.0, 40.0, 34.0, 35.0, 33.0, 29.0, 29.0, 27.0, 26.0, 14.0, 23.0, 17.0, 26.0, 10.0, 12.0, 6.0, 5.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-4.5234375, -4.3868408203125, -4.250244140625, -4.1136474609375, -3.97705078125, -3.8404541015625, -3.703857421875, -3.5672607421875, -3.4306640625, -3.2940673828125, -3.157470703125, -3.0208740234375, -2.88427734375, -2.7476806640625, -2.611083984375, -2.4744873046875, -2.337890625, -2.2012939453125, -2.064697265625, -1.9281005859375, -1.79150390625, -1.6549072265625, -1.518310546875, -1.3817138671875, -1.2451171875, -1.1085205078125, -0.971923828125, -0.8353271484375, -0.69873046875, -0.5621337890625, -0.425537109375, -0.2889404296875, -0.15234375, -0.0157470703125, 0.120849609375, 0.2574462890625, 0.39404296875, 0.5306396484375, 0.667236328125, 0.8038330078125, 0.9404296875, 1.0770263671875, 1.213623046875, 1.3502197265625, 1.48681640625, 1.6234130859375, 1.760009765625, 1.8966064453125, 2.033203125, 2.1697998046875, 2.306396484375, 2.4429931640625, 2.57958984375, 2.7161865234375, 2.852783203125, 2.9893798828125, 3.1259765625, 3.2625732421875, 3.399169921875, 3.5357666015625, 3.67236328125, 3.8089599609375, 3.945556640625, 4.0821533203125, 4.21875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 9.0, 10.0, 16.0, 25.0, 20.0, 49.0, 77.0, 112.0, 158.0, 262.0, 393.0, 610.0, 898.0, 1466.0, 2260.0, 3491.0, 5534.0, 8680.0, 13908.0, 23463.0, 40485.0, 75046.0, 147212.0, 256414.0, 215325.0, 111782.0, 57901.0, 32297.0, 18997.0, 11660.0, 7238.0, 4590.0, 2811.0, 1815.0, 1235.0, 781.0, 517.0, 342.0, 224.0, 148.0, 112.0, 60.0, 43.0, 34.0, 20.0, 7.0, 8.0, 3.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7509765625, -0.726593017578125, -0.70220947265625, -0.677825927734375, -0.6534423828125, -0.629058837890625, -0.60467529296875, -0.580291748046875, -0.555908203125, -0.531524658203125, -0.50714111328125, -0.482757568359375, -0.4583740234375, -0.433990478515625, -0.40960693359375, -0.385223388671875, -0.36083984375, -0.336456298828125, -0.31207275390625, -0.287689208984375, -0.2633056640625, -0.238922119140625, -0.21453857421875, -0.190155029296875, -0.165771484375, -0.141387939453125, -0.11700439453125, -0.092620849609375, -0.0682373046875, -0.043853759765625, -0.01947021484375, 0.004913330078125, 0.029296875, 0.053680419921875, 0.07806396484375, 0.102447509765625, 0.1268310546875, 0.151214599609375, 0.17559814453125, 0.199981689453125, 0.224365234375, 0.248748779296875, 0.27313232421875, 0.297515869140625, 0.3218994140625, 0.346282958984375, 0.37066650390625, 0.395050048828125, 0.41943359375, 0.443817138671875, 0.46820068359375, 0.492584228515625, 0.5169677734375, 0.541351318359375, 0.56573486328125, 0.590118408203125, 0.614501953125, 0.638885498046875, 0.66326904296875, 0.687652587890625, 0.7120361328125, 0.736419677734375, 0.76080322265625, 0.785186767578125, 0.8095703125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 5.0, 3.0, 7.0, 9.0, 11.0, 16.0, 14.0, 17.0, 14.0, 17.0, 32.0, 20.0, 28.0, 33.0, 35.0, 40.0, 38.0, 38.0, 47.0, 50.0, 1069.0, 52.0, 34.0, 31.0, 37.0, 36.0, 37.0, 35.0, 27.0, 26.0, 29.0, 18.0, 11.0, 16.0, 11.0, 13.0, 7.0, 17.0, 9.0, 5.0, 4.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-3.076171875, -2.988128662109375, -2.90008544921875, -2.812042236328125, -2.7239990234375, -2.635955810546875, -2.54791259765625, -2.459869384765625, -2.371826171875, -2.283782958984375, -2.19573974609375, -2.107696533203125, -2.0196533203125, -1.931610107421875, -1.84356689453125, -1.755523681640625, -1.66748046875, -1.579437255859375, -1.49139404296875, -1.403350830078125, -1.3153076171875, -1.227264404296875, -1.13922119140625, -1.051177978515625, -0.963134765625, -0.875091552734375, -0.78704833984375, -0.699005126953125, -0.6109619140625, -0.522918701171875, -0.43487548828125, -0.346832275390625, -0.2587890625, -0.170745849609375, -0.08270263671875, 0.005340576171875, 0.0933837890625, 0.181427001953125, 0.26947021484375, 0.357513427734375, 0.445556640625, 0.533599853515625, 0.62164306640625, 0.709686279296875, 0.7977294921875, 0.885772705078125, 0.97381591796875, 1.061859130859375, 1.14990234375, 1.237945556640625, 1.32598876953125, 1.414031982421875, 1.5020751953125, 1.590118408203125, 1.67816162109375, 1.766204833984375, 1.854248046875, 1.942291259765625, 2.03033447265625, 2.118377685546875, 2.2064208984375, 2.294464111328125, 2.38250732421875, 2.470550537109375, 2.55859375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 9.0, 18.0, 23.0, 45.0, 52.0, 77.0, 130.0, 165.0, 260.0, 439.0, 595.0, 1008.0, 1606.0, 2525.0, 4139.0, 6757.0, 11422.0, 19449.0, 34005.0, 61358.0, 112590.0, 195856.0, 1282080.0, 159925.0, 87398.0, 48065.0, 27553.0, 15593.0, 9251.0, 5595.0, 3432.0, 2061.0, 1257.0, 836.0, 539.0, 358.0, 214.0, 140.0, 97.0, 64.0, 39.0, 32.0, 13.0, 23.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.53076171875, -0.5143280029296875, -0.497894287109375, -0.4814605712890625, -0.46502685546875, -0.4485931396484375, -0.432159423828125, -0.4157257080078125, -0.3992919921875, -0.3828582763671875, -0.366424560546875, -0.3499908447265625, -0.33355712890625, -0.3171234130859375, -0.300689697265625, -0.2842559814453125, -0.267822265625, -0.2513885498046875, -0.234954833984375, -0.2185211181640625, -0.20208740234375, -0.1856536865234375, -0.169219970703125, -0.1527862548828125, -0.1363525390625, -0.1199188232421875, -0.103485107421875, -0.0870513916015625, -0.07061767578125, -0.0541839599609375, -0.037750244140625, -0.0213165283203125, -0.0048828125, 0.0115509033203125, 0.027984619140625, 0.0444183349609375, 0.06085205078125, 0.0772857666015625, 0.093719482421875, 0.1101531982421875, 0.1265869140625, 0.1430206298828125, 0.159454345703125, 0.1758880615234375, 0.19232177734375, 0.2087554931640625, 0.225189208984375, 0.2416229248046875, 0.258056640625, 0.2744903564453125, 0.290924072265625, 0.3073577880859375, 0.32379150390625, 0.3402252197265625, 0.356658935546875, 0.3730926513671875, 0.3895263671875, 0.4059600830078125, 0.422393798828125, 0.4388275146484375, 0.45526123046875, 0.4716949462890625, 0.488128662109375, 0.5045623779296875, 0.52099609375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 5.0, 6.0, 7.0, 12.0, 20.0, 14.0, 18.0, 19.0, 18.0, 18.0, 25.0, 25.0, 32.0, 50.0, 34.0, 45.0, 47.0, 43.0, 57.0, 51.0, 41.0, 46.0, 33.0, 36.0, 39.0, 36.0, 34.0, 22.0, 30.0, 21.0, 19.0, 18.0, 16.0, 11.0, 4.0, 7.0, 8.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.00141143798828125, -0.0013677775859832764, -0.0013241171836853027, -0.001280456781387329, -0.0012367963790893555, -0.0011931359767913818, -0.0011494755744934082, -0.0011058151721954346, -0.001062154769897461, -0.0010184943675994873, -0.0009748339653015137, -0.00093117356300354, -0.0008875131607055664, -0.0008438527584075928, -0.0008001923561096191, -0.0007565319538116455, -0.0007128715515136719, -0.0006692111492156982, -0.0006255507469177246, -0.000581890344619751, -0.0005382299423217773, -0.0004945695400238037, -0.0004509091377258301, -0.00040724873542785645, -0.0003635883331298828, -0.0003199279308319092, -0.00027626752853393555, -0.00023260712623596191, -0.00018894672393798828, -0.00014528632164001465, -0.00010162591934204102, -5.796551704406738e-05, -1.430511474609375e-05, 2.9355287551879883e-05, 7.301568984985352e-05, 0.00011667609214782715, 0.00016033649444580078, 0.00020399689674377441, 0.00024765729904174805, 0.0002913177013397217, 0.0003349781036376953, 0.00037863850593566895, 0.0004222989082336426, 0.0004659593105316162, 0.0005096197128295898, 0.0005532801151275635, 0.0005969405174255371, 0.0006406009197235107, 0.0006842613220214844, 0.000727921724319458, 0.0007715821266174316, 0.0008152425289154053, 0.0008589029312133789, 0.0009025633335113525, 0.0009462237358093262, 0.0009898841381072998, 0.0010335445404052734, 0.001077204942703247, 0.0011208653450012207, 0.0011645257472991943, 0.001208186149597168, 0.0012518465518951416, 0.0012955069541931152, 0.0013391673564910889, 0.0013828277587890625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 6.0, 5.0, 8.0, 8.0, 11.0, 27.0, 23.0, 24.0, 37.0, 52.0, 72.0, 104.0, 134.0, 231.0, 401.0, 772.0, 7304.0, 932237.0, 103894.0, 1785.0, 534.0, 283.0, 176.0, 129.0, 66.0, 53.0, 33.0, 36.0, 25.0, 14.0, 18.0, 9.0, 10.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0401611328125, -0.03889656066894531, -0.037631988525390625, -0.03636741638183594, -0.03510284423828125, -0.03383827209472656, -0.032573699951171875, -0.03130912780761719, -0.0300445556640625, -0.028779983520507812, -0.027515411376953125, -0.026250839233398438, -0.02498626708984375, -0.023721694946289062, -0.022457122802734375, -0.021192550659179688, -0.019927978515625, -0.018663406372070312, -0.017398834228515625, -0.016134262084960938, -0.01486968994140625, -0.013605117797851562, -0.012340545654296875, -0.011075973510742188, -0.0098114013671875, -0.008546829223632812, -0.007282257080078125, -0.0060176849365234375, -0.00475311279296875, -0.0034885406494140625, -0.002223968505859375, -0.0009593963623046875, 0.00030517578125, 0.0015697479248046875, 0.002834320068359375, 0.0040988922119140625, 0.00536346435546875, 0.0066280364990234375, 0.007892608642578125, 0.009157180786132812, 0.0104217529296875, 0.011686325073242188, 0.012950897216796875, 0.014215469360351562, 0.01548004150390625, 0.016744613647460938, 0.018009185791015625, 0.019273757934570312, 0.020538330078125, 0.021802902221679688, 0.023067474365234375, 0.024332046508789062, 0.02559661865234375, 0.026861190795898438, 0.028125762939453125, 0.029390335083007812, 0.0306549072265625, 0.03191947937011719, 0.033184051513671875, 0.03444862365722656, 0.03571319580078125, 0.03697776794433594, 0.038242340087890625, 0.03950691223144531, 0.040771484375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 364.0, 642.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007213766220957041, -0.006619041319936514, -0.006024316884577274, -0.0054295919835567474, -0.0048348670825362206, -0.004240142181515694, -0.0036454175133258104, -0.003050692845135927, -0.0024559679441154003, -0.0018612431595101953, -0.0012665183749049902, -0.0006717935902997851, -7.706880569458008e-05, 0.0005176560953259468, 0.00111238076351583, 0.0017071054317057133, 0.00230183033272624, 0.002896555233746767, 0.0034912799019366503, 0.0040860045701265335, 0.00468072947114706, 0.005275454372167587, 0.005870179273188114, 0.006464903708547354, 0.007059628609567881, 0.0076543535105884075, 0.008249077945947647, 0.008843802846968174, 0.0094385277479887, 0.010033252649009228, 0.010627977550029755, 0.011222701519727707, 0.011817427352070808, 0.012412152253091335, 0.013006877154111862, 0.013601602055132389, 0.014196326956152916, 0.014791050925850868, 0.015385775826871395, 0.015980500727891922, 0.016575224697589874, 0.017169948667287827, 0.017764674499630928, 0.01835939846932888, 0.018954124301671982, 0.019548848271369934, 0.020143574103713036, 0.020738298073410988, 0.02133302390575409, 0.02192774787545204, 0.022522473707795143, 0.023117197677493095, 0.023711923509836197, 0.02430664747953415, 0.02490137331187725, 0.025496097281575203, 0.026090823113918304, 0.026685547083616257, 0.027280272915959358, 0.02787499688565731, 0.028469722718000412, 0.029064446687698364, 0.029659172520041466, 0.030253896489739418, 0.03084862045943737]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 8.0, 6.0, 3.0, 8.0, 7.0, 14.0, 12.0, 17.0, 15.0, 25.0, 29.0, 20.0, 32.0, 28.0, 38.0, 41.0, 40.0, 46.0, 48.0, 52.0, 56.0, 48.0, 48.0, 47.0, 49.0, 37.0, 40.0, 35.0, 18.0, 21.0, 19.0, 16.0, 15.0, 15.0, 16.0, 3.0, 3.0, 11.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0009328126907348633, -0.0009030187502503395, -0.0008732248097658157, -0.000843430869281292, -0.0008136369287967682, -0.0007838429883122444, -0.0007540490478277206, -0.0007242551073431969, -0.0006944611668586731, -0.0006646672263741493, -0.0006348732858896255, -0.0006050793454051018, -0.000575285404920578, -0.0005454914644360542, -0.0005156975239515305, -0.0004859035834670067, -0.0004561096429824829, -0.00042631570249795914, -0.00039652176201343536, -0.0003667278215289116, -0.0003369338810443878, -0.00030713994055986404, -0.00027734600007534027, -0.0002475520595908165, -0.00021775811910629272, -0.00018796417862176895, -0.00015817023813724518, -0.0001283762976527214, -9.858235716819763e-05, -6.878841668367386e-05, -3.8994476199150085e-05, -9.200535714626312e-06, 2.059340476989746e-05, 5.0387345254421234e-05, 8.018128573894501e-05, 0.00010997522622346878, 0.00013976916670799255, 0.00016956310719251633, 0.0001993570476770401, 0.00022915098816156387, 0.00025894492864608765, 0.0002887388691306114, 0.0003185328096151352, 0.00034832675009965897, 0.00037812069058418274, 0.0004079146310687065, 0.0004377085715532303, 0.00046750251203775406, 0.0004972964525222778, 0.0005270903930068016, 0.0005568843334913254, 0.0005866782739758492, 0.0006164722144603729, 0.0006462661549448967, 0.0006760600954294205, 0.0007058540359139442, 0.000735647976398468, 0.0007654419168829918, 0.0007952358573675156, 0.0008250297978520393, 0.0008548237383365631, 0.0008846176788210869, 0.0009144116193056107, 0.0009442055597901344, 0.0009739995002746582]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 5.0, 6.0, 14.0, 18.0, 13.0, 19.0, 30.0, 20.0, 26.0, 36.0, 31.0, 34.0, 44.0, 34.0, 42.0, 36.0, 28.0, 32.0, 37.0, 44.0, 36.0, 40.0, 34.0, 35.0, 33.0, 29.0, 29.0, 27.0, 26.0, 14.0, 23.0, 17.0, 26.0, 10.0, 12.0, 6.0, 5.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-4.5234375, -4.3868408203125, -4.250244140625, -4.1136474609375, -3.97705078125, -3.8404541015625, -3.703857421875, -3.5672607421875, -3.4306640625, -3.2940673828125, -3.157470703125, -3.0208740234375, -2.88427734375, -2.7476806640625, -2.611083984375, -2.4744873046875, -2.337890625, -2.2012939453125, -2.064697265625, -1.9281005859375, -1.79150390625, -1.6549072265625, -1.518310546875, -1.3817138671875, -1.2451171875, -1.1085205078125, -0.971923828125, -0.8353271484375, -0.69873046875, -0.5621337890625, -0.425537109375, -0.2889404296875, -0.15234375, -0.0157470703125, 0.120849609375, 0.2574462890625, 0.39404296875, 0.5306396484375, 0.667236328125, 0.8038330078125, 0.9404296875, 1.0770263671875, 1.213623046875, 1.3502197265625, 1.48681640625, 1.6234130859375, 1.760009765625, 1.8966064453125, 2.033203125, 2.1697998046875, 2.306396484375, 2.4429931640625, 2.57958984375, 2.7161865234375, 2.852783203125, 2.9893798828125, 3.1259765625, 3.2625732421875, 3.399169921875, 3.5357666015625, 3.67236328125, 3.8089599609375, 3.945556640625, 4.0821533203125, 4.21875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 10.0, 13.0, 9.0, 26.0, 27.0, 34.0, 52.0, 64.0, 125.0, 164.0, 269.0, 419.0, 715.0, 1185.0, 2142.0, 3516.0, 6099.0, 10663.0, 19423.0, 38587.0, 86865.0, 270870.0, 384790.0, 119545.0, 48566.0, 23858.0, 12763.0, 7380.0, 4211.0, 2430.0, 1497.0, 858.0, 493.0, 284.0, 190.0, 139.0, 76.0, 58.0, 43.0, 31.0, 19.0, 11.0, 13.0, 14.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1875, -3.09136962890625, -2.9952392578125, -2.89910888671875, -2.802978515625, -2.70684814453125, -2.6107177734375, -2.51458740234375, -2.41845703125, -2.32232666015625, -2.2261962890625, -2.13006591796875, -2.033935546875, -1.93780517578125, -1.8416748046875, -1.74554443359375, -1.6494140625, -1.55328369140625, -1.4571533203125, -1.36102294921875, -1.264892578125, -1.16876220703125, -1.0726318359375, -0.97650146484375, -0.88037109375, -0.78424072265625, -0.6881103515625, -0.59197998046875, -0.495849609375, -0.39971923828125, -0.3035888671875, -0.20745849609375, -0.111328125, -0.01519775390625, 0.0809326171875, 0.17706298828125, 0.273193359375, 0.36932373046875, 0.4654541015625, 0.56158447265625, 0.65771484375, 0.75384521484375, 0.8499755859375, 0.94610595703125, 1.042236328125, 1.13836669921875, 1.2344970703125, 1.33062744140625, 1.4267578125, 1.52288818359375, 1.6190185546875, 1.71514892578125, 1.811279296875, 1.90740966796875, 2.0035400390625, 2.09967041015625, 2.19580078125, 2.29193115234375, 2.3880615234375, 2.48419189453125, 2.580322265625, 2.67645263671875, 2.7725830078125, 2.86871337890625, 2.96484375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 5.0, 10.0, 11.0, 7.0, 11.0, 23.0, 18.0, 20.0, 22.0, 22.0, 29.0, 35.0, 43.0, 38.0, 37.0, 72.0, 179.0, 1693.0, 225.0, 81.0, 65.0, 44.0, 45.0, 40.0, 32.0, 33.0, 28.0, 24.0, 20.0, 31.0, 22.0, 13.0, 12.0, 10.0, 7.0, 9.0, 3.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.2845458984375, -12.764404296875, -12.2442626953125, -11.72412109375, -11.2039794921875, -10.683837890625, -10.1636962890625, -9.6435546875, -9.1234130859375, -8.603271484375, -8.0831298828125, -7.56298828125, -7.0428466796875, -6.522705078125, -6.0025634765625, -5.482421875, -4.9622802734375, -4.442138671875, -3.9219970703125, -3.40185546875, -2.8817138671875, -2.361572265625, -1.8414306640625, -1.3212890625, -0.8011474609375, -0.281005859375, 0.2391357421875, 0.75927734375, 1.2794189453125, 1.799560546875, 2.3197021484375, 2.83984375, 3.3599853515625, 3.880126953125, 4.4002685546875, 4.92041015625, 5.4405517578125, 5.960693359375, 6.4808349609375, 7.0009765625, 7.5211181640625, 8.041259765625, 8.5614013671875, 9.08154296875, 9.6016845703125, 10.121826171875, 10.6419677734375, 11.162109375, 11.6822509765625, 12.202392578125, 12.7225341796875, 13.24267578125, 13.7628173828125, 14.282958984375, 14.8031005859375, 15.3232421875, 15.8433837890625, 16.363525390625, 16.8836669921875, 17.40380859375, 17.9239501953125, 18.444091796875, 18.9642333984375, 19.484375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 13.0, 13.0, 10.0, 21.0, 32.0, 40.0, 56.0, 72.0, 97.0, 179.0, 279.0, 556.0, 2920.0, 2910897.0, 227915.0, 1542.0, 423.0, 230.0, 128.0, 76.0, 61.0, 38.0, 19.0, 26.0, 14.0, 12.0, 5.0, 7.0, 9.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.09375, -46.53662109375, -44.9794921875, -43.42236328125, -41.865234375, -40.30810546875, -38.7509765625, -37.19384765625, -35.63671875, -34.07958984375, -32.5224609375, -30.96533203125, -29.408203125, -27.85107421875, -26.2939453125, -24.73681640625, -23.1796875, -21.62255859375, -20.0654296875, -18.50830078125, -16.951171875, -15.39404296875, -13.8369140625, -12.27978515625, -10.72265625, -9.16552734375, -7.6083984375, -6.05126953125, -4.494140625, -2.93701171875, -1.3798828125, 0.17724609375, 1.734375, 3.29150390625, 4.8486328125, 6.40576171875, 7.962890625, 9.52001953125, 11.0771484375, 12.63427734375, 14.19140625, 15.74853515625, 17.3056640625, 18.86279296875, 20.419921875, 21.97705078125, 23.5341796875, 25.09130859375, 26.6484375, 28.20556640625, 29.7626953125, 31.31982421875, 32.876953125, 34.43408203125, 35.9912109375, 37.54833984375, 39.10546875, 40.66259765625, 42.2197265625, 43.77685546875, 45.333984375, 46.89111328125, 48.4482421875, 50.00537109375, 51.5625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 187.0, 759.0, 69.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.774166107177734, -20.15549087524414, -15.53681468963623, -10.91813850402832, -6.299463272094727, -1.6807880401611328, 2.9378890991210938, 7.5565643310546875, 12.175239562988281, 16.793914794921875, 21.41259002685547, 26.031267166137695, 30.64994239807129, 35.26861572265625, 39.88729476928711, 44.5059700012207, 49.1246452331543, 53.74332046508789, 58.361995697021484, 62.980674743652344, 67.59934997558594, 72.21802520751953, 76.83670043945312, 81.45537567138672, 86.07405090332031, 90.6927261352539, 95.3114013671875, 99.9300765991211, 104.54875183105469, 109.16742706298828, 113.78610229492188, 118.40478515625, 123.02345275878906, 127.64212799072266, 132.26080322265625, 136.87948608398438, 141.49815368652344, 146.11683654785156, 150.73550415039062, 155.35418701171875, 159.9728546142578, 164.59153747558594, 169.210205078125, 173.82888793945312, 178.4475555419922, 183.0662384033203, 187.68490600585938, 192.3035888671875, 196.92227172851562, 201.54095458984375, 206.1596221923828, 210.77830505371094, 215.39697265625, 220.01565551757812, 224.6343231201172, 229.2530059814453, 233.87167358398438, 238.4903564453125, 243.10902404785156, 247.7277069091797, 252.34637451171875, 256.9650573730469, 261.583740234375, 266.202392578125, 270.8210754394531]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 8.0, 5.0, 14.0, 5.0, 5.0, 19.0, 18.0, 16.0, 18.0, 19.0, 26.0, 24.0, 27.0, 31.0, 37.0, 37.0, 40.0, 46.0, 35.0, 36.0, 40.0, 42.0, 44.0, 34.0, 37.0, 39.0, 30.0, 31.0, 33.0, 33.0, 37.0, 22.0, 19.0, 18.0, 18.0, 15.0, 6.0, 1.0, 13.0, 6.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.74343490600586, -43.338130950927734, -41.932823181152344, -40.52751922607422, -39.12221145629883, -37.7169075012207, -36.31159973144531, -34.90629577636719, -33.5009880065918, -32.09568405151367, -30.69037628173828, -29.285070419311523, -27.879764556884766, -26.474458694458008, -25.06915283203125, -23.663848876953125, -22.258543014526367, -20.85323715209961, -19.44793128967285, -18.042625427246094, -16.637319564819336, -15.232013702392578, -13.826708793640137, -12.421402931213379, -11.016097068786621, -9.610791206359863, -8.205485343933105, -6.800179958343506, -5.394874095916748, -3.9895682334899902, -2.5842628479003906, -1.1789569854736328, 0.226348876953125, 1.6316546201705933, 3.0369603633880615, 4.44226598739624, 5.847571849822998, 7.252877712249756, 8.658183097839355, 10.063488960266113, 11.468794822692871, 12.874100685119629, 14.279406547546387, 15.684711456298828, 17.090017318725586, 18.495323181152344, 19.9006290435791, 21.30593490600586, 22.711240768432617, 24.116546630859375, 25.521852493286133, 26.92715835571289, 28.33246421813965, 29.737770080566406, 31.14307403564453, 32.54838180541992, 33.95368576049805, 35.35898971557617, 36.76429748535156, 38.16960144042969, 39.57490921020508, 40.9802131652832, 42.385520935058594, 43.79082489013672, 45.19613265991211]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 2.0, 4.0, 1.0, 5.0, 10.0, 10.0, 11.0, 9.0, 17.0, 18.0, 14.0, 30.0, 30.0, 32.0, 30.0, 34.0, 38.0, 38.0, 29.0, 43.0, 39.0, 39.0, 32.0, 34.0, 48.0, 50.0, 35.0, 27.0, 30.0, 23.0, 30.0, 30.0, 26.0, 25.0, 21.0, 22.0, 16.0, 14.0, 13.0, 5.0, 10.0, 5.0, 6.0, 6.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.69921875, -4.55474853515625, -4.4102783203125, -4.26580810546875, -4.121337890625, -3.97686767578125, -3.8323974609375, -3.68792724609375, -3.54345703125, -3.39898681640625, -3.2545166015625, -3.11004638671875, -2.965576171875, -2.82110595703125, -2.6766357421875, -2.53216552734375, -2.3876953125, -2.24322509765625, -2.0987548828125, -1.95428466796875, -1.809814453125, -1.66534423828125, -1.5208740234375, -1.37640380859375, -1.23193359375, -1.08746337890625, -0.9429931640625, -0.79852294921875, -0.654052734375, -0.50958251953125, -0.3651123046875, -0.22064208984375, -0.076171875, 0.06829833984375, 0.2127685546875, 0.35723876953125, 0.501708984375, 0.64617919921875, 0.7906494140625, 0.93511962890625, 1.07958984375, 1.22406005859375, 1.3685302734375, 1.51300048828125, 1.657470703125, 1.80194091796875, 1.9464111328125, 2.09088134765625, 2.2353515625, 2.37982177734375, 2.5242919921875, 2.66876220703125, 2.813232421875, 2.95770263671875, 3.1021728515625, 3.24664306640625, 3.39111328125, 3.53558349609375, 3.6800537109375, 3.82452392578125, 3.968994140625, 4.11346435546875, 4.2579345703125, 4.40240478515625, 4.546875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 14.0, 22.0, 20.0, 26.0, 45.0, 59.0, 72.0, 102.0, 149.0, 222.0, 322.0, 541.0, 1027.0, 1993.0, 4663.0, 13065.0, 48782.0, 262994.0, 1251775.0, 1857373.0, 607925.0, 104905.0, 23947.0, 7720.0, 2978.0, 1409.0, 725.0, 432.0, 266.0, 192.0, 146.0, 94.0, 64.0, 37.0, 49.0, 21.0, 18.0, 12.0, 14.0, 12.0, 5.0, 10.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.56640625, -6.32537841796875, -6.0843505859375, -5.84332275390625, -5.602294921875, -5.36126708984375, -5.1202392578125, -4.87921142578125, -4.63818359375, -4.39715576171875, -4.1561279296875, -3.91510009765625, -3.674072265625, -3.43304443359375, -3.1920166015625, -2.95098876953125, -2.7099609375, -2.46893310546875, -2.2279052734375, -1.98687744140625, -1.745849609375, -1.50482177734375, -1.2637939453125, -1.02276611328125, -0.78173828125, -0.54071044921875, -0.2996826171875, -0.05865478515625, 0.182373046875, 0.42340087890625, 0.6644287109375, 0.90545654296875, 1.146484375, 1.38751220703125, 1.6285400390625, 1.86956787109375, 2.110595703125, 2.35162353515625, 2.5926513671875, 2.83367919921875, 3.07470703125, 3.31573486328125, 3.5567626953125, 3.79779052734375, 4.038818359375, 4.27984619140625, 4.5208740234375, 4.76190185546875, 5.0029296875, 5.24395751953125, 5.4849853515625, 5.72601318359375, 5.967041015625, 6.20806884765625, 6.4490966796875, 6.69012451171875, 6.93115234375, 7.17218017578125, 7.4132080078125, 7.65423583984375, 7.895263671875, 8.13629150390625, 8.3773193359375, 8.61834716796875, 8.859375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 5.0, 8.0, 9.0, 7.0, 15.0, 25.0, 36.0, 52.0, 84.0, 98.0, 145.0, 191.0, 235.0, 361.0, 412.0, 448.0, 507.0, 375.0, 301.0, 218.0, 154.0, 112.0, 74.0, 58.0, 40.0, 33.0, 24.0, 18.0, 10.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3359375, -10.96728515625, -10.5986328125, -10.22998046875, -9.861328125, -9.49267578125, -9.1240234375, -8.75537109375, -8.38671875, -8.01806640625, -7.6494140625, -7.28076171875, -6.912109375, -6.54345703125, -6.1748046875, -5.80615234375, -5.4375, -5.06884765625, -4.7001953125, -4.33154296875, -3.962890625, -3.59423828125, -3.2255859375, -2.85693359375, -2.48828125, -2.11962890625, -1.7509765625, -1.38232421875, -1.013671875, -0.64501953125, -0.2763671875, 0.09228515625, 0.4609375, 0.82958984375, 1.1982421875, 1.56689453125, 1.935546875, 2.30419921875, 2.6728515625, 3.04150390625, 3.41015625, 3.77880859375, 4.1474609375, 4.51611328125, 4.884765625, 5.25341796875, 5.6220703125, 5.99072265625, 6.359375, 6.72802734375, 7.0966796875, 7.46533203125, 7.833984375, 8.20263671875, 8.5712890625, 8.93994140625, 9.30859375, 9.67724609375, 10.0458984375, 10.41455078125, 10.783203125, 11.15185546875, 11.5205078125, 11.88916015625, 12.2578125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 12.0, 9.0, 21.0, 24.0, 41.0, 42.0, 52.0, 97.0, 112.0, 169.0, 223.0, 550.0, 1685.0, 37444.0, 3770563.0, 376571.0, 4780.0, 796.0, 347.0, 216.0, 150.0, 95.0, 68.0, 47.0, 39.0, 33.0, 25.0, 11.0, 11.0, 16.0, 3.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.875, -32.607421875, -31.33984375, -30.072265625, -28.8046875, -27.537109375, -26.26953125, -25.001953125, -23.734375, -22.466796875, -21.19921875, -19.931640625, -18.6640625, -17.396484375, -16.12890625, -14.861328125, -13.59375, -12.326171875, -11.05859375, -9.791015625, -8.5234375, -7.255859375, -5.98828125, -4.720703125, -3.453125, -2.185546875, -0.91796875, 0.349609375, 1.6171875, 2.884765625, 4.15234375, 5.419921875, 6.6875, 7.955078125, 9.22265625, 10.490234375, 11.7578125, 13.025390625, 14.29296875, 15.560546875, 16.828125, 18.095703125, 19.36328125, 20.630859375, 21.8984375, 23.166015625, 24.43359375, 25.701171875, 26.96875, 28.236328125, 29.50390625, 30.771484375, 32.0390625, 33.306640625, 34.57421875, 35.841796875, 37.109375, 38.376953125, 39.64453125, 40.912109375, 42.1796875, 43.447265625, 44.71484375, 45.982421875, 47.25]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 8.0, 74.0, 270.0, 376.0, 226.0, 44.0, 11.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.75665283203125, -65.4729232788086, -60.18919372558594, -54.905460357666016, -49.62173080444336, -44.3380012512207, -39.05426788330078, -33.770538330078125, -28.48680877685547, -23.203079223632812, -17.919347763061523, -12.63561725616455, -7.351886749267578, -2.068157196044922, 3.215574264526367, 8.499305725097656, 13.783035278320312, 19.06676483154297, 24.350496292114258, 29.634227752685547, 34.9179573059082, 40.20168685913086, 45.48542022705078, 50.76914978027344, 56.052879333496094, 61.33660888671875, 66.6203384399414, 71.90406799316406, 77.18780517578125, 82.47152709960938, 87.75526428222656, 93.03899383544922, 98.32272338867188, 103.60645294189453, 108.89018249511719, 114.17391204833984, 119.4576416015625, 124.74137878417969, 130.0251007080078, 135.308837890625, 140.59255981445312, 145.8762969970703, 151.16001892089844, 156.44375610351562, 161.72747802734375, 167.01121520996094, 172.29493713378906, 177.57867431640625, 182.86241149902344, 188.14614868164062, 193.42987060546875, 198.71360778808594, 203.99732971191406, 209.28106689453125, 214.56478881835938, 219.84852600097656, 225.13226318359375, 230.41600036621094, 235.69972229003906, 240.98345947265625, 246.26718139648438, 251.55091857910156, 256.83465576171875, 262.1183776855469, 267.402099609375]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 6.0, 5.0, 11.0, 9.0, 18.0, 9.0, 20.0, 15.0, 19.0, 19.0, 22.0, 24.0, 28.0, 26.0, 46.0, 31.0, 45.0, 38.0, 41.0, 32.0, 43.0, 48.0, 37.0, 34.0, 38.0, 36.0, 26.0, 29.0, 34.0, 17.0, 24.0, 22.0, 23.0, 23.0, 18.0, 14.0, 20.0, 6.0, 12.0, 6.0, 5.0, 6.0, 0.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.296630859375, -32.26353454589844, -31.23044204711914, -30.19734764099121, -29.16425323486328, -28.13115882873535, -27.098064422607422, -26.064970016479492, -25.031875610351562, -23.998781204223633, -22.965686798095703, -21.932592391967773, -20.899497985839844, -19.866403579711914, -18.833309173583984, -17.800214767456055, -16.767120361328125, -15.734025955200195, -14.700931549072266, -13.667837142944336, -12.634742736816406, -11.601648330688477, -10.568553924560547, -9.535459518432617, -8.502365112304688, -7.469270706176758, -6.436176300048828, -5.403081893920898, -4.369987487792969, -3.336893081665039, -2.3037986755371094, -1.2707042694091797, -0.23760986328125, 0.7954845428466797, 1.8285789489746094, 2.861673355102539, 3.8947677612304688, 4.927862167358398, 5.960956573486328, 6.994050979614258, 8.027145385742188, 9.060239791870117, 10.093334197998047, 11.126428604125977, 12.159523010253906, 13.192617416381836, 14.225711822509766, 15.258806228637695, 16.291900634765625, 17.324995040893555, 18.358089447021484, 19.391183853149414, 20.424278259277344, 21.457372665405273, 22.490467071533203, 23.523561477661133, 24.556655883789062, 25.589750289916992, 26.622844696044922, 27.65593910217285, 28.68903350830078, 29.72212791442871, 30.75522232055664, 31.78831672668457, 32.8214111328125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 7.0, 10.0, 15.0, 17.0, 17.0, 21.0, 29.0, 33.0, 32.0, 32.0, 40.0, 38.0, 46.0, 44.0, 42.0, 42.0, 51.0, 42.0, 46.0, 40.0, 44.0, 40.0, 35.0, 38.0, 38.0, 26.0, 26.0, 19.0, 15.0, 17.0, 15.0, 13.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.99505615234375, -4.8260498046875, -4.65704345703125, -4.488037109375, -4.31903076171875, -4.1500244140625, -3.98101806640625, -3.81201171875, -3.64300537109375, -3.4739990234375, -3.30499267578125, -3.135986328125, -2.96697998046875, -2.7979736328125, -2.62896728515625, -2.4599609375, -2.29095458984375, -2.1219482421875, -1.95294189453125, -1.783935546875, -1.61492919921875, -1.4459228515625, -1.27691650390625, -1.10791015625, -0.93890380859375, -0.7698974609375, -0.60089111328125, -0.431884765625, -0.26287841796875, -0.0938720703125, 0.07513427734375, 0.244140625, 0.41314697265625, 0.5821533203125, 0.75115966796875, 0.920166015625, 1.08917236328125, 1.2581787109375, 1.42718505859375, 1.59619140625, 1.76519775390625, 1.9342041015625, 2.10321044921875, 2.272216796875, 2.44122314453125, 2.6102294921875, 2.77923583984375, 2.9482421875, 3.11724853515625, 3.2862548828125, 3.45526123046875, 3.624267578125, 3.79327392578125, 3.9622802734375, 4.13128662109375, 4.30029296875, 4.46929931640625, 4.6383056640625, 4.80731201171875, 4.976318359375, 5.14532470703125, 5.3143310546875, 5.48333740234375, 5.65234375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 11.0, 13.0, 21.0, 34.0, 49.0, 56.0, 79.0, 107.0, 136.0, 200.0, 303.0, 424.0, 646.0, 907.0, 1370.0, 2016.0, 2831.0, 4187.0, 6236.0, 9394.0, 14321.0, 22065.0, 34259.0, 55022.0, 89569.0, 148893.0, 207474.0, 168601.0, 103533.0, 63244.0, 39051.0, 24920.0, 15895.0, 10536.0, 7142.0, 4708.0, 3257.0, 2242.0, 1520.0, 1053.0, 676.0, 495.0, 341.0, 210.0, 149.0, 115.0, 71.0, 53.0, 38.0, 32.0, 23.0, 8.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0], "bins": [-0.572265625, -0.5535888671875, -0.534912109375, -0.5162353515625, -0.49755859375, -0.4788818359375, -0.460205078125, -0.4415283203125, -0.4228515625, -0.4041748046875, -0.385498046875, -0.3668212890625, -0.34814453125, -0.3294677734375, -0.310791015625, -0.2921142578125, -0.2734375, -0.2547607421875, -0.236083984375, -0.2174072265625, -0.19873046875, -0.1800537109375, -0.161376953125, -0.1427001953125, -0.1240234375, -0.1053466796875, -0.086669921875, -0.0679931640625, -0.04931640625, -0.0306396484375, -0.011962890625, 0.0067138671875, 0.025390625, 0.0440673828125, 0.062744140625, 0.0814208984375, 0.10009765625, 0.1187744140625, 0.137451171875, 0.1561279296875, 0.1748046875, 0.1934814453125, 0.212158203125, 0.2308349609375, 0.24951171875, 0.2681884765625, 0.286865234375, 0.3055419921875, 0.32421875, 0.3428955078125, 0.361572265625, 0.3802490234375, 0.39892578125, 0.4176025390625, 0.436279296875, 0.4549560546875, 0.4736328125, 0.4923095703125, 0.510986328125, 0.5296630859375, 0.54833984375, 0.5670166015625, 0.585693359375, 0.6043701171875, 0.623046875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 12.0, 7.0, 11.0, 11.0, 12.0, 17.0, 31.0, 36.0, 40.0, 31.0, 39.0, 51.0, 43.0, 37.0, 58.0, 1092.0, 59.0, 54.0, 48.0, 43.0, 44.0, 28.0, 42.0, 21.0, 34.0, 16.0, 28.0, 21.0, 14.0, 12.0, 8.0, 1.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.16015625, -3.04095458984375, -2.9217529296875, -2.80255126953125, -2.683349609375, -2.56414794921875, -2.4449462890625, -2.32574462890625, -2.20654296875, -2.08734130859375, -1.9681396484375, -1.84893798828125, -1.729736328125, -1.61053466796875, -1.4913330078125, -1.37213134765625, -1.2529296875, -1.13372802734375, -1.0145263671875, -0.89532470703125, -0.776123046875, -0.65692138671875, -0.5377197265625, -0.41851806640625, -0.29931640625, -0.18011474609375, -0.0609130859375, 0.05828857421875, 0.177490234375, 0.29669189453125, 0.4158935546875, 0.53509521484375, 0.654296875, 0.77349853515625, 0.8927001953125, 1.01190185546875, 1.131103515625, 1.25030517578125, 1.3695068359375, 1.48870849609375, 1.60791015625, 1.72711181640625, 1.8463134765625, 1.96551513671875, 2.084716796875, 2.20391845703125, 2.3231201171875, 2.44232177734375, 2.5615234375, 2.68072509765625, 2.7999267578125, 2.91912841796875, 3.038330078125, 3.15753173828125, 3.2767333984375, 3.39593505859375, 3.51513671875, 3.63433837890625, 3.7535400390625, 3.87274169921875, 3.991943359375, 4.11114501953125, 4.2303466796875, 4.34954833984375, 4.46875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 14.0, 9.0, 33.0, 47.0, 59.0, 116.0, 184.0, 317.0, 507.0, 972.0, 1786.0, 3371.0, 6347.0, 12190.0, 24481.0, 51877.0, 113925.0, 243317.0, 1343093.0, 156745.0, 70913.0, 33023.0, 16154.0, 8192.0, 4359.0, 2259.0, 1234.0, 682.0, 374.0, 222.0, 108.0, 78.0, 52.0, 36.0, 16.0, 17.0, 10.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79248046875, -0.7693099975585938, -0.7461395263671875, -0.7229690551757812, -0.699798583984375, -0.6766281127929688, -0.6534576416015625, -0.6302871704101562, -0.60711669921875, -0.5839462280273438, -0.5607757568359375, -0.5376052856445312, -0.514434814453125, -0.49126434326171875, -0.4680938720703125, -0.44492340087890625, -0.4217529296875, -0.39858245849609375, -0.3754119873046875, -0.35224151611328125, -0.329071044921875, -0.30590057373046875, -0.2827301025390625, -0.25955963134765625, -0.23638916015625, -0.21321868896484375, -0.1900482177734375, -0.16687774658203125, -0.143707275390625, -0.12053680419921875, -0.0973663330078125, -0.07419586181640625, -0.051025390625, -0.02785491943359375, -0.0046844482421875, 0.01848602294921875, 0.041656494140625, 0.06482696533203125, 0.0879974365234375, 0.11116790771484375, 0.13433837890625, 0.15750885009765625, 0.1806793212890625, 0.20384979248046875, 0.227020263671875, 0.25019073486328125, 0.2733612060546875, 0.29653167724609375, 0.3197021484375, 0.34287261962890625, 0.3660430908203125, 0.38921356201171875, 0.412384033203125, 0.43555450439453125, 0.4587249755859375, 0.48189544677734375, 0.50506591796875, 0.5282363891601562, 0.5514068603515625, 0.5745773315429688, 0.597747802734375, 0.6209182739257812, 0.6440887451171875, 0.6672592163085938, 0.6904296875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 8.0, 3.0, 6.0, 11.0, 15.0, 19.0, 19.0, 22.0, 30.0, 33.0, 34.0, 37.0, 56.0, 63.0, 49.0, 68.0, 62.0, 66.0, 60.0, 67.0, 39.0, 49.0, 38.0, 39.0, 26.0, 24.0, 15.0, 9.0, 9.0, 6.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0017576217651367188, -0.0016979724168777466, -0.0016383230686187744, -0.0015786737203598022, -0.00151902437210083, -0.001459375023841858, -0.0013997256755828857, -0.0013400763273239136, -0.0012804269790649414, -0.0012207776308059692, -0.001161128282546997, -0.001101478934288025, -0.0010418295860290527, -0.0009821802377700806, -0.0009225308895111084, -0.0008628815412521362, -0.0008032321929931641, -0.0007435828447341919, -0.0006839334964752197, -0.0006242841482162476, -0.0005646347999572754, -0.0005049854516983032, -0.00044533610343933105, -0.0003856867551803589, -0.0003260374069213867, -0.00026638805866241455, -0.00020673871040344238, -0.00014708936214447021, -8.744001388549805e-05, -2.779066562652588e-05, 3.185868263244629e-05, 9.150803089141846e-05, 0.00015115737915039062, 0.0002108067274093628, 0.00027045607566833496, 0.00033010542392730713, 0.0003897547721862793, 0.00044940412044525146, 0.0005090534687042236, 0.0005687028169631958, 0.000628352165222168, 0.0006880015134811401, 0.0007476508617401123, 0.0008073002099990845, 0.0008669495582580566, 0.0009265989065170288, 0.000986248254776001, 0.0010458976030349731, 0.0011055469512939453, 0.0011651962995529175, 0.0012248456478118896, 0.0012844949960708618, 0.001344144344329834, 0.0014037936925888062, 0.0014634430408477783, 0.0015230923891067505, 0.0015827417373657227, 0.0016423910856246948, 0.001702040433883667, 0.0017616897821426392, 0.0018213391304016113, 0.0018809884786605835, 0.0019406378269195557, 0.002000287175178528, 0.0020599365234375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 13.0, 18.0, 18.0, 19.0, 31.0, 41.0, 60.0, 71.0, 116.0, 191.0, 360.0, 677.0, 3511.0, 663000.0, 376312.0, 2525.0, 646.0, 280.0, 192.0, 117.0, 73.0, 59.0, 34.0, 38.0, 29.0, 21.0, 17.0, 16.0, 13.0, 5.0, 8.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0394287109375, -0.03826713562011719, -0.037105560302734375, -0.03594398498535156, -0.03478240966796875, -0.03362083435058594, -0.032459259033203125, -0.03129768371582031, -0.0301361083984375, -0.028974533081054688, -0.027812957763671875, -0.026651382446289062, -0.02548980712890625, -0.024328231811523438, -0.023166656494140625, -0.022005081176757812, -0.020843505859375, -0.019681930541992188, -0.018520355224609375, -0.017358779907226562, -0.01619720458984375, -0.015035629272460938, -0.013874053955078125, -0.012712478637695312, -0.0115509033203125, -0.010389328002929688, -0.009227752685546875, -0.008066177368164062, -0.00690460205078125, -0.0057430267333984375, -0.004581451416015625, -0.0034198760986328125, -0.00225830078125, -0.0010967254638671875, 6.4849853515625e-05, 0.0012264251708984375, 0.00238800048828125, 0.0035495758056640625, 0.004711151123046875, 0.0058727264404296875, 0.0070343017578125, 0.008195877075195312, 0.009357452392578125, 0.010519027709960938, 0.01168060302734375, 0.012842178344726562, 0.014003753662109375, 0.015165328979492188, 0.016326904296875, 0.017488479614257812, 0.018650054931640625, 0.019811630249023438, 0.02097320556640625, 0.022134780883789062, 0.023296356201171875, 0.024457931518554688, 0.0256195068359375, 0.026781082153320312, 0.027942657470703125, 0.029104232788085938, 0.03026580810546875, 0.03142738342285156, 0.032588958740234375, 0.03375053405761719, 0.034912109375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 22.0, 93.0, 270.0, 350.0, 191.0, 66.0, 13.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006533139385282993, -0.006395274773240089, -0.0062574101611971855, -0.006119545549154282, -0.00598168047145009, -0.0058438158594071865, -0.005705951247364283, -0.005568086635321379, -0.005430222023278475, -0.005292357411235571, -0.005154492799192667, -0.005016627721488476, -0.004878763109445572, -0.004740898497402668, -0.004603033885359764, -0.00446516927331686, -0.004327304661273956, -0.004189440049231052, -0.0040515754371881485, -0.003913710825145245, -0.003775845980271697, -0.0036379811353981495, -0.0035001165233552456, -0.0033622519113123417, -0.0032243868336081505, -0.0030865222215652466, -0.002948657376691699, -0.002810792764648795, -0.0026729281526058912, -0.0025350633077323437, -0.0023971986956894398, -0.002259334083646536, -0.0021214692387729883, -0.0019836046267300844, -0.0018457398982718587, -0.001707875169813633, -0.001570010557770729, -0.0014321458293125033, -0.0012942811008542776, -0.0011564164888113737, -0.001018551760353148, -0.0008806870901025832, -0.0007428224198520184, -0.0006049576913937926, -0.0004670930211432278, -0.000329228350892663, -0.00019136362243443727, -5.349895218387246e-05, 8.436571806669235e-05, 0.0002222304028691724, 0.00036009508767165244, 0.0004979597870260477, 0.0006358244572766125, 0.0007736891275271773, 0.0009115538559854031, 0.001049418468028307, 0.0011872831964865327, 0.0013251479249447584, 0.0014630125369876623, 0.001600877265445888, 0.0017387419939041138, 0.0018766066059470177, 0.0020144712179899216, 0.002152336062863469, 0.002290200674906373]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 9.0, 6.0, 13.0, 15.0, 19.0, 18.0, 25.0, 27.0, 33.0, 37.0, 38.0, 36.0, 50.0, 37.0, 46.0, 44.0, 60.0, 48.0, 60.0, 48.0, 36.0, 37.0, 31.0, 36.0, 42.0, 27.0, 29.0, 23.0, 14.0, 12.0, 14.0, 3.0, 4.0, 6.0, 4.0, 3.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0012736916542053223, -0.0012402180582284927, -0.0012067444622516632, -0.0011732708662748337, -0.0011397972702980042, -0.0011063236743211746, -0.001072850078344345, -0.0010393764823675156, -0.001005902886390686, -0.0009724292904138565, -0.000938955694437027, -0.0009054820984601974, -0.0008720085024833679, -0.0008385349065065384, -0.0008050613105297089, -0.0007715877145528793, -0.0007381141185760498, -0.0007046405225992203, -0.0006711669266223907, -0.0006376933306455612, -0.0006042197346687317, -0.0005707461386919022, -0.0005372725427150726, -0.0005037989467382431, -0.0004703253507614136, -0.00043685175478458405, -0.0004033781588077545, -0.000369904562830925, -0.00033643096685409546, -0.00030295737087726593, -0.0002694837749004364, -0.00023601017892360687, -0.00020253658294677734, -0.00016906298696994781, -0.00013558939099311829, -0.00010211579501628876, -6.864219903945923e-05, -3.51686030626297e-05, -1.695007085800171e-06, 3.177858889102936e-05, 6.525218486785889e-05, 9.872578084468842e-05, 0.00013219937682151794, 0.00016567297279834747, 0.000199146568775177, 0.00023262016475200653, 0.00026609376072883606, 0.0002995673567056656, 0.0003330409526824951, 0.00036651454865932465, 0.0003999881446361542, 0.0004334617406129837, 0.00046693533658981323, 0.0005004089325666428, 0.0005338825285434723, 0.0005673561245203018, 0.0006008297204971313, 0.0006343033164739609, 0.0006677769124507904, 0.0007012505084276199, 0.0007347241044044495, 0.000768197700381279, 0.0008016712963581085, 0.000835144892334938, 0.0008686184883117676]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 7.0, 10.0, 15.0, 17.0, 17.0, 21.0, 29.0, 33.0, 32.0, 32.0, 40.0, 38.0, 46.0, 44.0, 42.0, 42.0, 51.0, 42.0, 46.0, 40.0, 44.0, 40.0, 35.0, 38.0, 38.0, 26.0, 26.0, 19.0, 15.0, 17.0, 15.0, 13.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.99505615234375, -4.8260498046875, -4.65704345703125, -4.488037109375, -4.31903076171875, -4.1500244140625, -3.98101806640625, -3.81201171875, -3.64300537109375, -3.4739990234375, -3.30499267578125, -3.135986328125, -2.96697998046875, -2.7979736328125, -2.62896728515625, -2.4599609375, -2.29095458984375, -2.1219482421875, -1.95294189453125, -1.783935546875, -1.61492919921875, -1.4459228515625, -1.27691650390625, -1.10791015625, -0.93890380859375, -0.7698974609375, -0.60089111328125, -0.431884765625, -0.26287841796875, -0.0938720703125, 0.07513427734375, 0.244140625, 0.41314697265625, 0.5821533203125, 0.75115966796875, 0.920166015625, 1.08917236328125, 1.2581787109375, 1.42718505859375, 1.59619140625, 1.76519775390625, 1.9342041015625, 2.10321044921875, 2.272216796875, 2.44122314453125, 2.6102294921875, 2.77923583984375, 2.9482421875, 3.11724853515625, 3.2862548828125, 3.45526123046875, 3.624267578125, 3.79327392578125, 3.9622802734375, 4.13128662109375, 4.30029296875, 4.46929931640625, 4.6383056640625, 4.80731201171875, 4.976318359375, 5.14532470703125, 5.3143310546875, 5.48333740234375, 5.65234375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 8.0, 4.0, 17.0, 14.0, 29.0, 22.0, 60.0, 68.0, 124.0, 150.0, 259.0, 430.0, 723.0, 1161.0, 2214.0, 4652.0, 9282.0, 19245.0, 39847.0, 85007.0, 197958.0, 350414.0, 182708.0, 80820.0, 37225.0, 17993.0, 8699.0, 4274.0, 2160.0, 1161.0, 638.0, 401.0, 253.0, 148.0, 127.0, 94.0, 61.0, 29.0, 18.0, 17.0, 15.0, 10.0, 2.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-3.40625, -3.304443359375, -3.20263671875, -3.100830078125, -2.9990234375, -2.897216796875, -2.79541015625, -2.693603515625, -2.591796875, -2.489990234375, -2.38818359375, -2.286376953125, -2.1845703125, -2.082763671875, -1.98095703125, -1.879150390625, -1.77734375, -1.675537109375, -1.57373046875, -1.471923828125, -1.3701171875, -1.268310546875, -1.16650390625, -1.064697265625, -0.962890625, -0.861083984375, -0.75927734375, -0.657470703125, -0.5556640625, -0.453857421875, -0.35205078125, -0.250244140625, -0.1484375, -0.046630859375, 0.05517578125, 0.156982421875, 0.2587890625, 0.360595703125, 0.46240234375, 0.564208984375, 0.666015625, 0.767822265625, 0.86962890625, 0.971435546875, 1.0732421875, 1.175048828125, 1.27685546875, 1.378662109375, 1.48046875, 1.582275390625, 1.68408203125, 1.785888671875, 1.8876953125, 1.989501953125, 2.09130859375, 2.193115234375, 2.294921875, 2.396728515625, 2.49853515625, 2.600341796875, 2.7021484375, 2.803955078125, 2.90576171875, 3.007568359375, 3.109375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 2.0, 4.0, 9.0, 8.0, 10.0, 8.0, 16.0, 18.0, 23.0, 24.0, 25.0, 31.0, 38.0, 37.0, 49.0, 51.0, 66.0, 101.0, 354.0, 1598.0, 142.0, 69.0, 54.0, 44.0, 32.0, 40.0, 34.0, 29.0, 22.0, 22.0, 15.0, 11.0, 8.0, 12.0, 12.0, 11.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.96875, -20.35546875, -19.7421875, -19.12890625, -18.515625, -17.90234375, -17.2890625, -16.67578125, -16.0625, -15.44921875, -14.8359375, -14.22265625, -13.609375, -12.99609375, -12.3828125, -11.76953125, -11.15625, -10.54296875, -9.9296875, -9.31640625, -8.703125, -8.08984375, -7.4765625, -6.86328125, -6.25, -5.63671875, -5.0234375, -4.41015625, -3.796875, -3.18359375, -2.5703125, -1.95703125, -1.34375, -0.73046875, -0.1171875, 0.49609375, 1.109375, 1.72265625, 2.3359375, 2.94921875, 3.5625, 4.17578125, 4.7890625, 5.40234375, 6.015625, 6.62890625, 7.2421875, 7.85546875, 8.46875, 9.08203125, 9.6953125, 10.30859375, 10.921875, 11.53515625, 12.1484375, 12.76171875, 13.375, 13.98828125, 14.6015625, 15.21484375, 15.828125, 16.44140625, 17.0546875, 17.66796875, 18.28125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 10.0, 11.0, 15.0, 12.0, 14.0, 17.0, 17.0, 37.0, 41.0, 67.0, 83.0, 125.0, 148.0, 212.0, 343.0, 922.0, 6851.0, 2998578.0, 134317.0, 2278.0, 538.0, 320.0, 206.0, 124.0, 95.0, 66.0, 60.0, 53.0, 30.0, 18.0, 25.0, 11.0, 14.0, 9.0, 11.0, 6.0, 6.0, 6.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.25, -39.865234375, -38.48046875, -37.095703125, -35.7109375, -34.326171875, -32.94140625, -31.556640625, -30.171875, -28.787109375, -27.40234375, -26.017578125, -24.6328125, -23.248046875, -21.86328125, -20.478515625, -19.09375, -17.708984375, -16.32421875, -14.939453125, -13.5546875, -12.169921875, -10.78515625, -9.400390625, -8.015625, -6.630859375, -5.24609375, -3.861328125, -2.4765625, -1.091796875, 0.29296875, 1.677734375, 3.0625, 4.447265625, 5.83203125, 7.216796875, 8.6015625, 9.986328125, 11.37109375, 12.755859375, 14.140625, 15.525390625, 16.91015625, 18.294921875, 19.6796875, 21.064453125, 22.44921875, 23.833984375, 25.21875, 26.603515625, 27.98828125, 29.373046875, 30.7578125, 32.142578125, 33.52734375, 34.912109375, 36.296875, 37.681640625, 39.06640625, 40.451171875, 41.8359375, 43.220703125, 44.60546875, 45.990234375, 47.375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 3.0, 8.0, 15.0, 24.0, 31.0, 40.0, 65.0, 98.0, 115.0, 121.0, 111.0, 103.0, 85.0, 70.0, 43.0, 29.0, 12.0, 14.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.285987854003906, -13.757482528686523, -13.22897720336914, -12.700471878051758, -12.171966552734375, -11.643461227416992, -11.114956855773926, -10.586451530456543, -10.05794620513916, -9.529440879821777, -9.000935554504395, -8.472430229187012, -7.943925380706787, -7.415420055389404, -6.88691520690918, -6.358409881591797, -5.829904556274414, -5.301399230957031, -4.772893905639648, -4.244389057159424, -3.715883731842041, -3.187378406524658, -2.6588733196258545, -2.130368232727051, -1.601862907409668, -1.0733577013015747, -0.5448524951934814, -0.016347289085388184, 0.5121579170227051, 1.040663242340088, 1.5691683292388916, 2.0976734161376953, 2.6261768341064453, 3.154682159423828, 3.683187246322632, 4.2116923332214355, 4.740197658538818, 5.268702983856201, 5.797207832336426, 6.325713157653809, 6.854218482971191, 7.382723808288574, 7.911229133605957, 8.43973445892334, 8.968238830566406, 9.496744155883789, 10.025249481201172, 10.553754806518555, 11.082260131835938, 11.61076545715332, 12.139270782470703, 12.667776107788086, 13.196281433105469, 13.724786758422852, 14.253291130065918, 14.7817964553833, 15.310301780700684, 15.838807106018066, 16.367311477661133, 16.895816802978516, 17.4243221282959, 17.95282745361328, 18.481332778930664, 19.009838104248047, 19.53834342956543]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 13.0, 16.0, 21.0, 16.0, 28.0, 27.0, 34.0, 36.0, 36.0, 39.0, 52.0, 50.0, 33.0, 47.0, 47.0, 51.0, 42.0, 48.0, 56.0, 42.0, 42.0, 36.0, 37.0, 22.0, 18.0, 28.0, 23.0, 7.0, 12.0, 8.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.11354064941406, -41.5509033203125, -39.98826599121094, -38.425628662109375, -36.86299133300781, -35.30035400390625, -33.73771667480469, -32.175079345703125, -30.612443923950195, -29.049806594848633, -27.48716926574707, -25.92453384399414, -24.361896514892578, -22.799259185791016, -21.236621856689453, -19.67398452758789, -18.111347198486328, -16.548709869384766, -14.986072540283203, -13.423436164855957, -11.860798835754395, -10.298161506652832, -8.735525131225586, -7.172887802124023, -5.610250473022461, -4.047613143920898, -2.484976291656494, -0.9223394393920898, 0.6402978897094727, 2.202935218811035, 3.7655715942382812, 5.328208923339844, 6.890850067138672, 8.453487396240234, 10.016124725341797, 11.578761100769043, 13.141398429870605, 14.704035758972168, 16.266672134399414, 17.829309463500977, 19.39194679260254, 20.9545841217041, 22.517221450805664, 24.079856872558594, 25.642494201660156, 27.20513153076172, 28.76776885986328, 30.330406188964844, 31.893043518066406, 33.45568084716797, 35.01831817626953, 36.580955505371094, 38.143592834472656, 39.70623016357422, 41.26886749267578, 42.831504821777344, 44.394142150878906, 45.95677947998047, 47.51941680908203, 49.082054138183594, 50.644691467285156, 52.20732879638672, 53.76996612548828, 55.332603454589844, 56.89523696899414]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 13.0, 16.0, 19.0, 25.0, 22.0, 30.0, 33.0, 39.0, 36.0, 38.0, 37.0, 38.0, 53.0, 44.0, 40.0, 49.0, 45.0, 45.0, 37.0, 50.0, 36.0, 39.0, 40.0, 24.0, 25.0, 20.0, 18.0, 15.0, 18.0, 10.0, 13.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.10015869140625, -4.9229736328125, -4.74578857421875, -4.568603515625, -4.39141845703125, -4.2142333984375, -4.03704833984375, -3.85986328125, -3.68267822265625, -3.5054931640625, -3.32830810546875, -3.151123046875, -2.97393798828125, -2.7967529296875, -2.61956787109375, -2.4423828125, -2.26519775390625, -2.0880126953125, -1.91082763671875, -1.733642578125, -1.55645751953125, -1.3792724609375, -1.20208740234375, -1.02490234375, -0.84771728515625, -0.6705322265625, -0.49334716796875, -0.316162109375, -0.13897705078125, 0.0382080078125, 0.21539306640625, 0.392578125, 0.56976318359375, 0.7469482421875, 0.92413330078125, 1.101318359375, 1.27850341796875, 1.4556884765625, 1.63287353515625, 1.81005859375, 1.98724365234375, 2.1644287109375, 2.34161376953125, 2.518798828125, 2.69598388671875, 2.8731689453125, 3.05035400390625, 3.2275390625, 3.40472412109375, 3.5819091796875, 3.75909423828125, 3.936279296875, 4.11346435546875, 4.2906494140625, 4.46783447265625, 4.64501953125, 4.82220458984375, 4.9993896484375, 5.17657470703125, 5.353759765625, 5.53094482421875, 5.7081298828125, 5.88531494140625, 6.0625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 9.0, 9.0, 19.0, 15.0, 18.0, 30.0, 20.0, 22.0, 35.0, 38.0, 36.0, 48.0, 102.0, 472.0, 4020.0, 104376.0, 3497289.0, 575300.0, 10971.0, 974.0, 139.0, 56.0, 45.0, 36.0, 37.0, 32.0, 30.0, 17.0, 19.0, 9.0, 14.0, 17.0, 12.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.46875, -18.765380859375, -18.06201171875, -17.358642578125, -16.6552734375, -15.951904296875, -15.24853515625, -14.545166015625, -13.841796875, -13.138427734375, -12.43505859375, -11.731689453125, -11.0283203125, -10.324951171875, -9.62158203125, -8.918212890625, -8.21484375, -7.511474609375, -6.80810546875, -6.104736328125, -5.4013671875, -4.697998046875, -3.99462890625, -3.291259765625, -2.587890625, -1.884521484375, -1.18115234375, -0.477783203125, 0.2255859375, 0.928955078125, 1.63232421875, 2.335693359375, 3.0390625, 3.742431640625, 4.44580078125, 5.149169921875, 5.8525390625, 6.555908203125, 7.25927734375, 7.962646484375, 8.666015625, 9.369384765625, 10.07275390625, 10.776123046875, 11.4794921875, 12.182861328125, 12.88623046875, 13.589599609375, 14.29296875, 14.996337890625, 15.69970703125, 16.403076171875, 17.1064453125, 17.809814453125, 18.51318359375, 19.216552734375, 19.919921875, 20.623291015625, 21.32666015625, 22.030029296875, 22.7333984375, 23.436767578125, 24.14013671875, 24.843505859375, 25.546875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 6.0, 5.0, 5.0, 13.0, 28.0, 32.0, 36.0, 59.0, 65.0, 88.0, 101.0, 118.0, 185.0, 232.0, 276.0, 334.0, 418.0, 407.0, 384.0, 276.0, 233.0, 173.0, 121.0, 111.0, 97.0, 69.0, 58.0, 36.0, 20.0, 16.0, 16.0, 15.0, 12.0, 3.0, 2.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.90625, -10.6041259765625, -10.302001953125, -9.9998779296875, -9.69775390625, -9.3956298828125, -9.093505859375, -8.7913818359375, -8.4892578125, -8.1871337890625, -7.885009765625, -7.5828857421875, -7.28076171875, -6.9786376953125, -6.676513671875, -6.3743896484375, -6.072265625, -5.7701416015625, -5.468017578125, -5.1658935546875, -4.86376953125, -4.5616455078125, -4.259521484375, -3.9573974609375, -3.6552734375, -3.3531494140625, -3.051025390625, -2.7489013671875, -2.44677734375, -2.1446533203125, -1.842529296875, -1.5404052734375, -1.23828125, -0.9361572265625, -0.634033203125, -0.3319091796875, -0.02978515625, 0.2723388671875, 0.574462890625, 0.8765869140625, 1.1787109375, 1.4808349609375, 1.782958984375, 2.0850830078125, 2.38720703125, 2.6893310546875, 2.991455078125, 3.2935791015625, 3.595703125, 3.8978271484375, 4.199951171875, 4.5020751953125, 4.80419921875, 5.1063232421875, 5.408447265625, 5.7105712890625, 6.0126953125, 6.3148193359375, 6.616943359375, 6.9190673828125, 7.22119140625, 7.5233154296875, 7.825439453125, 8.1275634765625, 8.4296875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 7.0, 12.0, 13.0, 19.0, 31.0, 40.0, 32.0, 44.0, 61.0, 85.0, 121.0, 167.0, 239.0, 366.0, 1059.0, 10728.0, 1523143.0, 2639264.0, 16213.0, 1192.0, 444.0, 256.0, 190.0, 133.0, 112.0, 69.0, 54.0, 34.0, 26.0, 20.0, 23.0, 15.0, 12.0, 12.0, 6.0, 7.0, 5.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.6875, -33.49365234375, -32.2998046875, -31.10595703125, -29.912109375, -28.71826171875, -27.5244140625, -26.33056640625, -25.13671875, -23.94287109375, -22.7490234375, -21.55517578125, -20.361328125, -19.16748046875, -17.9736328125, -16.77978515625, -15.5859375, -14.39208984375, -13.1982421875, -12.00439453125, -10.810546875, -9.61669921875, -8.4228515625, -7.22900390625, -6.03515625, -4.84130859375, -3.6474609375, -2.45361328125, -1.259765625, -0.06591796875, 1.1279296875, 2.32177734375, 3.515625, 4.70947265625, 5.9033203125, 7.09716796875, 8.291015625, 9.48486328125, 10.6787109375, 11.87255859375, 13.06640625, 14.26025390625, 15.4541015625, 16.64794921875, 17.841796875, 19.03564453125, 20.2294921875, 21.42333984375, 22.6171875, 23.81103515625, 25.0048828125, 26.19873046875, 27.392578125, 28.58642578125, 29.7802734375, 30.97412109375, 32.16796875, 33.36181640625, 34.5556640625, 35.74951171875, 36.943359375, 38.13720703125, 39.3310546875, 40.52490234375, 41.71875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 136.0, 400.0, 387.0, 84.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.9327507019043, -54.79733657836914, -48.66192626953125, -42.526512145996094, -36.39109802246094, -30.255687713623047, -24.12027359008789, -17.98486328125, -11.849449157714844, -5.714036464691162, 0.42137622833251953, 6.556789398193359, 12.692201614379883, 18.827613830566406, 24.963027954101562, 31.098438262939453, 37.23385238647461, 43.369266510009766, 49.504676818847656, 55.64009094238281, 61.77550506591797, 67.91091918945312, 74.04632568359375, 80.1817398071289, 86.31715393066406, 92.45256805419922, 98.58798217773438, 104.723388671875, 110.85880279541016, 116.99421691894531, 123.12963104248047, 129.26504516601562, 135.4004669189453, 141.53587341308594, 147.67129516601562, 153.80670166015625, 159.94212341308594, 166.07752990722656, 172.21295166015625, 178.34835815429688, 184.4837646484375, 190.61917114257812, 196.7545928955078, 202.88999938964844, 209.02542114257812, 215.16082763671875, 221.29623413085938, 227.43165588378906, 233.56707763671875, 239.70248413085938, 245.83790588378906, 251.9733123779297, 258.1087341308594, 264.244140625, 270.3795471191406, 276.51495361328125, 282.6503601074219, 288.7857666015625, 294.9211730957031, 301.0566101074219, 307.1920166015625, 313.3274230957031, 319.46282958984375, 325.5982360839844, 331.7336730957031]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 2.0, 8.0, 7.0, 8.0, 13.0, 9.0, 12.0, 19.0, 27.0, 22.0, 22.0, 29.0, 33.0, 27.0, 29.0, 32.0, 45.0, 45.0, 45.0, 50.0, 50.0, 43.0, 34.0, 40.0, 39.0, 31.0, 39.0, 35.0, 21.0, 19.0, 23.0, 24.0, 18.0, 15.0, 17.0, 15.0, 13.0, 11.0, 7.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-35.31499481201172, -34.24851608276367, -33.18203353881836, -32.11555480957031, -31.049074172973633, -29.982593536376953, -28.916114807128906, -27.849634170532227, -26.783153533935547, -25.716672897338867, -24.65019416809082, -23.58371353149414, -22.51723289489746, -21.45075225830078, -20.384273529052734, -19.317792892456055, -18.251314163208008, -17.184833526611328, -16.11835479736328, -15.051874160766602, -13.985393524169922, -12.918913841247559, -11.852434158325195, -10.785953521728516, -9.719473838806152, -8.652994155883789, -7.586513519287109, -6.520033836364746, -5.453553676605225, -4.387073516845703, -3.32059383392334, -2.2541136741638184, -1.1876335144042969, -0.12115347385406494, 0.945326566696167, 2.0118064880371094, 3.078286647796631, 4.144766807556152, 5.211246490478516, 6.277726650238037, 7.344206809997559, 8.410686492919922, 9.477167129516602, 10.543646812438965, 11.610126495361328, 12.676607131958008, 13.743086814880371, 14.809566497802734, 15.876047134399414, 16.942527770996094, 18.00900650024414, 19.07548713684082, 20.1419677734375, 21.208446502685547, 22.274927139282227, 23.341407775878906, 24.407886505126953, 25.474367141723633, 26.54084587097168, 27.60732650756836, 28.67380714416504, 29.74028778076172, 30.806766510009766, 31.873247146606445, 32.939727783203125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 4.0, 11.0, 10.0, 18.0, 25.0, 17.0, 20.0, 30.0, 36.0, 31.0, 47.0, 30.0, 35.0, 52.0, 51.0, 48.0, 40.0, 46.0, 38.0, 42.0, 44.0, 53.0, 35.0, 28.0, 28.0, 36.0, 30.0, 24.0, 20.0, 18.0, 12.0, 14.0, 9.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.69134521484375, -5.5115966796875, -5.33184814453125, -5.152099609375, -4.97235107421875, -4.7926025390625, -4.61285400390625, -4.43310546875, -4.25335693359375, -4.0736083984375, -3.89385986328125, -3.714111328125, -3.53436279296875, -3.3546142578125, -3.17486572265625, -2.9951171875, -2.81536865234375, -2.6356201171875, -2.45587158203125, -2.276123046875, -2.09637451171875, -1.9166259765625, -1.73687744140625, -1.55712890625, -1.37738037109375, -1.1976318359375, -1.01788330078125, -0.838134765625, -0.65838623046875, -0.4786376953125, -0.29888916015625, -0.119140625, 0.06060791015625, 0.2403564453125, 0.42010498046875, 0.599853515625, 0.77960205078125, 0.9593505859375, 1.13909912109375, 1.31884765625, 1.49859619140625, 1.6783447265625, 1.85809326171875, 2.037841796875, 2.21759033203125, 2.3973388671875, 2.57708740234375, 2.7568359375, 2.93658447265625, 3.1163330078125, 3.29608154296875, 3.475830078125, 3.65557861328125, 3.8353271484375, 4.01507568359375, 4.19482421875, 4.37457275390625, 4.5543212890625, 4.73406982421875, 4.913818359375, 5.09356689453125, 5.2733154296875, 5.45306396484375, 5.6328125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 9.0, 15.0, 20.0, 23.0, 23.0, 52.0, 72.0, 111.0, 153.0, 238.0, 294.0, 480.0, 648.0, 986.0, 1384.0, 2024.0, 2940.0, 4248.0, 6210.0, 8900.0, 12948.0, 19150.0, 28483.0, 43178.0, 68363.0, 109443.0, 166293.0, 186960.0, 136546.0, 86206.0, 53897.0, 34797.0, 23162.0, 15783.0, 10860.0, 7272.0, 5048.0, 3519.0, 2399.0, 1699.0, 1132.0, 802.0, 553.0, 382.0, 269.0, 192.0, 126.0, 92.0, 48.0, 38.0, 33.0, 29.0, 10.0, 9.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.57666015625, -0.5582046508789062, -0.5397491455078125, -0.5212936401367188, -0.502838134765625, -0.48438262939453125, -0.4659271240234375, -0.44747161865234375, -0.42901611328125, -0.41056060791015625, -0.3921051025390625, -0.37364959716796875, -0.355194091796875, -0.33673858642578125, -0.3182830810546875, -0.29982757568359375, -0.2813720703125, -0.26291656494140625, -0.2444610595703125, -0.22600555419921875, -0.207550048828125, -0.18909454345703125, -0.1706390380859375, -0.15218353271484375, -0.13372802734375, -0.11527252197265625, -0.0968170166015625, -0.07836151123046875, -0.059906005859375, -0.04145050048828125, -0.0229949951171875, -0.00453948974609375, 0.013916015625, 0.03237152099609375, 0.0508270263671875, 0.06928253173828125, 0.087738037109375, 0.10619354248046875, 0.1246490478515625, 0.14310455322265625, 0.16156005859375, 0.18001556396484375, 0.1984710693359375, 0.21692657470703125, 0.235382080078125, 0.25383758544921875, 0.2722930908203125, 0.29074859619140625, 0.3092041015625, 0.32765960693359375, 0.3461151123046875, 0.36457061767578125, 0.383026123046875, 0.40148162841796875, 0.4199371337890625, 0.43839263916015625, 0.45684814453125, 0.47530364990234375, 0.4937591552734375, 0.5122146606445312, 0.530670166015625, 0.5491256713867188, 0.5675811767578125, 0.5860366821289062, 0.6044921875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 11.0, 9.0, 8.0, 11.0, 15.0, 23.0, 14.0, 19.0, 20.0, 29.0, 19.0, 27.0, 32.0, 49.0, 24.0, 38.0, 45.0, 47.0, 1066.0, 50.0, 43.0, 49.0, 45.0, 39.0, 30.0, 33.0, 29.0, 29.0, 23.0, 30.0, 19.0, 19.0, 8.0, 8.0, 13.0, 8.0, 12.0, 6.0, 8.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.08984375, -2.986602783203125, -2.88336181640625, -2.780120849609375, -2.6768798828125, -2.573638916015625, -2.47039794921875, -2.367156982421875, -2.263916015625, -2.160675048828125, -2.05743408203125, -1.954193115234375, -1.8509521484375, -1.747711181640625, -1.64447021484375, -1.541229248046875, -1.43798828125, -1.334747314453125, -1.23150634765625, -1.128265380859375, -1.0250244140625, -0.921783447265625, -0.81854248046875, -0.715301513671875, -0.612060546875, -0.508819580078125, -0.40557861328125, -0.302337646484375, -0.1990966796875, -0.095855712890625, 0.00738525390625, 0.110626220703125, 0.2138671875, 0.317108154296875, 0.42034912109375, 0.523590087890625, 0.6268310546875, 0.730072021484375, 0.83331298828125, 0.936553955078125, 1.039794921875, 1.143035888671875, 1.24627685546875, 1.349517822265625, 1.4527587890625, 1.555999755859375, 1.65924072265625, 1.762481689453125, 1.86572265625, 1.968963623046875, 2.07220458984375, 2.175445556640625, 2.2786865234375, 2.381927490234375, 2.48516845703125, 2.588409423828125, 2.691650390625, 2.794891357421875, 2.89813232421875, 3.001373291015625, 3.1046142578125, 3.207855224609375, 3.31109619140625, 3.414337158203125, 3.517578125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 7.0, 10.0, 24.0, 28.0, 42.0, 68.0, 102.0, 140.0, 208.0, 330.0, 495.0, 800.0, 1201.0, 1952.0, 3057.0, 4865.0, 7992.0, 12920.0, 21750.0, 38247.0, 68320.0, 126175.0, 213037.0, 1271163.0, 142384.0, 77031.0, 42312.0, 24680.0, 14365.0, 8763.0, 5327.0, 3283.0, 2164.0, 1379.0, 870.0, 562.0, 362.0, 250.0, 160.0, 91.0, 80.0, 36.0, 29.0, 16.0, 13.0, 11.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5576171875, -0.5402450561523438, -0.5228729248046875, -0.5055007934570312, -0.488128662109375, -0.47075653076171875, -0.4533843994140625, -0.43601226806640625, -0.41864013671875, -0.40126800537109375, -0.3838958740234375, -0.36652374267578125, -0.349151611328125, -0.33177947998046875, -0.3144073486328125, -0.29703521728515625, -0.2796630859375, -0.26229095458984375, -0.2449188232421875, -0.22754669189453125, -0.210174560546875, -0.19280242919921875, -0.1754302978515625, -0.15805816650390625, -0.14068603515625, -0.12331390380859375, -0.1059417724609375, -0.08856964111328125, -0.071197509765625, -0.05382537841796875, -0.0364532470703125, -0.01908111572265625, -0.001708984375, 0.01566314697265625, 0.0330352783203125, 0.05040740966796875, 0.067779541015625, 0.08515167236328125, 0.1025238037109375, 0.11989593505859375, 0.13726806640625, 0.15464019775390625, 0.1720123291015625, 0.18938446044921875, 0.206756591796875, 0.22412872314453125, 0.2415008544921875, 0.25887298583984375, 0.2762451171875, 0.29361724853515625, 0.3109893798828125, 0.32836151123046875, 0.345733642578125, 0.36310577392578125, 0.3804779052734375, 0.39785003662109375, 0.41522216796875, 0.43259429931640625, 0.4499664306640625, 0.46733856201171875, 0.484710693359375, 0.5020828247070312, 0.5194549560546875, 0.5368270874023438, 0.55419921875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 4.0, 3.0, 2.0, 1.0, 10.0, 10.0, 8.0, 14.0, 23.0, 26.0, 38.0, 46.0, 45.0, 63.0, 54.0, 57.0, 83.0, 80.0, 65.0, 75.0, 68.0, 53.0, 37.0, 24.0, 23.0, 18.0, 13.0, 9.0, 13.0, 10.0, 9.0, 3.0, 3.0, 2.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001983642578125, -0.0019269287586212158, -0.0018702149391174316, -0.0018135011196136475, -0.0017567873001098633, -0.001700073480606079, -0.001643359661102295, -0.0015866458415985107, -0.0015299320220947266, -0.0014732182025909424, -0.0014165043830871582, -0.001359790563583374, -0.0013030767440795898, -0.0012463629245758057, -0.0011896491050720215, -0.0011329352855682373, -0.0010762214660644531, -0.001019507646560669, -0.0009627938270568848, -0.0009060800075531006, -0.0008493661880493164, -0.0007926523685455322, -0.000735938549041748, -0.0006792247295379639, -0.0006225109100341797, -0.0005657970905303955, -0.0005090832710266113, -0.00045236945152282715, -0.00039565563201904297, -0.0003389418125152588, -0.0002822279930114746, -0.00022551417350769043, -0.00016880035400390625, -0.00011208653450012207, -5.537271499633789e-05, 1.341104507446289e-06, 5.805492401123047e-05, 0.00011476874351501465, 0.00017148256301879883, 0.000228196382522583, 0.0002849102020263672, 0.00034162402153015137, 0.00039833784103393555, 0.0004550516605377197, 0.0005117654800415039, 0.0005684792995452881, 0.0006251931190490723, 0.0006819069385528564, 0.0007386207580566406, 0.0007953345775604248, 0.000852048397064209, 0.0009087622165679932, 0.0009654760360717773, 0.0010221898555755615, 0.0010789036750793457, 0.0011356174945831299, 0.001192331314086914, 0.0012490451335906982, 0.0013057589530944824, 0.0013624727725982666, 0.0014191865921020508, 0.001475900411605835, 0.0015326142311096191, 0.0015893280506134033, 0.0016460418701171875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 6.0, 13.0, 15.0, 6.0, 18.0, 17.0, 29.0, 32.0, 52.0, 72.0, 90.0, 161.0, 239.0, 447.0, 1373.0, 48974.0, 986823.0, 8276.0, 842.0, 370.0, 220.0, 137.0, 100.0, 59.0, 49.0, 30.0, 31.0, 15.0, 10.0, 13.0, 8.0, 4.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.036773681640625, -0.03563642501831055, -0.034499168395996094, -0.03336191177368164, -0.03222465515136719, -0.031087398529052734, -0.02995014190673828, -0.028812885284423828, -0.027675628662109375, -0.026538372039794922, -0.02540111541748047, -0.024263858795166016, -0.023126602172851562, -0.02198934555053711, -0.020852088928222656, -0.019714832305908203, -0.01857757568359375, -0.017440319061279297, -0.016303062438964844, -0.01516580581665039, -0.014028549194335938, -0.012891292572021484, -0.011754035949707031, -0.010616779327392578, -0.009479522705078125, -0.008342266082763672, -0.007205009460449219, -0.006067752838134766, -0.0049304962158203125, -0.0037932395935058594, -0.0026559829711914062, -0.0015187263488769531, -0.0003814697265625, 0.0007557868957519531, 0.0018930435180664062, 0.0030303001403808594, 0.0041675567626953125, 0.005304813385009766, 0.006442070007324219, 0.007579326629638672, 0.008716583251953125, 0.009853839874267578, 0.010991096496582031, 0.012128353118896484, 0.013265609741210938, 0.01440286636352539, 0.015540122985839844, 0.016677379608154297, 0.01781463623046875, 0.018951892852783203, 0.020089149475097656, 0.02122640609741211, 0.022363662719726562, 0.023500919342041016, 0.02463817596435547, 0.025775432586669922, 0.026912689208984375, 0.028049945831298828, 0.02918720245361328, 0.030324459075927734, 0.03146171569824219, 0.03259897232055664, 0.033736228942871094, 0.03487348556518555, 0.0360107421875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 461.0, 539.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02173800580203533, -0.021312225610017776, -0.02088644541800022, -0.020460665225982666, -0.02003488503396511, -0.019609104841947556, -0.01918332278728485, -0.018757542595267296, -0.01833176240324974, -0.017905982211232185, -0.01748020201921463, -0.017054421827197075, -0.01662864163517952, -0.016202859580516815, -0.01577708125114441, -0.01535130012780428, -0.014925519935786724, -0.014499739743769169, -0.014073959551751614, -0.013648178428411484, -0.013222398236393929, -0.012796618044376373, -0.012370837852358818, -0.011945057660341263, -0.011519277468323708, -0.011093497276306152, -0.010667717084288597, -0.010241936892271042, -0.009816155768930912, -0.009390375576913357, -0.008964595384895802, -0.008538815192878246, -0.008113034069538116, -0.007687253877520561, -0.007261473219841719, -0.0068356930278241634, -0.006409912370145321, -0.005984132178127766, -0.00555835198611021, -0.005132571794092655, -0.004706791136413813, -0.004281010944396257, -0.003855230286717415, -0.0034294500946998596, -0.0030036696698516607, -0.002577889245003462, -0.0021521090529859066, -0.0017263286281377077, -0.0013005482032895088, -0.0008747678366489708, -0.00044898747000843287, -2.32071615755558e-05, 0.0004025732632726431, 0.000828353688120842, 0.0012541338801383972, 0.001679914304986596, 0.002105694729834795, 0.002531475154682994, 0.0029572555795311928, 0.003383035771548748, 0.003808816196396947, 0.004234596621245146, 0.004660376813262701, 0.005086157470941544, 0.005511937662959099]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 4.0, 10.0, 10.0, 10.0, 14.0, 22.0, 33.0, 31.0, 36.0, 35.0, 48.0, 49.0, 62.0, 61.0, 48.0, 68.0, 53.0, 54.0, 51.0, 62.0, 44.0, 45.0, 35.0, 25.0, 19.0, 19.0, 18.0, 10.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000890195369720459, -0.0008535804226994514, -0.0008169654756784439, -0.0007803505286574364, -0.0007437355816364288, -0.0007071206346154213, -0.0006705056875944138, -0.0006338907405734062, -0.0005972757935523987, -0.0005606608465313911, -0.0005240458995103836, -0.00048743095248937607, -0.00045081600546836853, -0.000414201058447361, -0.00037758611142635345, -0.0003409711644053459, -0.0003043562173843384, -0.00026774127036333084, -0.0002311263233423233, -0.00019451137632131577, -0.00015789642930030823, -0.00012128148227930069, -8.466653525829315e-05, -4.8051588237285614e-05, -1.1436641216278076e-05, 2.517830580472946e-05, 6.1793252825737e-05, 9.840819984674454e-05, 0.00013502314686775208, 0.0001716380938887596, 0.00020825304090976715, 0.0002448679879307747, 0.0002814829349517822, 0.00031809788197278976, 0.0003547128289937973, 0.00039132777601480484, 0.0004279427230358124, 0.0004645576700568199, 0.0005011726170778275, 0.000537787564098835, 0.0005744025111198425, 0.0006110174581408501, 0.0006476324051618576, 0.0006842473521828651, 0.0007208622992038727, 0.0007574772462248802, 0.0007940921932458878, 0.0008307071402668953, 0.0008673220872879028, 0.0009039370343089104, 0.0009405519813299179, 0.0009771669283509254, 0.001013781875371933, 0.0010503968223929405, 0.001087011769413948, 0.0011236267164349556, 0.0011602416634559631, 0.0011968566104769707, 0.0012334715574979782, 0.0012700865045189857, 0.0013067014515399933, 0.0013433163985610008, 0.0013799313455820084, 0.001416546292603016, 0.0014531612396240234]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 4.0, 11.0, 10.0, 18.0, 25.0, 17.0, 20.0, 30.0, 36.0, 31.0, 47.0, 30.0, 35.0, 52.0, 51.0, 48.0, 40.0, 46.0, 38.0, 42.0, 44.0, 53.0, 35.0, 28.0, 28.0, 36.0, 30.0, 24.0, 20.0, 18.0, 12.0, 14.0, 9.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.69134521484375, -5.5115966796875, -5.33184814453125, -5.152099609375, -4.97235107421875, -4.7926025390625, -4.61285400390625, -4.43310546875, -4.25335693359375, -4.0736083984375, -3.89385986328125, -3.714111328125, -3.53436279296875, -3.3546142578125, -3.17486572265625, -2.9951171875, -2.81536865234375, -2.6356201171875, -2.45587158203125, -2.276123046875, -2.09637451171875, -1.9166259765625, -1.73687744140625, -1.55712890625, -1.37738037109375, -1.1976318359375, -1.01788330078125, -0.838134765625, -0.65838623046875, -0.4786376953125, -0.29888916015625, -0.119140625, 0.06060791015625, 0.2403564453125, 0.42010498046875, 0.599853515625, 0.77960205078125, 0.9593505859375, 1.13909912109375, 1.31884765625, 1.49859619140625, 1.6783447265625, 1.85809326171875, 2.037841796875, 2.21759033203125, 2.3973388671875, 2.57708740234375, 2.7568359375, 2.93658447265625, 3.1163330078125, 3.29608154296875, 3.475830078125, 3.65557861328125, 3.8353271484375, 4.01507568359375, 4.19482421875, 4.37457275390625, 4.5543212890625, 4.73406982421875, 4.913818359375, 5.09356689453125, 5.2733154296875, 5.45306396484375, 5.6328125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 9.0, 12.0, 16.0, 21.0, 32.0, 41.0, 71.0, 90.0, 124.0, 179.0, 326.0, 624.0, 1071.0, 1961.0, 4085.0, 8629.0, 18704.0, 42999.0, 98098.0, 236251.0, 372985.0, 145431.0, 64077.0, 28148.0, 12520.0, 5856.0, 2826.0, 1405.0, 717.0, 444.0, 276.0, 143.0, 111.0, 74.0, 48.0, 39.0, 32.0, 23.0, 16.0, 17.0, 11.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.359375, -3.248291015625, -3.13720703125, -3.026123046875, -2.9150390625, -2.803955078125, -2.69287109375, -2.581787109375, -2.470703125, -2.359619140625, -2.24853515625, -2.137451171875, -2.0263671875, -1.915283203125, -1.80419921875, -1.693115234375, -1.58203125, -1.470947265625, -1.35986328125, -1.248779296875, -1.1376953125, -1.026611328125, -0.91552734375, -0.804443359375, -0.693359375, -0.582275390625, -0.47119140625, -0.360107421875, -0.2490234375, -0.137939453125, -0.02685546875, 0.084228515625, 0.1953125, 0.306396484375, 0.41748046875, 0.528564453125, 0.6396484375, 0.750732421875, 0.86181640625, 0.972900390625, 1.083984375, 1.195068359375, 1.30615234375, 1.417236328125, 1.5283203125, 1.639404296875, 1.75048828125, 1.861572265625, 1.97265625, 2.083740234375, 2.19482421875, 2.305908203125, 2.4169921875, 2.528076171875, 2.63916015625, 2.750244140625, 2.861328125, 2.972412109375, 3.08349609375, 3.194580078125, 3.3056640625, 3.416748046875, 3.52783203125, 3.638916015625, 3.75]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 4.0, 3.0, 3.0, 7.0, 3.0, 12.0, 8.0, 8.0, 7.0, 12.0, 13.0, 22.0, 18.0, 20.0, 25.0, 29.0, 26.0, 31.0, 33.0, 41.0, 39.0, 51.0, 86.0, 213.0, 1619.0, 215.0, 85.0, 55.0, 39.0, 44.0, 40.0, 43.0, 32.0, 31.0, 22.0, 19.0, 20.0, 11.0, 11.0, 14.0, 13.0, 4.0, 8.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.34375, -18.82763671875, -18.3115234375, -17.79541015625, -17.279296875, -16.76318359375, -16.2470703125, -15.73095703125, -15.21484375, -14.69873046875, -14.1826171875, -13.66650390625, -13.150390625, -12.63427734375, -12.1181640625, -11.60205078125, -11.0859375, -10.56982421875, -10.0537109375, -9.53759765625, -9.021484375, -8.50537109375, -7.9892578125, -7.47314453125, -6.95703125, -6.44091796875, -5.9248046875, -5.40869140625, -4.892578125, -4.37646484375, -3.8603515625, -3.34423828125, -2.828125, -2.31201171875, -1.7958984375, -1.27978515625, -0.763671875, -0.24755859375, 0.2685546875, 0.78466796875, 1.30078125, 1.81689453125, 2.3330078125, 2.84912109375, 3.365234375, 3.88134765625, 4.3974609375, 4.91357421875, 5.4296875, 5.94580078125, 6.4619140625, 6.97802734375, 7.494140625, 8.01025390625, 8.5263671875, 9.04248046875, 9.55859375, 10.07470703125, 10.5908203125, 11.10693359375, 11.623046875, 12.13916015625, 12.6552734375, 13.17138671875, 13.6875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 5.0, 7.0, 6.0, 9.0, 15.0, 11.0, 25.0, 24.0, 24.0, 44.0, 43.0, 75.0, 99.0, 122.0, 174.0, 214.0, 283.0, 591.0, 2575.0, 341800.0, 2792408.0, 5004.0, 764.0, 343.0, 249.0, 171.0, 121.0, 102.0, 80.0, 57.0, 51.0, 31.0, 37.0, 30.0, 20.0, 10.0, 21.0, 15.0, 9.0, 6.0, 5.0, 5.0, 5.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.875, -32.7119140625, -31.548828125, -30.3857421875, -29.22265625, -28.0595703125, -26.896484375, -25.7333984375, -24.5703125, -23.4072265625, -22.244140625, -21.0810546875, -19.91796875, -18.7548828125, -17.591796875, -16.4287109375, -15.265625, -14.1025390625, -12.939453125, -11.7763671875, -10.61328125, -9.4501953125, -8.287109375, -7.1240234375, -5.9609375, -4.7978515625, -3.634765625, -2.4716796875, -1.30859375, -0.1455078125, 1.017578125, 2.1806640625, 3.34375, 4.5068359375, 5.669921875, 6.8330078125, 7.99609375, 9.1591796875, 10.322265625, 11.4853515625, 12.6484375, 13.8115234375, 14.974609375, 16.1376953125, 17.30078125, 18.4638671875, 19.626953125, 20.7900390625, 21.953125, 23.1162109375, 24.279296875, 25.4423828125, 26.60546875, 27.7685546875, 28.931640625, 30.0947265625, 31.2578125, 32.4208984375, 33.583984375, 34.7470703125, 35.91015625, 37.0732421875, 38.236328125, 39.3994140625, 40.5625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 11.0, 338.0, 623.0, 44.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.69039916992188, -188.60650634765625, -184.5226287841797, -180.43873596191406, -176.3548583984375, -172.27096557617188, -168.1870880126953, -164.1031951904297, -160.01931762695312, -155.9354248046875, -151.85154724121094, -147.7676544189453, -143.68377685546875, -139.59988403320312, -135.51600646972656, -131.43211364746094, -127.34822845458984, -123.26434326171875, -119.18045806884766, -115.09657287597656, -111.01268768310547, -106.92880249023438, -102.84490966796875, -98.76103210449219, -94.67713928222656, -90.59325408935547, -86.50936889648438, -82.42548370361328, -78.34159851074219, -74.2577133178711, -70.173828125, -66.08993530273438, -62.00605010986328, -57.92216491699219, -53.838279724121094, -49.75439453125, -45.670509338378906, -41.58662414550781, -37.50273513793945, -33.41884994506836, -29.334964752197266, -25.251079559326172, -21.167194366455078, -17.08330726623535, -12.999422073364258, -8.915536880493164, -4.8316497802734375, -0.7477645874023438, 3.33612060546875, 7.420006275177002, 11.503891944885254, 15.587778091430664, 19.671663284301758, 23.75554847717285, 27.839435577392578, 31.923320770263672, 36.007205963134766, 40.09109115600586, 44.17497634887695, 48.25886535644531, 52.342750549316406, 56.4266357421875, 60.510520935058594, 64.59440612792969, 68.67829132080078]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 13.0, 6.0, 8.0, 9.0, 14.0, 15.0, 21.0, 28.0, 28.0, 26.0, 35.0, 27.0, 39.0, 27.0, 36.0, 45.0, 35.0, 53.0, 53.0, 31.0, 51.0, 47.0, 36.0, 34.0, 38.0, 22.0, 23.0, 22.0, 28.0, 20.0, 23.0, 13.0, 13.0, 13.0, 14.0, 10.0, 5.0, 4.0, 4.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0], "bins": [-52.956687927246094, -51.42449188232422, -49.892295837402344, -48.36009979248047, -46.82790756225586, -45.295711517333984, -43.76351547241211, -42.231319427490234, -40.699127197265625, -39.16693115234375, -37.634735107421875, -36.1025390625, -34.57034683227539, -33.038150787353516, -31.50595474243164, -29.973758697509766, -28.44156265258789, -26.909366607666016, -25.377172470092773, -23.8449764251709, -22.312782287597656, -20.78058624267578, -19.248390197753906, -17.71619415283203, -16.18400001525879, -14.65180492401123, -13.119609832763672, -11.587413787841797, -10.055218696594238, -8.52302360534668, -6.990827560424805, -5.458632469177246, -3.926433563232422, -2.394238233566284, -0.8620429039001465, 0.6701526641845703, 2.202347755432129, 3.7345428466796875, 5.2667388916015625, 6.798933982849121, 8.33112907409668, 9.863324165344238, 11.395519256591797, 12.927715301513672, 14.45991039276123, 15.992105484008789, 17.524301528930664, 19.056495666503906, 20.58869171142578, 22.120887756347656, 23.6530818939209, 25.185277938842773, 26.717472076416016, 28.24966812133789, 29.781864166259766, 31.31406021118164, 32.84625244140625, 34.378448486328125, 35.91064453125, 37.442840576171875, 38.975032806396484, 40.50722885131836, 42.039424896240234, 43.57162094116211, 45.103816986083984]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 1.0, 11.0, 5.0, 10.0, 13.0, 15.0, 22.0, 21.0, 27.0, 26.0, 37.0, 27.0, 37.0, 36.0, 43.0, 54.0, 46.0, 41.0, 41.0, 39.0, 35.0, 39.0, 42.0, 50.0, 36.0, 23.0, 30.0, 38.0, 27.0, 18.0, 25.0, 16.0, 16.0, 16.0, 12.0, 11.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90234375, -5.72216796875, -5.5419921875, -5.36181640625, -5.181640625, -5.00146484375, -4.8212890625, -4.64111328125, -4.4609375, -4.28076171875, -4.1005859375, -3.92041015625, -3.740234375, -3.56005859375, -3.3798828125, -3.19970703125, -3.01953125, -2.83935546875, -2.6591796875, -2.47900390625, -2.298828125, -2.11865234375, -1.9384765625, -1.75830078125, -1.578125, -1.39794921875, -1.2177734375, -1.03759765625, -0.857421875, -0.67724609375, -0.4970703125, -0.31689453125, -0.13671875, 0.04345703125, 0.2236328125, 0.40380859375, 0.583984375, 0.76416015625, 0.9443359375, 1.12451171875, 1.3046875, 1.48486328125, 1.6650390625, 1.84521484375, 2.025390625, 2.20556640625, 2.3857421875, 2.56591796875, 2.74609375, 2.92626953125, 3.1064453125, 3.28662109375, 3.466796875, 3.64697265625, 3.8271484375, 4.00732421875, 4.1875, 4.36767578125, 4.5478515625, 4.72802734375, 4.908203125, 5.08837890625, 5.2685546875, 5.44873046875, 5.62890625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 3.0, 9.0, 12.0, 12.0, 8.0, 19.0, 24.0, 21.0, 24.0, 28.0, 34.0, 47.0, 71.0, 107.0, 326.0, 1133.0, 7504.0, 179030.0, 3376288.0, 611000.0, 15817.0, 1806.0, 452.0, 166.0, 64.0, 44.0, 39.0, 28.0, 18.0, 27.0, 20.0, 21.0, 15.0, 22.0, 12.0, 6.0, 7.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.77294921875, -18.1396484375, -17.50634765625, -16.873046875, -16.23974609375, -15.6064453125, -14.97314453125, -14.33984375, -13.70654296875, -13.0732421875, -12.43994140625, -11.806640625, -11.17333984375, -10.5400390625, -9.90673828125, -9.2734375, -8.64013671875, -8.0068359375, -7.37353515625, -6.740234375, -6.10693359375, -5.4736328125, -4.84033203125, -4.20703125, -3.57373046875, -2.9404296875, -2.30712890625, -1.673828125, -1.04052734375, -0.4072265625, 0.22607421875, 0.859375, 1.49267578125, 2.1259765625, 2.75927734375, 3.392578125, 4.02587890625, 4.6591796875, 5.29248046875, 5.92578125, 6.55908203125, 7.1923828125, 7.82568359375, 8.458984375, 9.09228515625, 9.7255859375, 10.35888671875, 10.9921875, 11.62548828125, 12.2587890625, 12.89208984375, 13.525390625, 14.15869140625, 14.7919921875, 15.42529296875, 16.05859375, 16.69189453125, 17.3251953125, 17.95849609375, 18.591796875, 19.22509765625, 19.8583984375, 20.49169921875, 21.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 7.0, 9.0, 19.0, 13.0, 21.0, 20.0, 29.0, 38.0, 64.0, 77.0, 84.0, 110.0, 173.0, 207.0, 249.0, 318.0, 399.0, 409.0, 371.0, 342.0, 302.0, 192.0, 136.0, 118.0, 89.0, 72.0, 44.0, 29.0, 26.0, 28.0, 17.0, 19.0, 7.0, 4.0, 4.0, 9.0, 8.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.45703125, -8.1484375, -7.83984375, -7.53125, -7.22265625, -6.9140625, -6.60546875, -6.296875, -5.98828125, -5.6796875, -5.37109375, -5.0625, -4.75390625, -4.4453125, -4.13671875, -3.828125, -3.51953125, -3.2109375, -2.90234375, -2.59375, -2.28515625, -1.9765625, -1.66796875, -1.359375, -1.05078125, -0.7421875, -0.43359375, -0.125, 0.18359375, 0.4921875, 0.80078125, 1.109375, 1.41796875, 1.7265625, 2.03515625, 2.34375, 2.65234375, 2.9609375, 3.26953125, 3.578125, 3.88671875, 4.1953125, 4.50390625, 4.8125, 5.12109375, 5.4296875, 5.73828125, 6.046875, 6.35546875, 6.6640625, 6.97265625, 7.28125, 7.58984375, 7.8984375, 8.20703125, 8.515625, 8.82421875, 9.1328125, 9.44140625, 9.75, 10.05859375, 10.3671875, 10.67578125, 10.984375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 3.0, 8.0, 11.0, 8.0, 11.0, 12.0, 20.0, 35.0, 41.0, 45.0, 68.0, 76.0, 106.0, 130.0, 160.0, 233.0, 285.0, 502.0, 1429.0, 37221.0, 3746124.0, 401274.0, 4369.0, 610.0, 374.0, 242.0, 179.0, 148.0, 118.0, 107.0, 59.0, 51.0, 49.0, 34.0, 26.0, 28.0, 19.0, 17.0, 10.0, 9.0, 9.0, 6.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-38.1875, -36.98388671875, -35.7802734375, -34.57666015625, -33.373046875, -32.16943359375, -30.9658203125, -29.76220703125, -28.55859375, -27.35498046875, -26.1513671875, -24.94775390625, -23.744140625, -22.54052734375, -21.3369140625, -20.13330078125, -18.9296875, -17.72607421875, -16.5224609375, -15.31884765625, -14.115234375, -12.91162109375, -11.7080078125, -10.50439453125, -9.30078125, -8.09716796875, -6.8935546875, -5.68994140625, -4.486328125, -3.28271484375, -2.0791015625, -0.87548828125, 0.328125, 1.53173828125, 2.7353515625, 3.93896484375, 5.142578125, 6.34619140625, 7.5498046875, 8.75341796875, 9.95703125, 11.16064453125, 12.3642578125, 13.56787109375, 14.771484375, 15.97509765625, 17.1787109375, 18.38232421875, 19.5859375, 20.78955078125, 21.9931640625, 23.19677734375, 24.400390625, 25.60400390625, 26.8076171875, 28.01123046875, 29.21484375, 30.41845703125, 31.6220703125, 32.82568359375, 34.029296875, 35.23291015625, 36.4365234375, 37.64013671875, 38.84375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 58.0, 220.0, 378.0, 259.0, 80.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.08834075927734, -69.35191345214844, -64.61548614501953, -59.87905502319336, -55.14262771606445, -50.40620040893555, -45.669769287109375, -40.93334197998047, -36.19691467285156, -31.460487365722656, -26.724058151245117, -21.987628936767578, -17.251201629638672, -12.514774322509766, -7.778345108032227, -3.0419158935546875, 1.6945114135742188, 6.430939674377441, 11.167367935180664, 15.903796195983887, 20.64022445678711, 25.376651763916016, 30.113080978393555, 34.849510192871094, 39.5859375, 44.322364807128906, 49.05879211425781, 53.795223236083984, 58.53165054321289, 63.2680778503418, 68.00450897216797, 72.74093627929688, 77.47737121582031, 82.21379852294922, 86.95022583007812, 91.68665313720703, 96.42308044433594, 101.15951538085938, 105.89594268798828, 110.63236999511719, 115.3687973022461, 120.105224609375, 124.8416519165039, 129.5780792236328, 134.31451416015625, 139.05093383789062, 143.78736877441406, 148.5238037109375, 153.26022338867188, 157.9966583251953, 162.7330780029297, 167.46951293945312, 172.2059326171875, 176.94236755371094, 181.6787872314453, 186.41522216796875, 191.15164184570312, 195.88807678222656, 200.62449645996094, 205.36093139648438, 210.09735107421875, 214.8337860107422, 219.57020568847656, 224.306640625, 229.04307556152344]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 9.0, 6.0, 7.0, 6.0, 5.0, 13.0, 13.0, 18.0, 9.0, 22.0, 21.0, 16.0, 41.0, 28.0, 34.0, 20.0, 35.0, 31.0, 30.0, 32.0, 35.0, 30.0, 44.0, 33.0, 35.0, 35.0, 39.0, 36.0, 27.0, 37.0, 35.0, 25.0, 27.0, 31.0, 17.0, 10.0, 15.0, 19.0, 10.0, 11.0, 9.0, 13.0, 7.0, 5.0, 6.0, 1.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-31.401290893554688, -30.431167602539062, -29.461044311523438, -28.49091911315918, -27.520795822143555, -26.55067253112793, -25.580547332763672, -24.610424041748047, -23.640300750732422, -22.670177459716797, -21.700054168701172, -20.729928970336914, -19.75980567932129, -18.789682388305664, -17.819557189941406, -16.84943389892578, -15.879310607910156, -14.909187316894531, -13.93906307220459, -12.968938827514648, -11.998815536499023, -11.028692245483398, -10.058568000793457, -9.088443756103516, -8.11832046508789, -7.148196697235107, -6.178072929382324, -5.207949161529541, -4.237825393676758, -3.2677016258239746, -2.2975778579711914, -1.3274540901184082, -0.357330322265625, 0.6127934455871582, 1.5829172134399414, 2.5530409812927246, 3.523164749145508, 4.493288516998291, 5.463412284851074, 6.433536052703857, 7.403659820556641, 8.373783111572266, 9.343907356262207, 10.314031600952148, 11.284154891967773, 12.254278182983398, 13.22440242767334, 14.194526672363281, 15.164649963378906, 16.13477325439453, 17.104896545410156, 18.075021743774414, 19.04514503479004, 20.015268325805664, 20.985393524169922, 21.955516815185547, 22.925640106201172, 23.895763397216797, 24.865886688232422, 25.83601188659668, 26.806135177612305, 27.77625846862793, 28.746383666992188, 29.716506958007812, 30.686630249023438]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 3.0, 5.0, 8.0, 10.0, 20.0, 17.0, 21.0, 21.0, 16.0, 34.0, 31.0, 30.0, 31.0, 26.0, 45.0, 47.0, 19.0, 41.0, 33.0, 47.0, 37.0, 40.0, 41.0, 37.0, 48.0, 37.0, 24.0, 31.0, 33.0, 28.0, 21.0, 24.0, 14.0, 14.0, 14.0, 6.0, 14.0, 6.0, 4.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.6484375, -5.484619140625, -5.32080078125, -5.156982421875, -4.9931640625, -4.829345703125, -4.66552734375, -4.501708984375, -4.337890625, -4.174072265625, -4.01025390625, -3.846435546875, -3.6826171875, -3.518798828125, -3.35498046875, -3.191162109375, -3.02734375, -2.863525390625, -2.69970703125, -2.535888671875, -2.3720703125, -2.208251953125, -2.04443359375, -1.880615234375, -1.716796875, -1.552978515625, -1.38916015625, -1.225341796875, -1.0615234375, -0.897705078125, -0.73388671875, -0.570068359375, -0.40625, -0.242431640625, -0.07861328125, 0.085205078125, 0.2490234375, 0.412841796875, 0.57666015625, 0.740478515625, 0.904296875, 1.068115234375, 1.23193359375, 1.395751953125, 1.5595703125, 1.723388671875, 1.88720703125, 2.051025390625, 2.21484375, 2.378662109375, 2.54248046875, 2.706298828125, 2.8701171875, 3.033935546875, 3.19775390625, 3.361572265625, 3.525390625, 3.689208984375, 3.85302734375, 4.016845703125, 4.1806640625, 4.344482421875, 4.50830078125, 4.672119140625, 4.8359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 14.0, 13.0, 16.0, 28.0, 52.0, 77.0, 92.0, 140.0, 199.0, 250.0, 422.0, 546.0, 808.0, 1147.0, 1677.0, 2347.0, 3419.0, 5043.0, 7320.0, 10772.0, 15927.0, 24085.0, 36531.0, 56099.0, 88171.0, 140902.0, 190416.0, 163541.0, 104650.0, 65748.0, 42165.0, 27911.0, 18479.0, 12405.0, 8348.0, 5761.0, 4086.0, 2781.0, 1896.0, 1310.0, 873.0, 613.0, 402.0, 324.0, 239.0, 151.0, 132.0, 82.0, 56.0, 39.0, 19.0, 14.0, 11.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.58984375, -0.57061767578125, -0.5513916015625, -0.53216552734375, -0.512939453125, -0.49371337890625, -0.4744873046875, -0.45526123046875, -0.43603515625, -0.41680908203125, -0.3975830078125, -0.37835693359375, -0.359130859375, -0.33990478515625, -0.3206787109375, -0.30145263671875, -0.2822265625, -0.26300048828125, -0.2437744140625, -0.22454833984375, -0.205322265625, -0.18609619140625, -0.1668701171875, -0.14764404296875, -0.12841796875, -0.10919189453125, -0.0899658203125, -0.07073974609375, -0.051513671875, -0.03228759765625, -0.0130615234375, 0.00616455078125, 0.025390625, 0.04461669921875, 0.0638427734375, 0.08306884765625, 0.102294921875, 0.12152099609375, 0.1407470703125, 0.15997314453125, 0.17919921875, 0.19842529296875, 0.2176513671875, 0.23687744140625, 0.256103515625, 0.27532958984375, 0.2945556640625, 0.31378173828125, 0.3330078125, 0.35223388671875, 0.3714599609375, 0.39068603515625, 0.409912109375, 0.42913818359375, 0.4483642578125, 0.46759033203125, 0.48681640625, 0.50604248046875, 0.5252685546875, 0.54449462890625, 0.563720703125, 0.58294677734375, 0.6021728515625, 0.62139892578125, 0.640625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 2.0, 9.0, 6.0, 11.0, 12.0, 9.0, 8.0, 14.0, 19.0, 26.0, 25.0, 19.0, 22.0, 30.0, 35.0, 37.0, 26.0, 35.0, 30.0, 35.0, 42.0, 39.0, 1053.0, 31.0, 27.0, 37.0, 34.0, 34.0, 37.0, 31.0, 22.0, 22.0, 27.0, 17.0, 27.0, 20.0, 21.0, 12.0, 15.0, 10.0, 12.0, 5.0, 8.0, 8.0, 1.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.8046875, -2.712890625, -2.62109375, -2.529296875, -2.4375, -2.345703125, -2.25390625, -2.162109375, -2.0703125, -1.978515625, -1.88671875, -1.794921875, -1.703125, -1.611328125, -1.51953125, -1.427734375, -1.3359375, -1.244140625, -1.15234375, -1.060546875, -0.96875, -0.876953125, -0.78515625, -0.693359375, -0.6015625, -0.509765625, -0.41796875, -0.326171875, -0.234375, -0.142578125, -0.05078125, 0.041015625, 0.1328125, 0.224609375, 0.31640625, 0.408203125, 0.5, 0.591796875, 0.68359375, 0.775390625, 0.8671875, 0.958984375, 1.05078125, 1.142578125, 1.234375, 1.326171875, 1.41796875, 1.509765625, 1.6015625, 1.693359375, 1.78515625, 1.876953125, 1.96875, 2.060546875, 2.15234375, 2.244140625, 2.3359375, 2.427734375, 2.51953125, 2.611328125, 2.703125, 2.794921875, 2.88671875, 2.978515625, 3.0703125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 14.0, 18.0, 26.0, 38.0, 68.0, 84.0, 164.0, 285.0, 460.0, 729.0, 1334.0, 2289.0, 4040.0, 7042.0, 12588.0, 23941.0, 45058.0, 91186.0, 185327.0, 1320255.0, 197367.0, 98680.0, 49290.0, 25191.0, 13798.0, 7491.0, 4278.0, 2468.0, 1443.0, 886.0, 476.0, 314.0, 184.0, 109.0, 72.0, 43.0, 31.0, 12.0, 16.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.810546875, -0.7889633178710938, -0.7673797607421875, -0.7457962036132812, -0.724212646484375, -0.7026290893554688, -0.6810455322265625, -0.6594619750976562, -0.63787841796875, -0.6162948608398438, -0.5947113037109375, -0.5731277465820312, -0.551544189453125, -0.5299606323242188, -0.5083770751953125, -0.48679351806640625, -0.4652099609375, -0.44362640380859375, -0.4220428466796875, -0.40045928955078125, -0.378875732421875, -0.35729217529296875, -0.3357086181640625, -0.31412506103515625, -0.29254150390625, -0.27095794677734375, -0.2493743896484375, -0.22779083251953125, -0.206207275390625, -0.18462371826171875, -0.1630401611328125, -0.14145660400390625, -0.119873046875, -0.09828948974609375, -0.0767059326171875, -0.05512237548828125, -0.033538818359375, -0.01195526123046875, 0.0096282958984375, 0.03121185302734375, 0.05279541015625, 0.07437896728515625, 0.0959625244140625, 0.11754608154296875, 0.139129638671875, 0.16071319580078125, 0.1822967529296875, 0.20388031005859375, 0.2254638671875, 0.24704742431640625, 0.2686309814453125, 0.29021453857421875, 0.311798095703125, 0.33338165283203125, 0.3549652099609375, 0.37654876708984375, 0.39813232421875, 0.41971588134765625, 0.4412994384765625, 0.46288299560546875, 0.484466552734375, 0.5060501098632812, 0.5276336669921875, 0.5492172241210938, 0.57080078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 9.0, 10.0, 15.0, 10.0, 17.0, 22.0, 15.0, 30.0, 41.0, 33.0, 50.0, 43.0, 67.0, 61.0, 63.0, 68.0, 50.0, 56.0, 46.0, 57.0, 31.0, 29.0, 27.0, 24.0, 32.0, 18.0, 12.0, 17.0, 9.0, 6.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001987457275390625, -0.0019224882125854492, -0.0018575191497802734, -0.0017925500869750977, -0.0017275810241699219, -0.001662611961364746, -0.0015976428985595703, -0.0015326738357543945, -0.0014677047729492188, -0.001402735710144043, -0.0013377666473388672, -0.0012727975845336914, -0.0012078285217285156, -0.0011428594589233398, -0.001077890396118164, -0.0010129213333129883, -0.0009479522705078125, -0.0008829832077026367, -0.0008180141448974609, -0.0007530450820922852, -0.0006880760192871094, -0.0006231069564819336, -0.0005581378936767578, -0.000493168830871582, -0.00042819976806640625, -0.00036323070526123047, -0.0002982616424560547, -0.0002332925796508789, -0.00016832351684570312, -0.00010335445404052734, -3.838539123535156e-05, 2.658367156982422e-05, 9.1552734375e-05, 0.00015652179718017578, 0.00022149085998535156, 0.00028645992279052734, 0.0003514289855957031, 0.0004163980484008789, 0.0004813671112060547, 0.0005463361740112305, 0.0006113052368164062, 0.000676274299621582, 0.0007412433624267578, 0.0008062124252319336, 0.0008711814880371094, 0.0009361505508422852, 0.001001119613647461, 0.0010660886764526367, 0.0011310577392578125, 0.0011960268020629883, 0.001260995864868164, 0.0013259649276733398, 0.0013909339904785156, 0.0014559030532836914, 0.0015208721160888672, 0.001585841178894043, 0.0016508102416992188, 0.0017157793045043945, 0.0017807483673095703, 0.001845717430114746, 0.0019106864929199219, 0.0019756555557250977, 0.0020406246185302734, 0.0021055936813354492, 0.002170562744140625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 9.0, 2.0, 9.0, 17.0, 22.0, 24.0, 24.0, 29.0, 41.0, 68.0, 93.0, 121.0, 193.0, 383.0, 1394.0, 176131.0, 866623.0, 2189.0, 525.0, 215.0, 105.0, 71.0, 68.0, 52.0, 24.0, 23.0, 21.0, 18.0, 14.0, 18.0, 8.0, 4.0, 4.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.062347412109375, -0.060753822326660156, -0.05916023254394531, -0.05756664276123047, -0.055973052978515625, -0.05437946319580078, -0.05278587341308594, -0.051192283630371094, -0.04959869384765625, -0.048005104064941406, -0.04641151428222656, -0.04481792449951172, -0.043224334716796875, -0.04163074493408203, -0.04003715515136719, -0.038443565368652344, -0.0368499755859375, -0.035256385803222656, -0.03366279602050781, -0.03206920623779297, -0.030475616455078125, -0.02888202667236328, -0.027288436889648438, -0.025694847106933594, -0.02410125732421875, -0.022507667541503906, -0.020914077758789062, -0.01932048797607422, -0.017726898193359375, -0.01613330841064453, -0.014539718627929688, -0.012946128845214844, -0.0113525390625, -0.009758949279785156, -0.008165359497070312, -0.006571769714355469, -0.004978179931640625, -0.0033845901489257812, -0.0017910003662109375, -0.00019741058349609375, 0.00139617919921875, 0.0029897689819335938, 0.0045833587646484375, 0.006176948547363281, 0.007770538330078125, 0.009364128112792969, 0.010957717895507812, 0.012551307678222656, 0.0141448974609375, 0.015738487243652344, 0.017332077026367188, 0.01892566680908203, 0.020519256591796875, 0.02211284637451172, 0.023706436157226562, 0.025300025939941406, 0.02689361572265625, 0.028487205505371094, 0.030080795288085938, 0.03167438507080078, 0.033267974853515625, 0.03486156463623047, 0.03645515441894531, 0.038048744201660156, 0.039642333984375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 46.0, 849.0, 120.0, 1.0, 1.0], "bins": [-0.026967698708176613, -0.026522818952798843, -0.026077939197421074, -0.025633061304688454, -0.025188181549310684, -0.024743301793932915, -0.024298422038555145, -0.023853542283177376, -0.023408664390444756, -0.022963784635066986, -0.022518904879689217, -0.022074026986956596, -0.021629147231578827, -0.021184267476201057, -0.020739387720823288, -0.02029450796544552, -0.01984962821006775, -0.01940474845468998, -0.01895986869931221, -0.01851499080657959, -0.01807011105120182, -0.01762523129582405, -0.01718035154044628, -0.016735471785068512, -0.01629059389233589, -0.015845714136958122, -0.015400835312902927, -0.014955955557525158, -0.014511076733469963, -0.014066196978092194, -0.013621317222714424, -0.01317643839865923, -0.01273155864328146, -0.01228667888790369, -0.011841800063848495, -0.011396920308470726, -0.010952041484415531, -0.010507161729037762, -0.010062282904982567, -0.009617403149604797, -0.009172523394227028, -0.008727643638849258, -0.008282764814794064, -0.007837885059416294, -0.007393005769699812, -0.00694812647998333, -0.006503247190266848, -0.0060583679005503654, -0.005613488145172596, -0.005168608855456114, -0.004723729565739632, -0.004278849810361862, -0.00383397052064538, -0.003389091230928898, -0.0029442119412124157, -0.00249933241866529, -0.0020544533617794514, -0.0016095739556476474, -0.0011646945495158434, -0.0007198152597993612, -0.00027493585366755724, 0.00016994355246424675, 0.0006148228421807289, 0.0010597023647278547, 0.0015045816544443369]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 10.0, 10.0, 19.0, 23.0, 20.0, 28.0, 22.0, 43.0, 36.0, 51.0, 42.0, 47.0, 42.0, 45.0, 55.0, 35.0, 60.0, 52.0, 51.0, 52.0, 39.0, 35.0, 36.0, 27.0, 20.0, 14.0, 20.0, 17.0, 10.0, 10.0, 6.0, 2.0, 1.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001035928726196289, -0.0009940741583704948, -0.0009522195905447006, -0.0009103650227189064, -0.0008685104548931122, -0.000826655887067318, -0.0007848013192415237, -0.0007429467514157295, -0.0007010921835899353, -0.0006592376157641411, -0.0006173830479383469, -0.0005755284801125526, -0.0005336739122867584, -0.0004918193444609642, -0.00044996477663517, -0.00040811020880937576, -0.00036625564098358154, -0.0003244010731577873, -0.0002825465053319931, -0.00024069193750619888, -0.00019883736968040466, -0.00015698280185461044, -0.00011512823402881622, -7.3273666203022e-05, -3.141909837722778e-05, 1.0435469448566437e-05, 5.229003727436066e-05, 9.414460510015488e-05, 0.0001359991729259491, 0.00017785374075174332, 0.00021970830857753754, 0.00026156287640333176, 0.000303417444229126, 0.0003452720120549202, 0.0003871265798807144, 0.00042898114770650864, 0.00047083571553230286, 0.0005126902833580971, 0.0005545448511838913, 0.0005963994190096855, 0.0006382539868354797, 0.000680108554661274, 0.0007219631224870682, 0.0007638176903128624, 0.0008056722581386566, 0.0008475268259644508, 0.0008893813937902451, 0.0009312359616160393, 0.0009730905294418335, 0.0010149450972676277, 0.001056799665093422, 0.0010986542329192162, 0.0011405088007450104, 0.0011823633685708046, 0.0012242179363965988, 0.001266072504222393, 0.0013079270720481873, 0.0013497816398739815, 0.0013916362076997757, 0.00143349077552557, 0.0014753453433513641, 0.0015171999111771584, 0.0015590544790029526, 0.0016009090468287468, 0.001642763614654541]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 3.0, 5.0, 8.0, 10.0, 20.0, 17.0, 21.0, 21.0, 16.0, 34.0, 31.0, 30.0, 31.0, 26.0, 45.0, 47.0, 19.0, 41.0, 33.0, 47.0, 37.0, 40.0, 41.0, 37.0, 48.0, 37.0, 24.0, 31.0, 34.0, 27.0, 21.0, 24.0, 14.0, 14.0, 14.0, 6.0, 14.0, 6.0, 4.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.6484375, -5.484619140625, -5.32080078125, -5.156982421875, -4.9931640625, -4.829345703125, -4.66552734375, -4.501708984375, -4.337890625, -4.174072265625, -4.01025390625, -3.846435546875, -3.6826171875, -3.518798828125, -3.35498046875, -3.191162109375, -3.02734375, -2.863525390625, -2.69970703125, -2.535888671875, -2.3720703125, -2.208251953125, -2.04443359375, -1.880615234375, -1.716796875, -1.552978515625, -1.38916015625, -1.225341796875, -1.0615234375, -0.897705078125, -0.73388671875, -0.570068359375, -0.40625, -0.242431640625, -0.07861328125, 0.085205078125, 0.2490234375, 0.412841796875, 0.57666015625, 0.740478515625, 0.904296875, 1.068115234375, 1.23193359375, 1.395751953125, 1.5595703125, 1.723388671875, 1.88720703125, 2.051025390625, 2.21484375, 2.378662109375, 2.54248046875, 2.706298828125, 2.8701171875, 3.033935546875, 3.19775390625, 3.361572265625, 3.525390625, 3.689208984375, 3.85302734375, 4.016845703125, 4.1806640625, 4.344482421875, 4.50830078125, 4.672119140625, 4.8359375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 7.0, 6.0, 13.0, 15.0, 34.0, 60.0, 64.0, 85.0, 151.0, 177.0, 305.0, 478.0, 746.0, 1157.0, 1913.0, 3385.0, 5838.0, 11102.0, 21667.0, 47833.0, 115371.0, 312733.0, 314018.0, 116013.0, 47485.0, 22263.0, 11033.0, 5890.0, 3445.0, 1984.0, 1212.0, 693.0, 443.0, 315.0, 173.0, 122.0, 94.0, 74.0, 53.0, 29.0, 26.0, 15.0, 9.0, 6.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-3.86328125, -3.749664306640625, -3.63604736328125, -3.522430419921875, -3.4088134765625, -3.295196533203125, -3.18157958984375, -3.067962646484375, -2.954345703125, -2.840728759765625, -2.72711181640625, -2.613494873046875, -2.4998779296875, -2.386260986328125, -2.27264404296875, -2.159027099609375, -2.04541015625, -1.931793212890625, -1.81817626953125, -1.704559326171875, -1.5909423828125, -1.477325439453125, -1.36370849609375, -1.250091552734375, -1.136474609375, -1.022857666015625, -0.90924072265625, -0.795623779296875, -0.6820068359375, -0.568389892578125, -0.45477294921875, -0.341156005859375, -0.2275390625, -0.113922119140625, -0.00030517578125, 0.113311767578125, 0.2269287109375, 0.340545654296875, 0.45416259765625, 0.567779541015625, 0.681396484375, 0.795013427734375, 0.90863037109375, 1.022247314453125, 1.1358642578125, 1.249481201171875, 1.36309814453125, 1.476715087890625, 1.59033203125, 1.703948974609375, 1.81756591796875, 1.931182861328125, 2.0447998046875, 2.158416748046875, 2.27203369140625, 2.385650634765625, 2.499267578125, 2.612884521484375, 2.72650146484375, 2.840118408203125, 2.9537353515625, 3.067352294921875, 3.18096923828125, 3.294586181640625, 3.408203125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 6.0, 11.0, 10.0, 9.0, 14.0, 14.0, 11.0, 17.0, 26.0, 27.0, 22.0, 31.0, 43.0, 45.0, 49.0, 52.0, 82.0, 136.0, 1586.0, 268.0, 99.0, 69.0, 56.0, 37.0, 40.0, 43.0, 41.0, 31.0, 22.0, 25.0, 19.0, 23.0, 16.0, 15.0, 6.0, 9.0, 5.0, 9.0, 2.0, 2.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -18.0286865234375, -17.494873046875, -16.9610595703125, -16.42724609375, -15.8934326171875, -15.359619140625, -14.8258056640625, -14.2919921875, -13.7581787109375, -13.224365234375, -12.6905517578125, -12.15673828125, -11.6229248046875, -11.089111328125, -10.5552978515625, -10.021484375, -9.4876708984375, -8.953857421875, -8.4200439453125, -7.88623046875, -7.3524169921875, -6.818603515625, -6.2847900390625, -5.7509765625, -5.2171630859375, -4.683349609375, -4.1495361328125, -3.61572265625, -3.0819091796875, -2.548095703125, -2.0142822265625, -1.48046875, -0.9466552734375, -0.412841796875, 0.1209716796875, 0.65478515625, 1.1885986328125, 1.722412109375, 2.2562255859375, 2.7900390625, 3.3238525390625, 3.857666015625, 4.3914794921875, 4.92529296875, 5.4591064453125, 5.992919921875, 6.5267333984375, 7.060546875, 7.5943603515625, 8.128173828125, 8.6619873046875, 9.19580078125, 9.7296142578125, 10.263427734375, 10.7972412109375, 11.3310546875, 11.8648681640625, 12.398681640625, 12.9324951171875, 13.46630859375, 14.0001220703125, 14.533935546875, 15.0677490234375, 15.6015625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 11.0, 18.0, 37.0, 66.0, 119.0, 223.0, 404.0, 941.0, 2124166.0, 1018014.0, 894.0, 352.0, 197.0, 102.0, 66.0, 35.0, 28.0, 8.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.125, -115.015625, -111.90625, -108.796875, -105.6875, -102.578125, -99.46875, -96.359375, -93.25, -90.140625, -87.03125, -83.921875, -80.8125, -77.703125, -74.59375, -71.484375, -68.375, -65.265625, -62.15625, -59.046875, -55.9375, -52.828125, -49.71875, -46.609375, -43.5, -40.390625, -37.28125, -34.171875, -31.0625, -27.953125, -24.84375, -21.734375, -18.625, -15.515625, -12.40625, -9.296875, -6.1875, -3.078125, 0.03125, 3.140625, 6.25, 9.359375, 12.46875, 15.578125, 18.6875, 21.796875, 24.90625, 28.015625, 31.125, 34.234375, 37.34375, 40.453125, 43.5625, 46.671875, 49.78125, 52.890625, 56.0, 59.109375, 62.21875, 65.328125, 68.4375, 71.546875, 74.65625, 77.765625, 80.875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [912.0, 108.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.222808837890625, 2.0210132598876953, 13.264835357666016, 24.50865936279297, 35.752479553222656, 46.996299743652344, 58.24012756347656, 69.48394775390625, 80.72776794433594, 91.97158813476562, 103.21540832519531, 114.45923614501953, 125.70305633544922, 136.94686889648438, 148.19070434570312, 159.4345245361328, 170.6783447265625, 181.9221649169922, 193.16598510742188, 204.40982055664062, 215.65362548828125, 226.8974609375, 238.1412811279297, 249.38510131835938, 260.62890625, 271.87274169921875, 283.1165466308594, 294.3603820800781, 305.60418701171875, 316.8480224609375, 328.09185791015625, 339.3356628417969, 350.57952880859375, 361.8233642578125, 373.0671691894531, 384.3110046386719, 395.5548095703125, 406.79864501953125, 418.04248046875, 429.2862854003906, 440.53009033203125, 451.77392578125, 463.0177307128906, 474.2615661621094, 485.50537109375, 496.74920654296875, 507.9930419921875, 519.23681640625, 530.480712890625, 541.7245483398438, 552.9683837890625, 564.212158203125, 575.4559936523438, 586.6998291015625, 597.9436645507812, 609.1875, 620.4312744140625, 631.6751098632812, 642.9189453125, 654.1627197265625, 665.4065551757812, 676.650390625, 687.8942260742188, 699.1380615234375, 710.3818359375]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 6.0, 3.0, 4.0, 5.0, 14.0, 10.0, 7.0, 14.0, 19.0, 20.0, 25.0, 25.0, 19.0, 29.0, 26.0, 34.0, 31.0, 30.0, 45.0, 45.0, 49.0, 49.0, 43.0, 37.0, 42.0, 44.0, 44.0, 37.0, 27.0, 35.0, 32.0, 18.0, 29.0, 19.0, 29.0, 7.0, 16.0, 10.0, 12.0, 2.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.857139587402344, -52.239131927490234, -50.621124267578125, -49.003116607666016, -47.385108947753906, -45.7671012878418, -44.14909362792969, -42.531089782714844, -40.91307830810547, -39.29507064819336, -37.67706298828125, -36.05905532836914, -34.44104766845703, -32.82304000854492, -31.205034255981445, -29.587026596069336, -27.96902084350586, -26.35101318359375, -24.73300552368164, -23.11499786376953, -21.496990203857422, -19.878982543945312, -18.260976791381836, -16.642969131469727, -15.024961471557617, -13.406953811645508, -11.788946151733398, -10.170939445495605, -8.552931785583496, -6.934924125671387, -5.316917419433594, -3.6989097595214844, -2.080902099609375, -0.4628946781158447, 1.1551127433776855, 2.7731199264526367, 4.391127586364746, 6.0091352462768555, 7.627141952514648, 9.245149612426758, 10.863157272338867, 12.481164932250977, 14.099172592163086, 15.717179298400879, 17.335186004638672, 18.95319366455078, 20.57120132446289, 22.189208984375, 23.80721664428711, 25.42522430419922, 27.043231964111328, 28.661239624023438, 30.279247283935547, 31.897254943847656, 33.5152587890625, 35.133270263671875, 36.75127410888672, 38.36928176879883, 39.98728942871094, 41.60529708862305, 43.223304748535156, 44.841312408447266, 46.459320068359375, 48.07732391357422, 49.695335388183594]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 4.0, 11.0, 10.0, 13.0, 14.0, 14.0, 24.0, 30.0, 26.0, 25.0, 33.0, 28.0, 28.0, 34.0, 36.0, 46.0, 34.0, 37.0, 38.0, 46.0, 42.0, 38.0, 33.0, 48.0, 32.0, 29.0, 28.0, 24.0, 30.0, 31.0, 14.0, 20.0, 20.0, 16.0, 10.0, 11.0, 7.0, 5.0, 3.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-5.87109375, -5.7021484375, -5.533203125, -5.3642578125, -5.1953125, -5.0263671875, -4.857421875, -4.6884765625, -4.51953125, -4.3505859375, -4.181640625, -4.0126953125, -3.84375, -3.6748046875, -3.505859375, -3.3369140625, -3.16796875, -2.9990234375, -2.830078125, -2.6611328125, -2.4921875, -2.3232421875, -2.154296875, -1.9853515625, -1.81640625, -1.6474609375, -1.478515625, -1.3095703125, -1.140625, -0.9716796875, -0.802734375, -0.6337890625, -0.46484375, -0.2958984375, -0.126953125, 0.0419921875, 0.2109375, 0.3798828125, 0.548828125, 0.7177734375, 0.88671875, 1.0556640625, 1.224609375, 1.3935546875, 1.5625, 1.7314453125, 1.900390625, 2.0693359375, 2.23828125, 2.4072265625, 2.576171875, 2.7451171875, 2.9140625, 3.0830078125, 3.251953125, 3.4208984375, 3.58984375, 3.7587890625, 3.927734375, 4.0966796875, 4.265625, 4.4345703125, 4.603515625, 4.7724609375, 4.94140625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 8.0, 4.0, 7.0, 7.0, 8.0, 19.0, 11.0, 15.0, 22.0, 27.0, 19.0, 29.0, 37.0, 89.0, 105.0, 207.0, 482.0, 1284.0, 4806.0, 34978.0, 632244.0, 2877699.0, 601026.0, 33970.0, 4794.0, 1275.0, 506.0, 192.0, 110.0, 60.0, 35.0, 39.0, 21.0, 28.0, 21.0, 13.0, 19.0, 18.0, 8.0, 10.0, 10.0, 5.0, 1.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.7578125, -13.3209228515625, -12.884033203125, -12.4471435546875, -12.01025390625, -11.5733642578125, -11.136474609375, -10.6995849609375, -10.2626953125, -9.8258056640625, -9.388916015625, -8.9520263671875, -8.51513671875, -8.0782470703125, -7.641357421875, -7.2044677734375, -6.767578125, -6.3306884765625, -5.893798828125, -5.4569091796875, -5.02001953125, -4.5831298828125, -4.146240234375, -3.7093505859375, -3.2724609375, -2.8355712890625, -2.398681640625, -1.9617919921875, -1.52490234375, -1.0880126953125, -0.651123046875, -0.2142333984375, 0.22265625, 0.6595458984375, 1.096435546875, 1.5333251953125, 1.97021484375, 2.4071044921875, 2.843994140625, 3.2808837890625, 3.7177734375, 4.1546630859375, 4.591552734375, 5.0284423828125, 5.46533203125, 5.9022216796875, 6.339111328125, 6.7760009765625, 7.212890625, 7.6497802734375, 8.086669921875, 8.5235595703125, 8.96044921875, 9.3973388671875, 9.834228515625, 10.2711181640625, 10.7080078125, 11.1448974609375, 11.581787109375, 12.0186767578125, 12.45556640625, 12.8924560546875, 13.329345703125, 13.7662353515625, 14.203125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 7.0, 5.0, 12.0, 10.0, 13.0, 22.0, 34.0, 29.0, 43.0, 50.0, 69.0, 75.0, 128.0, 167.0, 189.0, 242.0, 357.0, 399.0, 373.0, 362.0, 328.0, 272.0, 221.0, 155.0, 133.0, 81.0, 70.0, 42.0, 51.0, 27.0, 32.0, 15.0, 10.0, 12.0, 9.0, 9.0, 1.0, 2.0, 6.0, 3.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.97265625, -8.6875, -8.40234375, -8.1171875, -7.83203125, -7.546875, -7.26171875, -6.9765625, -6.69140625, -6.40625, -6.12109375, -5.8359375, -5.55078125, -5.265625, -4.98046875, -4.6953125, -4.41015625, -4.125, -3.83984375, -3.5546875, -3.26953125, -2.984375, -2.69921875, -2.4140625, -2.12890625, -1.84375, -1.55859375, -1.2734375, -0.98828125, -0.703125, -0.41796875, -0.1328125, 0.15234375, 0.4375, 0.72265625, 1.0078125, 1.29296875, 1.578125, 1.86328125, 2.1484375, 2.43359375, 2.71875, 3.00390625, 3.2890625, 3.57421875, 3.859375, 4.14453125, 4.4296875, 4.71484375, 5.0, 5.28515625, 5.5703125, 5.85546875, 6.140625, 6.42578125, 6.7109375, 6.99609375, 7.28125, 7.56640625, 7.8515625, 8.13671875, 8.421875, 8.70703125, 8.9921875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 13.0, 3.0, 9.0, 13.0, 18.0, 31.0, 30.0, 39.0, 47.0, 70.0, 88.0, 129.0, 146.0, 205.0, 252.0, 384.0, 886.0, 14011.0, 3469605.0, 702230.0, 4118.0, 596.0, 332.0, 227.0, 168.0, 144.0, 95.0, 85.0, 76.0, 51.0, 34.0, 40.0, 28.0, 21.0, 16.0, 5.0, 7.0, 6.0, 2.0, 11.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.96875, -43.64013671875, -42.3115234375, -40.98291015625, -39.654296875, -38.32568359375, -36.9970703125, -35.66845703125, -34.33984375, -33.01123046875, -31.6826171875, -30.35400390625, -29.025390625, -27.69677734375, -26.3681640625, -25.03955078125, -23.7109375, -22.38232421875, -21.0537109375, -19.72509765625, -18.396484375, -17.06787109375, -15.7392578125, -14.41064453125, -13.08203125, -11.75341796875, -10.4248046875, -9.09619140625, -7.767578125, -6.43896484375, -5.1103515625, -3.78173828125, -2.453125, -1.12451171875, 0.2041015625, 1.53271484375, 2.861328125, 4.18994140625, 5.5185546875, 6.84716796875, 8.17578125, 9.50439453125, 10.8330078125, 12.16162109375, 13.490234375, 14.81884765625, 16.1474609375, 17.47607421875, 18.8046875, 20.13330078125, 21.4619140625, 22.79052734375, 24.119140625, 25.44775390625, 26.7763671875, 28.10498046875, 29.43359375, 30.76220703125, 32.0908203125, 33.41943359375, 34.748046875, 36.07666015625, 37.4052734375, 38.73388671875, 40.0625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 11.0, 18.0, 37.0, 45.0, 74.0, 104.0, 95.0, 115.0, 106.0, 118.0, 99.0, 60.0, 57.0, 28.0, 13.0, 8.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.936431884765625, -31.567873001098633, -30.199316024780273, -28.83075714111328, -27.462200164794922, -26.09364128112793, -24.725082397460938, -23.356525421142578, -21.987966537475586, -20.619407653808594, -19.250850677490234, -17.882291793823242, -16.51373291015625, -15.14517593383789, -13.776617050170898, -12.408059120178223, -11.039501190185547, -9.670943260192871, -8.302385330200195, -6.933826446533203, -5.565268516540527, -4.196710586547852, -2.8281517028808594, -1.4595937728881836, -0.09103584289550781, 1.277522325515747, 2.646080493927002, 4.014638900756836, 5.383196830749512, 6.7517547607421875, 8.12031364440918, 9.488871574401855, 10.857425689697266, 12.225983619689941, 13.594541549682617, 14.96310043334961, 16.33165740966797, 17.70021629333496, 19.068775177001953, 20.437332153320312, 21.805891036987305, 23.174449920654297, 24.543006896972656, 25.91156578063965, 27.28012466430664, 28.648681640625, 30.017240524291992, 31.385799407958984, 32.754356384277344, 34.1229133605957, 35.49147415161133, 36.86003112792969, 38.22858810424805, 39.597145080566406, 40.96570587158203, 42.33426284790039, 43.70281982421875, 45.07137680053711, 46.439937591552734, 47.808494567871094, 49.17705154418945, 50.54560852050781, 51.91416931152344, 53.2827262878418, 54.65128707885742]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 5.0, 10.0, 4.0, 5.0, 12.0, 7.0, 16.0, 20.0, 17.0, 14.0, 26.0, 19.0, 28.0, 27.0, 32.0, 29.0, 35.0, 37.0, 35.0, 48.0, 31.0, 44.0, 34.0, 36.0, 35.0, 34.0, 35.0, 41.0, 24.0, 38.0, 29.0, 27.0, 21.0, 17.0, 17.0, 19.0, 18.0, 9.0, 18.0, 9.0, 8.0, 8.0, 3.0, 3.0, 6.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.09229278564453, -31.064437866210938, -30.036582946777344, -29.00872802734375, -27.980873107910156, -26.953018188476562, -25.92516326904297, -24.897308349609375, -23.86945343017578, -22.841598510742188, -21.813743591308594, -20.785888671875, -19.758033752441406, -18.730178833007812, -17.70232391357422, -16.674468994140625, -15.646614074707031, -14.618759155273438, -13.590904235839844, -12.56304931640625, -11.535194396972656, -10.507339477539062, -9.479484558105469, -8.451629638671875, -7.423774719238281, -6.3959197998046875, -5.368064880371094, -4.3402099609375, -3.3123550415039062, -2.2845001220703125, -1.2566452026367188, -0.228790283203125, 0.7990646362304688, 1.8269195556640625, 2.8547744750976562, 3.88262939453125, 4.910484313964844, 5.9383392333984375, 6.966194152832031, 7.994049072265625, 9.021903991699219, 10.049758911132812, 11.077613830566406, 12.10546875, 13.133323669433594, 14.161178588867188, 15.189033508300781, 16.216888427734375, 17.24474334716797, 18.272598266601562, 19.300453186035156, 20.32830810546875, 21.356163024902344, 22.384017944335938, 23.41187286376953, 24.439727783203125, 25.46758270263672, 26.495437622070312, 27.523292541503906, 28.5511474609375, 29.579002380371094, 30.606857299804688, 31.63471221923828, 32.662567138671875, 33.69042205810547]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 2.0, 7.0, 10.0, 9.0, 13.0, 18.0, 15.0, 23.0, 20.0, 14.0, 29.0, 26.0, 37.0, 32.0, 24.0, 44.0, 43.0, 36.0, 43.0, 33.0, 52.0, 38.0, 47.0, 43.0, 42.0, 29.0, 32.0, 31.0, 31.0, 26.0, 14.0, 24.0, 19.0, 15.0, 16.0, 8.0, 14.0, 11.0, 8.0, 5.0, 2.0, 4.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.703125, -5.54095458984375, -5.3787841796875, -5.21661376953125, -5.054443359375, -4.89227294921875, -4.7301025390625, -4.56793212890625, -4.40576171875, -4.24359130859375, -4.0814208984375, -3.91925048828125, -3.757080078125, -3.59490966796875, -3.4327392578125, -3.27056884765625, -3.1083984375, -2.94622802734375, -2.7840576171875, -2.62188720703125, -2.459716796875, -2.29754638671875, -2.1353759765625, -1.97320556640625, -1.81103515625, -1.64886474609375, -1.4866943359375, -1.32452392578125, -1.162353515625, -1.00018310546875, -0.8380126953125, -0.67584228515625, -0.513671875, -0.35150146484375, -0.1893310546875, -0.02716064453125, 0.135009765625, 0.29718017578125, 0.4593505859375, 0.62152099609375, 0.78369140625, 0.94586181640625, 1.1080322265625, 1.27020263671875, 1.432373046875, 1.59454345703125, 1.7567138671875, 1.91888427734375, 2.0810546875, 2.24322509765625, 2.4053955078125, 2.56756591796875, 2.729736328125, 2.89190673828125, 3.0540771484375, 3.21624755859375, 3.37841796875, 3.54058837890625, 3.7027587890625, 3.86492919921875, 4.027099609375, 4.18927001953125, 4.3514404296875, 4.51361083984375, 4.67578125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 1.0, 14.0, 5.0, 11.0, 23.0, 25.0, 54.0, 73.0, 98.0, 163.0, 280.0, 409.0, 579.0, 790.0, 1133.0, 1603.0, 2387.0, 3344.0, 4882.0, 7184.0, 10448.0, 15888.0, 24413.0, 38303.0, 60910.0, 101705.0, 169350.0, 209978.0, 150240.0, 89455.0, 54109.0, 33871.0, 21791.0, 14173.0, 9667.0, 6793.0, 4585.0, 3116.0, 2050.0, 1426.0, 999.0, 705.0, 454.0, 340.0, 222.0, 126.0, 123.0, 76.0, 67.0, 34.0, 28.0, 19.0, 22.0, 6.0, 8.0, 1.0, 2.0], "bins": [-0.69970703125, -0.679351806640625, -0.65899658203125, -0.638641357421875, -0.6182861328125, -0.597930908203125, -0.57757568359375, -0.557220458984375, -0.536865234375, -0.516510009765625, -0.49615478515625, -0.475799560546875, -0.4554443359375, -0.435089111328125, -0.41473388671875, -0.394378662109375, -0.3740234375, -0.353668212890625, -0.33331298828125, -0.312957763671875, -0.2926025390625, -0.272247314453125, -0.25189208984375, -0.231536865234375, -0.211181640625, -0.190826416015625, -0.17047119140625, -0.150115966796875, -0.1297607421875, -0.109405517578125, -0.08905029296875, -0.068695068359375, -0.04833984375, -0.027984619140625, -0.00762939453125, 0.012725830078125, 0.0330810546875, 0.053436279296875, 0.07379150390625, 0.094146728515625, 0.114501953125, 0.134857177734375, 0.15521240234375, 0.175567626953125, 0.1959228515625, 0.216278076171875, 0.23663330078125, 0.256988525390625, 0.27734375, 0.297698974609375, 0.31805419921875, 0.338409423828125, 0.3587646484375, 0.379119873046875, 0.39947509765625, 0.419830322265625, 0.440185546875, 0.460540771484375, 0.48089599609375, 0.501251220703125, 0.5216064453125, 0.541961669921875, 0.56231689453125, 0.582672119140625, 0.60302734375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 8.0, 11.0, 8.0, 14.0, 7.0, 13.0, 16.0, 22.0, 25.0, 26.0, 33.0, 27.0, 31.0, 29.0, 23.0, 29.0, 39.0, 47.0, 43.0, 43.0, 1064.0, 39.0, 37.0, 34.0, 23.0, 33.0, 39.0, 31.0, 28.0, 24.0, 24.0, 24.0, 19.0, 15.0, 14.0, 14.0, 11.0, 14.0, 8.0, 6.0, 8.0, 6.0, 2.0, 5.0, 2.0, 0.0, 3.0], "bins": [-3.62890625, -3.531341552734375, -3.43377685546875, -3.336212158203125, -3.2386474609375, -3.141082763671875, -3.04351806640625, -2.945953369140625, -2.848388671875, -2.750823974609375, -2.65325927734375, -2.555694580078125, -2.4581298828125, -2.360565185546875, -2.26300048828125, -2.165435791015625, -2.06787109375, -1.970306396484375, -1.87274169921875, -1.775177001953125, -1.6776123046875, -1.580047607421875, -1.48248291015625, -1.384918212890625, -1.287353515625, -1.189788818359375, -1.09222412109375, -0.994659423828125, -0.8970947265625, -0.799530029296875, -0.70196533203125, -0.604400634765625, -0.5068359375, -0.409271240234375, -0.31170654296875, -0.214141845703125, -0.1165771484375, -0.019012451171875, 0.07855224609375, 0.176116943359375, 0.273681640625, 0.371246337890625, 0.46881103515625, 0.566375732421875, 0.6639404296875, 0.761505126953125, 0.85906982421875, 0.956634521484375, 1.05419921875, 1.151763916015625, 1.24932861328125, 1.346893310546875, 1.4444580078125, 1.542022705078125, 1.63958740234375, 1.737152099609375, 1.834716796875, 1.932281494140625, 2.02984619140625, 2.127410888671875, 2.2249755859375, 2.322540283203125, 2.42010498046875, 2.517669677734375, 2.615234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 12.0, 8.0, 8.0, 18.0, 33.0, 50.0, 62.0, 91.0, 143.0, 220.0, 379.0, 591.0, 946.0, 1561.0, 2542.0, 4224.0, 7150.0, 12628.0, 23002.0, 42090.0, 79174.0, 151165.0, 1287787.0, 216355.0, 122861.0, 64728.0, 34763.0, 18684.0, 10523.0, 6013.0, 3559.0, 2113.0, 1290.0, 842.0, 538.0, 342.0, 244.0, 137.0, 96.0, 45.0, 38.0, 34.0, 18.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.64990234375, -0.6301116943359375, -0.610321044921875, -0.5905303955078125, -0.57073974609375, -0.5509490966796875, -0.531158447265625, -0.5113677978515625, -0.4915771484375, -0.4717864990234375, -0.451995849609375, -0.4322052001953125, -0.41241455078125, -0.3926239013671875, -0.372833251953125, -0.3530426025390625, -0.333251953125, -0.3134613037109375, -0.293670654296875, -0.2738800048828125, -0.25408935546875, -0.2342987060546875, -0.214508056640625, -0.1947174072265625, -0.1749267578125, -0.1551361083984375, -0.135345458984375, -0.1155548095703125, -0.09576416015625, -0.0759735107421875, -0.056182861328125, -0.0363922119140625, -0.0166015625, 0.0031890869140625, 0.022979736328125, 0.0427703857421875, 0.06256103515625, 0.0823516845703125, 0.102142333984375, 0.1219329833984375, 0.1417236328125, 0.1615142822265625, 0.181304931640625, 0.2010955810546875, 0.22088623046875, 0.2406768798828125, 0.260467529296875, 0.2802581787109375, 0.300048828125, 0.3198394775390625, 0.339630126953125, 0.3594207763671875, 0.37921142578125, 0.3990020751953125, 0.418792724609375, 0.4385833740234375, 0.4583740234375, 0.4781646728515625, 0.497955322265625, 0.5177459716796875, 0.53753662109375, 0.5573272705078125, 0.577117919921875, 0.5969085693359375, 0.61669921875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 11.0, 12.0, 10.0, 11.0, 13.0, 25.0, 10.0, 22.0, 27.0, 30.0, 39.0, 42.0, 38.0, 39.0, 57.0, 56.0, 48.0, 58.0, 57.0, 46.0, 41.0, 50.0, 37.0, 32.0, 35.0, 27.0, 15.0, 24.0, 14.0, 8.0, 10.0, 10.0, 12.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.002185821533203125, -0.002126649022102356, -0.002067476511001587, -0.002008303999900818, -0.0019491314888000488, -0.0018899589776992798, -0.0018307864665985107, -0.0017716139554977417, -0.0017124414443969727, -0.0016532689332962036, -0.0015940964221954346, -0.0015349239110946655, -0.0014757513999938965, -0.0014165788888931274, -0.0013574063777923584, -0.0012982338666915894, -0.0012390613555908203, -0.0011798888444900513, -0.0011207163333892822, -0.0010615438222885132, -0.0010023713111877441, -0.0009431988000869751, -0.0008840262889862061, -0.000824853777885437, -0.000765681266784668, -0.0007065087556838989, -0.0006473362445831299, -0.0005881637334823608, -0.0005289912223815918, -0.00046981871128082275, -0.0004106462001800537, -0.00035147368907928467, -0.0002923011779785156, -0.00023312866687774658, -0.00017395615577697754, -0.0001147836446762085, -5.561113357543945e-05, 3.56137752532959e-06, 6.273388862609863e-05, 0.00012190639972686768, 0.00018107891082763672, 0.00024025142192840576, 0.0002994239330291748, 0.00035859644412994385, 0.0004177689552307129, 0.00047694146633148193, 0.000536113977432251, 0.00059528648853302, 0.0006544589996337891, 0.0007136315107345581, 0.0007728040218353271, 0.0008319765329360962, 0.0008911490440368652, 0.0009503215551376343, 0.0010094940662384033, 0.0010686665773391724, 0.0011278390884399414, 0.0011870115995407104, 0.0012461841106414795, 0.0013053566217422485, 0.0013645291328430176, 0.0014237016439437866, 0.0014828741550445557, 0.0015420466661453247, 0.0016012191772460938]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 3.0, 7.0, 11.0, 21.0, 22.0, 20.0, 29.0, 29.0, 42.0, 66.0, 58.0, 85.0, 127.0, 209.0, 439.0, 1140.0, 29294.0, 1001116.0, 13762.0, 937.0, 383.0, 175.0, 128.0, 99.0, 58.0, 52.0, 51.0, 39.0, 29.0, 22.0, 19.0, 10.0, 12.0, 12.0, 9.0, 10.0, 6.0, 4.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.034637451171875, -0.033374786376953125, -0.03211212158203125, -0.030849456787109375, -0.0295867919921875, -0.028324127197265625, -0.02706146240234375, -0.025798797607421875, -0.0245361328125, -0.023273468017578125, -0.02201080322265625, -0.020748138427734375, -0.0194854736328125, -0.018222808837890625, -0.01696014404296875, -0.015697479248046875, -0.014434814453125, -0.013172149658203125, -0.01190948486328125, -0.010646820068359375, -0.0093841552734375, -0.008121490478515625, -0.00685882568359375, -0.005596160888671875, -0.00433349609375, -0.003070831298828125, -0.00180816650390625, -0.000545501708984375, 0.0007171630859375, 0.001979827880859375, 0.00324249267578125, 0.004505157470703125, 0.005767822265625, 0.007030487060546875, 0.00829315185546875, 0.009555816650390625, 0.0108184814453125, 0.012081146240234375, 0.01334381103515625, 0.014606475830078125, 0.015869140625, 0.017131805419921875, 0.01839447021484375, 0.019657135009765625, 0.0209197998046875, 0.022182464599609375, 0.02344512939453125, 0.024707794189453125, 0.025970458984375, 0.027233123779296875, 0.02849578857421875, 0.029758453369140625, 0.0310211181640625, 0.032283782958984375, 0.03354644775390625, 0.034809112548828125, 0.03607177734375, 0.037334442138671875, 0.03859710693359375, 0.039859771728515625, 0.0411224365234375, 0.042385101318359375, 0.04364776611328125, 0.044910430908203125, 0.046173095703125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 35.0, 958.0, 23.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03621470928192139, -0.03551113232970238, -0.034807559102773666, -0.03410398215055466, -0.03340040519833565, -0.03269682824611664, -0.03199325501918793, -0.03128967806696892, -0.03058610111474991, -0.02988252602517605, -0.02917894907295704, -0.02847537398338318, -0.02777179703116417, -0.02706822194159031, -0.02636464685201645, -0.02566106989979744, -0.02495749481022358, -0.02425391972064972, -0.02355034276843071, -0.02284676767885685, -0.02214319072663784, -0.02143961563706398, -0.02073603868484497, -0.02003246359527111, -0.01932888850569725, -0.01862531341612339, -0.01792173646390438, -0.01721816137433052, -0.01651458442211151, -0.01581100933253765, -0.015107433311641216, -0.014403857290744781, -0.013700282201170921, -0.012996706180274487, -0.012293130159378052, -0.011589555069804192, -0.010885978117585182, -0.010182403028011322, -0.009478827007114887, -0.008775250986218452, -0.008071674965322018, -0.007368098944425583, -0.006664522923529148, -0.005960947368294001, -0.005257371347397566, -0.004553795326501131, -0.0038502197712659836, -0.003146643750369549, -0.002443067729473114, -0.001739491824992001, -0.001035915920510888, -0.00033234013244509697, 0.0003712358884513378, 0.0010748119093477726, 0.00177838746458292, 0.002481963485479355, 0.0031855395063757896, 0.0038891155272722244, 0.004592691548168659, 0.005296267103403807, 0.0059998431243002415, 0.006703419145196676, 0.007406994700431824, 0.008110570721328259, 0.008814146742224693]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 2.0, 6.0, 2.0, 9.0, 7.0, 9.0, 15.0, 15.0, 19.0, 29.0, 32.0, 30.0, 43.0, 48.0, 41.0, 58.0, 63.0, 61.0, 48.0, 51.0, 49.0, 50.0, 55.0, 50.0, 41.0, 38.0, 23.0, 28.0, 17.0, 12.0, 14.0, 14.0, 5.0, 6.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000955045223236084, -0.0009106993675231934, -0.0008663535118103027, -0.0008220076560974121, -0.0007776618003845215, -0.0007333159446716309, -0.0006889700889587402, -0.0006446242332458496, -0.000600278377532959, -0.0005559325218200684, -0.0005115866661071777, -0.0004672408103942871, -0.0004228949546813965, -0.00037854909896850586, -0.00033420324325561523, -0.0002898573875427246, -0.000245511531829834, -0.00020116567611694336, -0.00015681982040405273, -0.00011247396469116211, -6.812810897827148e-05, -2.378225326538086e-05, 2.0563602447509766e-05, 6.490945816040039e-05, 0.00010925531387329102, 0.00015360116958618164, 0.00019794702529907227, 0.0002422928810119629, 0.0002866387367248535, 0.00033098459243774414, 0.00037533044815063477, 0.0004196763038635254, 0.000464022159576416, 0.0005083680152893066, 0.0005527138710021973, 0.0005970597267150879, 0.0006414055824279785, 0.0006857514381408691, 0.0007300972938537598, 0.0007744431495666504, 0.000818789005279541, 0.0008631348609924316, 0.0009074807167053223, 0.0009518265724182129, 0.0009961724281311035, 0.0010405182838439941, 0.0010848641395568848, 0.0011292099952697754, 0.001173555850982666, 0.0012179017066955566, 0.0012622475624084473, 0.0013065934181213379, 0.0013509392738342285, 0.0013952851295471191, 0.0014396309852600098, 0.0014839768409729004, 0.001528322696685791, 0.0015726685523986816, 0.0016170144081115723, 0.0016613602638244629, 0.0017057061195373535, 0.0017500519752502441, 0.0017943978309631348, 0.0018387436866760254, 0.001883089542388916]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 2.0, 7.0, 10.0, 9.0, 13.0, 18.0, 15.0, 23.0, 20.0, 14.0, 29.0, 26.0, 37.0, 32.0, 24.0, 44.0, 43.0, 36.0, 43.0, 33.0, 52.0, 38.0, 47.0, 43.0, 42.0, 29.0, 32.0, 31.0, 31.0, 26.0, 14.0, 24.0, 19.0, 15.0, 16.0, 8.0, 14.0, 11.0, 8.0, 5.0, 2.0, 4.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.703125, -5.54095458984375, -5.3787841796875, -5.21661376953125, -5.054443359375, -4.89227294921875, -4.7301025390625, -4.56793212890625, -4.40576171875, -4.24359130859375, -4.0814208984375, -3.91925048828125, -3.757080078125, -3.59490966796875, -3.4327392578125, -3.27056884765625, -3.1083984375, -2.94622802734375, -2.7840576171875, -2.62188720703125, -2.459716796875, -2.29754638671875, -2.1353759765625, -1.97320556640625, -1.81103515625, -1.64886474609375, -1.4866943359375, -1.32452392578125, -1.162353515625, -1.00018310546875, -0.8380126953125, -0.67584228515625, -0.513671875, -0.35150146484375, -0.1893310546875, -0.02716064453125, 0.135009765625, 0.29718017578125, 0.4593505859375, 0.62152099609375, 0.78369140625, 0.94586181640625, 1.1080322265625, 1.27020263671875, 1.432373046875, 1.59454345703125, 1.7567138671875, 1.91888427734375, 2.0810546875, 2.24322509765625, 2.4053955078125, 2.56756591796875, 2.729736328125, 2.89190673828125, 3.0540771484375, 3.21624755859375, 3.37841796875, 3.54058837890625, 3.7027587890625, 3.86492919921875, 4.027099609375, 4.18927001953125, 4.3514404296875, 4.51361083984375, 4.67578125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 3.0, 8.0, 10.0, 15.0, 33.0, 26.0, 28.0, 62.0, 81.0, 94.0, 150.0, 274.0, 387.0, 708.0, 1530.0, 3003.0, 7127.0, 20471.0, 72841.0, 304327.0, 470563.0, 118014.0, 30724.0, 9897.0, 4008.0, 1896.0, 901.0, 512.0, 290.0, 188.0, 109.0, 76.0, 49.0, 27.0, 25.0, 20.0, 20.0, 18.0, 11.0, 6.0, 4.0, 4.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.50390625, -5.347412109375, -5.19091796875, -5.034423828125, -4.8779296875, -4.721435546875, -4.56494140625, -4.408447265625, -4.251953125, -4.095458984375, -3.93896484375, -3.782470703125, -3.6259765625, -3.469482421875, -3.31298828125, -3.156494140625, -3.0, -2.843505859375, -2.68701171875, -2.530517578125, -2.3740234375, -2.217529296875, -2.06103515625, -1.904541015625, -1.748046875, -1.591552734375, -1.43505859375, -1.278564453125, -1.1220703125, -0.965576171875, -0.80908203125, -0.652587890625, -0.49609375, -0.339599609375, -0.18310546875, -0.026611328125, 0.1298828125, 0.286376953125, 0.44287109375, 0.599365234375, 0.755859375, 0.912353515625, 1.06884765625, 1.225341796875, 1.3818359375, 1.538330078125, 1.69482421875, 1.851318359375, 2.0078125, 2.164306640625, 2.32080078125, 2.477294921875, 2.6337890625, 2.790283203125, 2.94677734375, 3.103271484375, 3.259765625, 3.416259765625, 3.57275390625, 3.729248046875, 3.8857421875, 4.042236328125, 4.19873046875, 4.355224609375, 4.51171875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 4.0, 8.0, 10.0, 5.0, 14.0, 17.0, 15.0, 22.0, 21.0, 25.0, 38.0, 33.0, 38.0, 51.0, 35.0, 49.0, 73.0, 154.0, 1685.0, 263.0, 75.0, 48.0, 45.0, 35.0, 37.0, 29.0, 21.0, 27.0, 41.0, 17.0, 16.0, 23.0, 9.0, 11.0, 11.0, 10.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.578125, -18.00927734375, -17.4404296875, -16.87158203125, -16.302734375, -15.73388671875, -15.1650390625, -14.59619140625, -14.02734375, -13.45849609375, -12.8896484375, -12.32080078125, -11.751953125, -11.18310546875, -10.6142578125, -10.04541015625, -9.4765625, -8.90771484375, -8.3388671875, -7.77001953125, -7.201171875, -6.63232421875, -6.0634765625, -5.49462890625, -4.92578125, -4.35693359375, -3.7880859375, -3.21923828125, -2.650390625, -2.08154296875, -1.5126953125, -0.94384765625, -0.375, 0.19384765625, 0.7626953125, 1.33154296875, 1.900390625, 2.46923828125, 3.0380859375, 3.60693359375, 4.17578125, 4.74462890625, 5.3134765625, 5.88232421875, 6.451171875, 7.02001953125, 7.5888671875, 8.15771484375, 8.7265625, 9.29541015625, 9.8642578125, 10.43310546875, 11.001953125, 11.57080078125, 12.1396484375, 12.70849609375, 13.27734375, 13.84619140625, 14.4150390625, 14.98388671875, 15.552734375, 16.12158203125, 16.6904296875, 17.25927734375, 17.828125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 3.0, 6.0, 9.0, 14.0, 21.0, 22.0, 35.0, 34.0, 74.0, 94.0, 120.0, 209.0, 304.0, 584.0, 2475.0, 2533494.0, 604698.0, 2002.0, 559.0, 299.0, 185.0, 140.0, 97.0, 52.0, 42.0, 32.0, 24.0, 20.0, 12.0, 8.0, 7.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.46875, -47.76025390625, -46.0517578125, -44.34326171875, -42.634765625, -40.92626953125, -39.2177734375, -37.50927734375, -35.80078125, -34.09228515625, -32.3837890625, -30.67529296875, -28.966796875, -27.25830078125, -25.5498046875, -23.84130859375, -22.1328125, -20.42431640625, -18.7158203125, -17.00732421875, -15.298828125, -13.59033203125, -11.8818359375, -10.17333984375, -8.46484375, -6.75634765625, -5.0478515625, -3.33935546875, -1.630859375, 0.07763671875, 1.7861328125, 3.49462890625, 5.203125, 6.91162109375, 8.6201171875, 10.32861328125, 12.037109375, 13.74560546875, 15.4541015625, 17.16259765625, 18.87109375, 20.57958984375, 22.2880859375, 23.99658203125, 25.705078125, 27.41357421875, 29.1220703125, 30.83056640625, 32.5390625, 34.24755859375, 35.9560546875, 37.66455078125, 39.373046875, 41.08154296875, 42.7900390625, 44.49853515625, 46.20703125, 47.91552734375, 49.6240234375, 51.33251953125, 53.041015625, 54.74951171875, 56.4580078125, 58.16650390625, 59.875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 3.0, 1004.0, 11.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.21566390991211, -16.800312042236328, -6.38496208190918, 4.030387878417969, 14.44573974609375, 24.86109161376953, 35.27643966674805, 45.69179153442383, 56.10714340209961, 66.52249145507812, 76.9378433227539, 87.35319519042969, 97.76854705810547, 108.18389892578125, 118.5992431640625, 129.0146026611328, 139.42994689941406, 149.8452911376953, 160.26065063476562, 170.67599487304688, 181.0913543701172, 191.50669860839844, 201.92205810546875, 212.33740234375, 222.7527618408203, 233.16810607910156, 243.58346557617188, 253.99880981445312, 264.4141540527344, 274.82952880859375, 285.244873046875, 295.66021728515625, 306.0755920410156, 316.4909362792969, 326.9062805175781, 337.3216552734375, 347.73699951171875, 358.15234375, 368.56768798828125, 378.9830322265625, 389.3984069824219, 399.8137512207031, 410.2290954589844, 420.64447021484375, 431.059814453125, 441.47515869140625, 451.8905029296875, 462.30584716796875, 472.72119140625, 483.13653564453125, 493.5518798828125, 503.9672546386719, 514.382568359375, 524.7979736328125, 535.2133178710938, 545.628662109375, 556.0440063476562, 566.4593505859375, 576.8746948242188, 587.2900390625, 597.7053833007812, 608.1207885742188, 618.5361328125, 628.9514770507812, 639.3668212890625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 4.0, 7.0, 5.0, 6.0, 4.0, 8.0, 17.0, 16.0, 27.0, 21.0, 28.0, 17.0, 28.0, 36.0, 37.0, 45.0, 32.0, 37.0, 37.0, 44.0, 40.0, 42.0, 36.0, 41.0, 46.0, 43.0, 29.0, 35.0, 29.0, 24.0, 29.0, 29.0, 21.0, 18.0, 14.0, 17.0, 6.0, 7.0, 13.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.68431854248047, -48.079673767089844, -46.475032806396484, -44.87038803100586, -43.2657470703125, -41.661102294921875, -40.05645751953125, -38.45181655883789, -36.847171783447266, -35.24252700805664, -33.63788604736328, -32.033241271972656, -30.428598403930664, -28.823955535888672, -27.21931266784668, -25.614669799804688, -24.010026931762695, -22.405384063720703, -20.80074119567871, -19.19609832763672, -17.591453552246094, -15.986810684204102, -14.38216781616211, -12.7775239944458, -11.172881126403809, -9.568238258361816, -7.963594436645508, -6.358951568603516, -4.754308223724365, -3.149664878845215, -1.5450220108032227, 0.05962181091308594, 1.6642646789550781, 3.2689080238342285, 4.873551368713379, 6.478194236755371, 8.08283805847168, 9.687480926513672, 11.292123794555664, 12.896767616271973, 14.501410484313965, 16.106054306030273, 17.710697174072266, 19.315340042114258, 20.91998291015625, 22.524627685546875, 24.129268646240234, 25.73391342163086, 27.33855628967285, 28.943199157714844, 30.547842025756836, 32.15248489379883, 33.75712966918945, 35.36177062988281, 36.96641540527344, 38.57106018066406, 40.17570114135742, 41.78034591674805, 43.384986877441406, 44.98963165283203, 46.59427261352539, 48.198917388916016, 49.803558349609375, 51.408203125, 53.012847900390625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 9.0, 5.0, 5.0, 5.0, 13.0, 8.0, 16.0, 24.0, 22.0, 10.0, 26.0, 20.0, 23.0, 33.0, 37.0, 33.0, 43.0, 43.0, 36.0, 38.0, 45.0, 40.0, 50.0, 47.0, 29.0, 35.0, 41.0, 34.0, 28.0, 26.0, 21.0, 18.0, 23.0, 19.0, 22.0, 10.0, 18.0, 12.0, 10.0, 2.0, 8.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.5234375, -5.3568115234375, -5.190185546875, -5.0235595703125, -4.85693359375, -4.6903076171875, -4.523681640625, -4.3570556640625, -4.1904296875, -4.0238037109375, -3.857177734375, -3.6905517578125, -3.52392578125, -3.3572998046875, -3.190673828125, -3.0240478515625, -2.857421875, -2.6907958984375, -2.524169921875, -2.3575439453125, -2.19091796875, -2.0242919921875, -1.857666015625, -1.6910400390625, -1.5244140625, -1.3577880859375, -1.191162109375, -1.0245361328125, -0.85791015625, -0.6912841796875, -0.524658203125, -0.3580322265625, -0.19140625, -0.0247802734375, 0.141845703125, 0.3084716796875, 0.47509765625, 0.6417236328125, 0.808349609375, 0.9749755859375, 1.1416015625, 1.3082275390625, 1.474853515625, 1.6414794921875, 1.80810546875, 1.9747314453125, 2.141357421875, 2.3079833984375, 2.474609375, 2.6412353515625, 2.807861328125, 2.9744873046875, 3.14111328125, 3.3077392578125, 3.474365234375, 3.6409912109375, 3.8076171875, 3.9742431640625, 4.140869140625, 4.3074951171875, 4.47412109375, 4.6407470703125, 4.807373046875, 4.9739990234375, 5.140625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 4.0, 5.0, 14.0, 8.0, 19.0, 19.0, 22.0, 25.0, 22.0, 35.0, 43.0, 46.0, 58.0, 81.0, 101.0, 158.0, 237.0, 443.0, 1048.0, 3939.0, 21826.0, 259746.0, 2247692.0, 1522723.0, 118231.0, 12930.0, 2739.0, 878.0, 354.0, 197.0, 129.0, 95.0, 73.0, 59.0, 43.0, 46.0, 24.0, 39.0, 31.0, 23.0, 16.0, 10.0, 10.0, 6.0, 8.0, 7.0, 1.0, 6.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-12.7265625, -12.3271484375, -11.927734375, -11.5283203125, -11.12890625, -10.7294921875, -10.330078125, -9.9306640625, -9.53125, -9.1318359375, -8.732421875, -8.3330078125, -7.93359375, -7.5341796875, -7.134765625, -6.7353515625, -6.3359375, -5.9365234375, -5.537109375, -5.1376953125, -4.73828125, -4.3388671875, -3.939453125, -3.5400390625, -3.140625, -2.7412109375, -2.341796875, -1.9423828125, -1.54296875, -1.1435546875, -0.744140625, -0.3447265625, 0.0546875, 0.4541015625, 0.853515625, 1.2529296875, 1.65234375, 2.0517578125, 2.451171875, 2.8505859375, 3.25, 3.6494140625, 4.048828125, 4.4482421875, 4.84765625, 5.2470703125, 5.646484375, 6.0458984375, 6.4453125, 6.8447265625, 7.244140625, 7.6435546875, 8.04296875, 8.4423828125, 8.841796875, 9.2412109375, 9.640625, 10.0400390625, 10.439453125, 10.8388671875, 11.23828125, 11.6376953125, 12.037109375, 12.4365234375, 12.8359375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 8.0, 12.0, 12.0, 23.0, 31.0, 34.0, 51.0, 53.0, 96.0, 126.0, 178.0, 247.0, 345.0, 449.0, 495.0, 438.0, 393.0, 313.0, 177.0, 154.0, 134.0, 57.0, 69.0, 46.0, 30.0, 24.0, 20.0, 13.0, 7.0, 10.0, 7.0, 9.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.231689453125, -7.88525390625, -7.538818359375, -7.1923828125, -6.845947265625, -6.49951171875, -6.153076171875, -5.806640625, -5.460205078125, -5.11376953125, -4.767333984375, -4.4208984375, -4.074462890625, -3.72802734375, -3.381591796875, -3.03515625, -2.688720703125, -2.34228515625, -1.995849609375, -1.6494140625, -1.302978515625, -0.95654296875, -0.610107421875, -0.263671875, 0.082763671875, 0.42919921875, 0.775634765625, 1.1220703125, 1.468505859375, 1.81494140625, 2.161376953125, 2.5078125, 2.854248046875, 3.20068359375, 3.547119140625, 3.8935546875, 4.239990234375, 4.58642578125, 4.932861328125, 5.279296875, 5.625732421875, 5.97216796875, 6.318603515625, 6.6650390625, 7.011474609375, 7.35791015625, 7.704345703125, 8.05078125, 8.397216796875, 8.74365234375, 9.090087890625, 9.4365234375, 9.782958984375, 10.12939453125, 10.475830078125, 10.822265625, 11.168701171875, 11.51513671875, 11.861572265625, 12.2080078125, 12.554443359375, 12.90087890625, 13.247314453125, 13.59375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 6.0, 14.0, 13.0, 18.0, 17.0, 25.0, 36.0, 44.0, 61.0, 93.0, 114.0, 149.0, 199.0, 244.0, 342.0, 596.0, 6030.0, 3808409.0, 374606.0, 1519.0, 496.0, 333.0, 209.0, 163.0, 156.0, 82.0, 81.0, 46.0, 57.0, 30.0, 22.0, 26.0, 18.0, 11.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-61.71875, -60.0419921875, -58.365234375, -56.6884765625, -55.01171875, -53.3349609375, -51.658203125, -49.9814453125, -48.3046875, -46.6279296875, -44.951171875, -43.2744140625, -41.59765625, -39.9208984375, -38.244140625, -36.5673828125, -34.890625, -33.2138671875, -31.537109375, -29.8603515625, -28.18359375, -26.5068359375, -24.830078125, -23.1533203125, -21.4765625, -19.7998046875, -18.123046875, -16.4462890625, -14.76953125, -13.0927734375, -11.416015625, -9.7392578125, -8.0625, -6.3857421875, -4.708984375, -3.0322265625, -1.35546875, 0.3212890625, 1.998046875, 3.6748046875, 5.3515625, 7.0283203125, 8.705078125, 10.3818359375, 12.05859375, 13.7353515625, 15.412109375, 17.0888671875, 18.765625, 20.4423828125, 22.119140625, 23.7958984375, 25.47265625, 27.1494140625, 28.826171875, 30.5029296875, 32.1796875, 33.8564453125, 35.533203125, 37.2099609375, 38.88671875, 40.5634765625, 42.240234375, 43.9169921875, 45.59375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 19.0, 125.0, 527.0, 316.0, 30.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.33722686767578, -102.78571319580078, -96.23420715332031, -89.68269348144531, -83.13117980957031, -76.57967376708984, -70.02816009521484, -63.47665023803711, -56.925140380859375, -50.37363052368164, -43.822120666503906, -37.270606994628906, -30.719097137451172, -24.167587280273438, -17.616073608398438, -11.064563751220703, -4.513053894042969, 2.038456916809082, 8.589967727661133, 15.1414794921875, 21.692989349365234, 28.24449920654297, 34.79601287841797, 41.3475227355957, 47.89903259277344, 54.45054244995117, 61.002052307128906, 67.5535659790039, 74.10507202148438, 80.65658569335938, 87.20809936523438, 93.75961303710938, 100.31112670898438, 106.86264038085938, 113.41414642333984, 119.96566009521484, 126.51716613769531, 133.0686798095703, 139.6201934814453, 146.1717071533203, 152.72320556640625, 159.27471923828125, 165.82623291015625, 172.37774658203125, 178.9292449951172, 185.4807586669922, 192.0322723388672, 198.5837860107422, 205.1352996826172, 211.6868133544922, 218.2383270263672, 224.78982543945312, 231.34133911132812, 237.89285278320312, 244.44436645507812, 250.99588012695312, 257.5473937988281, 264.0989074707031, 270.6504211425781, 277.2019348144531, 283.7534484863281, 290.304931640625, 296.8564453125, 303.407958984375, 309.95947265625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 6.0, 11.0, 6.0, 16.0, 9.0, 13.0, 26.0, 14.0, 21.0, 24.0, 22.0, 23.0, 24.0, 34.0, 27.0, 39.0, 36.0, 36.0, 52.0, 56.0, 46.0, 38.0, 35.0, 45.0, 35.0, 38.0, 36.0, 24.0, 20.0, 30.0, 28.0, 25.0, 15.0, 12.0, 17.0, 14.0, 11.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-37.34490966796875, -36.23625946044922, -35.12760925292969, -34.018959045410156, -32.910308837890625, -31.80165672302246, -30.693004608154297, -29.584354400634766, -28.475704193115234, -27.367053985595703, -26.258403778076172, -25.149751663208008, -24.041101455688477, -22.932451248168945, -21.82379913330078, -20.71514892578125, -19.60649871826172, -18.497848510742188, -17.389198303222656, -16.280546188354492, -15.171895980834961, -14.06324577331543, -12.954594612121582, -11.845943450927734, -10.737293243408203, -9.628643035888672, -8.519991874694824, -7.411341190338135, -6.302690505981445, -5.194039821624756, -4.085389137268066, -2.976738452911377, -1.8680877685546875, -0.759437084197998, 0.3492136001586914, 1.4578642845153809, 2.5665149688720703, 3.6751656532287598, 4.783816337585449, 5.892467021942139, 7.001117706298828, 8.10976791381836, 9.218419075012207, 10.327070236206055, 11.435720443725586, 12.544370651245117, 13.653021812438965, 14.761672973632812, 15.870323181152344, 16.978973388671875, 18.087623596191406, 19.19627571105957, 20.3049259185791, 21.413576126098633, 22.522228240966797, 23.630878448486328, 24.73952865600586, 25.84817886352539, 26.956829071044922, 28.065481185913086, 29.174131393432617, 30.28278160095215, 31.391433715820312, 32.500083923339844, 33.608734130859375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 10.0, 6.0, 12.0, 22.0, 10.0, 15.0, 21.0, 25.0, 23.0, 18.0, 26.0, 32.0, 23.0, 29.0, 30.0, 32.0, 42.0, 40.0, 38.0, 34.0, 31.0, 43.0, 43.0, 40.0, 27.0, 16.0, 32.0, 41.0, 18.0, 26.0, 27.0, 26.0, 18.0, 15.0, 16.0, 13.0, 10.0, 9.0, 10.0, 13.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.671875, -4.526611328125, -4.38134765625, -4.236083984375, -4.0908203125, -3.945556640625, -3.80029296875, -3.655029296875, -3.509765625, -3.364501953125, -3.21923828125, -3.073974609375, -2.9287109375, -2.783447265625, -2.63818359375, -2.492919921875, -2.34765625, -2.202392578125, -2.05712890625, -1.911865234375, -1.7666015625, -1.621337890625, -1.47607421875, -1.330810546875, -1.185546875, -1.040283203125, -0.89501953125, -0.749755859375, -0.6044921875, -0.459228515625, -0.31396484375, -0.168701171875, -0.0234375, 0.121826171875, 0.26708984375, 0.412353515625, 0.5576171875, 0.702880859375, 0.84814453125, 0.993408203125, 1.138671875, 1.283935546875, 1.42919921875, 1.574462890625, 1.7197265625, 1.864990234375, 2.01025390625, 2.155517578125, 2.30078125, 2.446044921875, 2.59130859375, 2.736572265625, 2.8818359375, 3.027099609375, 3.17236328125, 3.317626953125, 3.462890625, 3.608154296875, 3.75341796875, 3.898681640625, 4.0439453125, 4.189208984375, 4.33447265625, 4.479736328125, 4.625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 4.0, 12.0, 17.0, 29.0, 40.0, 54.0, 86.0, 122.0, 194.0, 265.0, 437.0, 562.0, 895.0, 1354.0, 2100.0, 2997.0, 4568.0, 6866.0, 10777.0, 16516.0, 26236.0, 42613.0, 73164.0, 129326.0, 210061.0, 207301.0, 126241.0, 70735.0, 41969.0, 25780.0, 16534.0, 10366.0, 6884.0, 4438.0, 2972.0, 2016.0, 1304.0, 897.0, 586.0, 423.0, 266.0, 167.0, 129.0, 82.0, 63.0, 37.0, 25.0, 14.0, 13.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.68115234375, -0.6591644287109375, -0.637176513671875, -0.6151885986328125, -0.59320068359375, -0.5712127685546875, -0.549224853515625, -0.5272369384765625, -0.5052490234375, -0.4832611083984375, -0.461273193359375, -0.4392852783203125, -0.41729736328125, -0.3953094482421875, -0.373321533203125, -0.3513336181640625, -0.329345703125, -0.3073577880859375, -0.285369873046875, -0.2633819580078125, -0.24139404296875, -0.2194061279296875, -0.197418212890625, -0.1754302978515625, -0.1534423828125, -0.1314544677734375, -0.109466552734375, -0.0874786376953125, -0.06549072265625, -0.0435028076171875, -0.021514892578125, 0.0004730224609375, 0.0224609375, 0.0444488525390625, 0.066436767578125, 0.0884246826171875, 0.11041259765625, 0.1324005126953125, 0.154388427734375, 0.1763763427734375, 0.1983642578125, 0.2203521728515625, 0.242340087890625, 0.2643280029296875, 0.28631591796875, 0.3083038330078125, 0.330291748046875, 0.3522796630859375, 0.374267578125, 0.3962554931640625, 0.418243408203125, 0.4402313232421875, 0.46221923828125, 0.4842071533203125, 0.506195068359375, 0.5281829833984375, 0.5501708984375, 0.5721588134765625, 0.594146728515625, 0.6161346435546875, 0.63812255859375, 0.6601104736328125, 0.682098388671875, 0.7040863037109375, 0.72607421875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 3.0, 4.0, 11.0, 11.0, 3.0, 12.0, 8.0, 16.0, 17.0, 25.0, 24.0, 27.0, 41.0, 24.0, 34.0, 37.0, 51.0, 35.0, 51.0, 38.0, 47.0, 1066.0, 45.0, 36.0, 46.0, 42.0, 30.0, 29.0, 29.0, 29.0, 19.0, 19.0, 24.0, 17.0, 19.0, 11.0, 10.0, 7.0, 2.0, 7.0, 6.0, 8.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.198974609375, -3.08544921875, -2.971923828125, -2.8583984375, -2.744873046875, -2.63134765625, -2.517822265625, -2.404296875, -2.290771484375, -2.17724609375, -2.063720703125, -1.9501953125, -1.836669921875, -1.72314453125, -1.609619140625, -1.49609375, -1.382568359375, -1.26904296875, -1.155517578125, -1.0419921875, -0.928466796875, -0.81494140625, -0.701416015625, -0.587890625, -0.474365234375, -0.36083984375, -0.247314453125, -0.1337890625, -0.020263671875, 0.09326171875, 0.206787109375, 0.3203125, 0.433837890625, 0.54736328125, 0.660888671875, 0.7744140625, 0.887939453125, 1.00146484375, 1.114990234375, 1.228515625, 1.342041015625, 1.45556640625, 1.569091796875, 1.6826171875, 1.796142578125, 1.90966796875, 2.023193359375, 2.13671875, 2.250244140625, 2.36376953125, 2.477294921875, 2.5908203125, 2.704345703125, 2.81787109375, 2.931396484375, 3.044921875, 3.158447265625, 3.27197265625, 3.385498046875, 3.4990234375, 3.612548828125, 3.72607421875, 3.839599609375, 3.953125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 14.0, 24.0, 26.0, 36.0, 49.0, 85.0, 146.0, 221.0, 298.0, 519.0, 837.0, 1309.0, 2011.0, 3260.0, 5034.0, 8227.0, 13573.0, 21872.0, 36436.0, 60063.0, 101874.0, 166994.0, 1259746.0, 163842.0, 99929.0, 59143.0, 35438.0, 21571.0, 12990.0, 7913.0, 4995.0, 3178.0, 1939.0, 1259.0, 765.0, 537.0, 345.0, 233.0, 127.0, 97.0, 57.0, 39.0, 25.0, 15.0, 14.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.5380859375, -0.52099609375, -0.50390625, -0.48681640625, -0.4697265625, -0.45263671875, -0.435546875, -0.41845703125, -0.4013671875, -0.38427734375, -0.3671875, -0.35009765625, -0.3330078125, -0.31591796875, -0.298828125, -0.28173828125, -0.2646484375, -0.24755859375, -0.23046875, -0.21337890625, -0.1962890625, -0.17919921875, -0.162109375, -0.14501953125, -0.1279296875, -0.11083984375, -0.09375, -0.07666015625, -0.0595703125, -0.04248046875, -0.025390625, -0.00830078125, 0.0087890625, 0.02587890625, 0.04296875, 0.06005859375, 0.0771484375, 0.09423828125, 0.111328125, 0.12841796875, 0.1455078125, 0.16259765625, 0.1796875, 0.19677734375, 0.2138671875, 0.23095703125, 0.248046875, 0.26513671875, 0.2822265625, 0.29931640625, 0.31640625, 0.33349609375, 0.3505859375, 0.36767578125, 0.384765625, 0.40185546875, 0.4189453125, 0.43603515625, 0.453125, 0.47021484375, 0.4873046875, 0.50439453125, 0.521484375, 0.53857421875, 0.5556640625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 11.0, 16.0, 28.0, 31.0, 51.0, 61.0, 68.0, 74.0, 115.0, 118.0, 94.0, 81.0, 62.0, 52.0, 42.0, 26.0, 17.0, 11.0, 8.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.00383758544921875, -0.0037343502044677734, -0.003631114959716797, -0.0035278797149658203, -0.0034246444702148438, -0.003321409225463867, -0.0032181739807128906, -0.003114938735961914, -0.0030117034912109375, -0.002908468246459961, -0.0028052330017089844, -0.002701997756958008, -0.0025987625122070312, -0.0024955272674560547, -0.002392292022705078, -0.0022890567779541016, -0.002185821533203125, -0.0020825862884521484, -0.001979351043701172, -0.0018761157989501953, -0.0017728805541992188, -0.0016696453094482422, -0.0015664100646972656, -0.001463174819946289, -0.0013599395751953125, -0.001256704330444336, -0.0011534690856933594, -0.0010502338409423828, -0.0009469985961914062, -0.0008437633514404297, -0.0007405281066894531, -0.0006372928619384766, -0.0005340576171875, -0.00043082237243652344, -0.0003275871276855469, -0.0002243518829345703, -0.00012111663818359375, -1.7881393432617188e-05, 8.535385131835938e-05, 0.00018858909606933594, 0.0002918243408203125, 0.00039505958557128906, 0.0004982948303222656, 0.0006015300750732422, 0.0007047653198242188, 0.0008080005645751953, 0.0009112358093261719, 0.0010144710540771484, 0.001117706298828125, 0.0012209415435791016, 0.0013241767883300781, 0.0014274120330810547, 0.0015306472778320312, 0.0016338825225830078, 0.0017371177673339844, 0.001840353012084961, 0.0019435882568359375, 0.002046823501586914, 0.0021500587463378906, 0.002253293991088867, 0.0023565292358398438, 0.0024597644805908203, 0.002562999725341797, 0.0026662349700927734, 0.00276947021484375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 13.0, 10.0, 18.0, 28.0, 26.0, 27.0, 79.0, 88.0, 105.0, 237.0, 747.0, 131584.0, 913597.0, 1223.0, 260.0, 166.0, 102.0, 51.0, 36.0, 39.0, 34.0, 16.0, 10.0, 12.0, 10.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053619384765625, -0.05156564712524414, -0.04951190948486328, -0.04745817184448242, -0.04540443420410156, -0.0433506965637207, -0.041296958923339844, -0.039243221282958984, -0.037189483642578125, -0.035135746002197266, -0.033082008361816406, -0.031028270721435547, -0.028974533081054688, -0.026920795440673828, -0.02486705780029297, -0.02281332015991211, -0.02075958251953125, -0.01870584487915039, -0.01665210723876953, -0.014598369598388672, -0.012544631958007812, -0.010490894317626953, -0.008437156677246094, -0.006383419036865234, -0.004329681396484375, -0.0022759437561035156, -0.00022220611572265625, 0.0018315315246582031, 0.0038852691650390625, 0.005939006805419922, 0.007992744445800781, 0.01004648208618164, 0.0121002197265625, 0.01415395736694336, 0.01620769500732422, 0.018261432647705078, 0.020315170288085938, 0.022368907928466797, 0.024422645568847656, 0.026476383209228516, 0.028530120849609375, 0.030583858489990234, 0.032637596130371094, 0.03469133377075195, 0.03674507141113281, 0.03879880905151367, 0.04085254669189453, 0.04290628433227539, 0.04496002197265625, 0.04701375961303711, 0.04906749725341797, 0.05112123489379883, 0.05317497253417969, 0.05522871017456055, 0.057282447814941406, 0.059336185455322266, 0.061389923095703125, 0.06344366073608398, 0.06549739837646484, 0.0675511360168457, 0.06960487365722656, 0.07165861129760742, 0.07371234893798828, 0.07576608657836914, 0.07781982421875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 17.0, 76.0, 247.0, 429.0, 196.0, 38.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020997445099055767, -0.001942525035701692, -0.0017853055614978075, -0.001628085970878601, -0.0014708664966747165, -0.0013136470224708319, -0.0011564274318516254, -0.0009992079576477408, -0.0008419884834438562, -0.0006847690092399716, -0.0005275494768284261, -0.00037032997352071106, -0.000213110470212996, -5.5890996009111404e-05, 0.00010132853640243411, 0.0002585480688139796, 0.00041576754301786423, 0.0005729870172217488, 0.0007302065496332943, 0.0008874260820448399, 0.0010446455562487245, 0.001201865030452609, 0.0013590846210718155, 0.0015163040952757, 0.0016735235694795847, 0.0018307430436834693, 0.001987962517887354, 0.0021451821085065603, 0.0023024016991257668, 0.0024596210569143295, 0.002616840647533536, 0.0027740602381527424, 0.002931279130280018, 0.0030884987208992243, 0.003245718078687787, 0.0034029376693069935, 0.0035601570270955563, 0.0037173766177147627, 0.003874596208333969, 0.004031815566122532, 0.004189034923911095, 0.0043462542816996574, 0.0045034741051495075, 0.00466069346293807, 0.004817912820726633, 0.004975132644176483, 0.005132352001965046, 0.005289571359753609, 0.005446791183203459, 0.0056040105409920216, 0.005761230364441872, 0.005918449722230434, 0.006075669080018997, 0.00623288843780756, 0.00639010826125741, 0.006547327619045973, 0.006704547442495823, 0.006861766800284386, 0.007018986623734236, 0.0071762059815227985, 0.007333425339311361, 0.007490645162761211, 0.007647864520549774, 0.007805083878338337, 0.0079623032361269]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 9.0, 5.0, 4.0, 3.0, 3.0, 7.0, 8.0, 8.0, 18.0, 13.0, 15.0, 25.0, 26.0, 28.0, 26.0, 27.0, 34.0, 35.0, 34.0, 41.0, 40.0, 38.0, 58.0, 36.0, 37.0, 61.0, 46.0, 27.0, 49.0, 34.0, 32.0, 32.0, 25.0, 21.0, 19.0, 14.0, 15.0, 6.0, 10.0, 7.0, 3.0, 7.0, 3.0, 8.0, 12.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0012882351875305176, -0.0012522926554083824, -0.0012163501232862473, -0.001180407591164112, -0.001144465059041977, -0.0011085225269198418, -0.0010725799947977066, -0.0010366374626755714, -0.0010006949305534363, -0.0009647523984313011, -0.000928809866309166, -0.0008928673341870308, -0.0008569248020648956, -0.0008209822699427605, -0.0007850397378206253, -0.0007490972056984901, -0.000713154673576355, -0.0006772121414542198, -0.0006412696093320847, -0.0006053270772099495, -0.0005693845450878143, -0.0005334420129656792, -0.000497499480843544, -0.00046155694872140884, -0.0004256144165992737, -0.0003896718844771385, -0.00035372935235500336, -0.0003177868202328682, -0.00028184428811073303, -0.00024590175598859787, -0.0002099592238664627, -0.00017401669174432755, -0.00013807415962219238, -0.00010213162750005722, -6.618909537792206e-05, -3.0246563255786896e-05, 5.695968866348267e-06, 4.163850098848343e-05, 7.758103311061859e-05, 0.00011352356523275375, 0.00014946609735488892, 0.00018540862947702408, 0.00022135116159915924, 0.0002572936937212944, 0.00029323622584342957, 0.00032917875796556473, 0.0003651212900876999, 0.00040106382220983505, 0.0004370063543319702, 0.0004729488864541054, 0.0005088914185762405, 0.0005448339506983757, 0.0005807764828205109, 0.000616719014942646, 0.0006526615470647812, 0.0006886040791869164, 0.0007245466113090515, 0.0007604891434311867, 0.0007964316755533218, 0.000832374207675457, 0.0008683167397975922, 0.0009042592719197273, 0.0009402018040418625, 0.0009761443361639977, 0.0010120868682861328]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 5.0, 9.0, 6.0, 12.0, 22.0, 10.0, 15.0, 21.0, 25.0, 23.0, 18.0, 27.0, 31.0, 23.0, 29.0, 30.0, 32.0, 42.0, 40.0, 38.0, 34.0, 31.0, 43.0, 43.0, 40.0, 27.0, 16.0, 32.0, 41.0, 18.0, 26.0, 27.0, 26.0, 18.0, 15.0, 16.0, 13.0, 10.0, 9.0, 10.0, 13.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.671875, -4.526611328125, -4.38134765625, -4.236083984375, -4.0908203125, -3.945556640625, -3.80029296875, -3.655029296875, -3.509765625, -3.364501953125, -3.21923828125, -3.073974609375, -2.9287109375, -2.783447265625, -2.63818359375, -2.492919921875, -2.34765625, -2.202392578125, -2.05712890625, -1.911865234375, -1.7666015625, -1.621337890625, -1.47607421875, -1.330810546875, -1.185546875, -1.040283203125, -0.89501953125, -0.749755859375, -0.6044921875, -0.459228515625, -0.31396484375, -0.168701171875, -0.0234375, 0.121826171875, 0.26708984375, 0.412353515625, 0.5576171875, 0.702880859375, 0.84814453125, 0.993408203125, 1.138671875, 1.283935546875, 1.42919921875, 1.574462890625, 1.7197265625, 1.864990234375, 2.01025390625, 2.155517578125, 2.30078125, 2.446044921875, 2.59130859375, 2.736572265625, 2.8818359375, 3.027099609375, 3.17236328125, 3.317626953125, 3.462890625, 3.608154296875, 3.75341796875, 3.898681640625, 4.0439453125, 4.189208984375, 4.33447265625, 4.479736328125, 4.625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 2.0, 3.0, 0.0, 5.0, 6.0, 10.0, 10.0, 12.0, 19.0, 24.0, 30.0, 43.0, 76.0, 118.0, 234.0, 391.0, 717.0, 1266.0, 2344.0, 4497.0, 8878.0, 17892.0, 39031.0, 91389.0, 229988.0, 372269.0, 158668.0, 64371.0, 28452.0, 13532.0, 6610.0, 3503.0, 1777.0, 996.0, 532.0, 342.0, 191.0, 110.0, 64.0, 48.0, 23.0, 20.0, 17.0, 9.0, 6.0, 7.0, 7.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0], "bins": [-3.458984375, -3.351898193359375, -3.24481201171875, -3.137725830078125, -3.0306396484375, -2.923553466796875, -2.81646728515625, -2.709381103515625, -2.602294921875, -2.495208740234375, -2.38812255859375, -2.281036376953125, -2.1739501953125, -2.066864013671875, -1.95977783203125, -1.852691650390625, -1.74560546875, -1.638519287109375, -1.53143310546875, -1.424346923828125, -1.3172607421875, -1.210174560546875, -1.10308837890625, -0.996002197265625, -0.888916015625, -0.781829833984375, -0.67474365234375, -0.567657470703125, -0.4605712890625, -0.353485107421875, -0.24639892578125, -0.139312744140625, -0.0322265625, 0.074859619140625, 0.18194580078125, 0.289031982421875, 0.3961181640625, 0.503204345703125, 0.61029052734375, 0.717376708984375, 0.824462890625, 0.931549072265625, 1.03863525390625, 1.145721435546875, 1.2528076171875, 1.359893798828125, 1.46697998046875, 1.574066162109375, 1.68115234375, 1.788238525390625, 1.89532470703125, 2.002410888671875, 2.1094970703125, 2.216583251953125, 2.32366943359375, 2.430755615234375, 2.537841796875, 2.644927978515625, 2.75201416015625, 2.859100341796875, 2.9661865234375, 3.073272705078125, 3.18035888671875, 3.287445068359375, 3.39453125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 8.0, 13.0, 3.0, 27.0, 19.0, 14.0, 13.0, 23.0, 35.0, 26.0, 38.0, 46.0, 50.0, 51.0, 87.0, 164.0, 1587.0, 300.0, 92.0, 59.0, 64.0, 49.0, 45.0, 25.0, 33.0, 26.0, 23.0, 31.0, 21.0, 12.0, 10.0, 7.0, 7.0, 7.0, 3.0, 4.0, 6.0, 5.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.984375, -17.417236328125, -16.85009765625, -16.282958984375, -15.7158203125, -15.148681640625, -14.58154296875, -14.014404296875, -13.447265625, -12.880126953125, -12.31298828125, -11.745849609375, -11.1787109375, -10.611572265625, -10.04443359375, -9.477294921875, -8.91015625, -8.343017578125, -7.77587890625, -7.208740234375, -6.6416015625, -6.074462890625, -5.50732421875, -4.940185546875, -4.373046875, -3.805908203125, -3.23876953125, -2.671630859375, -2.1044921875, -1.537353515625, -0.97021484375, -0.403076171875, 0.1640625, 0.731201171875, 1.29833984375, 1.865478515625, 2.4326171875, 2.999755859375, 3.56689453125, 4.134033203125, 4.701171875, 5.268310546875, 5.83544921875, 6.402587890625, 6.9697265625, 7.536865234375, 8.10400390625, 8.671142578125, 9.23828125, 9.805419921875, 10.37255859375, 10.939697265625, 11.5068359375, 12.073974609375, 12.64111328125, 13.208251953125, 13.775390625, 14.342529296875, 14.90966796875, 15.476806640625, 16.0439453125, 16.611083984375, 17.17822265625, 17.745361328125, 18.3125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 0.0, 4.0, 6.0, 6.0, 6.0, 6.0, 9.0, 9.0, 11.0, 19.0, 29.0, 37.0, 48.0, 58.0, 64.0, 72.0, 123.0, 148.0, 237.0, 341.0, 680.0, 3343.0, 2052661.0, 1082959.0, 3023.0, 625.0, 326.0, 233.0, 139.0, 131.0, 99.0, 56.0, 40.0, 22.0, 23.0, 33.0, 21.0, 8.0, 21.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.21875, -42.8779296875, -41.537109375, -40.1962890625, -38.85546875, -37.5146484375, -36.173828125, -34.8330078125, -33.4921875, -32.1513671875, -30.810546875, -29.4697265625, -28.12890625, -26.7880859375, -25.447265625, -24.1064453125, -22.765625, -21.4248046875, -20.083984375, -18.7431640625, -17.40234375, -16.0615234375, -14.720703125, -13.3798828125, -12.0390625, -10.6982421875, -9.357421875, -8.0166015625, -6.67578125, -5.3349609375, -3.994140625, -2.6533203125, -1.3125, 0.0283203125, 1.369140625, 2.7099609375, 4.05078125, 5.3916015625, 6.732421875, 8.0732421875, 9.4140625, 10.7548828125, 12.095703125, 13.4365234375, 14.77734375, 16.1181640625, 17.458984375, 18.7998046875, 20.140625, 21.4814453125, 22.822265625, 24.1630859375, 25.50390625, 26.8447265625, 28.185546875, 29.5263671875, 30.8671875, 32.2080078125, 33.548828125, 34.8896484375, 36.23046875, 37.5712890625, 38.912109375, 40.2529296875, 41.59375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 139.0, 506.0, 322.0, 38.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.318716049194336, -15.096857070922852, -12.874998092651367, -10.653138160705566, -8.431279182434082, -6.209420204162598, -3.987560272216797, -1.7657012939453125, 0.4561576843261719, 2.6780169010162354, 4.899876117706299, 7.121735572814941, 9.343594551086426, 11.56545352935791, 13.787313461303711, 16.009172439575195, 18.23103141784668, 20.452890396118164, 22.67474937438965, 24.896610260009766, 27.11846923828125, 29.340328216552734, 31.56218719482422, 33.7840461730957, 36.00590515136719, 38.22776412963867, 40.449623107910156, 42.67148208618164, 44.893341064453125, 47.11520004272461, 49.337059020996094, 51.558921813964844, 53.78077697753906, 56.00263595581055, 58.22449493408203, 60.446353912353516, 62.668212890625, 64.89007568359375, 67.11193084716797, 69.33379364013672, 71.55564880371094, 73.77751159667969, 75.9993667602539, 78.22122955322266, 80.44308471679688, 82.66494750976562, 84.88680267333984, 87.1086654663086, 89.33052062988281, 91.55238342285156, 93.77423858642578, 95.99610137939453, 98.21795654296875, 100.4398193359375, 102.66167449951172, 104.88353729248047, 107.10540008544922, 109.32726287841797, 111.54911804199219, 113.77098083496094, 115.99283599853516, 118.2146987915039, 120.43655395507812, 122.65841674804688, 124.8802719116211]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 6.0, 8.0, 6.0, 8.0, 12.0, 9.0, 12.0, 10.0, 22.0, 25.0, 33.0, 26.0, 33.0, 20.0, 24.0, 36.0, 35.0, 42.0, 38.0, 32.0, 35.0, 26.0, 30.0, 39.0, 32.0, 43.0, 38.0, 29.0, 28.0, 21.0, 23.0, 23.0, 31.0, 10.0, 20.0, 21.0, 18.0, 14.0, 15.0, 14.0, 11.0, 6.0, 7.0, 6.0, 3.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-38.85610580444336, -37.63048553466797, -36.40486145019531, -35.17924118041992, -33.95362091064453, -32.72800064086914, -31.502378463745117, -30.276756286621094, -29.051136016845703, -27.825515747070312, -26.59989356994629, -25.374271392822266, -24.148651123046875, -22.923030853271484, -21.69740867614746, -20.471786499023438, -19.246166229248047, -18.020545959472656, -16.794923782348633, -15.569302558898926, -14.343681335449219, -13.118060111999512, -11.892438888549805, -10.666817665100098, -9.44119644165039, -8.215575218200684, -6.989953994750977, -5.7643327713012695, -4.5387115478515625, -3.3130903244018555, -2.0874691009521484, -0.8618478775024414, 0.36377716064453125, 1.5893983840942383, 2.8150196075439453, 4.040640830993652, 5.266262054443359, 6.491883277893066, 7.717504501342773, 8.94312572479248, 10.168746948242188, 11.394368171691895, 12.619989395141602, 13.845610618591309, 15.071231842041016, 16.296852111816406, 17.52247428894043, 18.748096466064453, 19.973716735839844, 21.199337005615234, 22.424959182739258, 23.65058135986328, 24.876201629638672, 26.101821899414062, 27.327444076538086, 28.55306625366211, 29.7786865234375, 31.00430679321289, 32.22992706298828, 33.45555114746094, 34.68117141723633, 35.90679168701172, 37.132415771484375, 38.358036041259766, 39.583656311035156]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 4.0, 9.0, 14.0, 10.0, 9.0, 14.0, 14.0, 19.0, 35.0, 23.0, 28.0, 19.0, 25.0, 33.0, 38.0, 41.0, 24.0, 37.0, 33.0, 40.0, 46.0, 34.0, 44.0, 31.0, 34.0, 24.0, 24.0, 37.0, 25.0, 34.0, 14.0, 29.0, 24.0, 24.0, 12.0, 10.0, 8.0, 17.0, 11.0, 14.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.8828125, -4.72821044921875, -4.5736083984375, -4.41900634765625, -4.264404296875, -4.10980224609375, -3.9552001953125, -3.80059814453125, -3.64599609375, -3.49139404296875, -3.3367919921875, -3.18218994140625, -3.027587890625, -2.87298583984375, -2.7183837890625, -2.56378173828125, -2.4091796875, -2.25457763671875, -2.0999755859375, -1.94537353515625, -1.790771484375, -1.63616943359375, -1.4815673828125, -1.32696533203125, -1.17236328125, -1.01776123046875, -0.8631591796875, -0.70855712890625, -0.553955078125, -0.39935302734375, -0.2447509765625, -0.09014892578125, 0.064453125, 0.21905517578125, 0.3736572265625, 0.52825927734375, 0.682861328125, 0.83746337890625, 0.9920654296875, 1.14666748046875, 1.30126953125, 1.45587158203125, 1.6104736328125, 1.76507568359375, 1.919677734375, 2.07427978515625, 2.2288818359375, 2.38348388671875, 2.5380859375, 2.69268798828125, 2.8472900390625, 3.00189208984375, 3.156494140625, 3.31109619140625, 3.4656982421875, 3.62030029296875, 3.77490234375, 3.92950439453125, 4.0841064453125, 4.23870849609375, 4.393310546875, 4.54791259765625, 4.7025146484375, 4.85711669921875, 5.01171875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 7.0, 7.0, 9.0, 12.0, 13.0, 12.0, 11.0, 19.0, 22.0, 26.0, 31.0, 38.0, 46.0, 61.0, 133.0, 294.0, 543.0, 1902.0, 9547.0, 128996.0, 2484533.0, 1501858.0, 57332.0, 6230.0, 1378.0, 510.0, 260.0, 120.0, 61.0, 43.0, 36.0, 27.0, 14.0, 25.0, 18.0, 17.0, 12.0, 17.0, 14.0, 6.0, 7.0, 9.0, 6.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.9453125, -15.4288330078125, -14.912353515625, -14.3958740234375, -13.87939453125, -13.3629150390625, -12.846435546875, -12.3299560546875, -11.8134765625, -11.2969970703125, -10.780517578125, -10.2640380859375, -9.74755859375, -9.2310791015625, -8.714599609375, -8.1981201171875, -7.681640625, -7.1651611328125, -6.648681640625, -6.1322021484375, -5.61572265625, -5.0992431640625, -4.582763671875, -4.0662841796875, -3.5498046875, -3.0333251953125, -2.516845703125, -2.0003662109375, -1.48388671875, -0.9674072265625, -0.450927734375, 0.0655517578125, 0.58203125, 1.0985107421875, 1.614990234375, 2.1314697265625, 2.64794921875, 3.1644287109375, 3.680908203125, 4.1973876953125, 4.7138671875, 5.2303466796875, 5.746826171875, 6.2633056640625, 6.77978515625, 7.2962646484375, 7.812744140625, 8.3292236328125, 8.845703125, 9.3621826171875, 9.878662109375, 10.3951416015625, 10.91162109375, 11.4281005859375, 11.944580078125, 12.4610595703125, 12.9775390625, 13.4940185546875, 14.010498046875, 14.5269775390625, 15.04345703125, 15.5599365234375, 16.076416015625, 16.5928955078125, 17.109375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 7.0, 13.0, 18.0, 17.0, 37.0, 51.0, 65.0, 100.0, 164.0, 212.0, 342.0, 447.0, 616.0, 559.0, 434.0, 298.0, 206.0, 158.0, 111.0, 55.0, 56.0, 31.0, 26.0, 16.0, 10.0, 8.0, 4.0, 1.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.5234375, -15.1141357421875, -14.704833984375, -14.2955322265625, -13.88623046875, -13.4769287109375, -13.067626953125, -12.6583251953125, -12.2490234375, -11.8397216796875, -11.430419921875, -11.0211181640625, -10.61181640625, -10.2025146484375, -9.793212890625, -9.3839111328125, -8.974609375, -8.5653076171875, -8.156005859375, -7.7467041015625, -7.33740234375, -6.9281005859375, -6.518798828125, -6.1094970703125, -5.7001953125, -5.2908935546875, -4.881591796875, -4.4722900390625, -4.06298828125, -3.6536865234375, -3.244384765625, -2.8350830078125, -2.42578125, -2.0164794921875, -1.607177734375, -1.1978759765625, -0.78857421875, -0.3792724609375, 0.030029296875, 0.4393310546875, 0.8486328125, 1.2579345703125, 1.667236328125, 2.0765380859375, 2.48583984375, 2.8951416015625, 3.304443359375, 3.7137451171875, 4.123046875, 4.5323486328125, 4.941650390625, 5.3509521484375, 5.76025390625, 6.1695556640625, 6.578857421875, 6.9881591796875, 7.3974609375, 7.8067626953125, 8.216064453125, 8.6253662109375, 9.03466796875, 9.4439697265625, 9.853271484375, 10.2625732421875, 10.671875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 11.0, 7.0, 17.0, 24.0, 36.0, 56.0, 76.0, 102.0, 166.0, 241.0, 325.0, 473.0, 1738.0, 2380961.0, 1806839.0, 1692.0, 495.0, 279.0, 225.0, 151.0, 122.0, 84.0, 52.0, 36.0, 28.0, 22.0, 13.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -64.716796875, -62.55859375, -60.400390625, -58.2421875, -56.083984375, -53.92578125, -51.767578125, -49.609375, -47.451171875, -45.29296875, -43.134765625, -40.9765625, -38.818359375, -36.66015625, -34.501953125, -32.34375, -30.185546875, -28.02734375, -25.869140625, -23.7109375, -21.552734375, -19.39453125, -17.236328125, -15.078125, -12.919921875, -10.76171875, -8.603515625, -6.4453125, -4.287109375, -2.12890625, 0.029296875, 2.1875, 4.345703125, 6.50390625, 8.662109375, 10.8203125, 12.978515625, 15.13671875, 17.294921875, 19.453125, 21.611328125, 23.76953125, 25.927734375, 28.0859375, 30.244140625, 32.40234375, 34.560546875, 36.71875, 38.876953125, 41.03515625, 43.193359375, 45.3515625, 47.509765625, 49.66796875, 51.826171875, 53.984375, 56.142578125, 58.30078125, 60.458984375, 62.6171875, 64.775390625, 66.93359375, 69.091796875, 71.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 15.0, 150.0, 313.0, 374.0, 133.0, 27.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.8953399658203, -167.4841766357422, -163.072998046875, -158.66183471679688, -154.2506561279297, -149.83949279785156, -145.42831420898438, -141.01715087890625, -136.60598754882812, -132.19482421875, -127.78364562988281, -123.37247467041016, -118.9613037109375, -114.55014038085938, -110.13896942138672, -105.72779846191406, -101.31661987304688, -96.90544891357422, -92.49427795410156, -88.0831069946289, -83.67193603515625, -79.26077270507812, -74.84960174560547, -70.43843078613281, -66.02725982666016, -61.6160888671875, -57.204917907714844, -52.79375076293945, -48.3825798034668, -43.97140884399414, -39.56024169921875, -35.149070739746094, -30.737884521484375, -26.32671356201172, -21.915544509887695, -17.504375457763672, -13.093204498291016, -8.68203353881836, -4.270864486694336, 0.1403045654296875, 4.551475524902344, 8.962645530700684, 13.373815536499023, 17.784984588623047, 22.196155548095703, 26.60732650756836, 31.018495559692383, 35.429664611816406, 39.84083557128906, 44.25200653076172, 48.663177490234375, 53.074344635009766, 57.48551559448242, 61.89668655395508, 66.30785369873047, 70.71902465820312, 75.13019561767578, 79.54136657714844, 83.9525375366211, 88.36370849609375, 92.77487182617188, 97.18605041503906, 101.59721374511719, 106.00838470458984, 110.4195556640625]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 9.0, 3.0, 2.0, 8.0, 7.0, 14.0, 15.0, 14.0, 16.0, 20.0, 21.0, 24.0, 13.0, 21.0, 31.0, 33.0, 24.0, 34.0, 27.0, 25.0, 33.0, 39.0, 50.0, 46.0, 44.0, 37.0, 28.0, 42.0, 37.0, 30.0, 26.0, 27.0, 26.0, 17.0, 17.0, 19.0, 26.0, 17.0, 13.0, 15.0, 8.0, 15.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-32.211605072021484, -31.25213050842285, -30.29265785217285, -29.33318328857422, -28.373708724975586, -27.414234161376953, -26.454761505126953, -25.49528694152832, -24.535812377929688, -23.576337814331055, -22.616865158081055, -21.657390594482422, -20.69791603088379, -19.738441467285156, -18.778968811035156, -17.819494247436523, -16.86001968383789, -15.900546073913574, -14.941071510314941, -13.981597900390625, -13.022123336791992, -12.062649726867676, -11.10317611694336, -10.143701553344727, -9.184228897094727, -8.22475528717041, -7.265280723571777, -6.305807113647461, -5.346332550048828, -4.386858940124512, -3.427384853363037, -2.4679107666015625, -1.5084362030029297, -0.5489621758460999, 0.41051185131073, 1.369985818862915, 2.3294599056243896, 3.288933753967285, 4.24840784072876, 5.207881927490234, 6.167356014251709, 7.126830101013184, 8.0863037109375, 9.045778274536133, 10.00525188446045, 10.964725494384766, 11.924200057983398, 12.883674621582031, 13.843148231506348, 14.802621841430664, 15.762096405029297, 16.72157096862793, 17.68104362487793, 18.640518188476562, 19.599992752075195, 20.559467315673828, 21.518939971923828, 22.47841453552246, 23.43788719177246, 24.397361755371094, 25.356836318969727, 26.31631088256836, 27.27578353881836, 28.235258102416992, 29.194732666015625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 9.0, 5.0, 11.0, 11.0, 7.0, 9.0, 15.0, 20.0, 21.0, 27.0, 26.0, 19.0, 33.0, 35.0, 30.0, 26.0, 37.0, 40.0, 36.0, 45.0, 42.0, 36.0, 39.0, 42.0, 40.0, 38.0, 19.0, 35.0, 30.0, 28.0, 33.0, 22.0, 18.0, 17.0, 15.0, 19.0, 9.0, 10.0, 10.0, 12.0, 5.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.08984375, -4.93060302734375, -4.7713623046875, -4.61212158203125, -4.452880859375, -4.29364013671875, -4.1343994140625, -3.97515869140625, -3.81591796875, -3.65667724609375, -3.4974365234375, -3.33819580078125, -3.178955078125, -3.01971435546875, -2.8604736328125, -2.70123291015625, -2.5419921875, -2.38275146484375, -2.2235107421875, -2.06427001953125, -1.905029296875, -1.74578857421875, -1.5865478515625, -1.42730712890625, -1.26806640625, -1.10882568359375, -0.9495849609375, -0.79034423828125, -0.631103515625, -0.47186279296875, -0.3126220703125, -0.15338134765625, 0.005859375, 0.16510009765625, 0.3243408203125, 0.48358154296875, 0.642822265625, 0.80206298828125, 0.9613037109375, 1.12054443359375, 1.27978515625, 1.43902587890625, 1.5982666015625, 1.75750732421875, 1.916748046875, 2.07598876953125, 2.2352294921875, 2.39447021484375, 2.5537109375, 2.71295166015625, 2.8721923828125, 3.03143310546875, 3.190673828125, 3.34991455078125, 3.5091552734375, 3.66839599609375, 3.82763671875, 3.98687744140625, 4.1461181640625, 4.30535888671875, 4.464599609375, 4.62384033203125, 4.7830810546875, 4.94232177734375, 5.1015625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 7.0, 7.0, 6.0, 10.0, 30.0, 31.0, 66.0, 78.0, 125.0, 168.0, 226.0, 348.0, 507.0, 659.0, 953.0, 1333.0, 1930.0, 2742.0, 4001.0, 5730.0, 8002.0, 11863.0, 18048.0, 27550.0, 43047.0, 67855.0, 109272.0, 166491.0, 188395.0, 140193.0, 88111.0, 55328.0, 34726.0, 22698.0, 15370.0, 9985.0, 6825.0, 4697.0, 3250.0, 2343.0, 1644.0, 1180.0, 825.0, 583.0, 408.0, 294.0, 185.0, 159.0, 82.0, 62.0, 65.0, 24.0, 14.0, 14.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.6044921875, -0.5857620239257812, -0.5670318603515625, -0.5483016967773438, -0.529571533203125, -0.5108413696289062, -0.4921112060546875, -0.47338104248046875, -0.45465087890625, -0.43592071533203125, -0.4171905517578125, -0.39846038818359375, -0.379730224609375, -0.36100006103515625, -0.3422698974609375, -0.32353973388671875, -0.3048095703125, -0.28607940673828125, -0.2673492431640625, -0.24861907958984375, -0.229888916015625, -0.21115875244140625, -0.1924285888671875, -0.17369842529296875, -0.15496826171875, -0.13623809814453125, -0.1175079345703125, -0.09877777099609375, -0.080047607421875, -0.06131744384765625, -0.0425872802734375, -0.02385711669921875, -0.005126953125, 0.01360321044921875, 0.0323333740234375, 0.05106353759765625, 0.069793701171875, 0.08852386474609375, 0.1072540283203125, 0.12598419189453125, 0.14471435546875, 0.16344451904296875, 0.1821746826171875, 0.20090484619140625, 0.219635009765625, 0.23836517333984375, 0.2570953369140625, 0.27582550048828125, 0.2945556640625, 0.31328582763671875, 0.3320159912109375, 0.35074615478515625, 0.369476318359375, 0.38820648193359375, 0.4069366455078125, 0.42566680908203125, 0.44439697265625, 0.46312713623046875, 0.4818572998046875, 0.5005874633789062, 0.519317626953125, 0.5380477905273438, 0.5567779541015625, 0.5755081176757812, 0.59423828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 5.0, 9.0, 10.0, 9.0, 18.0, 19.0, 23.0, 22.0, 20.0, 26.0, 27.0, 31.0, 41.0, 36.0, 49.0, 41.0, 45.0, 48.0, 1077.0, 32.0, 44.0, 42.0, 30.0, 31.0, 38.0, 27.0, 27.0, 34.0, 21.0, 23.0, 21.0, 12.0, 17.0, 19.0, 7.0, 12.0, 8.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.267578125, -3.155242919921875, -3.04290771484375, -2.930572509765625, -2.8182373046875, -2.705902099609375, -2.59356689453125, -2.481231689453125, -2.368896484375, -2.256561279296875, -2.14422607421875, -2.031890869140625, -1.9195556640625, -1.807220458984375, -1.69488525390625, -1.582550048828125, -1.47021484375, -1.357879638671875, -1.24554443359375, -1.133209228515625, -1.0208740234375, -0.908538818359375, -0.79620361328125, -0.683868408203125, -0.571533203125, -0.459197998046875, -0.34686279296875, -0.234527587890625, -0.1221923828125, -0.009857177734375, 0.10247802734375, 0.214813232421875, 0.3271484375, 0.439483642578125, 0.55181884765625, 0.664154052734375, 0.7764892578125, 0.888824462890625, 1.00115966796875, 1.113494873046875, 1.225830078125, 1.338165283203125, 1.45050048828125, 1.562835693359375, 1.6751708984375, 1.787506103515625, 1.89984130859375, 2.012176513671875, 2.12451171875, 2.236846923828125, 2.34918212890625, 2.461517333984375, 2.5738525390625, 2.686187744140625, 2.79852294921875, 2.910858154296875, 3.023193359375, 3.135528564453125, 3.24786376953125, 3.360198974609375, 3.4725341796875, 3.584869384765625, 3.69720458984375, 3.809539794921875, 3.921875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 8.0, 16.0, 13.0, 23.0, 36.0, 62.0, 98.0, 119.0, 184.0, 320.0, 473.0, 819.0, 1387.0, 2196.0, 3568.0, 5995.0, 10509.0, 17943.0, 31681.0, 56319.0, 102264.0, 182842.0, 1287907.0, 172185.0, 95889.0, 52859.0, 30062.0, 16790.0, 9908.0, 5733.0, 3442.0, 2028.0, 1228.0, 782.0, 520.0, 316.0, 211.0, 127.0, 83.0, 56.0, 31.0, 44.0, 16.0, 12.0, 6.0, 9.0, 0.0, 1.0, 5.0, 0.0, 1.0], "bins": [-0.6884765625, -0.6690521240234375, -0.649627685546875, -0.6302032470703125, -0.61077880859375, -0.5913543701171875, -0.571929931640625, -0.5525054931640625, -0.5330810546875, -0.5136566162109375, -0.494232177734375, -0.4748077392578125, -0.45538330078125, -0.4359588623046875, -0.416534423828125, -0.3971099853515625, -0.377685546875, -0.3582611083984375, -0.338836669921875, -0.3194122314453125, -0.29998779296875, -0.2805633544921875, -0.261138916015625, -0.2417144775390625, -0.2222900390625, -0.2028656005859375, -0.183441162109375, -0.1640167236328125, -0.14459228515625, -0.1251678466796875, -0.105743408203125, -0.0863189697265625, -0.06689453125, -0.0474700927734375, -0.028045654296875, -0.0086212158203125, 0.01080322265625, 0.0302276611328125, 0.049652099609375, 0.0690765380859375, 0.0885009765625, 0.1079254150390625, 0.127349853515625, 0.1467742919921875, 0.16619873046875, 0.1856231689453125, 0.205047607421875, 0.2244720458984375, 0.243896484375, 0.2633209228515625, 0.282745361328125, 0.3021697998046875, 0.32159423828125, 0.3410186767578125, 0.360443115234375, 0.3798675537109375, 0.3992919921875, 0.4187164306640625, 0.438140869140625, 0.4575653076171875, 0.47698974609375, 0.4964141845703125, 0.515838623046875, 0.5352630615234375, 0.5546875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 7.0, 10.0, 9.0, 12.0, 11.0, 12.0, 17.0, 33.0, 33.0, 32.0, 52.0, 32.0, 38.0, 59.0, 60.0, 60.0, 65.0, 71.0, 57.0, 55.0, 36.0, 45.0, 35.0, 29.0, 29.0, 22.0, 12.0, 12.0, 13.0, 10.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00212860107421875, -0.0020547211170196533, -0.0019808411598205566, -0.00190696120262146, -0.0018330812454223633, -0.0017592012882232666, -0.00168532133102417, -0.0016114413738250732, -0.0015375614166259766, -0.0014636814594268799, -0.0013898015022277832, -0.0013159215450286865, -0.0012420415878295898, -0.0011681616306304932, -0.0010942816734313965, -0.0010204017162322998, -0.0009465217590332031, -0.0008726418018341064, -0.0007987618446350098, -0.0007248818874359131, -0.0006510019302368164, -0.0005771219730377197, -0.000503242015838623, -0.00042936205863952637, -0.0003554821014404297, -0.000281602144241333, -0.00020772218704223633, -0.00013384222984313965, -5.996227264404297e-05, 1.3917684555053711e-05, 8.779764175415039e-05, 0.00016167759895324707, 0.00023555755615234375, 0.00030943751335144043, 0.0003833174705505371, 0.0004571974277496338, 0.0005310773849487305, 0.0006049573421478271, 0.0006788372993469238, 0.0007527172565460205, 0.0008265972137451172, 0.0009004771709442139, 0.0009743571281433105, 0.0010482370853424072, 0.001122117042541504, 0.0011959969997406006, 0.0012698769569396973, 0.001343756914138794, 0.0014176368713378906, 0.0014915168285369873, 0.001565396785736084, 0.0016392767429351807, 0.0017131567001342773, 0.001787036657333374, 0.0018609166145324707, 0.0019347965717315674, 0.002008676528930664, 0.0020825564861297607, 0.0021564364433288574, 0.002230316400527954, 0.0023041963577270508, 0.0023780763149261475, 0.002451956272125244, 0.002525836229324341, 0.0025997161865234375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 8.0, 8.0, 13.0, 15.0, 23.0, 21.0, 22.0, 29.0, 46.0, 62.0, 84.0, 102.0, 127.0, 261.0, 478.0, 2157.0, 951446.0, 91648.0, 1013.0, 332.0, 170.0, 108.0, 79.0, 64.0, 65.0, 40.0, 25.0, 23.0, 16.0, 13.0, 17.0, 8.0, 5.0, 1.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.05810546875, -0.056527137756347656, -0.05494880676269531, -0.05337047576904297, -0.051792144775390625, -0.05021381378173828, -0.04863548278808594, -0.047057151794433594, -0.04547882080078125, -0.043900489807128906, -0.04232215881347656, -0.04074382781982422, -0.039165496826171875, -0.03758716583251953, -0.03600883483886719, -0.034430503845214844, -0.0328521728515625, -0.031273841857910156, -0.029695510864257812, -0.02811717987060547, -0.026538848876953125, -0.02496051788330078, -0.023382186889648438, -0.021803855895996094, -0.02022552490234375, -0.018647193908691406, -0.017068862915039062, -0.015490531921386719, -0.013912200927734375, -0.012333869934082031, -0.010755538940429688, -0.009177207946777344, -0.007598876953125, -0.006020545959472656, -0.0044422149658203125, -0.0028638839721679688, -0.001285552978515625, 0.00029277801513671875, 0.0018711090087890625, 0.0034494400024414062, 0.00502777099609375, 0.006606101989746094, 0.008184432983398438, 0.009762763977050781, 0.011341094970703125, 0.012919425964355469, 0.014497756958007812, 0.016076087951660156, 0.0176544189453125, 0.019232749938964844, 0.020811080932617188, 0.02238941192626953, 0.023967742919921875, 0.02554607391357422, 0.027124404907226562, 0.028702735900878906, 0.03028106689453125, 0.031859397888183594, 0.03343772888183594, 0.03501605987548828, 0.036594390869140625, 0.03817272186279297, 0.03975105285644531, 0.041329383850097656, 0.04290771484375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 65.0, 936.0, 18.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0337277427315712, -0.033129896968603134, -0.03253204748034477, -0.03193420171737671, -0.031336355954408646, -0.030738508328795433, -0.03014066256582737, -0.029542814940214157, -0.028944969177246094, -0.02834712155163288, -0.027749275788664818, -0.027151428163051605, -0.026553582400083542, -0.02595573477447033, -0.025357889011502266, -0.024760041385889053, -0.02416219376027584, -0.023564346134662628, -0.022966500371694565, -0.022368652746081352, -0.02177080698311329, -0.021172959357500076, -0.020575113594532013, -0.0199772659689188, -0.019379418343305588, -0.018781570717692375, -0.018183724954724312, -0.0175858773291111, -0.016988031566143036, -0.016390183940529823, -0.01579233817756176, -0.015194490551948547, -0.014596642926335335, -0.013998796232044697, -0.013400949537754059, -0.012803102843463421, -0.012205256149172783, -0.01160740852355957, -0.011009561829268932, -0.010411715134978294, -0.009813869372010231, -0.009216022677719593, -0.008618175983428955, -0.008020329289138317, -0.007422482129186392, -0.006824635434895754, -0.006226788274943829, -0.005628941580653191, -0.005031094420701265, -0.004433247726410627, -0.0038354007992893457, -0.003237553872168064, -0.002639707177877426, -0.002041860483586788, -0.0014440135564655066, -0.0008461666293442249, -0.00024831993505358696, 0.00034952687565237284, 0.0009473736863583326, 0.0015452204970642924, 0.0021430673077702522, 0.00274091400206089, 0.003338760929182172, 0.0039366078563034534, 0.004534454550594091]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 6.0, 12.0, 7.0, 14.0, 24.0, 11.0, 23.0, 37.0, 36.0, 38.0, 33.0, 46.0, 52.0, 54.0, 46.0, 43.0, 47.0, 51.0, 46.0, 46.0, 56.0, 42.0, 32.0, 23.0, 32.0, 30.0, 18.0, 20.0, 19.0, 14.0, 10.0, 10.0, 6.0, 5.0, 8.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012114644050598145, -0.001164414919912815, -0.0011173654347658157, -0.0010703159496188164, -0.001023266464471817, -0.0009762169793248177, -0.0009291674941778183, -0.0008821180090308189, -0.0008350685238838196, -0.0007880190387368202, -0.0007409695535898209, -0.0006939200684428215, -0.0006468705832958221, -0.0005998210981488228, -0.0005527716130018234, -0.0005057221278548241, -0.0004586726427078247, -0.00041162315756082535, -0.000364573672413826, -0.00031752418726682663, -0.00027047470211982727, -0.0002234252169728279, -0.00017637573182582855, -0.0001293262466788292, -8.227676153182983e-05, -3.5227276384830475e-05, 1.1822208762168884e-05, 5.8871693909168243e-05, 0.0001059211790561676, 0.00015297066420316696, 0.00020002014935016632, 0.0002470696344971657, 0.00029411911964416504, 0.0003411686047911644, 0.00038821808993816376, 0.0004352675750851631, 0.0004823170602321625, 0.0005293665453791618, 0.0005764160305261612, 0.0006234655156731606, 0.0006705150008201599, 0.0007175644859671593, 0.0007646139711141586, 0.000811663456261158, 0.0008587129414081573, 0.0009057624265551567, 0.0009528119117021561, 0.0009998613968491554, 0.0010469108819961548, 0.0010939603671431541, 0.0011410098522901535, 0.0011880593374371529, 0.0012351088225841522, 0.0012821583077311516, 0.001329207792878151, 0.0013762572780251503, 0.0014233067631721497, 0.001470356248319149, 0.0015174057334661484, 0.0015644552186131477, 0.001611504703760147, 0.0016585541889071465, 0.0017056036740541458, 0.0017526531592011452, 0.0017997026443481445]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 9.0, 5.0, 11.0, 11.0, 7.0, 9.0, 15.0, 20.0, 21.0, 27.0, 26.0, 19.0, 33.0, 35.0, 30.0, 26.0, 37.0, 41.0, 35.0, 45.0, 42.0, 36.0, 39.0, 42.0, 41.0, 37.0, 19.0, 35.0, 30.0, 28.0, 33.0, 22.0, 18.0, 17.0, 15.0, 19.0, 9.0, 10.0, 10.0, 12.0, 5.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.08984375, -4.93060302734375, -4.7713623046875, -4.61212158203125, -4.452880859375, -4.29364013671875, -4.1343994140625, -3.97515869140625, -3.81591796875, -3.65667724609375, -3.4974365234375, -3.33819580078125, -3.178955078125, -3.01971435546875, -2.8604736328125, -2.70123291015625, -2.5419921875, -2.38275146484375, -2.2235107421875, -2.06427001953125, -1.905029296875, -1.74578857421875, -1.5865478515625, -1.42730712890625, -1.26806640625, -1.10882568359375, -0.9495849609375, -0.79034423828125, -0.631103515625, -0.47186279296875, -0.3126220703125, -0.15338134765625, 0.005859375, 0.16510009765625, 0.3243408203125, 0.48358154296875, 0.642822265625, 0.80206298828125, 0.9613037109375, 1.12054443359375, 1.27978515625, 1.43902587890625, 1.5982666015625, 1.75750732421875, 1.916748046875, 2.07598876953125, 2.2352294921875, 2.39447021484375, 2.5537109375, 2.71295166015625, 2.8721923828125, 3.03143310546875, 3.190673828125, 3.34991455078125, 3.5091552734375, 3.66839599609375, 3.82763671875, 3.98687744140625, 4.1461181640625, 4.30535888671875, 4.464599609375, 4.62384033203125, 4.7830810546875, 4.94232177734375, 5.1015625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 9.0, 8.0, 15.0, 19.0, 39.0, 33.0, 39.0, 43.0, 69.0, 90.0, 149.0, 205.0, 293.0, 543.0, 1281.0, 2963.0, 7343.0, 20230.0, 56617.0, 170653.0, 474360.0, 206738.0, 67361.0, 24017.0, 8846.0, 3436.0, 1432.0, 676.0, 327.0, 186.0, 130.0, 80.0, 67.0, 53.0, 39.0, 42.0, 33.0, 17.0, 14.0, 13.0, 9.0, 4.0, 7.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.144287109375, -4.97607421875, -4.807861328125, -4.6396484375, -4.471435546875, -4.30322265625, -4.135009765625, -3.966796875, -3.798583984375, -3.63037109375, -3.462158203125, -3.2939453125, -3.125732421875, -2.95751953125, -2.789306640625, -2.62109375, -2.452880859375, -2.28466796875, -2.116455078125, -1.9482421875, -1.780029296875, -1.61181640625, -1.443603515625, -1.275390625, -1.107177734375, -0.93896484375, -0.770751953125, -0.6025390625, -0.434326171875, -0.26611328125, -0.097900390625, 0.0703125, 0.238525390625, 0.40673828125, 0.574951171875, 0.7431640625, 0.911376953125, 1.07958984375, 1.247802734375, 1.416015625, 1.584228515625, 1.75244140625, 1.920654296875, 2.0888671875, 2.257080078125, 2.42529296875, 2.593505859375, 2.76171875, 2.929931640625, 3.09814453125, 3.266357421875, 3.4345703125, 3.602783203125, 3.77099609375, 3.939208984375, 4.107421875, 4.275634765625, 4.44384765625, 4.612060546875, 4.7802734375, 4.948486328125, 5.11669921875, 5.284912109375, 5.453125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 9.0, 12.0, 13.0, 17.0, 19.0, 24.0, 23.0, 31.0, 28.0, 40.0, 33.0, 44.0, 54.0, 54.0, 69.0, 282.0, 1711.0, 136.0, 59.0, 53.0, 41.0, 41.0, 40.0, 33.0, 32.0, 22.0, 24.0, 16.0, 23.0, 13.0, 12.0, 10.0, 4.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.765625, -18.201416015625, -17.63720703125, -17.072998046875, -16.5087890625, -15.944580078125, -15.38037109375, -14.816162109375, -14.251953125, -13.687744140625, -13.12353515625, -12.559326171875, -11.9951171875, -11.430908203125, -10.86669921875, -10.302490234375, -9.73828125, -9.174072265625, -8.60986328125, -8.045654296875, -7.4814453125, -6.917236328125, -6.35302734375, -5.788818359375, -5.224609375, -4.660400390625, -4.09619140625, -3.531982421875, -2.9677734375, -2.403564453125, -1.83935546875, -1.275146484375, -0.7109375, -0.146728515625, 0.41748046875, 0.981689453125, 1.5458984375, 2.110107421875, 2.67431640625, 3.238525390625, 3.802734375, 4.366943359375, 4.93115234375, 5.495361328125, 6.0595703125, 6.623779296875, 7.18798828125, 7.752197265625, 8.31640625, 8.880615234375, 9.44482421875, 10.009033203125, 10.5732421875, 11.137451171875, 11.70166015625, 12.265869140625, 12.830078125, 13.394287109375, 13.95849609375, 14.522705078125, 15.0869140625, 15.651123046875, 16.21533203125, 16.779541015625, 17.34375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 11.0, 13.0, 20.0, 25.0, 35.0, 52.0, 51.0, 74.0, 96.0, 163.0, 233.0, 397.0, 901.0, 6749.0, 3099277.0, 34907.0, 1262.0, 529.0, 279.0, 166.0, 117.0, 87.0, 60.0, 50.0, 36.0, 30.0, 16.0, 21.0, 11.0, 10.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.0625, -40.541015625, -39.01953125, -37.498046875, -35.9765625, -34.455078125, -32.93359375, -31.412109375, -29.890625, -28.369140625, -26.84765625, -25.326171875, -23.8046875, -22.283203125, -20.76171875, -19.240234375, -17.71875, -16.197265625, -14.67578125, -13.154296875, -11.6328125, -10.111328125, -8.58984375, -7.068359375, -5.546875, -4.025390625, -2.50390625, -0.982421875, 0.5390625, 2.060546875, 3.58203125, 5.103515625, 6.625, 8.146484375, 9.66796875, 11.189453125, 12.7109375, 14.232421875, 15.75390625, 17.275390625, 18.796875, 20.318359375, 21.83984375, 23.361328125, 24.8828125, 26.404296875, 27.92578125, 29.447265625, 30.96875, 32.490234375, 34.01171875, 35.533203125, 37.0546875, 38.576171875, 40.09765625, 41.619140625, 43.140625, 44.662109375, 46.18359375, 47.705078125, 49.2265625, 50.748046875, 52.26953125, 53.791015625, 55.3125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 100.0, 843.0, 68.0, 3.0, 1.0, 0.0, 1.0], "bins": [-263.8231506347656, -259.3093566894531, -254.79559326171875, -250.2818145751953, -245.76803588867188, -241.25425720214844, -236.740478515625, -232.2266845703125, -227.71292114257812, -223.1991424560547, -218.68536376953125, -214.1715850830078, -209.65780639648438, -205.14402770996094, -200.6302490234375, -196.116455078125, -191.60267639160156, -187.08889770507812, -182.5751190185547, -178.06134033203125, -173.5475616455078, -169.03378295898438, -164.52000427246094, -160.0062255859375, -155.492431640625, -150.97865295410156, -146.46487426757812, -141.9510955810547, -137.43731689453125, -132.9235382080078, -128.40975952148438, -123.8959732055664, -119.38220977783203, -114.8684310913086, -110.35465240478516, -105.84087371826172, -101.32708740234375, -96.81330871582031, -92.29953002929688, -87.78575134277344, -83.27197265625, -78.75819396972656, -74.24441528320312, -69.73063659667969, -65.21685791015625, -60.70307540893555, -56.189292907714844, -51.675514221191406, -47.16173553466797, -42.64795684814453, -38.134178161621094, -33.62039566040039, -29.106616973876953, -24.592838287353516, -20.079057693481445, -15.565277099609375, -11.051496505737305, -6.537716865539551, -2.023937225341797, 2.489842414855957, 7.003622055053711, 11.517400741577148, 16.03118133544922, 20.54496192932129, 25.058740615844727]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 4.0, 4.0, 7.0, 12.0, 5.0, 19.0, 17.0, 11.0, 17.0, 17.0, 13.0, 42.0, 36.0, 46.0, 35.0, 37.0, 38.0, 29.0, 38.0, 43.0, 34.0, 52.0, 48.0, 37.0, 39.0, 33.0, 39.0, 29.0, 26.0, 21.0, 26.0, 24.0, 15.0, 29.0, 12.0, 9.0, 10.0, 15.0, 7.0, 5.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-47.05217742919922, -45.647544860839844, -44.242916107177734, -42.838287353515625, -41.43365478515625, -40.029022216796875, -38.624393463134766, -37.219764709472656, -35.81513214111328, -34.410499572753906, -33.0058708190918, -31.601240158081055, -30.196609497070312, -28.79197883605957, -27.387348175048828, -25.982717514038086, -24.578086853027344, -23.1734561920166, -21.76882553100586, -20.364194869995117, -18.959564208984375, -17.554933547973633, -16.15030288696289, -14.745672225952148, -13.341041564941406, -11.936410903930664, -10.531780242919922, -9.12714958190918, -7.7225189208984375, -6.317888259887695, -4.913257598876953, -3.508626937866211, -2.1039962768554688, -0.6993656158447266, 0.7052650451660156, 2.109895706176758, 3.5145263671875, 4.919157028198242, 6.323787689208984, 7.728418350219727, 9.133049011230469, 10.537679672241211, 11.942310333251953, 13.346940994262695, 14.751571655273438, 16.15620231628418, 17.560832977294922, 18.965463638305664, 20.370094299316406, 21.77472496032715, 23.17935562133789, 24.583986282348633, 25.988616943359375, 27.393247604370117, 28.79787826538086, 30.2025089263916, 31.607139587402344, 33.01177215576172, 34.41640090942383, 35.82102966308594, 37.22566223144531, 38.63029479980469, 40.0349235534668, 41.439552307128906, 42.84418487548828]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 5.0, 3.0, 7.0, 8.0, 11.0, 11.0, 18.0, 21.0, 19.0, 20.0, 29.0, 29.0, 33.0, 33.0, 25.0, 40.0, 35.0, 35.0, 36.0, 45.0, 41.0, 37.0, 33.0, 36.0, 33.0, 34.0, 40.0, 25.0, 25.0, 34.0, 27.0, 30.0, 15.0, 19.0, 14.0, 23.0, 12.0, 10.0, 11.0, 6.0, 6.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.2265625, -5.06298828125, -4.8994140625, -4.73583984375, -4.572265625, -4.40869140625, -4.2451171875, -4.08154296875, -3.91796875, -3.75439453125, -3.5908203125, -3.42724609375, -3.263671875, -3.10009765625, -2.9365234375, -2.77294921875, -2.609375, -2.44580078125, -2.2822265625, -2.11865234375, -1.955078125, -1.79150390625, -1.6279296875, -1.46435546875, -1.30078125, -1.13720703125, -0.9736328125, -0.81005859375, -0.646484375, -0.48291015625, -0.3193359375, -0.15576171875, 0.0078125, 0.17138671875, 0.3349609375, 0.49853515625, 0.662109375, 0.82568359375, 0.9892578125, 1.15283203125, 1.31640625, 1.47998046875, 1.6435546875, 1.80712890625, 1.970703125, 2.13427734375, 2.2978515625, 2.46142578125, 2.625, 2.78857421875, 2.9521484375, 3.11572265625, 3.279296875, 3.44287109375, 3.6064453125, 3.77001953125, 3.93359375, 4.09716796875, 4.2607421875, 4.42431640625, 4.587890625, 4.75146484375, 4.9150390625, 5.07861328125, 5.2421875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 6.0, 10.0, 9.0, 15.0, 14.0, 21.0, 21.0, 39.0, 48.0, 45.0, 64.0, 103.0, 157.0, 298.0, 559.0, 1736.0, 11092.0, 286637.0, 3385640.0, 487788.0, 16158.0, 2198.0, 659.0, 316.0, 175.0, 131.0, 85.0, 61.0, 41.0, 25.0, 19.0, 24.0, 14.0, 14.0, 10.0, 12.0, 10.0, 12.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.21875, -18.646240234375, -18.07373046875, -17.501220703125, -16.9287109375, -16.356201171875, -15.78369140625, -15.211181640625, -14.638671875, -14.066162109375, -13.49365234375, -12.921142578125, -12.3486328125, -11.776123046875, -11.20361328125, -10.631103515625, -10.05859375, -9.486083984375, -8.91357421875, -8.341064453125, -7.7685546875, -7.196044921875, -6.62353515625, -6.051025390625, -5.478515625, -4.906005859375, -4.33349609375, -3.760986328125, -3.1884765625, -2.615966796875, -2.04345703125, -1.470947265625, -0.8984375, -0.325927734375, 0.24658203125, 0.819091796875, 1.3916015625, 1.964111328125, 2.53662109375, 3.109130859375, 3.681640625, 4.254150390625, 4.82666015625, 5.399169921875, 5.9716796875, 6.544189453125, 7.11669921875, 7.689208984375, 8.26171875, 8.834228515625, 9.40673828125, 9.979248046875, 10.5517578125, 11.124267578125, 11.69677734375, 12.269287109375, 12.841796875, 13.414306640625, 13.98681640625, 14.559326171875, 15.1318359375, 15.704345703125, 16.27685546875, 16.849365234375, 17.421875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 8.0, 17.0, 22.0, 34.0, 43.0, 58.0, 78.0, 129.0, 143.0, 174.0, 253.0, 402.0, 478.0, 550.0, 484.0, 334.0, 277.0, 176.0, 124.0, 72.0, 64.0, 34.0, 36.0, 18.0, 21.0, 10.0, 3.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-15.1484375, -14.79852294921875, -14.4486083984375, -14.09869384765625, -13.748779296875, -13.39886474609375, -13.0489501953125, -12.69903564453125, -12.34912109375, -11.99920654296875, -11.6492919921875, -11.29937744140625, -10.949462890625, -10.59954833984375, -10.2496337890625, -9.89971923828125, -9.5498046875, -9.19989013671875, -8.8499755859375, -8.50006103515625, -8.150146484375, -7.80023193359375, -7.4503173828125, -7.10040283203125, -6.75048828125, -6.40057373046875, -6.0506591796875, -5.70074462890625, -5.350830078125, -5.00091552734375, -4.6510009765625, -4.30108642578125, -3.951171875, -3.60125732421875, -3.2513427734375, -2.90142822265625, -2.551513671875, -2.20159912109375, -1.8516845703125, -1.50177001953125, -1.15185546875, -0.80194091796875, -0.4520263671875, -0.10211181640625, 0.247802734375, 0.59771728515625, 0.9476318359375, 1.29754638671875, 1.6474609375, 1.99737548828125, 2.3472900390625, 2.69720458984375, 3.047119140625, 3.39703369140625, 3.7469482421875, 4.09686279296875, 4.44677734375, 4.79669189453125, 5.1466064453125, 5.49652099609375, 5.846435546875, 6.19635009765625, 6.5462646484375, 6.89617919921875, 7.24609375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 8.0, 16.0, 19.0, 28.0, 25.0, 47.0, 70.0, 88.0, 129.0, 168.0, 252.0, 329.0, 576.0, 2973.0, 2841722.0, 1343952.0, 2163.0, 478.0, 293.0, 226.0, 183.0, 134.0, 100.0, 74.0, 77.0, 58.0, 33.0, 21.0, 12.0, 8.0, 8.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.6875, -38.74609375, -36.8046875, -34.86328125, -32.921875, -30.98046875, -29.0390625, -27.09765625, -25.15625, -23.21484375, -21.2734375, -19.33203125, -17.390625, -15.44921875, -13.5078125, -11.56640625, -9.625, -7.68359375, -5.7421875, -3.80078125, -1.859375, 0.08203125, 2.0234375, 3.96484375, 5.90625, 7.84765625, 9.7890625, 11.73046875, 13.671875, 15.61328125, 17.5546875, 19.49609375, 21.4375, 23.37890625, 25.3203125, 27.26171875, 29.203125, 31.14453125, 33.0859375, 35.02734375, 36.96875, 38.91015625, 40.8515625, 42.79296875, 44.734375, 46.67578125, 48.6171875, 50.55859375, 52.5, 54.44140625, 56.3828125, 58.32421875, 60.265625, 62.20703125, 64.1484375, 66.08984375, 68.03125, 69.97265625, 71.9140625, 73.85546875, 75.796875, 77.73828125, 79.6796875, 81.62109375, 83.5625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 40.0, 206.0, 373.0, 276.0, 86.0, 22.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-197.3533935546875, -193.31011962890625, -189.266845703125, -185.2235870361328, -181.18031311035156, -177.1370391845703, -173.09378051757812, -169.05050659179688, -165.00723266601562, -160.96395874023438, -156.92068481445312, -152.87742614746094, -148.8341522216797, -144.79087829589844, -140.74761962890625, -136.704345703125, -132.66107177734375, -128.6177978515625, -124.57453155517578, -120.53126525878906, -116.48799133300781, -112.44471740722656, -108.40145111083984, -104.35818481445312, -100.31491088867188, -96.27163696289062, -92.2283706665039, -88.18510437011719, -84.14183044433594, -80.09855651855469, -76.05529022216797, -72.01202392578125, -67.96876525878906, -63.92549514770508, -59.882225036621094, -55.83895492553711, -51.795684814453125, -47.75241470336914, -43.709144592285156, -39.66587448120117, -35.62260437011719, -31.579334259033203, -27.53606414794922, -23.492794036865234, -19.44952392578125, -15.406253814697266, -11.362983703613281, -7.319713592529297, -3.2764434814453125, 0.7668266296386719, 4.810096740722656, 8.85336685180664, 12.896636962890625, 16.93990707397461, 20.983177185058594, 25.026447296142578, 29.069717407226562, 33.11298751831055, 37.15625762939453, 41.199527740478516, 45.2427978515625, 49.286067962646484, 53.32933807373047, 57.37260818481445, 61.41587829589844]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 1.0, 3.0, 3.0, 5.0, 8.0, 8.0, 11.0, 8.0, 12.0, 13.0, 17.0, 29.0, 25.0, 25.0, 38.0, 31.0, 24.0, 29.0, 50.0, 41.0, 35.0, 44.0, 42.0, 42.0, 31.0, 45.0, 43.0, 38.0, 33.0, 35.0, 37.0, 25.0, 31.0, 20.0, 24.0, 18.0, 15.0, 12.0, 11.0, 10.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.54911804199219, -32.466426849365234, -31.38373565673828, -30.301042556762695, -29.218351364135742, -28.13566017150879, -27.052967071533203, -25.97027587890625, -24.887584686279297, -23.804893493652344, -22.72220230102539, -21.639509201049805, -20.55681800842285, -19.4741268157959, -18.391433715820312, -17.30874252319336, -16.226051330566406, -15.143360137939453, -14.060667991638184, -12.977975845336914, -11.895284652709961, -10.812593460083008, -9.729901313781738, -8.647209167480469, -7.564517974853516, -6.481826305389404, -5.399134635925293, -4.316442966461182, -3.2337512969970703, -2.151059627532959, -1.0683679580688477, 0.014323711395263672, 1.097015380859375, 2.1797070503234863, 3.2623987197875977, 4.345090389251709, 5.42778205871582, 6.510473728179932, 7.593165397644043, 8.675857543945312, 9.758548736572266, 10.841239929199219, 11.923932075500488, 13.006624221801758, 14.089315414428711, 15.172006607055664, 16.25469970703125, 17.337390899658203, 18.420082092285156, 19.50277328491211, 20.585464477539062, 21.66815757751465, 22.7508487701416, 23.833539962768555, 24.91623306274414, 25.998924255371094, 27.081615447998047, 28.164306640625, 29.246997833251953, 30.32969093322754, 31.412382125854492, 32.49507522583008, 33.57776641845703, 34.660457611083984, 35.74314880371094]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 6.0, 13.0, 13.0, 14.0, 13.0, 23.0, 21.0, 23.0, 20.0, 28.0, 42.0, 33.0, 27.0, 40.0, 25.0, 33.0, 48.0, 40.0, 46.0, 30.0, 38.0, 40.0, 36.0, 31.0, 36.0, 23.0, 28.0, 28.0, 26.0, 14.0, 18.0, 25.0, 13.0, 16.0, 18.0, 15.0, 12.0, 10.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.2578125, -5.0916748046875, -4.925537109375, -4.7593994140625, -4.59326171875, -4.4271240234375, -4.260986328125, -4.0948486328125, -3.9287109375, -3.7625732421875, -3.596435546875, -3.4302978515625, -3.26416015625, -3.0980224609375, -2.931884765625, -2.7657470703125, -2.599609375, -2.4334716796875, -2.267333984375, -2.1011962890625, -1.93505859375, -1.7689208984375, -1.602783203125, -1.4366455078125, -1.2705078125, -1.1043701171875, -0.938232421875, -0.7720947265625, -0.60595703125, -0.4398193359375, -0.273681640625, -0.1075439453125, 0.05859375, 0.2247314453125, 0.390869140625, 0.5570068359375, 0.72314453125, 0.8892822265625, 1.055419921875, 1.2215576171875, 1.3876953125, 1.5538330078125, 1.719970703125, 1.8861083984375, 2.05224609375, 2.2183837890625, 2.384521484375, 2.5506591796875, 2.716796875, 2.8829345703125, 3.049072265625, 3.2152099609375, 3.38134765625, 3.5474853515625, 3.713623046875, 3.8797607421875, 4.0458984375, 4.2120361328125, 4.378173828125, 4.5443115234375, 4.71044921875, 4.8765869140625, 5.042724609375, 5.2088623046875, 5.375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 8.0, 19.0, 33.0, 38.0, 52.0, 69.0, 112.0, 148.0, 235.0, 310.0, 489.0, 757.0, 1045.0, 1591.0, 2262.0, 3584.0, 5496.0, 8264.0, 12830.0, 20145.0, 32901.0, 55481.0, 96681.0, 168643.0, 227572.0, 168357.0, 96104.0, 54918.0, 32943.0, 20173.0, 12959.0, 8320.0, 5273.0, 3536.0, 2320.0, 1572.0, 1066.0, 738.0, 457.0, 345.0, 216.0, 151.0, 102.0, 63.0, 61.0, 34.0, 25.0, 18.0, 13.0, 8.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.7509765625, -0.7278671264648438, -0.7047576904296875, -0.6816482543945312, -0.658538818359375, -0.6354293823242188, -0.6123199462890625, -0.5892105102539062, -0.56610107421875, -0.5429916381835938, -0.5198822021484375, -0.49677276611328125, -0.473663330078125, -0.45055389404296875, -0.4274444580078125, -0.40433502197265625, -0.3812255859375, -0.35811614990234375, -0.3350067138671875, -0.31189727783203125, -0.288787841796875, -0.26567840576171875, -0.2425689697265625, -0.21945953369140625, -0.19635009765625, -0.17324066162109375, -0.1501312255859375, -0.12702178955078125, -0.103912353515625, -0.08080291748046875, -0.0576934814453125, -0.03458404541015625, -0.011474609375, 0.01163482666015625, 0.0347442626953125, 0.05785369873046875, 0.080963134765625, 0.10407257080078125, 0.1271820068359375, 0.15029144287109375, 0.17340087890625, 0.19651031494140625, 0.2196197509765625, 0.24272918701171875, 0.265838623046875, 0.28894805908203125, 0.3120574951171875, 0.33516693115234375, 0.3582763671875, 0.38138580322265625, 0.4044952392578125, 0.42760467529296875, 0.450714111328125, 0.47382354736328125, 0.4969329833984375, 0.5200424194335938, 0.54315185546875, 0.5662612915039062, 0.5893707275390625, 0.6124801635742188, 0.635589599609375, 0.6586990356445312, 0.6818084716796875, 0.7049179077148438, 0.72802734375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 7.0, 20.0, 16.0, 13.0, 23.0, 21.0, 20.0, 18.0, 29.0, 30.0, 28.0, 42.0, 43.0, 43.0, 40.0, 41.0, 1073.0, 54.0, 48.0, 37.0, 43.0, 38.0, 26.0, 34.0, 38.0, 28.0, 27.0, 23.0, 23.0, 16.0, 21.0, 13.0, 7.0, 9.0, 4.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.9140625, -2.796875, -2.6796875, -2.5625, -2.4453125, -2.328125, -2.2109375, -2.09375, -1.9765625, -1.859375, -1.7421875, -1.625, -1.5078125, -1.390625, -1.2734375, -1.15625, -1.0390625, -0.921875, -0.8046875, -0.6875, -0.5703125, -0.453125, -0.3359375, -0.21875, -0.1015625, 0.015625, 0.1328125, 0.25, 0.3671875, 0.484375, 0.6015625, 0.71875, 0.8359375, 0.953125, 1.0703125, 1.1875, 1.3046875, 1.421875, 1.5390625, 1.65625, 1.7734375, 1.890625, 2.0078125, 2.125, 2.2421875, 2.359375, 2.4765625, 2.59375, 2.7109375, 2.828125, 2.9453125, 3.0625, 3.1796875, 3.296875, 3.4140625, 3.53125, 3.6484375, 3.765625, 3.8828125, 4.0, 4.1171875, 4.234375, 4.3515625, 4.46875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 2.0, 8.0, 22.0, 18.0, 33.0, 51.0, 77.0, 115.0, 185.0, 322.0, 479.0, 800.0, 1231.0, 2086.0, 3654.0, 6430.0, 11224.0, 20418.0, 38084.0, 72566.0, 139336.0, 1172916.0, 338844.0, 135115.0, 69967.0, 37096.0, 19972.0, 11091.0, 6100.0, 3491.0, 2074.0, 1291.0, 762.0, 479.0, 303.0, 166.0, 102.0, 92.0, 47.0, 20.0, 20.0, 12.0, 14.0, 4.0, 5.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68115234375, -0.6591644287109375, -0.637176513671875, -0.6151885986328125, -0.59320068359375, -0.5712127685546875, -0.549224853515625, -0.5272369384765625, -0.5052490234375, -0.4832611083984375, -0.461273193359375, -0.4392852783203125, -0.41729736328125, -0.3953094482421875, -0.373321533203125, -0.3513336181640625, -0.329345703125, -0.3073577880859375, -0.285369873046875, -0.2633819580078125, -0.24139404296875, -0.2194061279296875, -0.197418212890625, -0.1754302978515625, -0.1534423828125, -0.1314544677734375, -0.109466552734375, -0.0874786376953125, -0.06549072265625, -0.0435028076171875, -0.021514892578125, 0.0004730224609375, 0.0224609375, 0.0444488525390625, 0.066436767578125, 0.0884246826171875, 0.11041259765625, 0.1324005126953125, 0.154388427734375, 0.1763763427734375, 0.1983642578125, 0.2203521728515625, 0.242340087890625, 0.2643280029296875, 0.28631591796875, 0.3083038330078125, 0.330291748046875, 0.3522796630859375, 0.374267578125, 0.3962554931640625, 0.418243408203125, 0.4402313232421875, 0.46221923828125, 0.4842071533203125, 0.506195068359375, 0.5281829833984375, 0.5501708984375, 0.5721588134765625, 0.594146728515625, 0.6161346435546875, 0.63812255859375, 0.6601104736328125, 0.682098388671875, 0.7040863037109375, 0.72607421875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 2.0, 4.0, 6.0, 9.0, 13.0, 16.0, 20.0, 31.0, 45.0, 44.0, 54.0, 53.0, 57.0, 62.0, 67.0, 79.0, 54.0, 61.0, 52.0, 49.0, 39.0, 40.0, 24.0, 35.0, 19.0, 15.0, 15.0, 11.0, 6.0, 6.0, 4.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.002292633056640625, -0.0022272467613220215, -0.002161860466003418, -0.0020964741706848145, -0.002031087875366211, -0.0019657015800476074, -0.001900315284729004, -0.0018349289894104004, -0.0017695426940917969, -0.0017041563987731934, -0.0016387701034545898, -0.0015733838081359863, -0.0015079975128173828, -0.0014426112174987793, -0.0013772249221801758, -0.0013118386268615723, -0.0012464523315429688, -0.0011810660362243652, -0.0011156797409057617, -0.0010502934455871582, -0.0009849071502685547, -0.0009195208549499512, -0.0008541345596313477, -0.0007887482643127441, -0.0007233619689941406, -0.0006579756736755371, -0.0005925893783569336, -0.0005272030830383301, -0.00046181678771972656, -0.00039643049240112305, -0.00033104419708251953, -0.000265657901763916, -0.0002002716064453125, -0.00013488531112670898, -6.949901580810547e-05, -4.112720489501953e-06, 6.127357482910156e-05, 0.00012665987014770508, 0.0001920461654663086, 0.0002574324607849121, 0.0003228187561035156, 0.00038820505142211914, 0.00045359134674072266, 0.0005189776420593262, 0.0005843639373779297, 0.0006497502326965332, 0.0007151365280151367, 0.0007805228233337402, 0.0008459091186523438, 0.0009112954139709473, 0.0009766817092895508, 0.0010420680046081543, 0.0011074542999267578, 0.0011728405952453613, 0.0012382268905639648, 0.0013036131858825684, 0.0013689994812011719, 0.0014343857765197754, 0.001499772071838379, 0.0015651583671569824, 0.001630544662475586, 0.0016959309577941895, 0.001761317253112793, 0.0018267035484313965, 0.00189208984375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 11.0, 17.0, 19.0, 16.0, 30.0, 52.0, 52.0, 82.0, 80.0, 134.0, 243.0, 618.0, 10582.0, 1026347.0, 9007.0, 524.0, 229.0, 145.0, 97.0, 58.0, 55.0, 41.0, 23.0, 22.0, 17.0, 10.0, 7.0, 6.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05224609375, -0.050685882568359375, -0.04912567138671875, -0.047565460205078125, -0.0460052490234375, -0.044445037841796875, -0.04288482666015625, -0.041324615478515625, -0.039764404296875, -0.038204193115234375, -0.03664398193359375, -0.035083770751953125, -0.0335235595703125, -0.031963348388671875, -0.03040313720703125, -0.028842926025390625, -0.02728271484375, -0.025722503662109375, -0.02416229248046875, -0.022602081298828125, -0.0210418701171875, -0.019481658935546875, -0.01792144775390625, -0.016361236572265625, -0.014801025390625, -0.013240814208984375, -0.01168060302734375, -0.010120391845703125, -0.0085601806640625, -0.006999969482421875, -0.00543975830078125, -0.003879547119140625, -0.0023193359375, -0.000759124755859375, 0.00080108642578125, 0.002361297607421875, 0.0039215087890625, 0.005481719970703125, 0.00704193115234375, 0.008602142333984375, 0.010162353515625, 0.011722564697265625, 0.01328277587890625, 0.014842987060546875, 0.0164031982421875, 0.017963409423828125, 0.01952362060546875, 0.021083831787109375, 0.02264404296875, 0.024204254150390625, 0.02576446533203125, 0.027324676513671875, 0.0288848876953125, 0.030445098876953125, 0.03200531005859375, 0.033565521240234375, 0.035125732421875, 0.036685943603515625, 0.03824615478515625, 0.039806365966796875, 0.0413665771484375, 0.042926788330078125, 0.04448699951171875, 0.046047210693359375, 0.047607421875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 18.0, 34.0, 96.0, 187.0, 239.0, 222.0, 125.0, 58.0, 14.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004594548139721155, -0.0045001995749771595, -0.004405851010233164, -0.0043115029111504555, -0.00421715434640646, -0.004122805781662464, -0.0040284572169184685, -0.003934108652174473, -0.003839760320261121, -0.003745411755517125, -0.003651063423603773, -0.0035567148588597775, -0.0034623665269464254, -0.0033680179622024298, -0.0032736696302890778, -0.003179321065545082, -0.0030849725008010864, -0.0029906239360570908, -0.0028962756041437387, -0.002801927039399743, -0.002707578707486391, -0.0026132301427423954, -0.0025188815779983997, -0.0024245332460850477, -0.0023301849141716957, -0.0022358363494277, -0.002141488017514348, -0.0020471394527703524, -0.0019527910044416785, -0.0018584425561130047, -0.0017640941077843308, -0.001669745659455657, -0.0015753972111269832, -0.0014810487627983093, -0.0013867003144696355, -0.0012923518661409616, -0.001198003301396966, -0.0011036548530682921, -0.0010093064047396183, -0.0009149578982032835, -0.0008206094498746097, -0.0007262610015459359, -0.0006319124950096011, -0.0005375640466809273, -0.000443215569248423, -0.0003488670918159187, -0.00025451864348724484, -0.0001601701369509101, -6.582168862223625e-05, 2.852678153431043e-05, 0.0001228752516908571, 0.00021722371457144618, 0.0003115721920039505, 0.0004059206694364548, 0.0005002691177651286, 0.0005946176243014634, 0.0006889660726301372, 0.000783314520958811, 0.0008776630274951458, 0.0009720114758238196, 0.0010663599241524935, 0.0011607084888964891, 0.0012550568208098412, 0.0013494053855538368, 0.0014437538338825107]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 5.0, 9.0, 10.0, 14.0, 16.0, 18.0, 21.0, 23.0, 25.0, 28.0, 25.0, 39.0, 48.0, 38.0, 42.0, 39.0, 40.0, 40.0, 35.0, 40.0, 35.0, 42.0, 39.0, 38.0, 40.0, 31.0, 36.0, 32.0, 22.0, 17.0, 15.0, 23.0, 23.0, 7.0, 9.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009667873382568359, -0.0009367233142256737, -0.0009066592901945114, -0.0008765952661633492, -0.0008465312421321869, -0.0008164672181010246, -0.0007864031940698624, -0.0007563391700387001, -0.0007262751460075378, -0.0006962111219763756, -0.0006661470979452133, -0.0006360830739140511, -0.0006060190498828888, -0.0005759550258517265, -0.0005458910018205643, -0.000515826977789402, -0.00048576295375823975, -0.0004556989297270775, -0.0004256349056959152, -0.00039557088166475296, -0.0003655068576335907, -0.00033544283360242844, -0.0003053788095712662, -0.0002753147855401039, -0.00024525076150894165, -0.0002151867374777794, -0.00018512271344661713, -0.00015505868941545486, -0.0001249946653842926, -9.493064135313034e-05, -6.486661732196808e-05, -3.480259329080582e-05, -4.738569259643555e-06, 2.5325454771518707e-05, 5.538947880268097e-05, 8.545350283384323e-05, 0.00011551752686500549, 0.00014558155089616776, 0.00017564557492733002, 0.00020570959895849228, 0.00023577362298965454, 0.0002658376470208168, 0.00029590167105197906, 0.0003259656950831413, 0.0003560297191143036, 0.00038609374314546585, 0.0004161577671766281, 0.0004462217912077904, 0.00047628581523895264, 0.0005063498392701149, 0.0005364138633012772, 0.0005664778873324394, 0.0005965419113636017, 0.000626605935394764, 0.0006566699594259262, 0.0006867339834570885, 0.0007167980074882507, 0.000746862031519413, 0.0007769260555505753, 0.0008069900795817375, 0.0008370541036128998, 0.000867118127644062, 0.0008971821516752243, 0.0009272461757063866, 0.0009573101997375488]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 6.0, 13.0, 13.0, 14.0, 13.0, 23.0, 21.0, 23.0, 20.0, 28.0, 42.0, 33.0, 27.0, 40.0, 25.0, 33.0, 48.0, 40.0, 46.0, 30.0, 38.0, 40.0, 36.0, 31.0, 36.0, 23.0, 28.0, 28.0, 26.0, 14.0, 18.0, 25.0, 13.0, 16.0, 18.0, 15.0, 12.0, 10.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.2578125, -5.0916748046875, -4.925537109375, -4.7593994140625, -4.59326171875, -4.4271240234375, -4.260986328125, -4.0948486328125, -3.9287109375, -3.7625732421875, -3.596435546875, -3.4302978515625, -3.26416015625, -3.0980224609375, -2.931884765625, -2.7657470703125, -2.599609375, -2.4334716796875, -2.267333984375, -2.1011962890625, -1.93505859375, -1.7689208984375, -1.602783203125, -1.4366455078125, -1.2705078125, -1.1043701171875, -0.938232421875, -0.7720947265625, -0.60595703125, -0.4398193359375, -0.273681640625, -0.1075439453125, 0.05859375, 0.2247314453125, 0.390869140625, 0.5570068359375, 0.72314453125, 0.8892822265625, 1.055419921875, 1.2215576171875, 1.3876953125, 1.5538330078125, 1.719970703125, 1.8861083984375, 2.05224609375, 2.2183837890625, 2.384521484375, 2.5506591796875, 2.716796875, 2.8829345703125, 3.049072265625, 3.2152099609375, 3.38134765625, 3.5474853515625, 3.713623046875, 3.8797607421875, 4.0458984375, 4.2120361328125, 4.378173828125, 4.5443115234375, 4.71044921875, 4.8765869140625, 5.042724609375, 5.2088623046875, 5.375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 13.0, 11.0, 17.0, 18.0, 20.0, 25.0, 42.0, 46.0, 75.0, 78.0, 112.0, 168.0, 220.0, 334.0, 583.0, 992.0, 2986.0, 15867.0, 120079.0, 753048.0, 130858.0, 16948.0, 3156.0, 1088.0, 598.0, 318.0, 211.0, 158.0, 101.0, 83.0, 59.0, 51.0, 43.0, 23.0, 28.0, 24.0, 15.0, 16.0, 10.0, 7.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.734375, -9.425537109375, -9.11669921875, -8.807861328125, -8.4990234375, -8.190185546875, -7.88134765625, -7.572509765625, -7.263671875, -6.954833984375, -6.64599609375, -6.337158203125, -6.0283203125, -5.719482421875, -5.41064453125, -5.101806640625, -4.79296875, -4.484130859375, -4.17529296875, -3.866455078125, -3.5576171875, -3.248779296875, -2.93994140625, -2.631103515625, -2.322265625, -2.013427734375, -1.70458984375, -1.395751953125, -1.0869140625, -0.778076171875, -0.46923828125, -0.160400390625, 0.1484375, 0.457275390625, 0.76611328125, 1.074951171875, 1.3837890625, 1.692626953125, 2.00146484375, 2.310302734375, 2.619140625, 2.927978515625, 3.23681640625, 3.545654296875, 3.8544921875, 4.163330078125, 4.47216796875, 4.781005859375, 5.08984375, 5.398681640625, 5.70751953125, 6.016357421875, 6.3251953125, 6.634033203125, 6.94287109375, 7.251708984375, 7.560546875, 7.869384765625, 8.17822265625, 8.487060546875, 8.7958984375, 9.104736328125, 9.41357421875, 9.722412109375, 10.03125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 10.0, 11.0, 9.0, 7.0, 12.0, 8.0, 18.0, 18.0, 25.0, 29.0, 34.0, 27.0, 24.0, 37.0, 46.0, 45.0, 50.0, 67.0, 214.0, 1698.0, 154.0, 76.0, 47.0, 45.0, 41.0, 29.0, 24.0, 34.0, 28.0, 26.0, 21.0, 19.0, 16.0, 12.0, 12.0, 11.0, 10.0, 9.0, 12.0, 9.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.828125, -15.307373046875, -14.78662109375, -14.265869140625, -13.7451171875, -13.224365234375, -12.70361328125, -12.182861328125, -11.662109375, -11.141357421875, -10.62060546875, -10.099853515625, -9.5791015625, -9.058349609375, -8.53759765625, -8.016845703125, -7.49609375, -6.975341796875, -6.45458984375, -5.933837890625, -5.4130859375, -4.892333984375, -4.37158203125, -3.850830078125, -3.330078125, -2.809326171875, -2.28857421875, -1.767822265625, -1.2470703125, -0.726318359375, -0.20556640625, 0.315185546875, 0.8359375, 1.356689453125, 1.87744140625, 2.398193359375, 2.9189453125, 3.439697265625, 3.96044921875, 4.481201171875, 5.001953125, 5.522705078125, 6.04345703125, 6.564208984375, 7.0849609375, 7.605712890625, 8.12646484375, 8.647216796875, 9.16796875, 9.688720703125, 10.20947265625, 10.730224609375, 11.2509765625, 11.771728515625, 12.29248046875, 12.813232421875, 13.333984375, 13.854736328125, 14.37548828125, 14.896240234375, 15.4169921875, 15.937744140625, 16.45849609375, 16.979248046875, 17.5]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 4.0, 14.0, 13.0, 10.0, 17.0, 16.0, 20.0, 19.0, 28.0, 35.0, 43.0, 41.0, 70.0, 87.0, 121.0, 204.0, 388.0, 926.0, 23779.0, 3112229.0, 5998.0, 656.0, 282.0, 187.0, 121.0, 79.0, 49.0, 50.0, 47.0, 30.0, 23.0, 19.0, 14.0, 13.0, 8.0, 10.0, 8.0, 14.0, 4.0, 6.0, 2.0, 3.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-52.5, -50.8779296875, -49.255859375, -47.6337890625, -46.01171875, -44.3896484375, -42.767578125, -41.1455078125, -39.5234375, -37.9013671875, -36.279296875, -34.6572265625, -33.03515625, -31.4130859375, -29.791015625, -28.1689453125, -26.546875, -24.9248046875, -23.302734375, -21.6806640625, -20.05859375, -18.4365234375, -16.814453125, -15.1923828125, -13.5703125, -11.9482421875, -10.326171875, -8.7041015625, -7.08203125, -5.4599609375, -3.837890625, -2.2158203125, -0.59375, 1.0283203125, 2.650390625, 4.2724609375, 5.89453125, 7.5166015625, 9.138671875, 10.7607421875, 12.3828125, 14.0048828125, 15.626953125, 17.2490234375, 18.87109375, 20.4931640625, 22.115234375, 23.7373046875, 25.359375, 26.9814453125, 28.603515625, 30.2255859375, 31.84765625, 33.4697265625, 35.091796875, 36.7138671875, 38.3359375, 39.9580078125, 41.580078125, 43.2021484375, 44.82421875, 46.4462890625, 48.068359375, 49.6904296875, 51.3125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 47.0, 208.0, 376.0, 272.0, 86.0, 15.0, 3.0], "bins": [-83.17974853515625, -81.78570556640625, -80.39166259765625, -78.99762725830078, -77.60358428955078, -76.20954132080078, -74.81549835205078, -73.42146301269531, -72.02742004394531, -70.63337707519531, -69.23933410644531, -67.84529876708984, -66.45125579833984, -65.05721282958984, -63.66317367553711, -62.26913070678711, -60.875091552734375, -59.481048583984375, -58.08700942993164, -56.69296646118164, -55.298927307128906, -53.904884338378906, -52.51084518432617, -51.11680221557617, -49.72275924682617, -48.32871627807617, -46.93467712402344, -45.54063415527344, -44.1465950012207, -42.7525520324707, -41.35851287841797, -39.96446990966797, -38.570430755615234, -37.176387786865234, -35.7823486328125, -34.3883056640625, -32.994266510009766, -31.6002254486084, -30.20618438720703, -28.81214141845703, -27.418100357055664, -26.024059295654297, -24.63001823425293, -23.235977172851562, -21.841936111450195, -20.447895050048828, -19.053852081298828, -17.659812927246094, -16.265769958496094, -14.871728897094727, -13.47768783569336, -12.083646774291992, -10.689605712890625, -9.295564651489258, -7.901522636413574, -6.507481575012207, -5.113441467285156, -3.719400405883789, -2.3253591060638428, -0.9313178062438965, 0.4627232551574707, 1.856764316558838, 3.2508058547973633, 4.6448469161987305, 6.038887977600098]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 4.0, 7.0, 4.0, 7.0, 6.0, 13.0, 14.0, 8.0, 14.0, 12.0, 16.0, 21.0, 21.0, 26.0, 30.0, 25.0, 23.0, 25.0, 24.0, 34.0, 37.0, 32.0, 35.0, 49.0, 50.0, 35.0, 27.0, 38.0, 29.0, 26.0, 22.0, 27.0, 29.0, 31.0, 24.0, 24.0, 18.0, 27.0, 18.0, 18.0, 20.0, 9.0, 9.0, 8.0, 6.0, 11.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-46.25877380371094, -44.89012145996094, -43.52146911621094, -42.15281677246094, -40.78416061401367, -39.41550827026367, -38.04685592651367, -36.67820358276367, -35.309547424316406, -33.940895080566406, -32.572242736816406, -31.203588485717773, -29.83493423461914, -28.46628189086914, -27.09762954711914, -25.72897720336914, -24.36032485961914, -22.99167251586914, -21.623018264770508, -20.254365921020508, -18.885711669921875, -17.517059326171875, -16.148406982421875, -14.779753684997559, -13.411100387573242, -12.042447090148926, -10.67379379272461, -9.30514144897461, -7.936488151550293, -6.567834854125977, -5.199182510375977, -3.83052921295166, -2.461872100830078, -1.0932190418243408, 0.2754340171813965, 1.6440868377685547, 3.012740135192871, 4.3813934326171875, 5.7500457763671875, 7.118699073791504, 8.48735237121582, 9.856005668640137, 11.224658966064453, 12.593311309814453, 13.96196460723877, 15.330617904663086, 16.699270248413086, 18.06792449951172, 19.43657684326172, 20.80522918701172, 22.17388343811035, 23.54253578186035, 24.911190032958984, 26.279842376708984, 27.648494720458984, 29.017147064208984, 30.385801315307617, 31.754453659057617, 33.12310791015625, 34.49176025390625, 35.86041259765625, 37.22906494140625, 38.59771728515625, 39.966373443603516, 41.335025787353516]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 6.0, 9.0, 7.0, 15.0, 11.0, 18.0, 18.0, 24.0, 19.0, 27.0, 31.0, 23.0, 32.0, 32.0, 33.0, 35.0, 38.0, 37.0, 37.0, 45.0, 47.0, 49.0, 34.0, 29.0, 37.0, 31.0, 20.0, 33.0, 20.0, 33.0, 24.0, 15.0, 14.0, 19.0, 20.0, 12.0, 13.0, 16.0, 7.0, 10.0, 2.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.05859375, -5.8802490234375, -5.701904296875, -5.5235595703125, -5.34521484375, -5.1668701171875, -4.988525390625, -4.8101806640625, -4.6318359375, -4.4534912109375, -4.275146484375, -4.0968017578125, -3.91845703125, -3.7401123046875, -3.561767578125, -3.3834228515625, -3.205078125, -3.0267333984375, -2.848388671875, -2.6700439453125, -2.49169921875, -2.3133544921875, -2.135009765625, -1.9566650390625, -1.7783203125, -1.5999755859375, -1.421630859375, -1.2432861328125, -1.06494140625, -0.8865966796875, -0.708251953125, -0.5299072265625, -0.3515625, -0.1732177734375, 0.005126953125, 0.1834716796875, 0.36181640625, 0.5401611328125, 0.718505859375, 0.8968505859375, 1.0751953125, 1.2535400390625, 1.431884765625, 1.6102294921875, 1.78857421875, 1.9669189453125, 2.145263671875, 2.3236083984375, 2.501953125, 2.6802978515625, 2.858642578125, 3.0369873046875, 3.21533203125, 3.3936767578125, 3.572021484375, 3.7503662109375, 3.9287109375, 4.1070556640625, 4.285400390625, 4.4637451171875, 4.64208984375, 4.8204345703125, 4.998779296875, 5.1771240234375, 5.35546875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 7.0, 16.0, 23.0, 29.0, 37.0, 53.0, 83.0, 95.0, 178.0, 320.0, 632.0, 1495.0, 4136.0, 12722.0, 50101.0, 276236.0, 1176925.0, 1796704.0, 703808.0, 128885.0, 28331.0, 8126.0, 2880.0, 1162.0, 532.0, 267.0, 171.0, 87.0, 67.0, 53.0, 40.0, 15.0, 22.0, 19.0, 11.0, 7.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-10.6171875, -10.34698486328125, -10.0767822265625, -9.80657958984375, -9.536376953125, -9.26617431640625, -8.9959716796875, -8.72576904296875, -8.45556640625, -8.18536376953125, -7.9151611328125, -7.64495849609375, -7.374755859375, -7.10455322265625, -6.8343505859375, -6.56414794921875, -6.2939453125, -6.02374267578125, -5.7535400390625, -5.48333740234375, -5.213134765625, -4.94293212890625, -4.6727294921875, -4.40252685546875, -4.13232421875, -3.86212158203125, -3.5919189453125, -3.32171630859375, -3.051513671875, -2.78131103515625, -2.5111083984375, -2.24090576171875, -1.970703125, -1.70050048828125, -1.4302978515625, -1.16009521484375, -0.889892578125, -0.61968994140625, -0.3494873046875, -0.07928466796875, 0.19091796875, 0.46112060546875, 0.7313232421875, 1.00152587890625, 1.271728515625, 1.54193115234375, 1.8121337890625, 2.08233642578125, 2.3525390625, 2.62274169921875, 2.8929443359375, 3.16314697265625, 3.433349609375, 3.70355224609375, 3.9737548828125, 4.24395751953125, 4.51416015625, 4.78436279296875, 5.0545654296875, 5.32476806640625, 5.594970703125, 5.86517333984375, 6.1353759765625, 6.40557861328125, 6.67578125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 8.0, 9.0, 13.0, 18.0, 24.0, 40.0, 36.0, 52.0, 87.0, 103.0, 125.0, 189.0, 214.0, 265.0, 363.0, 384.0, 407.0, 392.0, 318.0, 276.0, 179.0, 123.0, 111.0, 76.0, 57.0, 41.0, 39.0, 27.0, 30.0, 16.0, 15.0, 15.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.46875, -12.1422119140625, -11.815673828125, -11.4891357421875, -11.16259765625, -10.8360595703125, -10.509521484375, -10.1829833984375, -9.8564453125, -9.5299072265625, -9.203369140625, -8.8768310546875, -8.55029296875, -8.2237548828125, -7.897216796875, -7.5706787109375, -7.244140625, -6.9176025390625, -6.591064453125, -6.2645263671875, -5.93798828125, -5.6114501953125, -5.284912109375, -4.9583740234375, -4.6318359375, -4.3052978515625, -3.978759765625, -3.6522216796875, -3.32568359375, -2.9991455078125, -2.672607421875, -2.3460693359375, -2.01953125, -1.6929931640625, -1.366455078125, -1.0399169921875, -0.71337890625, -0.3868408203125, -0.060302734375, 0.2662353515625, 0.5927734375, 0.9193115234375, 1.245849609375, 1.5723876953125, 1.89892578125, 2.2254638671875, 2.552001953125, 2.8785400390625, 3.205078125, 3.5316162109375, 3.858154296875, 4.1846923828125, 4.51123046875, 4.8377685546875, 5.164306640625, 5.4908447265625, 5.8173828125, 6.1439208984375, 6.470458984375, 6.7969970703125, 7.12353515625, 7.4500732421875, 7.776611328125, 8.1031494140625, 8.4296875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 7.0, 13.0, 27.0, 16.0, 36.0, 28.0, 66.0, 75.0, 91.0, 127.0, 139.0, 199.0, 266.0, 384.0, 654.0, 1538.0, 15070.0, 3276531.0, 889409.0, 6631.0, 1026.0, 528.0, 325.0, 277.0, 209.0, 135.0, 102.0, 95.0, 66.0, 49.0, 40.0, 33.0, 25.0, 14.0, 15.0, 12.0, 1.0, 7.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.75, -31.43359375, -30.1171875, -28.80078125, -27.484375, -26.16796875, -24.8515625, -23.53515625, -22.21875, -20.90234375, -19.5859375, -18.26953125, -16.953125, -15.63671875, -14.3203125, -13.00390625, -11.6875, -10.37109375, -9.0546875, -7.73828125, -6.421875, -5.10546875, -3.7890625, -2.47265625, -1.15625, 0.16015625, 1.4765625, 2.79296875, 4.109375, 5.42578125, 6.7421875, 8.05859375, 9.375, 10.69140625, 12.0078125, 13.32421875, 14.640625, 15.95703125, 17.2734375, 18.58984375, 19.90625, 21.22265625, 22.5390625, 23.85546875, 25.171875, 26.48828125, 27.8046875, 29.12109375, 30.4375, 31.75390625, 33.0703125, 34.38671875, 35.703125, 37.01953125, 38.3359375, 39.65234375, 40.96875, 42.28515625, 43.6015625, 44.91796875, 46.234375, 47.55078125, 48.8671875, 50.18359375, 51.5]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 436.0, 532.0, 30.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-486.7415466308594, -477.9002685546875, -469.0589904785156, -460.21771240234375, -451.3764343261719, -442.53515625, -433.6938781738281, -424.85260009765625, -416.0113220214844, -407.1700439453125, -398.3287658691406, -389.48748779296875, -380.6462097167969, -371.804931640625, -362.9636535644531, -354.12237548828125, -345.2811279296875, -336.4398498535156, -327.59857177734375, -318.7572937011719, -309.916015625, -301.0747375488281, -292.23345947265625, -283.3921813964844, -274.5509033203125, -265.7096252441406, -256.86834716796875, -248.02706909179688, -239.185791015625, -230.34451293945312, -221.50323486328125, -212.66195678710938, -203.82070922851562, -194.97943115234375, -186.13815307617188, -177.296875, -168.45559692382812, -159.61431884765625, -150.77304077148438, -141.9317626953125, -133.09048461914062, -124.24920654296875, -115.40792846679688, -106.566650390625, -97.72537231445312, -88.88409423828125, -80.0428237915039, -71.20154571533203, -62.360267639160156, -53.51898956298828, -44.677711486816406, -35.8364372253418, -26.995159149169922, -18.153881072998047, -9.312606811523438, -0.4713287353515625, 8.369949340820312, 17.211227416992188, 26.05250358581543, 34.89377975463867, 43.73505783081055, 52.57633590698242, 61.41761016845703, 70.2588882446289, 79.10016632080078]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 4.0, 8.0, 10.0, 16.0, 12.0, 9.0, 25.0, 17.0, 21.0, 22.0, 21.0, 28.0, 27.0, 47.0, 49.0, 34.0, 56.0, 31.0, 39.0, 32.0, 44.0, 39.0, 43.0, 27.0, 33.0, 33.0, 25.0, 32.0, 21.0, 28.0, 28.0, 14.0, 25.0, 26.0, 11.0, 11.0, 11.0, 6.0, 3.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-36.28489685058594, -35.20779037475586, -34.13068389892578, -33.0535774230957, -31.976472854614258, -30.89936637878418, -29.822261810302734, -28.745155334472656, -27.668048858642578, -26.5909423828125, -25.513835906982422, -24.436731338500977, -23.3596248626709, -22.28251838684082, -21.205413818359375, -20.128307342529297, -19.05120086669922, -17.97409439086914, -16.896987915039062, -15.819883346557617, -14.742776870727539, -13.665670394897461, -12.5885648727417, -11.511459350585938, -10.43435287475586, -9.357246398925781, -8.28014087677002, -7.2030348777771, -6.12592887878418, -5.04882287979126, -3.97171688079834, -2.89461088180542, -1.8175048828125, -0.7403988838195801, 0.33670711517333984, 1.4138131141662598, 2.4909191131591797, 3.5680251121520996, 4.6451311111450195, 5.7222371101379395, 6.799343109130859, 7.876449108123779, 8.9535551071167, 10.030660629272461, 11.107767105102539, 12.184873580932617, 13.261979103088379, 14.33908462524414, 15.416191101074219, 16.493297576904297, 17.570404052734375, 18.64750862121582, 19.7246150970459, 20.801721572875977, 21.878826141357422, 22.9559326171875, 24.033039093017578, 25.110145568847656, 26.187252044677734, 27.26435661315918, 28.341463088989258, 29.418569564819336, 30.49567413330078, 31.57278060913086, 32.64988708496094]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 7.0, 9.0, 8.0, 8.0, 13.0, 14.0, 12.0, 13.0, 13.0, 18.0, 13.0, 24.0, 26.0, 39.0, 17.0, 31.0, 24.0, 28.0, 33.0, 48.0, 36.0, 34.0, 43.0, 37.0, 32.0, 34.0, 27.0, 31.0, 32.0, 28.0, 36.0, 23.0, 23.0, 19.0, 21.0, 18.0, 18.0, 15.0, 19.0, 15.0, 13.0, 13.0, 9.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-5.20703125, -5.04876708984375, -4.8905029296875, -4.73223876953125, -4.573974609375, -4.41571044921875, -4.2574462890625, -4.09918212890625, -3.94091796875, -3.78265380859375, -3.6243896484375, -3.46612548828125, -3.307861328125, -3.14959716796875, -2.9913330078125, -2.83306884765625, -2.6748046875, -2.51654052734375, -2.3582763671875, -2.20001220703125, -2.041748046875, -1.88348388671875, -1.7252197265625, -1.56695556640625, -1.40869140625, -1.25042724609375, -1.0921630859375, -0.93389892578125, -0.775634765625, -0.61737060546875, -0.4591064453125, -0.30084228515625, -0.142578125, 0.01568603515625, 0.1739501953125, 0.33221435546875, 0.490478515625, 0.64874267578125, 0.8070068359375, 0.96527099609375, 1.12353515625, 1.28179931640625, 1.4400634765625, 1.59832763671875, 1.756591796875, 1.91485595703125, 2.0731201171875, 2.23138427734375, 2.3896484375, 2.54791259765625, 2.7061767578125, 2.86444091796875, 3.022705078125, 3.18096923828125, 3.3392333984375, 3.49749755859375, 3.65576171875, 3.81402587890625, 3.9722900390625, 4.13055419921875, 4.288818359375, 4.44708251953125, 4.6053466796875, 4.76361083984375, 4.921875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 7.0, 10.0, 29.0, 37.0, 41.0, 45.0, 89.0, 112.0, 187.0, 258.0, 423.0, 654.0, 866.0, 1303.0, 1878.0, 2717.0, 4190.0, 6313.0, 9689.0, 15092.0, 23952.0, 39169.0, 66442.0, 116878.0, 198392.0, 218805.0, 139022.0, 78785.0, 45588.0, 27660.0, 17194.0, 11044.0, 7196.0, 4774.0, 3161.0, 2106.0, 1414.0, 978.0, 672.0, 445.0, 296.0, 197.0, 143.0, 93.0, 79.0, 37.0, 27.0, 25.0, 20.0, 7.0, 4.0, 2.0, 7.0, 2.0, 3.0, 1.0], "bins": [-0.767578125, -0.7444229125976562, -0.7212677001953125, -0.6981124877929688, -0.674957275390625, -0.6518020629882812, -0.6286468505859375, -0.6054916381835938, -0.58233642578125, -0.5591812133789062, -0.5360260009765625, -0.5128707885742188, -0.489715576171875, -0.46656036376953125, -0.4434051513671875, -0.42024993896484375, -0.3970947265625, -0.37393951416015625, -0.3507843017578125, -0.32762908935546875, -0.304473876953125, -0.28131866455078125, -0.2581634521484375, -0.23500823974609375, -0.21185302734375, -0.18869781494140625, -0.1655426025390625, -0.14238739013671875, -0.119232177734375, -0.09607696533203125, -0.0729217529296875, -0.04976654052734375, -0.026611328125, -0.00345611572265625, 0.0196990966796875, 0.04285430908203125, 0.066009521484375, 0.08916473388671875, 0.1123199462890625, 0.13547515869140625, 0.15863037109375, 0.18178558349609375, 0.2049407958984375, 0.22809600830078125, 0.251251220703125, 0.27440643310546875, 0.2975616455078125, 0.32071685791015625, 0.3438720703125, 0.36702728271484375, 0.3901824951171875, 0.41333770751953125, 0.436492919921875, 0.45964813232421875, 0.4828033447265625, 0.5059585571289062, 0.52911376953125, 0.5522689819335938, 0.5754241943359375, 0.5985794067382812, 0.621734619140625, 0.6448898315429688, 0.6680450439453125, 0.6912002563476562, 0.71435546875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 9.0, 8.0, 17.0, 10.0, 24.0, 14.0, 21.0, 29.0, 17.0, 20.0, 31.0, 39.0, 30.0, 45.0, 46.0, 42.0, 49.0, 37.0, 1068.0, 42.0, 36.0, 31.0, 46.0, 30.0, 36.0, 35.0, 32.0, 29.0, 22.0, 12.0, 18.0, 13.0, 12.0, 19.0, 13.0, 7.0, 6.0, 11.0, 1.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.486328125, -3.363861083984375, -3.24139404296875, -3.118927001953125, -2.9964599609375, -2.873992919921875, -2.75152587890625, -2.629058837890625, -2.506591796875, -2.384124755859375, -2.26165771484375, -2.139190673828125, -2.0167236328125, -1.894256591796875, -1.77178955078125, -1.649322509765625, -1.52685546875, -1.404388427734375, -1.28192138671875, -1.159454345703125, -1.0369873046875, -0.914520263671875, -0.79205322265625, -0.669586181640625, -0.547119140625, -0.424652099609375, -0.30218505859375, -0.179718017578125, -0.0572509765625, 0.065216064453125, 0.18768310546875, 0.310150146484375, 0.4326171875, 0.555084228515625, 0.67755126953125, 0.800018310546875, 0.9224853515625, 1.044952392578125, 1.16741943359375, 1.289886474609375, 1.412353515625, 1.534820556640625, 1.65728759765625, 1.779754638671875, 1.9022216796875, 2.024688720703125, 2.14715576171875, 2.269622802734375, 2.39208984375, 2.514556884765625, 2.63702392578125, 2.759490966796875, 2.8819580078125, 3.004425048828125, 3.12689208984375, 3.249359130859375, 3.371826171875, 3.494293212890625, 3.61676025390625, 3.739227294921875, 3.8616943359375, 3.984161376953125, 4.10662841796875, 4.229095458984375, 4.3515625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 10.0, 18.0, 27.0, 51.0, 87.0, 129.0, 194.0, 329.0, 579.0, 996.0, 1629.0, 2829.0, 4889.0, 8850.0, 15937.0, 29633.0, 55331.0, 107766.0, 200992.0, 1304456.0, 172160.0, 88494.0, 46477.0, 24829.0, 13304.0, 7356.0, 4132.0, 2327.0, 1300.0, 762.0, 462.0, 279.0, 173.0, 111.0, 71.0, 46.0, 37.0, 18.0, 15.0, 18.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.84716796875, -0.8238677978515625, -0.800567626953125, -0.7772674560546875, -0.75396728515625, -0.7306671142578125, -0.707366943359375, -0.6840667724609375, -0.6607666015625, -0.6374664306640625, -0.614166259765625, -0.5908660888671875, -0.56756591796875, -0.5442657470703125, -0.520965576171875, -0.4976654052734375, -0.474365234375, -0.4510650634765625, -0.427764892578125, -0.4044647216796875, -0.38116455078125, -0.3578643798828125, -0.334564208984375, -0.3112640380859375, -0.2879638671875, -0.2646636962890625, -0.241363525390625, -0.2180633544921875, -0.19476318359375, -0.1714630126953125, -0.148162841796875, -0.1248626708984375, -0.1015625, -0.0782623291015625, -0.054962158203125, -0.0316619873046875, -0.00836181640625, 0.0149383544921875, 0.038238525390625, 0.0615386962890625, 0.0848388671875, 0.1081390380859375, 0.131439208984375, 0.1547393798828125, 0.17803955078125, 0.2013397216796875, 0.224639892578125, 0.2479400634765625, 0.271240234375, 0.2945404052734375, 0.317840576171875, 0.3411407470703125, 0.36444091796875, 0.3877410888671875, 0.411041259765625, 0.4343414306640625, 0.4576416015625, 0.4809417724609375, 0.504241943359375, 0.5275421142578125, 0.55084228515625, 0.5741424560546875, 0.597442626953125, 0.6207427978515625, 0.64404296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 17.0, 17.0, 20.0, 18.0, 29.0, 21.0, 34.0, 43.0, 50.0, 58.0, 74.0, 74.0, 53.0, 67.0, 69.0, 48.0, 49.0, 37.0, 48.0, 26.0, 20.0, 27.0, 21.0, 15.0, 8.0, 11.0, 8.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.002773284912109375, -0.002696692943572998, -0.002620100975036621, -0.002543509006500244, -0.002466917037963867, -0.0023903250694274902, -0.0023137331008911133, -0.0022371411323547363, -0.0021605491638183594, -0.0020839571952819824, -0.0020073652267456055, -0.0019307732582092285, -0.0018541812896728516, -0.0017775893211364746, -0.0017009973526000977, -0.0016244053840637207, -0.0015478134155273438, -0.0014712214469909668, -0.0013946294784545898, -0.0013180375099182129, -0.001241445541381836, -0.001164853572845459, -0.001088261604309082, -0.001011669635772705, -0.0009350776672363281, -0.0008584856986999512, -0.0007818937301635742, -0.0007053017616271973, -0.0006287097930908203, -0.0005521178245544434, -0.0004755258560180664, -0.00039893388748168945, -0.0003223419189453125, -0.00024574995040893555, -0.0001691579818725586, -9.256601333618164e-05, -1.5974044799804688e-05, 6.0617923736572266e-05, 0.00013720989227294922, 0.00021380186080932617, 0.0002903938293457031, 0.0003669857978820801, 0.00044357776641845703, 0.000520169734954834, 0.0005967617034912109, 0.0006733536720275879, 0.0007499456405639648, 0.0008265376091003418, 0.0009031295776367188, 0.0009797215461730957, 0.0010563135147094727, 0.0011329054832458496, 0.0012094974517822266, 0.0012860894203186035, 0.0013626813888549805, 0.0014392733573913574, 0.0015158653259277344, 0.0015924572944641113, 0.0016690492630004883, 0.0017456412315368652, 0.0018222332000732422, 0.0018988251686096191, 0.001975417137145996, 0.002052009105682373, 0.00212860107421875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 2.0, 1.0, 3.0, 8.0, 7.0, 11.0, 13.0, 17.0, 19.0, 24.0, 47.0, 56.0, 81.0, 77.0, 124.0, 194.0, 511.0, 2013.0, 1008521.0, 35279.0, 748.0, 278.0, 153.0, 89.0, 59.0, 52.0, 36.0, 36.0, 28.0, 18.0, 16.0, 4.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05291748046875, -0.05107593536376953, -0.04923439025878906, -0.047392845153808594, -0.045551300048828125, -0.043709754943847656, -0.04186820983886719, -0.04002666473388672, -0.03818511962890625, -0.03634357452392578, -0.03450202941894531, -0.032660484313964844, -0.030818939208984375, -0.028977394104003906, -0.027135848999023438, -0.02529430389404297, -0.0234527587890625, -0.02161121368408203, -0.019769668579101562, -0.017928123474121094, -0.016086578369140625, -0.014245033264160156, -0.012403488159179688, -0.010561943054199219, -0.00872039794921875, -0.006878852844238281, -0.0050373077392578125, -0.0031957626342773438, -0.001354217529296875, 0.00048732757568359375, 0.0023288726806640625, 0.004170417785644531, 0.006011962890625, 0.007853507995605469, 0.009695053100585938, 0.011536598205566406, 0.013378143310546875, 0.015219688415527344, 0.017061233520507812, 0.01890277862548828, 0.02074432373046875, 0.02258586883544922, 0.024427413940429688, 0.026268959045410156, 0.028110504150390625, 0.029952049255371094, 0.03179359436035156, 0.03363513946533203, 0.0354766845703125, 0.03731822967529297, 0.03915977478027344, 0.041001319885253906, 0.042842864990234375, 0.044684410095214844, 0.04652595520019531, 0.04836750030517578, 0.05020904541015625, 0.05205059051513672, 0.05389213562011719, 0.055733680725097656, 0.057575225830078125, 0.059416770935058594, 0.06125831604003906, 0.06309986114501953, 0.06494140625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 24.0, 98.0, 347.0, 360.0, 142.0, 34.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027707030531018972, -0.0026084640994668007, -0.0024462249130010605, -0.0022839857265353203, -0.0021217467729002237, -0.001959507819265127, -0.001797268632799387, -0.0016350295627489686, -0.0014727904926985502, -0.0013105514226481318, -0.0011483123525977135, -0.000986073282547295, -0.0008238342124968767, -0.0006615951424464583, -0.00049935607239604, -0.0003371170023456216, -0.0001748779322952032, -1.2638862244784832e-05, 0.00014960020780563354, 0.0003118392778560519, 0.0004740783479064703, 0.0006363174179568887, 0.000798556488007307, 0.0009607955580577254, 0.0011230346281081438, 0.0012852736981585622, 0.0014475127682089806, 0.001609751838259399, 0.0017719909083098173, 0.0019342299783602357, 0.002096469048410654, 0.0022587082348763943, 0.0024209474213421345, 0.0025831866078078747, 0.0027454255614429712, 0.0029076645150780678, 0.003069903701543808, 0.003232142888009548, 0.0033943818416446447, 0.0035566207952797413, 0.0037188599817454815, 0.0038810991682112217, 0.004043337889015675, 0.004205577075481415, 0.004367816261947155, 0.004530055448412895, 0.004692294634878635, 0.004854533355683088, 0.0050167725421488285, 0.005179011728614569, 0.005341250449419022, 0.005503489635884762, 0.005665728822350502, 0.005827968008816242, 0.005990207195281982, 0.006152445916086435, 0.0063146851025521755, 0.006476924289017916, 0.006639163009822369, 0.006801402196288109, 0.006963641382753849, 0.007125880569219589, 0.0072881197556853294, 0.007450358476489782, 0.0076125976629555225]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 10.0, 16.0, 6.0, 14.0, 15.0, 14.0, 17.0, 25.0, 30.0, 27.0, 31.0, 31.0, 32.0, 38.0, 38.0, 31.0, 39.0, 28.0, 25.0, 45.0, 37.0, 37.0, 43.0, 31.0, 37.0, 24.0, 43.0, 36.0, 25.0, 29.0, 24.0, 15.0, 16.0, 20.0, 10.0, 13.0, 7.0, 7.0, 9.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.001285254955291748, -0.0012497790157794952, -0.0012143030762672424, -0.0011788271367549896, -0.0011433511972427368, -0.001107875257730484, -0.0010723993182182312, -0.0010369233787059784, -0.0010014474391937256, -0.0009659714996814728, -0.00093049556016922, -0.0008950196206569672, -0.0008595436811447144, -0.0008240677416324615, -0.0007885918021202087, -0.0007531158626079559, -0.0007176399230957031, -0.0006821639835834503, -0.0006466880440711975, -0.0006112121045589447, -0.0005757361650466919, -0.0005402602255344391, -0.0005047842860221863, -0.00046930834650993347, -0.00043383240699768066, -0.00039835646748542786, -0.00036288052797317505, -0.00032740458846092224, -0.00029192864894866943, -0.0002564527094364166, -0.00022097676992416382, -0.000185500830411911, -0.0001500248908996582, -0.0001145489513874054, -7.907301187515259e-05, -4.359707236289978e-05, -8.121132850646973e-06, 2.7354806661605835e-05, 6.283074617385864e-05, 9.830668568611145e-05, 0.00013378262519836426, 0.00016925856471061707, 0.00020473450422286987, 0.00024021044373512268, 0.0002756863832473755, 0.0003111623227596283, 0.0003466382622718811, 0.0003821142017841339, 0.0004175901412963867, 0.0004530660808086395, 0.0004885420203208923, 0.0005240179598331451, 0.000559493899345398, 0.0005949698388576508, 0.0006304457783699036, 0.0006659217178821564, 0.0007013976573944092, 0.000736873596906662, 0.0007723495364189148, 0.0008078254759311676, 0.0008433014154434204, 0.0008787773549556732, 0.000914253294467926, 0.0009497292339801788, 0.0009852051734924316]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 7.0, 9.0, 8.0, 8.0, 13.0, 14.0, 12.0, 13.0, 13.0, 18.0, 13.0, 24.0, 26.0, 39.0, 17.0, 31.0, 24.0, 28.0, 33.0, 48.0, 36.0, 34.0, 43.0, 37.0, 32.0, 34.0, 27.0, 31.0, 32.0, 28.0, 36.0, 23.0, 23.0, 19.0, 21.0, 18.0, 18.0, 15.0, 19.0, 15.0, 13.0, 13.0, 9.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-5.20703125, -5.04876708984375, -4.8905029296875, -4.73223876953125, -4.573974609375, -4.41571044921875, -4.2574462890625, -4.09918212890625, -3.94091796875, -3.78265380859375, -3.6243896484375, -3.46612548828125, -3.307861328125, -3.14959716796875, -2.9913330078125, -2.83306884765625, -2.6748046875, -2.51654052734375, -2.3582763671875, -2.20001220703125, -2.041748046875, -1.88348388671875, -1.7252197265625, -1.56695556640625, -1.40869140625, -1.25042724609375, -1.0921630859375, -0.93389892578125, -0.775634765625, -0.61737060546875, -0.4591064453125, -0.30084228515625, -0.142578125, 0.01568603515625, 0.1739501953125, 0.33221435546875, 0.490478515625, 0.64874267578125, 0.8070068359375, 0.96527099609375, 1.12353515625, 1.28179931640625, 1.4400634765625, 1.59832763671875, 1.756591796875, 1.91485595703125, 2.0731201171875, 2.23138427734375, 2.3896484375, 2.54791259765625, 2.7061767578125, 2.86444091796875, 3.022705078125, 3.18096923828125, 3.3392333984375, 3.49749755859375, 3.65576171875, 3.81402587890625, 3.9722900390625, 4.13055419921875, 4.288818359375, 4.44708251953125, 4.6053466796875, 4.76361083984375, 4.921875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 2.0, 9.0, 7.0, 6.0, 16.0, 19.0, 20.0, 26.0, 26.0, 30.0, 45.0, 73.0, 104.0, 196.0, 358.0, 712.0, 1455.0, 3194.0, 7179.0, 16085.0, 35281.0, 81149.0, 217841.0, 391580.0, 171807.0, 66966.0, 29733.0, 13318.0, 5899.0, 2730.0, 1238.0, 586.0, 303.0, 165.0, 113.0, 71.0, 40.0, 30.0, 39.0, 10.0, 24.0, 12.0, 11.0, 16.0, 4.0, 8.0, 6.0, 4.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.890625, -4.7396240234375, -4.588623046875, -4.4376220703125, -4.28662109375, -4.1356201171875, -3.984619140625, -3.8336181640625, -3.6826171875, -3.5316162109375, -3.380615234375, -3.2296142578125, -3.07861328125, -2.9276123046875, -2.776611328125, -2.6256103515625, -2.474609375, -2.3236083984375, -2.172607421875, -2.0216064453125, -1.87060546875, -1.7196044921875, -1.568603515625, -1.4176025390625, -1.2666015625, -1.1156005859375, -0.964599609375, -0.8135986328125, -0.66259765625, -0.5115966796875, -0.360595703125, -0.2095947265625, -0.05859375, 0.0924072265625, 0.243408203125, 0.3944091796875, 0.54541015625, 0.6964111328125, 0.847412109375, 0.9984130859375, 1.1494140625, 1.3004150390625, 1.451416015625, 1.6024169921875, 1.75341796875, 1.9044189453125, 2.055419921875, 2.2064208984375, 2.357421875, 2.5084228515625, 2.659423828125, 2.8104248046875, 2.96142578125, 3.1124267578125, 3.263427734375, 3.4144287109375, 3.5654296875, 3.7164306640625, 3.867431640625, 4.0184326171875, 4.16943359375, 4.3204345703125, 4.471435546875, 4.6224365234375, 4.7734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 3.0, 5.0, 12.0, 10.0, 16.0, 15.0, 22.0, 14.0, 23.0, 29.0, 19.0, 33.0, 30.0, 37.0, 48.0, 56.0, 64.0, 134.0, 1480.0, 392.0, 112.0, 65.0, 51.0, 46.0, 32.0, 34.0, 31.0, 21.0, 22.0, 31.0, 29.0, 15.0, 19.0, 15.0, 19.0, 8.0, 5.0, 9.0, 11.0, 7.0, 5.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.734375, -18.165283203125, -17.59619140625, -17.027099609375, -16.4580078125, -15.888916015625, -15.31982421875, -14.750732421875, -14.181640625, -13.612548828125, -13.04345703125, -12.474365234375, -11.9052734375, -11.336181640625, -10.76708984375, -10.197998046875, -9.62890625, -9.059814453125, -8.49072265625, -7.921630859375, -7.3525390625, -6.783447265625, -6.21435546875, -5.645263671875, -5.076171875, -4.507080078125, -3.93798828125, -3.368896484375, -2.7998046875, -2.230712890625, -1.66162109375, -1.092529296875, -0.5234375, 0.045654296875, 0.61474609375, 1.183837890625, 1.7529296875, 2.322021484375, 2.89111328125, 3.460205078125, 4.029296875, 4.598388671875, 5.16748046875, 5.736572265625, 6.3056640625, 6.874755859375, 7.44384765625, 8.012939453125, 8.58203125, 9.151123046875, 9.72021484375, 10.289306640625, 10.8583984375, 11.427490234375, 11.99658203125, 12.565673828125, 13.134765625, 13.703857421875, 14.27294921875, 14.842041015625, 15.4111328125, 15.980224609375, 16.54931640625, 17.118408203125, 17.6875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 2.0, 5.0, 6.0, 13.0, 11.0, 14.0, 11.0, 24.0, 25.0, 31.0, 50.0, 55.0, 72.0, 76.0, 104.0, 134.0, 180.0, 260.0, 421.0, 911.0, 8723.0, 2652769.0, 475527.0, 4230.0, 795.0, 395.0, 215.0, 156.0, 106.0, 82.0, 65.0, 54.0, 34.0, 32.0, 29.0, 21.0, 13.0, 8.0, 8.0, 11.0, 11.0, 3.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -30.948974609375, -29.91357421875, -28.878173828125, -27.8427734375, -26.807373046875, -25.77197265625, -24.736572265625, -23.701171875, -22.665771484375, -21.63037109375, -20.594970703125, -19.5595703125, -18.524169921875, -17.48876953125, -16.453369140625, -15.41796875, -14.382568359375, -13.34716796875, -12.311767578125, -11.2763671875, -10.240966796875, -9.20556640625, -8.170166015625, -7.134765625, -6.099365234375, -5.06396484375, -4.028564453125, -2.9931640625, -1.957763671875, -0.92236328125, 0.113037109375, 1.1484375, 2.183837890625, 3.21923828125, 4.254638671875, 5.2900390625, 6.325439453125, 7.36083984375, 8.396240234375, 9.431640625, 10.467041015625, 11.50244140625, 12.537841796875, 13.5732421875, 14.608642578125, 15.64404296875, 16.679443359375, 17.71484375, 18.750244140625, 19.78564453125, 20.821044921875, 21.8564453125, 22.891845703125, 23.92724609375, 24.962646484375, 25.998046875, 27.033447265625, 28.06884765625, 29.104248046875, 30.1396484375, 31.175048828125, 32.21044921875, 33.245849609375, 34.28125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 9.0, 164.0, 597.0, 227.0, 19.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.780529022216797, -10.007795333862305, -7.235060691833496, -4.4623260498046875, -1.6895923614501953, 1.0831413269042969, 3.855876922607422, 6.628610610961914, 9.401344299316406, 12.174077987670898, 14.946812629699707, 17.719547271728516, 20.492280960083008, 23.2650146484375, 26.037750244140625, 28.810483932495117, 31.58321762084961, 34.355953216552734, 37.128684997558594, 39.90142059326172, 42.674156188964844, 45.4468879699707, 48.21962356567383, 50.99235534667969, 53.76509094238281, 56.53782653808594, 59.3105583190918, 62.08329391479492, 64.85602569580078, 67.6287612915039, 70.40149688720703, 73.17423248291016, 75.94696044921875, 78.71969604492188, 81.492431640625, 84.26516723632812, 87.03789520263672, 89.81063079833984, 92.58336639404297, 95.3561019897461, 98.12882995605469, 100.90156555175781, 103.67430114746094, 106.44703674316406, 109.21976470947266, 111.99250030517578, 114.7652359008789, 117.53797149658203, 120.31070709228516, 123.08344268798828, 125.8561782836914, 128.62890625, 131.40164184570312, 134.17437744140625, 136.94711303710938, 139.7198486328125, 142.49258422851562, 145.26531982421875, 148.03805541992188, 150.810791015625, 153.58352661132812, 156.35626220703125, 159.12899780273438, 161.90171813964844, 164.67445373535156]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 5.0, 3.0, 4.0, 6.0, 8.0, 7.0, 13.0, 8.0, 11.0, 12.0, 12.0, 19.0, 19.0, 27.0, 29.0, 31.0, 42.0, 38.0, 39.0, 37.0, 36.0, 39.0, 54.0, 45.0, 42.0, 42.0, 34.0, 30.0, 44.0, 42.0, 32.0, 24.0, 27.0, 21.0, 22.0, 18.0, 14.0, 9.0, 15.0, 12.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-53.05552291870117, -51.49504089355469, -49.93455505371094, -48.37407302856445, -46.81359100341797, -45.253108978271484, -43.692623138427734, -42.13214111328125, -40.571659088134766, -39.01117706298828, -37.45069122314453, -35.89020919799805, -34.32972717285156, -32.76924514770508, -31.208759307861328, -29.648277282714844, -28.087793350219727, -26.52730941772461, -24.966827392578125, -23.406343460083008, -21.845861434936523, -20.285377502441406, -18.724895477294922, -17.164411544799805, -15.603928565979004, -14.043445587158203, -12.482962608337402, -10.922479629516602, -9.361995697021484, -7.801513195037842, -6.241029739379883, -4.680546760559082, -3.1200637817382812, -1.559580683708191, 0.0009024143218994141, 1.5613856315612793, 3.12186861038208, 4.682351589202881, 6.24283504486084, 7.803318023681641, 9.363801002502441, 10.924283981323242, 12.484766960144043, 14.045249938964844, 15.605733871459961, 17.166215896606445, 18.726699829101562, 20.287181854248047, 21.847665786743164, 23.40814971923828, 24.968631744384766, 26.529115676879883, 28.089597702026367, 29.650081634521484, 31.21056365966797, 32.77104949951172, 34.3315315246582, 35.89201354980469, 37.45249938964844, 39.01298141479492, 40.573463439941406, 42.13394546508789, 43.69443130493164, 45.254913330078125, 46.81539535522461]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 5.0, 7.0, 7.0, 11.0, 13.0, 14.0, 16.0, 9.0, 16.0, 17.0, 18.0, 32.0, 24.0, 23.0, 27.0, 27.0, 43.0, 36.0, 40.0, 33.0, 38.0, 41.0, 30.0, 31.0, 34.0, 41.0, 34.0, 26.0, 36.0, 25.0, 25.0, 32.0, 21.0, 16.0, 24.0, 10.0, 18.0, 22.0, 8.0, 9.0, 9.0, 12.0, 9.0, 6.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.10546875, -4.94158935546875, -4.7777099609375, -4.61383056640625, -4.449951171875, -4.28607177734375, -4.1221923828125, -3.95831298828125, -3.79443359375, -3.63055419921875, -3.4666748046875, -3.30279541015625, -3.138916015625, -2.97503662109375, -2.8111572265625, -2.64727783203125, -2.4833984375, -2.31951904296875, -2.1556396484375, -1.99176025390625, -1.827880859375, -1.66400146484375, -1.5001220703125, -1.33624267578125, -1.17236328125, -1.00848388671875, -0.8446044921875, -0.68072509765625, -0.516845703125, -0.35296630859375, -0.1890869140625, -0.02520751953125, 0.138671875, 0.30255126953125, 0.4664306640625, 0.63031005859375, 0.794189453125, 0.95806884765625, 1.1219482421875, 1.28582763671875, 1.44970703125, 1.61358642578125, 1.7774658203125, 1.94134521484375, 2.105224609375, 2.26910400390625, 2.4329833984375, 2.59686279296875, 2.7607421875, 2.92462158203125, 3.0885009765625, 3.25238037109375, 3.416259765625, 3.58013916015625, 3.7440185546875, 3.90789794921875, 4.07177734375, 4.23565673828125, 4.3995361328125, 4.56341552734375, 4.727294921875, 4.89117431640625, 5.0550537109375, 5.21893310546875, 5.3828125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 12.0, 13.0, 11.0, 12.0, 14.0, 25.0, 25.0, 31.0, 24.0, 38.0, 51.0, 66.0, 84.0, 147.0, 234.0, 738.0, 4486.0, 47685.0, 1295290.0, 2696876.0, 136426.0, 9594.0, 1432.0, 342.0, 145.0, 99.0, 84.0, 42.0, 37.0, 40.0, 32.0, 24.0, 20.0, 21.0, 16.0, 12.0, 7.0, 14.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.578125, -17.03173828125, -16.4853515625, -15.93896484375, -15.392578125, -14.84619140625, -14.2998046875, -13.75341796875, -13.20703125, -12.66064453125, -12.1142578125, -11.56787109375, -11.021484375, -10.47509765625, -9.9287109375, -9.38232421875, -8.8359375, -8.28955078125, -7.7431640625, -7.19677734375, -6.650390625, -6.10400390625, -5.5576171875, -5.01123046875, -4.46484375, -3.91845703125, -3.3720703125, -2.82568359375, -2.279296875, -1.73291015625, -1.1865234375, -0.64013671875, -0.09375, 0.45263671875, 0.9990234375, 1.54541015625, 2.091796875, 2.63818359375, 3.1845703125, 3.73095703125, 4.27734375, 4.82373046875, 5.3701171875, 5.91650390625, 6.462890625, 7.00927734375, 7.5556640625, 8.10205078125, 8.6484375, 9.19482421875, 9.7412109375, 10.28759765625, 10.833984375, 11.38037109375, 11.9267578125, 12.47314453125, 13.01953125, 13.56591796875, 14.1123046875, 14.65869140625, 15.205078125, 15.75146484375, 16.2978515625, 16.84423828125, 17.390625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 7.0, 13.0, 15.0, 23.0, 36.0, 47.0, 67.0, 99.0, 134.0, 189.0, 237.0, 304.0, 406.0, 473.0, 523.0, 392.0, 300.0, 208.0, 140.0, 113.0, 87.0, 68.0, 37.0, 43.0, 28.0, 24.0, 16.0, 11.0, 8.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.796875, -10.46728515625, -10.1376953125, -9.80810546875, -9.478515625, -9.14892578125, -8.8193359375, -8.48974609375, -8.16015625, -7.83056640625, -7.5009765625, -7.17138671875, -6.841796875, -6.51220703125, -6.1826171875, -5.85302734375, -5.5234375, -5.19384765625, -4.8642578125, -4.53466796875, -4.205078125, -3.87548828125, -3.5458984375, -3.21630859375, -2.88671875, -2.55712890625, -2.2275390625, -1.89794921875, -1.568359375, -1.23876953125, -0.9091796875, -0.57958984375, -0.25, 0.07958984375, 0.4091796875, 0.73876953125, 1.068359375, 1.39794921875, 1.7275390625, 2.05712890625, 2.38671875, 2.71630859375, 3.0458984375, 3.37548828125, 3.705078125, 4.03466796875, 4.3642578125, 4.69384765625, 5.0234375, 5.35302734375, 5.6826171875, 6.01220703125, 6.341796875, 6.67138671875, 7.0009765625, 7.33056640625, 7.66015625, 7.98974609375, 8.3193359375, 8.64892578125, 8.978515625, 9.30810546875, 9.6376953125, 9.96728515625, 10.296875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 4.0, 12.0, 14.0, 13.0, 28.0, 24.0, 34.0, 49.0, 63.0, 71.0, 97.0, 113.0, 172.0, 210.0, 278.0, 437.0, 1140.0, 17167.0, 3690034.0, 477878.0, 4369.0, 712.0, 357.0, 243.0, 169.0, 130.0, 110.0, 76.0, 69.0, 37.0, 40.0, 32.0, 29.0, 18.0, 15.0, 9.0, 8.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.96875, -45.537109375, -44.10546875, -42.673828125, -41.2421875, -39.810546875, -38.37890625, -36.947265625, -35.515625, -34.083984375, -32.65234375, -31.220703125, -29.7890625, -28.357421875, -26.92578125, -25.494140625, -24.0625, -22.630859375, -21.19921875, -19.767578125, -18.3359375, -16.904296875, -15.47265625, -14.041015625, -12.609375, -11.177734375, -9.74609375, -8.314453125, -6.8828125, -5.451171875, -4.01953125, -2.587890625, -1.15625, 0.275390625, 1.70703125, 3.138671875, 4.5703125, 6.001953125, 7.43359375, 8.865234375, 10.296875, 11.728515625, 13.16015625, 14.591796875, 16.0234375, 17.455078125, 18.88671875, 20.318359375, 21.75, 23.181640625, 24.61328125, 26.044921875, 27.4765625, 28.908203125, 30.33984375, 31.771484375, 33.203125, 34.634765625, 36.06640625, 37.498046875, 38.9296875, 40.361328125, 41.79296875, 43.224609375, 44.65625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 25.0, 143.0, 448.0, 324.0, 67.0, 10.0, 0.0, 2.0], "bins": [-276.5811767578125, -271.86993408203125, -267.1587219238281, -262.447509765625, -257.73626708984375, -253.02503967285156, -248.31381225585938, -243.6025848388672, -238.891357421875, -234.1801300048828, -229.46890258789062, -224.75767517089844, -220.04644775390625, -215.33522033691406, -210.62399291992188, -205.9127655029297, -201.2015380859375, -196.4903106689453, -191.77908325195312, -187.06785583496094, -182.35662841796875, -177.64540100097656, -172.93417358398438, -168.2229461669922, -163.51171875, -158.8004913330078, -154.08926391601562, -149.37803649902344, -144.66680908203125, -139.95558166503906, -135.24435424804688, -130.5331268310547, -125.82190704345703, -121.11067962646484, -116.39945220947266, -111.68822479248047, -106.97699737548828, -102.2657699584961, -97.5545425415039, -92.84331512451172, -88.13208770751953, -83.42086029052734, -78.70963287353516, -73.99840545654297, -69.28717803955078, -64.5759506225586, -59.864723205566406, -55.15349578857422, -50.44226837158203, -45.731040954589844, -41.019813537597656, -36.30858612060547, -31.59735870361328, -26.886131286621094, -22.174903869628906, -17.46367645263672, -12.752447128295898, -8.041219711303711, -3.3299922943115234, 1.381235122680664, 6.092462539672852, 10.803689956665039, 15.514917373657227, 20.226144790649414, 24.9373722076416]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 7.0, 5.0, 6.0, 9.0, 9.0, 9.0, 16.0, 16.0, 23.0, 25.0, 30.0, 27.0, 34.0, 37.0, 41.0, 34.0, 40.0, 47.0, 39.0, 35.0, 51.0, 45.0, 41.0, 49.0, 24.0, 35.0, 31.0, 37.0, 31.0, 27.0, 25.0, 22.0, 23.0, 15.0, 12.0, 13.0, 5.0, 7.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.204925537109375, -32.067684173583984, -30.930438995361328, -29.793197631835938, -28.655954360961914, -27.51871109008789, -26.3814697265625, -25.244226455688477, -24.106983184814453, -22.96973991394043, -21.832496643066406, -20.695255279541016, -19.558012008666992, -18.42076873779297, -17.283527374267578, -16.146284103393555, -15.009040832519531, -13.871797561645508, -12.7345552444458, -11.597312927246094, -10.46006965637207, -9.322826385498047, -8.18558406829834, -7.048341274261475, -5.911098480224609, -4.773855686187744, -3.636612892150879, -2.4993700981140137, -1.3621273040771484, -0.2248845100402832, 0.912358283996582, 2.0496010780334473, 3.1868438720703125, 4.324086666107178, 5.461329460144043, 6.598572254180908, 7.735815048217773, 8.873058319091797, 10.010300636291504, 11.147542953491211, 12.284786224365234, 13.422029495239258, 14.559271812438965, 15.696514129638672, 16.833757400512695, 17.97100067138672, 19.10824203491211, 20.245485305786133, 21.382728576660156, 22.51997184753418, 23.657215118408203, 24.794456481933594, 25.931699752807617, 27.06894302368164, 28.20618438720703, 29.343427658081055, 30.480670928955078, 31.6179141998291, 32.755157470703125, 33.892398834228516, 35.029640197753906, 36.16688537597656, 37.30412673950195, 38.44137191772461, 39.57861328125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 5.0, 9.0, 12.0, 14.0, 8.0, 12.0, 23.0, 20.0, 14.0, 21.0, 25.0, 39.0, 26.0, 47.0, 32.0, 36.0, 30.0, 30.0, 42.0, 34.0, 37.0, 42.0, 36.0, 47.0, 30.0, 32.0, 38.0, 28.0, 33.0, 23.0, 21.0, 23.0, 13.0, 16.0, 19.0, 15.0, 11.0, 11.0, 5.0, 11.0, 6.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.6796875, -5.50750732421875, -5.3353271484375, -5.16314697265625, -4.990966796875, -4.81878662109375, -4.6466064453125, -4.47442626953125, -4.30224609375, -4.13006591796875, -3.9578857421875, -3.78570556640625, -3.613525390625, -3.44134521484375, -3.2691650390625, -3.09698486328125, -2.9248046875, -2.75262451171875, -2.5804443359375, -2.40826416015625, -2.236083984375, -2.06390380859375, -1.8917236328125, -1.71954345703125, -1.54736328125, -1.37518310546875, -1.2030029296875, -1.03082275390625, -0.858642578125, -0.68646240234375, -0.5142822265625, -0.34210205078125, -0.169921875, 0.00225830078125, 0.1744384765625, 0.34661865234375, 0.518798828125, 0.69097900390625, 0.8631591796875, 1.03533935546875, 1.20751953125, 1.37969970703125, 1.5518798828125, 1.72406005859375, 1.896240234375, 2.06842041015625, 2.2406005859375, 2.41278076171875, 2.5849609375, 2.75714111328125, 2.9293212890625, 3.10150146484375, 3.273681640625, 3.44586181640625, 3.6180419921875, 3.79022216796875, 3.96240234375, 4.13458251953125, 4.3067626953125, 4.47894287109375, 4.651123046875, 4.82330322265625, 4.9954833984375, 5.16766357421875, 5.33984375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 13.0, 17.0, 39.0, 41.0, 49.0, 89.0, 97.0, 194.0, 285.0, 390.0, 578.0, 879.0, 1193.0, 1874.0, 2462.0, 3613.0, 5122.0, 7358.0, 10337.0, 15077.0, 21832.0, 33213.0, 50357.0, 78240.0, 125765.0, 181695.0, 173662.0, 115995.0, 73240.0, 46882.0, 30613.0, 20553.0, 14029.0, 9908.0, 6824.0, 4770.0, 3564.0, 2363.0, 1698.0, 1162.0, 813.0, 523.0, 366.0, 253.0, 178.0, 111.0, 67.0, 57.0, 40.0, 29.0, 21.0, 7.0, 9.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.65478515625, -0.6342697143554688, -0.6137542724609375, -0.5932388305664062, -0.572723388671875, -0.5522079467773438, -0.5316925048828125, -0.5111770629882812, -0.49066162109375, -0.47014617919921875, -0.4496307373046875, -0.42911529541015625, -0.408599853515625, -0.38808441162109375, -0.3675689697265625, -0.34705352783203125, -0.3265380859375, -0.30602264404296875, -0.2855072021484375, -0.26499176025390625, -0.244476318359375, -0.22396087646484375, -0.2034454345703125, -0.18292999267578125, -0.16241455078125, -0.14189910888671875, -0.1213836669921875, -0.10086822509765625, -0.080352783203125, -0.05983734130859375, -0.0393218994140625, -0.01880645751953125, 0.001708984375, 0.02222442626953125, 0.0427398681640625, 0.06325531005859375, 0.083770751953125, 0.10428619384765625, 0.1248016357421875, 0.14531707763671875, 0.16583251953125, 0.18634796142578125, 0.2068634033203125, 0.22737884521484375, 0.247894287109375, 0.26840972900390625, 0.2889251708984375, 0.30944061279296875, 0.3299560546875, 0.35047149658203125, 0.3709869384765625, 0.39150238037109375, 0.412017822265625, 0.43253326416015625, 0.4530487060546875, 0.47356414794921875, 0.49407958984375, 0.5145950317382812, 0.5351104736328125, 0.5556259155273438, 0.576141357421875, 0.5966567993164062, 0.6171722412109375, 0.6376876831054688, 0.658203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 11.0, 5.0, 13.0, 12.0, 12.0, 11.0, 23.0, 15.0, 22.0, 27.0, 19.0, 29.0, 43.0, 46.0, 40.0, 36.0, 35.0, 46.0, 41.0, 1061.0, 42.0, 40.0, 33.0, 44.0, 37.0, 38.0, 33.0, 36.0, 23.0, 20.0, 26.0, 18.0, 12.0, 15.0, 12.0, 9.0, 10.0, 5.0, 8.0, 6.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.970977783203125, -3.84820556640625, -3.725433349609375, -3.6026611328125, -3.479888916015625, -3.35711669921875, -3.234344482421875, -3.111572265625, -2.988800048828125, -2.86602783203125, -2.743255615234375, -2.6204833984375, -2.497711181640625, -2.37493896484375, -2.252166748046875, -2.12939453125, -2.006622314453125, -1.88385009765625, -1.761077880859375, -1.6383056640625, -1.515533447265625, -1.39276123046875, -1.269989013671875, -1.147216796875, -1.024444580078125, -0.90167236328125, -0.778900146484375, -0.6561279296875, -0.533355712890625, -0.41058349609375, -0.287811279296875, -0.1650390625, -0.042266845703125, 0.08050537109375, 0.203277587890625, 0.3260498046875, 0.448822021484375, 0.57159423828125, 0.694366455078125, 0.817138671875, 0.939910888671875, 1.06268310546875, 1.185455322265625, 1.3082275390625, 1.430999755859375, 1.55377197265625, 1.676544189453125, 1.79931640625, 1.922088623046875, 2.04486083984375, 2.167633056640625, 2.2904052734375, 2.413177490234375, 2.53594970703125, 2.658721923828125, 2.781494140625, 2.904266357421875, 3.02703857421875, 3.149810791015625, 3.2725830078125, 3.395355224609375, 3.51812744140625, 3.640899658203125, 3.763671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 12.0, 3.0, 13.0, 14.0, 25.0, 35.0, 50.0, 90.0, 139.0, 243.0, 393.0, 673.0, 1019.0, 1683.0, 2877.0, 4872.0, 8283.0, 14103.0, 24256.0, 43485.0, 78151.0, 146047.0, 1281594.0, 212865.0, 122995.0, 65772.0, 36871.0, 20979.0, 12051.0, 7149.0, 4118.0, 2398.0, 1483.0, 871.0, 563.0, 337.0, 229.0, 131.0, 81.0, 51.0, 54.0, 24.0, 16.0, 8.0, 8.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7685546875, -0.7458572387695312, -0.7231597900390625, -0.7004623413085938, -0.677764892578125, -0.6550674438476562, -0.6323699951171875, -0.6096725463867188, -0.58697509765625, -0.5642776489257812, -0.5415802001953125, -0.5188827514648438, -0.496185302734375, -0.47348785400390625, -0.4507904052734375, -0.42809295654296875, -0.4053955078125, -0.38269805908203125, -0.3600006103515625, -0.33730316162109375, -0.314605712890625, -0.29190826416015625, -0.2692108154296875, -0.24651336669921875, -0.22381591796875, -0.20111846923828125, -0.1784210205078125, -0.15572357177734375, -0.133026123046875, -0.11032867431640625, -0.0876312255859375, -0.06493377685546875, -0.042236328125, -0.01953887939453125, 0.0031585693359375, 0.02585601806640625, 0.048553466796875, 0.07125091552734375, 0.0939483642578125, 0.11664581298828125, 0.13934326171875, 0.16204071044921875, 0.1847381591796875, 0.20743560791015625, 0.230133056640625, 0.25283050537109375, 0.2755279541015625, 0.29822540283203125, 0.3209228515625, 0.34362030029296875, 0.3663177490234375, 0.38901519775390625, 0.411712646484375, 0.43441009521484375, 0.4571075439453125, 0.47980499267578125, 0.50250244140625, 0.5251998901367188, 0.5478973388671875, 0.5705947875976562, 0.593292236328125, 0.6159896850585938, 0.6386871337890625, 0.6613845825195312, 0.68408203125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 4.0, 1.0, 4.0, 1.0, 8.0, 4.0, 14.0, 8.0, 14.0, 10.0, 16.0, 23.0, 25.0, 32.0, 37.0, 42.0, 37.0, 48.0, 55.0, 52.0, 59.0, 39.0, 69.0, 59.0, 46.0, 37.0, 31.0, 41.0, 37.0, 34.0, 20.0, 15.0, 12.0, 11.0, 8.0, 9.0, 8.0, 8.0, 7.0, 2.0, 4.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019006729125976562, -0.0018430203199386597, -0.001785367727279663, -0.0017277151346206665, -0.00167006254196167, -0.0016124099493026733, -0.0015547573566436768, -0.0014971047639846802, -0.0014394521713256836, -0.001381799578666687, -0.0013241469860076904, -0.0012664943933486938, -0.0012088418006896973, -0.0011511892080307007, -0.001093536615371704, -0.0010358840227127075, -0.000978231430053711, -0.0009205788373947144, -0.0008629262447357178, -0.0008052736520767212, -0.0007476210594177246, -0.000689968466758728, -0.0006323158740997314, -0.0005746632814407349, -0.0005170106887817383, -0.0004593580961227417, -0.0004017055034637451, -0.00034405291080474854, -0.00028640031814575195, -0.00022874772548675537, -0.0001710951328277588, -0.00011344254016876221, -5.5789947509765625e-05, 1.862645149230957e-06, 5.951523780822754e-05, 0.00011716783046722412, 0.0001748204231262207, 0.00023247301578521729, 0.00029012560844421387, 0.00034777820110321045, 0.00040543079376220703, 0.0004630833864212036, 0.0005207359790802002, 0.0005783885717391968, 0.0006360411643981934, 0.0006936937570571899, 0.0007513463497161865, 0.0008089989423751831, 0.0008666515350341797, 0.0009243041276931763, 0.0009819567203521729, 0.0010396093130111694, 0.001097261905670166, 0.0011549144983291626, 0.0012125670909881592, 0.0012702196836471558, 0.0013278722763061523, 0.001385524868965149, 0.0014431774616241455, 0.001500830054283142, 0.0015584826469421387, 0.0016161352396011353, 0.0016737878322601318, 0.0017314404249191284, 0.001789093017578125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 9.0, 8.0, 8.0, 14.0, 13.0, 18.0, 26.0, 31.0, 33.0, 43.0, 56.0, 69.0, 98.0, 131.0, 213.0, 368.0, 980.0, 49957.0, 990377.0, 4551.0, 605.0, 279.0, 156.0, 135.0, 77.0, 53.0, 43.0, 35.0, 30.0, 40.0, 15.0, 19.0, 12.0, 11.0, 7.0, 6.0, 8.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.04083251953125, -0.03952789306640625, -0.0382232666015625, -0.03691864013671875, -0.035614013671875, -0.03430938720703125, -0.0330047607421875, -0.03170013427734375, -0.0303955078125, -0.02909088134765625, -0.0277862548828125, -0.02648162841796875, -0.025177001953125, -0.02387237548828125, -0.0225677490234375, -0.02126312255859375, -0.01995849609375, -0.01865386962890625, -0.0173492431640625, -0.01604461669921875, -0.014739990234375, -0.01343536376953125, -0.0121307373046875, -0.01082611083984375, -0.009521484375, -0.00821685791015625, -0.0069122314453125, -0.00560760498046875, -0.004302978515625, -0.00299835205078125, -0.0016937255859375, -0.00038909912109375, 0.00091552734375, 0.00222015380859375, 0.0035247802734375, 0.00482940673828125, 0.006134033203125, 0.00743865966796875, 0.0087432861328125, 0.01004791259765625, 0.0113525390625, 0.01265716552734375, 0.0139617919921875, 0.01526641845703125, 0.016571044921875, 0.01787567138671875, 0.0191802978515625, 0.02048492431640625, 0.02178955078125, 0.02309417724609375, 0.0243988037109375, 0.02570343017578125, 0.027008056640625, 0.02831268310546875, 0.0296173095703125, 0.03092193603515625, 0.0322265625, 0.03353118896484375, 0.0348358154296875, 0.03614044189453125, 0.037445068359375, 0.03874969482421875, 0.0400543212890625, 0.04135894775390625, 0.04266357421875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 24.0, 943.0, 48.0, 1.0, 0.0, 1.0], "bins": [-0.036522723734378815, -0.035909418016672134, -0.035296108573675156, -0.034682802855968475, -0.0340694934129715, -0.033456187695264816, -0.032842881977558136, -0.03222957253456116, -0.03161626681685448, -0.031002959236502647, -0.030389651656150818, -0.029776345938444138, -0.029163038358092308, -0.02854973077774048, -0.027936425060033798, -0.02732311747968197, -0.02670980989933014, -0.02609650231897831, -0.02548319473862648, -0.0248698890209198, -0.02425658144056797, -0.02364327386021614, -0.02302996814250946, -0.02241666056215763, -0.0218033529818058, -0.021190045401453972, -0.020576737821102142, -0.019963432103395462, -0.019350124523043633, -0.018736816942691803, -0.018123511224985123, -0.017510203644633293, -0.016896894201636314, -0.016283586621284485, -0.015670280903577805, -0.015056973323225975, -0.014443665742874146, -0.013830358162522316, -0.013217051513493061, -0.012603744864463806, -0.011990437284111977, -0.011377129703760147, -0.010763823054730892, -0.010150516405701637, -0.009537208825349808, -0.008923901244997978, -0.008310594595968723, -0.007697287481278181, -0.007083980366587639, -0.006470673251897097, -0.005857366137206554, -0.005244059022516012, -0.00463075190782547, -0.004017444793134928, -0.0034041376784443855, -0.0027908305637538433, -0.002177523449063301, -0.0015642163343727589, -0.0009509092196822166, -0.0003376021049916744, 0.0002757050096988678, 0.00088901212438941, 0.0015023192390799522, 0.0021156263537704945, 0.0027289334684610367]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 12.0, 15.0, 26.0, 29.0, 32.0, 43.0, 53.0, 65.0, 54.0, 64.0, 70.0, 62.0, 70.0, 69.0, 54.0, 49.0, 55.0, 37.0, 25.0, 25.0, 30.0, 24.0, 8.0, 7.0, 11.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011633038520812988, -0.0011096522212028503, -0.0010560005903244019, -0.0010023489594459534, -0.0009486973285675049, -0.0008950456976890564, -0.0008413940668106079, -0.0007877424359321594, -0.0007340908050537109, -0.0006804391741752625, -0.000626787543296814, -0.0005731359124183655, -0.000519484281539917, -0.0004658326506614685, -0.00041218101978302, -0.00035852938890457153, -0.00030487775802612305, -0.00025122612714767456, -0.00019757449626922607, -0.0001439228653907776, -9.02712345123291e-05, -3.6619603633880615e-05, 1.703202724456787e-05, 7.068365812301636e-05, 0.00012433528900146484, 0.00017798691987991333, 0.00023163855075836182, 0.0002852901816368103, 0.0003389418125152588, 0.0003925934433937073, 0.00044624507427215576, 0.0004998967051506042, 0.0005535483360290527, 0.0006071999669075012, 0.0006608515977859497, 0.0007145032286643982, 0.0007681548595428467, 0.0008218064904212952, 0.0008754581212997437, 0.0009291097521781921, 0.0009827613830566406, 0.0010364130139350891, 0.0010900646448135376, 0.001143716275691986, 0.0011973679065704346, 0.001251019537448883, 0.0013046711683273315, 0.00135832279920578, 0.0014119744300842285, 0.001465626060962677, 0.0015192776918411255, 0.001572929322719574, 0.0016265809535980225, 0.001680232584476471, 0.0017338842153549194, 0.001787535846233368, 0.0018411874771118164, 0.001894839107990265, 0.0019484907388687134, 0.002002142369747162, 0.0020557940006256104, 0.002109445631504059, 0.0021630972623825073, 0.002216748893260956, 0.0022704005241394043]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 5.0, 9.0, 12.0, 14.0, 8.0, 12.0, 23.0, 20.0, 14.0, 21.0, 25.0, 39.0, 26.0, 47.0, 32.0, 36.0, 30.0, 30.0, 42.0, 34.0, 37.0, 42.0, 36.0, 47.0, 30.0, 32.0, 38.0, 28.0, 33.0, 24.0, 20.0, 23.0, 13.0, 16.0, 19.0, 15.0, 11.0, 11.0, 5.0, 11.0, 6.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.6796875, -5.50750732421875, -5.3353271484375, -5.16314697265625, -4.990966796875, -4.81878662109375, -4.6466064453125, -4.47442626953125, -4.30224609375, -4.13006591796875, -3.9578857421875, -3.78570556640625, -3.613525390625, -3.44134521484375, -3.2691650390625, -3.09698486328125, -2.9248046875, -2.75262451171875, -2.5804443359375, -2.40826416015625, -2.236083984375, -2.06390380859375, -1.8917236328125, -1.71954345703125, -1.54736328125, -1.37518310546875, -1.2030029296875, -1.03082275390625, -0.858642578125, -0.68646240234375, -0.5142822265625, -0.34210205078125, -0.169921875, 0.00225830078125, 0.1744384765625, 0.34661865234375, 0.518798828125, 0.69097900390625, 0.8631591796875, 1.03533935546875, 1.20751953125, 1.37969970703125, 1.5518798828125, 1.72406005859375, 1.896240234375, 2.06842041015625, 2.2406005859375, 2.41278076171875, 2.5849609375, 2.75714111328125, 2.9293212890625, 3.10150146484375, 3.273681640625, 3.44586181640625, 3.6180419921875, 3.79022216796875, 3.96240234375, 4.13458251953125, 4.3067626953125, 4.47894287109375, 4.651123046875, 4.82330322265625, 4.9954833984375, 5.16766357421875, 5.33984375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 8.0, 4.0, 4.0, 10.0, 16.0, 17.0, 18.0, 18.0, 21.0, 40.0, 39.0, 54.0, 81.0, 115.0, 140.0, 201.0, 311.0, 513.0, 1314.0, 5655.0, 30810.0, 254706.0, 667732.0, 70710.0, 11662.0, 2338.0, 727.0, 382.0, 239.0, 157.0, 131.0, 89.0, 53.0, 46.0, 43.0, 28.0, 26.0, 23.0, 18.0, 12.0, 9.0, 8.0, 7.0, 4.0, 3.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.2890625, -10.94921875, -10.609375, -10.26953125, -9.9296875, -9.58984375, -9.25, -8.91015625, -8.5703125, -8.23046875, -7.890625, -7.55078125, -7.2109375, -6.87109375, -6.53125, -6.19140625, -5.8515625, -5.51171875, -5.171875, -4.83203125, -4.4921875, -4.15234375, -3.8125, -3.47265625, -3.1328125, -2.79296875, -2.453125, -2.11328125, -1.7734375, -1.43359375, -1.09375, -0.75390625, -0.4140625, -0.07421875, 0.265625, 0.60546875, 0.9453125, 1.28515625, 1.625, 1.96484375, 2.3046875, 2.64453125, 2.984375, 3.32421875, 3.6640625, 4.00390625, 4.34375, 4.68359375, 5.0234375, 5.36328125, 5.703125, 6.04296875, 6.3828125, 6.72265625, 7.0625, 7.40234375, 7.7421875, 8.08203125, 8.421875, 8.76171875, 9.1015625, 9.44140625, 9.78125, 10.12109375, 10.4609375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 8.0, 7.0, 8.0, 7.0, 8.0, 14.0, 11.0, 16.0, 19.0, 23.0, 20.0, 14.0, 43.0, 28.0, 47.0, 43.0, 43.0, 56.0, 53.0, 198.0, 1722.0, 206.0, 62.0, 48.0, 49.0, 29.0, 41.0, 24.0, 33.0, 29.0, 22.0, 19.0, 23.0, 16.0, 20.0, 10.0, 6.0, 4.0, 4.0, 9.0, 2.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.890625, -19.278564453125, -18.66650390625, -18.054443359375, -17.4423828125, -16.830322265625, -16.21826171875, -15.606201171875, -14.994140625, -14.382080078125, -13.77001953125, -13.157958984375, -12.5458984375, -11.933837890625, -11.32177734375, -10.709716796875, -10.09765625, -9.485595703125, -8.87353515625, -8.261474609375, -7.6494140625, -7.037353515625, -6.42529296875, -5.813232421875, -5.201171875, -4.589111328125, -3.97705078125, -3.364990234375, -2.7529296875, -2.140869140625, -1.52880859375, -0.916748046875, -0.3046875, 0.307373046875, 0.91943359375, 1.531494140625, 2.1435546875, 2.755615234375, 3.36767578125, 3.979736328125, 4.591796875, 5.203857421875, 5.81591796875, 6.427978515625, 7.0400390625, 7.652099609375, 8.26416015625, 8.876220703125, 9.48828125, 10.100341796875, 10.71240234375, 11.324462890625, 11.9365234375, 12.548583984375, 13.16064453125, 13.772705078125, 14.384765625, 14.996826171875, 15.60888671875, 16.220947265625, 16.8330078125, 17.445068359375, 18.05712890625, 18.669189453125, 19.28125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 5.0, 5.0, 5.0, 11.0, 17.0, 22.0, 25.0, 29.0, 25.0, 43.0, 52.0, 50.0, 60.0, 121.0, 205.0, 406.0, 1088.0, 28455.0, 3104010.0, 9225.0, 816.0, 351.0, 176.0, 113.0, 91.0, 55.0, 42.0, 33.0, 29.0, 33.0, 18.0, 16.0, 14.0, 11.0, 8.0, 10.0, 5.0, 6.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5, -43.08251953125, -41.6650390625, -40.24755859375, -38.830078125, -37.41259765625, -35.9951171875, -34.57763671875, -33.16015625, -31.74267578125, -30.3251953125, -28.90771484375, -27.490234375, -26.07275390625, -24.6552734375, -23.23779296875, -21.8203125, -20.40283203125, -18.9853515625, -17.56787109375, -16.150390625, -14.73291015625, -13.3154296875, -11.89794921875, -10.48046875, -9.06298828125, -7.6455078125, -6.22802734375, -4.810546875, -3.39306640625, -1.9755859375, -0.55810546875, 0.859375, 2.27685546875, 3.6943359375, 5.11181640625, 6.529296875, 7.94677734375, 9.3642578125, 10.78173828125, 12.19921875, 13.61669921875, 15.0341796875, 16.45166015625, 17.869140625, 19.28662109375, 20.7041015625, 22.12158203125, 23.5390625, 24.95654296875, 26.3740234375, 27.79150390625, 29.208984375, 30.62646484375, 32.0439453125, 33.46142578125, 34.87890625, 36.29638671875, 37.7138671875, 39.13134765625, 40.548828125, 41.96630859375, 43.3837890625, 44.80126953125, 46.21875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 164.0, 781.0, 69.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.91584014892578, -17.040651321411133, -13.1654634475708, -9.290275573730469, -5.41508674621582, -1.5398979187011719, 2.3352890014648438, 6.210477828979492, 10.08566665649414, 13.960855484008789, 17.836044311523438, 21.711231231689453, 25.5864200592041, 29.46160888671875, 33.336795806884766, 37.21198272705078, 41.08717346191406, 44.96236038208008, 48.83755111694336, 52.712738037109375, 56.587928771972656, 60.46311569213867, 64.33830261230469, 68.21349334716797, 72.08868408203125, 75.96387481689453, 79.83905792236328, 83.71424865722656, 87.58943939208984, 91.46463012695312, 95.33981323242188, 99.21500396728516, 103.09017944335938, 106.96537017822266, 110.8405532836914, 114.71574401855469, 118.59093475341797, 122.46612548828125, 126.34130859375, 130.21649169921875, 134.09169006347656, 137.9668731689453, 141.84207153320312, 145.71725463867188, 149.59243774414062, 153.46763610839844, 157.3428192138672, 161.21800231933594, 165.09320068359375, 168.9683837890625, 172.8435821533203, 176.71876525878906, 180.5939483642578, 184.46914672851562, 188.34432983398438, 192.21951293945312, 196.09469604492188, 199.96987915039062, 203.84507751464844, 207.7202606201172, 211.59544372558594, 215.47064208984375, 219.3458251953125, 223.22100830078125, 227.09620666503906]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 6.0, 7.0, 9.0, 13.0, 9.0, 12.0, 11.0, 12.0, 18.0, 22.0, 33.0, 40.0, 35.0, 45.0, 37.0, 38.0, 48.0, 46.0, 38.0, 50.0, 39.0, 48.0, 32.0, 34.0, 37.0, 32.0, 38.0, 36.0, 32.0, 24.0, 21.0, 16.0, 13.0, 17.0, 14.0, 7.0, 5.0, 4.0, 4.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-55.597747802734375, -54.0280876159668, -52.45842742919922, -50.88876724243164, -49.31910705566406, -47.749446868896484, -46.179786682128906, -44.61012649536133, -43.04046630859375, -41.47080612182617, -39.901145935058594, -38.331485748291016, -36.76182556152344, -35.19216537475586, -33.62250518798828, -32.0528450012207, -30.483186721801758, -28.91352653503418, -27.3438663482666, -25.774206161499023, -24.204545974731445, -22.634885787963867, -21.065227508544922, -19.495567321777344, -17.925907135009766, -16.356246948242188, -14.78658676147461, -13.216926574707031, -11.647266387939453, -10.077606201171875, -8.507946968078613, -6.938286781311035, -5.368625640869141, -3.7989654541015625, -2.2293055057525635, -0.6596455574035645, 0.9100146293640137, 2.479674816131592, 4.049334526062012, 5.61899471282959, 7.188654899597168, 8.758315086364746, 10.327975273132324, 11.897634506225586, 13.467294692993164, 15.036954879760742, 16.60661506652832, 18.1762752532959, 19.745935440063477, 21.315595626831055, 22.885255813598633, 24.45491600036621, 26.02457618713379, 27.594236373901367, 29.163894653320312, 30.73355484008789, 32.30321502685547, 33.87287521362305, 35.442535400390625, 37.0121955871582, 38.58185577392578, 40.15151596069336, 41.72117614746094, 43.290836334228516, 44.860496520996094]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 14.0, 6.0, 9.0, 9.0, 14.0, 15.0, 18.0, 18.0, 18.0, 24.0, 34.0, 34.0, 29.0, 37.0, 36.0, 40.0, 41.0, 31.0, 42.0, 27.0, 39.0, 42.0, 44.0, 37.0, 29.0, 31.0, 31.0, 33.0, 36.0, 31.0, 19.0, 17.0, 9.0, 20.0, 16.0, 6.0, 10.0, 8.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.62109375, -5.44287109375, -5.2646484375, -5.08642578125, -4.908203125, -4.72998046875, -4.5517578125, -4.37353515625, -4.1953125, -4.01708984375, -3.8388671875, -3.66064453125, -3.482421875, -3.30419921875, -3.1259765625, -2.94775390625, -2.76953125, -2.59130859375, -2.4130859375, -2.23486328125, -2.056640625, -1.87841796875, -1.7001953125, -1.52197265625, -1.34375, -1.16552734375, -0.9873046875, -0.80908203125, -0.630859375, -0.45263671875, -0.2744140625, -0.09619140625, 0.08203125, 0.26025390625, 0.4384765625, 0.61669921875, 0.794921875, 0.97314453125, 1.1513671875, 1.32958984375, 1.5078125, 1.68603515625, 1.8642578125, 2.04248046875, 2.220703125, 2.39892578125, 2.5771484375, 2.75537109375, 2.93359375, 3.11181640625, 3.2900390625, 3.46826171875, 3.646484375, 3.82470703125, 4.0029296875, 4.18115234375, 4.359375, 4.53759765625, 4.7158203125, 4.89404296875, 5.072265625, 5.25048828125, 5.4287109375, 5.60693359375, 5.78515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 11.0, 9.0, 9.0, 7.0, 16.0, 13.0, 18.0, 29.0, 32.0, 42.0, 54.0, 97.0, 170.0, 331.0, 748.0, 2147.0, 8288.0, 54691.0, 830426.0, 2865569.0, 392151.0, 30708.0, 5633.0, 1689.0, 607.0, 278.0, 153.0, 92.0, 47.0, 56.0, 25.0, 24.0, 23.0, 16.0, 12.0, 7.0, 10.0, 9.0, 4.0, 3.0, 2.0, 7.0, 8.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-15.0859375, -14.619873046875, -14.15380859375, -13.687744140625, -13.2216796875, -12.755615234375, -12.28955078125, -11.823486328125, -11.357421875, -10.891357421875, -10.42529296875, -9.959228515625, -9.4931640625, -9.027099609375, -8.56103515625, -8.094970703125, -7.62890625, -7.162841796875, -6.69677734375, -6.230712890625, -5.7646484375, -5.298583984375, -4.83251953125, -4.366455078125, -3.900390625, -3.434326171875, -2.96826171875, -2.502197265625, -2.0361328125, -1.570068359375, -1.10400390625, -0.637939453125, -0.171875, 0.294189453125, 0.76025390625, 1.226318359375, 1.6923828125, 2.158447265625, 2.62451171875, 3.090576171875, 3.556640625, 4.022705078125, 4.48876953125, 4.954833984375, 5.4208984375, 5.886962890625, 6.35302734375, 6.819091796875, 7.28515625, 7.751220703125, 8.21728515625, 8.683349609375, 9.1494140625, 9.615478515625, 10.08154296875, 10.547607421875, 11.013671875, 11.479736328125, 11.94580078125, 12.411865234375, 12.8779296875, 13.343994140625, 13.81005859375, 14.276123046875, 14.7421875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 6.0, 6.0, 11.0, 14.0, 14.0, 30.0, 23.0, 36.0, 44.0, 60.0, 81.0, 119.0, 138.0, 207.0, 263.0, 304.0, 421.0, 434.0, 408.0, 343.0, 292.0, 199.0, 146.0, 101.0, 92.0, 77.0, 51.0, 41.0, 27.0, 15.0, 13.0, 13.0, 11.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.84375, -9.551025390625, -9.25830078125, -8.965576171875, -8.6728515625, -8.380126953125, -8.08740234375, -7.794677734375, -7.501953125, -7.209228515625, -6.91650390625, -6.623779296875, -6.3310546875, -6.038330078125, -5.74560546875, -5.452880859375, -5.16015625, -4.867431640625, -4.57470703125, -4.281982421875, -3.9892578125, -3.696533203125, -3.40380859375, -3.111083984375, -2.818359375, -2.525634765625, -2.23291015625, -1.940185546875, -1.6474609375, -1.354736328125, -1.06201171875, -0.769287109375, -0.4765625, -0.183837890625, 0.10888671875, 0.401611328125, 0.6943359375, 0.987060546875, 1.27978515625, 1.572509765625, 1.865234375, 2.157958984375, 2.45068359375, 2.743408203125, 3.0361328125, 3.328857421875, 3.62158203125, 3.914306640625, 4.20703125, 4.499755859375, 4.79248046875, 5.085205078125, 5.3779296875, 5.670654296875, 5.96337890625, 6.256103515625, 6.548828125, 6.841552734375, 7.13427734375, 7.427001953125, 7.7197265625, 8.012451171875, 8.30517578125, 8.597900390625, 8.890625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 9.0, 3.0, 3.0, 8.0, 11.0, 15.0, 21.0, 26.0, 48.0, 63.0, 88.0, 98.0, 144.0, 206.0, 352.0, 732.0, 4715.0, 432507.0, 3735104.0, 17516.0, 1290.0, 471.0, 261.0, 170.0, 106.0, 89.0, 60.0, 57.0, 31.0, 29.0, 15.0, 13.0, 4.0, 6.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.28125, -41.798828125, -40.31640625, -38.833984375, -37.3515625, -35.869140625, -34.38671875, -32.904296875, -31.421875, -29.939453125, -28.45703125, -26.974609375, -25.4921875, -24.009765625, -22.52734375, -21.044921875, -19.5625, -18.080078125, -16.59765625, -15.115234375, -13.6328125, -12.150390625, -10.66796875, -9.185546875, -7.703125, -6.220703125, -4.73828125, -3.255859375, -1.7734375, -0.291015625, 1.19140625, 2.673828125, 4.15625, 5.638671875, 7.12109375, 8.603515625, 10.0859375, 11.568359375, 13.05078125, 14.533203125, 16.015625, 17.498046875, 18.98046875, 20.462890625, 21.9453125, 23.427734375, 24.91015625, 26.392578125, 27.875, 29.357421875, 30.83984375, 32.322265625, 33.8046875, 35.287109375, 36.76953125, 38.251953125, 39.734375, 41.216796875, 42.69921875, 44.181640625, 45.6640625, 47.146484375, 48.62890625, 50.111328125, 51.59375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 13.0, 39.0, 76.0, 136.0, 173.0, 203.0, 139.0, 110.0, 59.0, 36.0, 12.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.45834350585938, -71.72279357910156, -69.98724365234375, -68.2516860961914, -66.5161361694336, -64.78058624267578, -63.0450325012207, -61.30948257446289, -59.57392883300781, -57.83837890625, -56.10282516479492, -54.36727523803711, -52.63172149658203, -50.89617156982422, -49.16061782836914, -47.42506790161133, -45.68951416015625, -43.95396423339844, -42.21841049194336, -40.48286056518555, -38.74730682373047, -37.011756896972656, -35.27620315551758, -33.540653228759766, -31.805103302001953, -30.069551467895508, -28.333999633789062, -26.598447799682617, -24.862895965576172, -23.12734603881836, -21.39179229736328, -19.65624237060547, -17.92068862915039, -16.185136795043945, -14.4495849609375, -12.714033126831055, -10.97848129272461, -9.24293041229248, -7.507378578186035, -5.77182674407959, -4.0362749099731445, -2.300723075866699, -0.565171480178833, 1.1703801155090332, 2.9059319496154785, 4.641483306884766, 6.377035140991211, 8.112586975097656, 9.848138809204102, 11.583690643310547, 13.319242477416992, 15.054794311523438, 16.790346145629883, 18.525897979736328, 20.26144790649414, 21.99700164794922, 23.73255157470703, 25.468103408813477, 27.203655242919922, 28.939207077026367, 30.674758911132812, 32.410308837890625, 34.1458625793457, 35.881412506103516, 37.616966247558594]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 2.0, 7.0, 12.0, 11.0, 11.0, 15.0, 14.0, 20.0, 20.0, 20.0, 27.0, 36.0, 29.0, 34.0, 35.0, 35.0, 40.0, 44.0, 49.0, 49.0, 43.0, 44.0, 42.0, 44.0, 39.0, 37.0, 34.0, 11.0, 27.0, 27.0, 25.0, 22.0, 14.0, 22.0, 19.0, 11.0, 7.0, 1.0, 5.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.78478240966797, -26.771011352539062, -25.75724220275879, -24.743471145629883, -23.72970199584961, -22.715930938720703, -21.702159881591797, -20.688390731811523, -19.67462158203125, -18.660850524902344, -17.64708137512207, -16.633310317993164, -15.61954116821289, -14.605770111083984, -13.592000007629395, -12.578229904174805, -11.564458847045898, -10.550688743591309, -9.536918640136719, -8.523147583007812, -7.509377956390381, -6.495607852935791, -5.481837272644043, -4.468067169189453, -3.4542970657348633, -2.4405269622802734, -1.4267566204071045, -0.41298627853393555, 0.6007838249206543, 1.6145539283752441, 2.628324508666992, 3.642094612121582, 4.655864715576172, 5.669634819030762, 6.683404922485352, 7.6971755027771, 8.710945129394531, 9.724716186523438, 10.738486289978027, 11.752256393432617, 12.766026496887207, 13.779796600341797, 14.793566703796387, 15.807336807250977, 16.821107864379883, 17.834877014160156, 18.848648071289062, 19.86241912841797, 20.876188278198242, 21.88995933532715, 22.903728485107422, 23.917499542236328, 24.9312686920166, 25.945039749145508, 26.95880889892578, 27.972579956054688, 28.986351013183594, 30.0001220703125, 31.013891220092773, 32.02766036987305, 33.04143142700195, 34.05520248413086, 35.068973541259766, 36.082740783691406, 37.09651184082031]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 7.0, 5.0, 4.0, 9.0, 11.0, 13.0, 11.0, 23.0, 15.0, 20.0, 20.0, 22.0, 21.0, 40.0, 40.0, 40.0, 35.0, 42.0, 39.0, 43.0, 32.0, 32.0, 43.0, 36.0, 32.0, 52.0, 34.0, 35.0, 43.0, 26.0, 29.0, 20.0, 15.0, 19.0, 14.0, 16.0, 11.0, 11.0, 11.0, 10.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.1328125, -5.9410400390625, -5.749267578125, -5.5574951171875, -5.36572265625, -5.1739501953125, -4.982177734375, -4.7904052734375, -4.5986328125, -4.4068603515625, -4.215087890625, -4.0233154296875, -3.83154296875, -3.6397705078125, -3.447998046875, -3.2562255859375, -3.064453125, -2.8726806640625, -2.680908203125, -2.4891357421875, -2.29736328125, -2.1055908203125, -1.913818359375, -1.7220458984375, -1.5302734375, -1.3385009765625, -1.146728515625, -0.9549560546875, -0.76318359375, -0.5714111328125, -0.379638671875, -0.1878662109375, 0.00390625, 0.1956787109375, 0.387451171875, 0.5792236328125, 0.77099609375, 0.9627685546875, 1.154541015625, 1.3463134765625, 1.5380859375, 1.7298583984375, 1.921630859375, 2.1134033203125, 2.30517578125, 2.4969482421875, 2.688720703125, 2.8804931640625, 3.072265625, 3.2640380859375, 3.455810546875, 3.6475830078125, 3.83935546875, 4.0311279296875, 4.222900390625, 4.4146728515625, 4.6064453125, 4.7982177734375, 4.989990234375, 5.1817626953125, 5.37353515625, 5.5653076171875, 5.757080078125, 5.9488525390625, 6.140625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 5.0, 11.0, 6.0, 21.0, 23.0, 34.0, 56.0, 89.0, 99.0, 148.0, 196.0, 316.0, 455.0, 622.0, 946.0, 1322.0, 1878.0, 2712.0, 4100.0, 5902.0, 9062.0, 13616.0, 21094.0, 33239.0, 53658.0, 88902.0, 143349.0, 196758.0, 172948.0, 111615.0, 67700.0, 41399.0, 25999.0, 16603.0, 10907.0, 7288.0, 4797.0, 3336.0, 2238.0, 1559.0, 1046.0, 789.0, 506.0, 356.0, 275.0, 189.0, 113.0, 100.0, 53.0, 43.0, 36.0, 19.0, 14.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.72509765625, -0.7022476196289062, -0.6793975830078125, -0.6565475463867188, -0.633697509765625, -0.6108474731445312, -0.5879974365234375, -0.5651473999023438, -0.54229736328125, -0.5194473266601562, -0.4965972900390625, -0.47374725341796875, -0.450897216796875, -0.42804718017578125, -0.4051971435546875, -0.38234710693359375, -0.3594970703125, -0.33664703369140625, -0.3137969970703125, -0.29094696044921875, -0.268096923828125, -0.24524688720703125, -0.2223968505859375, -0.19954681396484375, -0.17669677734375, -0.15384674072265625, -0.1309967041015625, -0.10814666748046875, -0.085296630859375, -0.06244659423828125, -0.0395965576171875, -0.01674652099609375, 0.006103515625, 0.02895355224609375, 0.0518035888671875, 0.07465362548828125, 0.097503662109375, 0.12035369873046875, 0.1432037353515625, 0.16605377197265625, 0.18890380859375, 0.21175384521484375, 0.2346038818359375, 0.25745391845703125, 0.280303955078125, 0.30315399169921875, 0.3260040283203125, 0.34885406494140625, 0.3717041015625, 0.39455413818359375, 0.4174041748046875, 0.44025421142578125, 0.463104248046875, 0.48595428466796875, 0.5088043212890625, 0.5316543579101562, 0.55450439453125, 0.5773544311523438, 0.6002044677734375, 0.6230545043945312, 0.645904541015625, 0.6687545776367188, 0.6916046142578125, 0.7144546508789062, 0.7373046875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 9.0, 5.0, 8.0, 11.0, 9.0, 13.0, 12.0, 15.0, 16.0, 19.0, 22.0, 29.0, 41.0, 40.0, 37.0, 44.0, 40.0, 50.0, 35.0, 45.0, 1075.0, 36.0, 41.0, 37.0, 31.0, 44.0, 29.0, 31.0, 32.0, 28.0, 18.0, 23.0, 20.0, 14.0, 5.0, 8.0, 8.0, 12.0, 10.0, 4.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44140625, -3.3153076171875, -3.189208984375, -3.0631103515625, -2.93701171875, -2.8109130859375, -2.684814453125, -2.5587158203125, -2.4326171875, -2.3065185546875, -2.180419921875, -2.0543212890625, -1.92822265625, -1.8021240234375, -1.676025390625, -1.5499267578125, -1.423828125, -1.2977294921875, -1.171630859375, -1.0455322265625, -0.91943359375, -0.7933349609375, -0.667236328125, -0.5411376953125, -0.4150390625, -0.2889404296875, -0.162841796875, -0.0367431640625, 0.08935546875, 0.2154541015625, 0.341552734375, 0.4676513671875, 0.59375, 0.7198486328125, 0.845947265625, 0.9720458984375, 1.09814453125, 1.2242431640625, 1.350341796875, 1.4764404296875, 1.6025390625, 1.7286376953125, 1.854736328125, 1.9808349609375, 2.10693359375, 2.2330322265625, 2.359130859375, 2.4852294921875, 2.611328125, 2.7374267578125, 2.863525390625, 2.9896240234375, 3.11572265625, 3.2418212890625, 3.367919921875, 3.4940185546875, 3.6201171875, 3.7462158203125, 3.872314453125, 3.9984130859375, 4.12451171875, 4.2506103515625, 4.376708984375, 4.5028076171875, 4.62890625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 9.0, 9.0, 12.0, 25.0, 24.0, 31.0, 54.0, 85.0, 139.0, 200.0, 297.0, 485.0, 823.0, 1252.0, 1875.0, 2963.0, 4738.0, 7548.0, 12423.0, 20174.0, 33448.0, 56621.0, 98612.0, 169206.0, 1268386.0, 171093.0, 100774.0, 57353.0, 34441.0, 20428.0, 12262.0, 7731.0, 4920.0, 3098.0, 2037.0, 1283.0, 772.0, 548.0, 325.0, 207.0, 135.0, 114.0, 64.0, 39.0, 21.0, 16.0, 11.0, 10.0, 5.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.7119140625, -0.690673828125, -0.66943359375, -0.648193359375, -0.626953125, -0.605712890625, -0.58447265625, -0.563232421875, -0.5419921875, -0.520751953125, -0.49951171875, -0.478271484375, -0.45703125, -0.435791015625, -0.41455078125, -0.393310546875, -0.3720703125, -0.350830078125, -0.32958984375, -0.308349609375, -0.287109375, -0.265869140625, -0.24462890625, -0.223388671875, -0.2021484375, -0.180908203125, -0.15966796875, -0.138427734375, -0.1171875, -0.095947265625, -0.07470703125, -0.053466796875, -0.0322265625, -0.010986328125, 0.01025390625, 0.031494140625, 0.052734375, 0.073974609375, 0.09521484375, 0.116455078125, 0.1376953125, 0.158935546875, 0.18017578125, 0.201416015625, 0.22265625, 0.243896484375, 0.26513671875, 0.286376953125, 0.3076171875, 0.328857421875, 0.35009765625, 0.371337890625, 0.392578125, 0.413818359375, 0.43505859375, 0.456298828125, 0.4775390625, 0.498779296875, 0.52001953125, 0.541259765625, 0.5625, 0.583740234375, 0.60498046875, 0.626220703125, 0.6474609375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 4.0, 5.0, 4.0, 8.0, 3.0, 8.0, 16.0, 26.0, 21.0, 29.0, 37.0, 67.0, 60.0, 85.0, 82.0, 82.0, 73.0, 74.0, 73.0, 51.0, 47.0, 31.0, 24.0, 20.0, 20.0, 5.0, 7.0, 12.0, 4.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026187896728515625, -0.002526789903640747, -0.0024347901344299316, -0.002342790365219116, -0.0022507905960083008, -0.0021587908267974854, -0.00206679105758667, -0.0019747912883758545, -0.001882791519165039, -0.0017907917499542236, -0.0016987919807434082, -0.0016067922115325928, -0.0015147924423217773, -0.001422792673110962, -0.0013307929039001465, -0.001238793134689331, -0.0011467933654785156, -0.0010547935962677002, -0.0009627938270568848, -0.0008707940578460693, -0.0007787942886352539, -0.0006867945194244385, -0.000594794750213623, -0.0005027949810028076, -0.0004107952117919922, -0.00031879544258117676, -0.00022679567337036133, -0.0001347959041595459, -4.279613494873047e-05, 4.920363426208496e-05, 0.0001412034034729004, 0.00023320317268371582, 0.00032520294189453125, 0.0004172027111053467, 0.0005092024803161621, 0.0006012022495269775, 0.000693202018737793, 0.0007852017879486084, 0.0008772015571594238, 0.0009692013263702393, 0.0010612010955810547, 0.0011532008647918701, 0.0012452006340026855, 0.001337200403213501, 0.0014292001724243164, 0.0015211999416351318, 0.0016131997108459473, 0.0017051994800567627, 0.0017971992492675781, 0.0018891990184783936, 0.001981198787689209, 0.0020731985569000244, 0.00216519832611084, 0.0022571980953216553, 0.0023491978645324707, 0.002441197633743286, 0.0025331974029541016, 0.002625197172164917, 0.0027171969413757324, 0.002809196710586548, 0.0029011964797973633, 0.0029931962490081787, 0.003085196018218994, 0.0031771957874298096, 0.003269195556640625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 8.0, 5.0, 14.0, 11.0, 14.0, 15.0, 35.0, 38.0, 71.0, 82.0, 122.0, 180.0, 349.0, 940.0, 182603.0, 861744.0, 1258.0, 422.0, 213.0, 128.0, 82.0, 52.0, 37.0, 36.0, 19.0, 14.0, 17.0, 8.0, 7.0, 5.0, 2.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0687255859375, -0.06676721572875977, -0.06480884552001953, -0.0628504753112793, -0.06089210510253906, -0.05893373489379883, -0.056975364685058594, -0.05501699447631836, -0.053058624267578125, -0.05110025405883789, -0.049141883850097656, -0.04718351364135742, -0.04522514343261719, -0.04326677322387695, -0.04130840301513672, -0.039350032806396484, -0.03739166259765625, -0.035433292388916016, -0.03347492218017578, -0.03151655197143555, -0.029558181762695312, -0.027599811553955078, -0.025641441345214844, -0.02368307113647461, -0.021724700927734375, -0.01976633071899414, -0.017807960510253906, -0.015849590301513672, -0.013891220092773438, -0.011932849884033203, -0.009974479675292969, -0.008016109466552734, -0.0060577392578125, -0.004099369049072266, -0.0021409988403320312, -0.00018262863159179688, 0.0017757415771484375, 0.003734111785888672, 0.005692481994628906, 0.007650852203369141, 0.009609222412109375, 0.01156759262084961, 0.013525962829589844, 0.015484333038330078, 0.017442703247070312, 0.019401073455810547, 0.02135944366455078, 0.023317813873291016, 0.02527618408203125, 0.027234554290771484, 0.02919292449951172, 0.031151294708251953, 0.03310966491699219, 0.03506803512573242, 0.037026405334472656, 0.03898477554321289, 0.040943145751953125, 0.04290151596069336, 0.044859886169433594, 0.04681825637817383, 0.04877662658691406, 0.0507349967956543, 0.05269336700439453, 0.054651737213134766, 0.056610107421875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 366.0, 651.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054013825953006744, -0.052995696663856506, -0.05197757109999657, -0.05095944181084633, -0.04994131252169609, -0.04892318695783615, -0.04790505766868591, -0.046886928379535675, -0.045868802815675735, -0.0448506735265255, -0.04383254796266556, -0.04281441867351532, -0.04179628938436508, -0.04077816382050514, -0.039760034531354904, -0.038741905242204666, -0.03772377967834473, -0.03670565038919449, -0.03568752482533455, -0.03466939553618431, -0.03365126624703407, -0.03263314068317413, -0.031615011394023895, -0.030596883967518806, -0.02957875281572342, -0.02856062538921833, -0.027542496100068092, -0.026524368673563004, -0.025506241247057915, -0.024488113820552826, -0.023469984531402588, -0.0224518571048975, -0.02143372967839241, -0.02041560225188732, -0.019397472962737083, -0.018379345536231995, -0.017361218109726906, -0.016343090683221817, -0.015324961394071579, -0.01430683396756649, -0.013288704678416252, -0.012270576320588589, -0.0112524488940835, -0.010234320536255836, -0.009216193109750748, -0.008198064751923084, -0.007179936394095421, -0.006161808501929045, -0.005143680609762669, -0.0041255527175962925, -0.0031074245925992727, -0.002089296467602253, -0.0010711685754358768, -5.304068326950073e-05, 0.0009650876745581627, 0.001983215566724539, 0.003001343458890915, 0.004019471351057291, 0.005037599243223667, 0.006055727601051331, 0.007073855493217707, 0.008091983385384083, 0.009110111743211746, 0.010128239169716835, 0.011146367527544498]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 5.0, 5.0, 9.0, 11.0, 11.0, 11.0, 20.0, 25.0, 25.0, 40.0, 38.0, 44.0, 44.0, 51.0, 45.0, 64.0, 65.0, 64.0, 67.0, 59.0, 53.0, 54.0, 41.0, 41.0, 28.0, 24.0, 19.0, 15.0, 13.0, 8.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001131296157836914, -0.0010736426338553429, -0.0010159891098737717, -0.0009583355858922005, -0.0009006820619106293, -0.0008430285379290581, -0.0007853750139474869, -0.0007277214899659157, -0.0006700679659843445, -0.0006124144420027733, -0.0005547609180212021, -0.0004971073940396309, -0.0004394538700580597, -0.0003818003460764885, -0.0003241468220949173, -0.0002664932981133461, -0.0002088397741317749, -0.0001511862501502037, -9.353272616863251e-05, -3.587920218706131e-05, 2.1774321794509888e-05, 7.942784577608109e-05, 0.00013708136975765228, 0.00019473489373922348, 0.0002523884177207947, 0.0003100419417023659, 0.00036769546568393707, 0.00042534898966550827, 0.00048300251364707947, 0.0005406560376286507, 0.0005983095616102219, 0.0006559630855917931, 0.0007136166095733643, 0.0007712701335549355, 0.0008289236575365067, 0.0008865771815180779, 0.000944230705499649, 0.0010018842294812202, 0.0010595377534627914, 0.0011171912774443626, 0.0011748448014259338, 0.001232498325407505, 0.0012901518493890762, 0.0013478053733706474, 0.0014054588973522186, 0.0014631124213337898, 0.001520765945315361, 0.0015784194692969322, 0.0016360729932785034, 0.0016937265172600746, 0.0017513800412416458, 0.001809033565223217, 0.0018666870892047882, 0.0019243406131863594, 0.0019819941371679306, 0.002039647661149502, 0.002097301185131073, 0.002154954709112644, 0.0022126082330942154, 0.0022702617570757866, 0.002327915281057358, 0.002385568805038929, 0.0024432223290205, 0.0025008758530020714, 0.0025585293769836426]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 7.0, 5.0, 4.0, 9.0, 11.0, 13.0, 11.0, 23.0, 15.0, 20.0, 20.0, 22.0, 21.0, 40.0, 40.0, 40.0, 35.0, 42.0, 39.0, 43.0, 32.0, 32.0, 43.0, 36.0, 32.0, 52.0, 34.0, 35.0, 43.0, 26.0, 29.0, 20.0, 15.0, 19.0, 14.0, 16.0, 11.0, 11.0, 11.0, 10.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.1328125, -5.9410400390625, -5.749267578125, -5.5574951171875, -5.36572265625, -5.1739501953125, -4.982177734375, -4.7904052734375, -4.5986328125, -4.4068603515625, -4.215087890625, -4.0233154296875, -3.83154296875, -3.6397705078125, -3.447998046875, -3.2562255859375, -3.064453125, -2.8726806640625, -2.680908203125, -2.4891357421875, -2.29736328125, -2.1055908203125, -1.913818359375, -1.7220458984375, -1.5302734375, -1.3385009765625, -1.146728515625, -0.9549560546875, -0.76318359375, -0.5714111328125, -0.379638671875, -0.1878662109375, 0.00390625, 0.1956787109375, 0.387451171875, 0.5792236328125, 0.77099609375, 0.9627685546875, 1.154541015625, 1.3463134765625, 1.5380859375, 1.7298583984375, 1.921630859375, 2.1134033203125, 2.30517578125, 2.4969482421875, 2.688720703125, 2.8804931640625, 3.072265625, 3.2640380859375, 3.455810546875, 3.6475830078125, 3.83935546875, 4.0311279296875, 4.222900390625, 4.4146728515625, 4.6064453125, 4.7982177734375, 4.989990234375, 5.1817626953125, 5.37353515625, 5.5653076171875, 5.757080078125, 5.9488525390625, 6.140625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 7.0, 12.0, 14.0, 9.0, 15.0, 15.0, 36.0, 31.0, 47.0, 64.0, 68.0, 119.0, 146.0, 201.0, 297.0, 368.0, 495.0, 736.0, 1585.0, 5292.0, 28112.0, 505408.0, 468650.0, 27465.0, 5066.0, 1565.0, 770.0, 484.0, 389.0, 279.0, 209.0, 137.0, 121.0, 74.0, 54.0, 39.0, 37.0, 37.0, 24.0, 23.0, 17.0, 6.0, 12.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.46875, -14.9852294921875, -14.501708984375, -14.0181884765625, -13.53466796875, -13.0511474609375, -12.567626953125, -12.0841064453125, -11.6005859375, -11.1170654296875, -10.633544921875, -10.1500244140625, -9.66650390625, -9.1829833984375, -8.699462890625, -8.2159423828125, -7.732421875, -7.2489013671875, -6.765380859375, -6.2818603515625, -5.79833984375, -5.3148193359375, -4.831298828125, -4.3477783203125, -3.8642578125, -3.3807373046875, -2.897216796875, -2.4136962890625, -1.93017578125, -1.4466552734375, -0.963134765625, -0.4796142578125, 0.00390625, 0.4874267578125, 0.970947265625, 1.4544677734375, 1.93798828125, 2.4215087890625, 2.905029296875, 3.3885498046875, 3.8720703125, 4.3555908203125, 4.839111328125, 5.3226318359375, 5.80615234375, 6.2896728515625, 6.773193359375, 7.2567138671875, 7.740234375, 8.2237548828125, 8.707275390625, 9.1907958984375, 9.67431640625, 10.1578369140625, 10.641357421875, 11.1248779296875, 11.6083984375, 12.0919189453125, 12.575439453125, 13.0589599609375, 13.54248046875, 14.0260009765625, 14.509521484375, 14.9930419921875, 15.4765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 1.0, 7.0, 5.0, 5.0, 3.0, 6.0, 7.0, 11.0, 8.0, 11.0, 15.0, 23.0, 15.0, 31.0, 25.0, 27.0, 32.0, 37.0, 34.0, 29.0, 52.0, 39.0, 84.0, 444.0, 1526.0, 101.0, 54.0, 45.0, 41.0, 41.0, 34.0, 32.0, 33.0, 36.0, 16.0, 22.0, 24.0, 16.0, 7.0, 16.0, 14.0, 10.0, 8.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.734375, -16.195068359375, -15.65576171875, -15.116455078125, -14.5771484375, -14.037841796875, -13.49853515625, -12.959228515625, -12.419921875, -11.880615234375, -11.34130859375, -10.802001953125, -10.2626953125, -9.723388671875, -9.18408203125, -8.644775390625, -8.10546875, -7.566162109375, -7.02685546875, -6.487548828125, -5.9482421875, -5.408935546875, -4.86962890625, -4.330322265625, -3.791015625, -3.251708984375, -2.71240234375, -2.173095703125, -1.6337890625, -1.094482421875, -0.55517578125, -0.015869140625, 0.5234375, 1.062744140625, 1.60205078125, 2.141357421875, 2.6806640625, 3.219970703125, 3.75927734375, 4.298583984375, 4.837890625, 5.377197265625, 5.91650390625, 6.455810546875, 6.9951171875, 7.534423828125, 8.07373046875, 8.613037109375, 9.15234375, 9.691650390625, 10.23095703125, 10.770263671875, 11.3095703125, 11.848876953125, 12.38818359375, 12.927490234375, 13.466796875, 14.006103515625, 14.54541015625, 15.084716796875, 15.6240234375, 16.163330078125, 16.70263671875, 17.241943359375, 17.78125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 4.0, 4.0, 2.0, 4.0, 8.0, 11.0, 12.0, 14.0, 14.0, 19.0, 24.0, 24.0, 24.0, 37.0, 40.0, 39.0, 58.0, 78.0, 117.0, 206.0, 443.0, 1490.0, 84206.0, 3052228.0, 5100.0, 647.0, 285.0, 133.0, 78.0, 61.0, 49.0, 37.0, 32.0, 39.0, 19.0, 22.0, 20.0, 11.0, 11.0, 10.0, 11.0, 7.0, 6.0, 4.0, 3.0, 7.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-50.09375, -48.58544921875, -47.0771484375, -45.56884765625, -44.060546875, -42.55224609375, -41.0439453125, -39.53564453125, -38.02734375, -36.51904296875, -35.0107421875, -33.50244140625, -31.994140625, -30.48583984375, -28.9775390625, -27.46923828125, -25.9609375, -24.45263671875, -22.9443359375, -21.43603515625, -19.927734375, -18.41943359375, -16.9111328125, -15.40283203125, -13.89453125, -12.38623046875, -10.8779296875, -9.36962890625, -7.861328125, -6.35302734375, -4.8447265625, -3.33642578125, -1.828125, -0.31982421875, 1.1884765625, 2.69677734375, 4.205078125, 5.71337890625, 7.2216796875, 8.72998046875, 10.23828125, 11.74658203125, 13.2548828125, 14.76318359375, 16.271484375, 17.77978515625, 19.2880859375, 20.79638671875, 22.3046875, 23.81298828125, 25.3212890625, 26.82958984375, 28.337890625, 29.84619140625, 31.3544921875, 32.86279296875, 34.37109375, 35.87939453125, 37.3876953125, 38.89599609375, 40.404296875, 41.91259765625, 43.4208984375, 44.92919921875, 46.4375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 89.0, 619.0, 290.0, 15.0], "bins": [-155.8143768310547, -153.29119873046875, -150.7680206298828, -148.2448272705078, -145.72164916992188, -143.19847106933594, -140.67529296875, -138.15211486816406, -135.62893676757812, -133.1057586669922, -130.58258056640625, -128.05938720703125, -125.53620910644531, -123.01303100585938, -120.48985290527344, -117.9666748046875, -115.4434814453125, -112.92030334472656, -110.3971176147461, -107.87393951416016, -105.35075378417969, -102.82757568359375, -100.30439758300781, -97.78121948242188, -95.2580337524414, -92.73485565185547, -90.211669921875, -87.68849182128906, -85.16531372070312, -82.64212799072266, -80.11894989013672, -77.59576416015625, -75.07258605957031, -72.54940795898438, -70.0262222290039, -67.50304412841797, -64.9798583984375, -62.45668029785156, -59.933502197265625, -57.41032028198242, -54.887142181396484, -52.36396026611328, -49.840782165527344, -47.31760025024414, -44.79441833496094, -42.271236419677734, -39.74805450439453, -37.224876403808594, -34.70169448852539, -32.17851257324219, -29.655332565307617, -27.132152557373047, -24.608970642089844, -22.08578872680664, -19.56260871887207, -17.0394287109375, -14.516246795654297, -11.99306583404541, -9.469884872436523, -6.946703910827637, -4.42352294921875, -1.9003419876098633, 0.6228389739990234, 3.1460189819335938, 5.669201374053955]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 9.0, 8.0, 8.0, 11.0, 15.0, 13.0, 17.0, 27.0, 24.0, 31.0, 39.0, 34.0, 43.0, 51.0, 55.0, 50.0, 51.0, 50.0, 51.0, 28.0, 46.0, 41.0, 47.0, 39.0, 27.0, 37.0, 29.0, 24.0, 15.0, 17.0, 14.0, 14.0, 10.0, 4.0, 5.0, 6.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.079185485839844, -51.39681625366211, -49.71445083618164, -48.032081604003906, -46.34971237182617, -44.66734313964844, -42.98497772216797, -41.302608489990234, -39.6202392578125, -37.937870025634766, -36.2555046081543, -34.57313537597656, -32.89076614379883, -31.208398818969727, -29.526031494140625, -27.84366226196289, -26.16129493713379, -24.478927612304688, -22.796558380126953, -21.11419105529785, -19.431821823120117, -17.749454498291016, -16.06708526611328, -14.38471794128418, -12.702349662780762, -11.019981384277344, -9.337613105773926, -7.655245304107666, -5.972877025604248, -4.290509223937988, -2.6081409454345703, -0.9257726669311523, 0.7565956115722656, 2.4389638900756836, 4.121332168579102, 5.803699970245361, 7.486068248748779, 9.168436050415039, 10.850804328918457, 12.533172607421875, 14.215540885925293, 15.897909164428711, 17.580276489257812, 19.262645721435547, 20.94501304626465, 22.62738037109375, 24.309749603271484, 25.99211883544922, 27.67448616027832, 29.356853485107422, 31.039222717285156, 32.72159194946289, 34.40395736694336, 36.086326599121094, 37.76869583129883, 39.45106506347656, 41.13343048095703, 42.815799713134766, 44.498165130615234, 46.18053436279297, 47.8629035949707, 49.54527282714844, 51.227638244628906, 52.91000747680664, 54.592376708984375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 12.0, 6.0, 7.0, 10.0, 12.0, 8.0, 18.0, 21.0, 13.0, 30.0, 18.0, 28.0, 31.0, 33.0, 29.0, 34.0, 34.0, 36.0, 43.0, 43.0, 34.0, 38.0, 39.0, 33.0, 40.0, 33.0, 41.0, 42.0, 25.0, 27.0, 30.0, 22.0, 17.0, 10.0, 22.0, 13.0, 10.0, 9.0, 14.0, 8.0, 5.0, 3.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.73828125, -5.55059814453125, -5.3629150390625, -5.17523193359375, -4.987548828125, -4.79986572265625, -4.6121826171875, -4.42449951171875, -4.23681640625, -4.04913330078125, -3.8614501953125, -3.67376708984375, -3.486083984375, -3.29840087890625, -3.1107177734375, -2.92303466796875, -2.7353515625, -2.54766845703125, -2.3599853515625, -2.17230224609375, -1.984619140625, -1.79693603515625, -1.6092529296875, -1.42156982421875, -1.23388671875, -1.04620361328125, -0.8585205078125, -0.67083740234375, -0.483154296875, -0.29547119140625, -0.1077880859375, 0.07989501953125, 0.267578125, 0.45526123046875, 0.6429443359375, 0.83062744140625, 1.018310546875, 1.20599365234375, 1.3936767578125, 1.58135986328125, 1.76904296875, 1.95672607421875, 2.1444091796875, 2.33209228515625, 2.519775390625, 2.70745849609375, 2.8951416015625, 3.08282470703125, 3.2705078125, 3.45819091796875, 3.6458740234375, 3.83355712890625, 4.021240234375, 4.20892333984375, 4.3966064453125, 4.58428955078125, 4.77197265625, 4.95965576171875, 5.1473388671875, 5.33502197265625, 5.522705078125, 5.71038818359375, 5.8980712890625, 6.08575439453125, 6.2734375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 5.0, 8.0, 10.0, 8.0, 12.0, 14.0, 24.0, 34.0, 40.0, 55.0, 68.0, 83.0, 109.0, 169.0, 247.0, 363.0, 575.0, 988.0, 1994.0, 4455.0, 12646.0, 55269.0, 477440.0, 2410576.0, 1078947.0, 117347.0, 20490.0, 6321.0, 2597.0, 1285.0, 641.0, 446.0, 291.0, 159.0, 134.0, 101.0, 74.0, 50.0, 42.0, 37.0, 29.0, 26.0, 17.0, 12.0, 15.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.515625, -11.140380859375, -10.76513671875, -10.389892578125, -10.0146484375, -9.639404296875, -9.26416015625, -8.888916015625, -8.513671875, -8.138427734375, -7.76318359375, -7.387939453125, -7.0126953125, -6.637451171875, -6.26220703125, -5.886962890625, -5.51171875, -5.136474609375, -4.76123046875, -4.385986328125, -4.0107421875, -3.635498046875, -3.26025390625, -2.885009765625, -2.509765625, -2.134521484375, -1.75927734375, -1.384033203125, -1.0087890625, -0.633544921875, -0.25830078125, 0.116943359375, 0.4921875, 0.867431640625, 1.24267578125, 1.617919921875, 1.9931640625, 2.368408203125, 2.74365234375, 3.118896484375, 3.494140625, 3.869384765625, 4.24462890625, 4.619873046875, 4.9951171875, 5.370361328125, 5.74560546875, 6.120849609375, 6.49609375, 6.871337890625, 7.24658203125, 7.621826171875, 7.9970703125, 8.372314453125, 8.74755859375, 9.122802734375, 9.498046875, 9.873291015625, 10.24853515625, 10.623779296875, 10.9990234375, 11.374267578125, 11.74951171875, 12.124755859375, 12.5]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 12.0, 9.0, 15.0, 37.0, 51.0, 85.0, 127.0, 204.0, 330.0, 524.0, 770.0, 698.0, 473.0, 283.0, 166.0, 124.0, 58.0, 45.0, 23.0, 16.0, 10.0, 6.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8125, -12.317138671875, -11.82177734375, -11.326416015625, -10.8310546875, -10.335693359375, -9.84033203125, -9.344970703125, -8.849609375, -8.354248046875, -7.85888671875, -7.363525390625, -6.8681640625, -6.372802734375, -5.87744140625, -5.382080078125, -4.88671875, -4.391357421875, -3.89599609375, -3.400634765625, -2.9052734375, -2.409912109375, -1.91455078125, -1.419189453125, -0.923828125, -0.428466796875, 0.06689453125, 0.562255859375, 1.0576171875, 1.552978515625, 2.04833984375, 2.543701171875, 3.0390625, 3.534423828125, 4.02978515625, 4.525146484375, 5.0205078125, 5.515869140625, 6.01123046875, 6.506591796875, 7.001953125, 7.497314453125, 7.99267578125, 8.488037109375, 8.9833984375, 9.478759765625, 9.97412109375, 10.469482421875, 10.96484375, 11.460205078125, 11.95556640625, 12.450927734375, 12.9462890625, 13.441650390625, 13.93701171875, 14.432373046875, 14.927734375, 15.423095703125, 15.91845703125, 16.413818359375, 16.9091796875, 17.404541015625, 17.89990234375, 18.395263671875, 18.890625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 8.0, 7.0, 12.0, 15.0, 28.0, 33.0, 38.0, 85.0, 101.0, 138.0, 211.0, 357.0, 1047.0, 5324.0, 153336.0, 3960594.0, 67407.0, 3640.0, 856.0, 355.0, 200.0, 147.0, 91.0, 74.0, 42.0, 44.0, 30.0, 22.0, 12.0, 9.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-50.65625, -49.33740234375, -48.0185546875, -46.69970703125, -45.380859375, -44.06201171875, -42.7431640625, -41.42431640625, -40.10546875, -38.78662109375, -37.4677734375, -36.14892578125, -34.830078125, -33.51123046875, -32.1923828125, -30.87353515625, -29.5546875, -28.23583984375, -26.9169921875, -25.59814453125, -24.279296875, -22.96044921875, -21.6416015625, -20.32275390625, -19.00390625, -17.68505859375, -16.3662109375, -15.04736328125, -13.728515625, -12.40966796875, -11.0908203125, -9.77197265625, -8.453125, -7.13427734375, -5.8154296875, -4.49658203125, -3.177734375, -1.85888671875, -0.5400390625, 0.77880859375, 2.09765625, 3.41650390625, 4.7353515625, 6.05419921875, 7.373046875, 8.69189453125, 10.0107421875, 11.32958984375, 12.6484375, 13.96728515625, 15.2861328125, 16.60498046875, 17.923828125, 19.24267578125, 20.5615234375, 21.88037109375, 23.19921875, 24.51806640625, 25.8369140625, 27.15576171875, 28.474609375, 29.79345703125, 31.1123046875, 32.43115234375, 33.75]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 22.0, 116.0, 324.0, 368.0, 138.0, 37.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.95913696289062, -206.14895629882812, -202.33877563476562, -198.52859497070312, -194.7184295654297, -190.9082489013672, -187.0980682373047, -183.2878875732422, -179.4777069091797, -175.6675262451172, -171.8573455810547, -168.04718017578125, -164.23699951171875, -160.42681884765625, -156.61663818359375, -152.80645751953125, -148.99627685546875, -145.18609619140625, -141.37591552734375, -137.56573486328125, -133.7555694580078, -129.9453887939453, -126.13520812988281, -122.32502746582031, -118.51486206054688, -114.70468139648438, -110.8945083618164, -107.0843276977539, -103.2741470336914, -99.46397399902344, -95.65379333496094, -91.84361267089844, -88.0334243774414, -84.2232437133789, -80.41307067871094, -76.60289001464844, -72.79270935058594, -68.98252868652344, -65.17235565185547, -61.36217498779297, -57.551998138427734, -53.7418212890625, -49.931640625, -46.121463775634766, -42.31128692626953, -38.50110626220703, -34.6909294128418, -30.88075065612793, -27.070571899414062, -23.260393142700195, -19.450214385986328, -15.640037536621094, -11.829858779907227, -8.01968002319336, -4.209503173828125, -0.3993244171142578, 3.4108543395996094, 7.221032619476318, 11.031210899353027, 14.841388702392578, 18.651567459106445, 22.461746215820312, 26.271923065185547, 30.082101821899414, 33.89228057861328]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 3.0, 9.0, 11.0, 19.0, 16.0, 18.0, 32.0, 21.0, 20.0, 28.0, 29.0, 40.0, 28.0, 38.0, 41.0, 44.0, 40.0, 31.0, 40.0, 29.0, 43.0, 35.0, 36.0, 43.0, 40.0, 35.0, 32.0, 31.0, 29.0, 19.0, 16.0, 23.0, 7.0, 14.0, 9.0, 10.0, 9.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-31.353004455566406, -30.33247184753418, -29.311941146850586, -28.29140853881836, -27.270875930786133, -26.250343322753906, -25.229812622070312, -24.209280014038086, -23.18874740600586, -22.168214797973633, -21.14768409729004, -20.127151489257812, -19.106618881225586, -18.08608627319336, -17.065555572509766, -16.04502296447754, -15.024492263793945, -14.003960609436035, -12.983428001403809, -11.962896347045898, -10.942363739013672, -9.921832084655762, -8.901300430297852, -7.880768299102783, -6.860236167907715, -5.8397040367126465, -4.819171905517578, -3.798640251159668, -2.7781081199645996, -1.7575759887695312, -0.7370443344116211, 0.28348779678344727, 1.3040199279785156, 2.324552059173584, 3.3450839519500732, 4.3656158447265625, 5.386147975921631, 6.406680107116699, 7.427211761474609, 8.447744369506836, 9.468276023864746, 10.488807678222656, 11.509340286254883, 12.529871940612793, 13.550403594970703, 14.57093620300293, 15.59146785736084, 16.61199951171875, 17.632532119750977, 18.653064727783203, 19.673595428466797, 20.694128036499023, 21.71466064453125, 22.735191345214844, 23.75572395324707, 24.776256561279297, 25.79678726196289, 26.817319869995117, 27.83785057067871, 28.858383178710938, 29.878915786743164, 30.89944839477539, 31.919979095458984, 32.94050979614258, 33.96104431152344]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 1.0, 7.0, 8.0, 9.0, 6.0, 8.0, 8.0, 7.0, 17.0, 13.0, 13.0, 16.0, 20.0, 24.0, 25.0, 26.0, 40.0, 37.0, 26.0, 31.0, 32.0, 34.0, 48.0, 52.0, 34.0, 34.0, 33.0, 33.0, 38.0, 35.0, 21.0, 30.0, 30.0, 28.0, 20.0, 24.0, 26.0, 12.0, 12.0, 16.0, 20.0, 9.0, 6.0, 5.0, 6.0, 9.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.45703125, -5.27044677734375, -5.0838623046875, -4.89727783203125, -4.710693359375, -4.52410888671875, -4.3375244140625, -4.15093994140625, -3.96435546875, -3.77777099609375, -3.5911865234375, -3.40460205078125, -3.218017578125, -3.03143310546875, -2.8448486328125, -2.65826416015625, -2.4716796875, -2.28509521484375, -2.0985107421875, -1.91192626953125, -1.725341796875, -1.53875732421875, -1.3521728515625, -1.16558837890625, -0.97900390625, -0.79241943359375, -0.6058349609375, -0.41925048828125, -0.232666015625, -0.04608154296875, 0.1405029296875, 0.32708740234375, 0.513671875, 0.70025634765625, 0.8868408203125, 1.07342529296875, 1.260009765625, 1.44659423828125, 1.6331787109375, 1.81976318359375, 2.00634765625, 2.19293212890625, 2.3795166015625, 2.56610107421875, 2.752685546875, 2.93927001953125, 3.1258544921875, 3.31243896484375, 3.4990234375, 3.68560791015625, 3.8721923828125, 4.05877685546875, 4.245361328125, 4.43194580078125, 4.6185302734375, 4.80511474609375, 4.99169921875, 5.17828369140625, 5.3648681640625, 5.55145263671875, 5.738037109375, 5.92462158203125, 6.1112060546875, 6.29779052734375, 6.484375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 7.0, 7.0, 20.0, 22.0, 25.0, 43.0, 56.0, 80.0, 108.0, 171.0, 234.0, 318.0, 407.0, 634.0, 806.0, 1071.0, 1497.0, 2147.0, 2800.0, 3999.0, 5301.0, 7361.0, 10102.0, 14267.0, 19917.0, 28532.0, 41355.0, 61103.0, 91951.0, 133345.0, 163429.0, 141535.0, 99005.0, 66043.0, 43882.0, 30687.0, 21282.0, 15326.0, 10950.0, 7771.0, 5585.0, 4157.0, 3108.0, 2230.0, 1577.0, 1187.0, 876.0, 642.0, 484.0, 335.0, 227.0, 171.0, 111.0, 94.0, 57.0, 54.0, 26.0, 20.0, 12.0, 8.0, 7.0, 3.0, 3.0], "bins": [-0.60888671875, -0.5896148681640625, -0.570343017578125, -0.5510711669921875, -0.53179931640625, -0.5125274658203125, -0.493255615234375, -0.4739837646484375, -0.4547119140625, -0.4354400634765625, -0.416168212890625, -0.3968963623046875, -0.37762451171875, -0.3583526611328125, -0.339080810546875, -0.3198089599609375, -0.300537109375, -0.2812652587890625, -0.261993408203125, -0.2427215576171875, -0.22344970703125, -0.2041778564453125, -0.184906005859375, -0.1656341552734375, -0.1463623046875, -0.1270904541015625, -0.107818603515625, -0.0885467529296875, -0.06927490234375, -0.0500030517578125, -0.030731201171875, -0.0114593505859375, 0.0078125, 0.0270843505859375, 0.046356201171875, 0.0656280517578125, 0.08489990234375, 0.1041717529296875, 0.123443603515625, 0.1427154541015625, 0.1619873046875, 0.1812591552734375, 0.200531005859375, 0.2198028564453125, 0.23907470703125, 0.2583465576171875, 0.277618408203125, 0.2968902587890625, 0.316162109375, 0.3354339599609375, 0.354705810546875, 0.3739776611328125, 0.39324951171875, 0.4125213623046875, 0.431793212890625, 0.4510650634765625, 0.4703369140625, 0.4896087646484375, 0.508880615234375, 0.5281524658203125, 0.54742431640625, 0.5666961669921875, 0.585968017578125, 0.6052398681640625, 0.62451171875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 12.0, 13.0, 12.0, 14.0, 16.0, 11.0, 22.0, 35.0, 25.0, 28.0, 38.0, 31.0, 32.0, 30.0, 30.0, 38.0, 28.0, 43.0, 1067.0, 38.0, 25.0, 40.0, 35.0, 27.0, 42.0, 33.0, 31.0, 28.0, 19.0, 19.0, 19.0, 13.0, 15.0, 15.0, 12.0, 13.0, 13.0, 8.0, 8.0, 7.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-4.26171875, -4.13787841796875, -4.0140380859375, -3.89019775390625, -3.766357421875, -3.64251708984375, -3.5186767578125, -3.39483642578125, -3.27099609375, -3.14715576171875, -3.0233154296875, -2.89947509765625, -2.775634765625, -2.65179443359375, -2.5279541015625, -2.40411376953125, -2.2802734375, -2.15643310546875, -2.0325927734375, -1.90875244140625, -1.784912109375, -1.66107177734375, -1.5372314453125, -1.41339111328125, -1.28955078125, -1.16571044921875, -1.0418701171875, -0.91802978515625, -0.794189453125, -0.67034912109375, -0.5465087890625, -0.42266845703125, -0.298828125, -0.17498779296875, -0.0511474609375, 0.07269287109375, 0.196533203125, 0.32037353515625, 0.4442138671875, 0.56805419921875, 0.69189453125, 0.81573486328125, 0.9395751953125, 1.06341552734375, 1.187255859375, 1.31109619140625, 1.4349365234375, 1.55877685546875, 1.6826171875, 1.80645751953125, 1.9302978515625, 2.05413818359375, 2.177978515625, 2.30181884765625, 2.4256591796875, 2.54949951171875, 2.67333984375, 2.79718017578125, 2.9210205078125, 3.04486083984375, 3.168701171875, 3.29254150390625, 3.4163818359375, 3.54022216796875, 3.6640625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 14.0, 17.0, 21.0, 37.0, 61.0, 89.0, 124.0, 183.0, 264.0, 431.0, 647.0, 934.0, 1583.0, 2535.0, 4115.0, 6734.0, 11350.0, 19119.0, 32732.0, 57040.0, 102086.0, 179617.0, 1283590.0, 169082.0, 95050.0, 53464.0, 30684.0, 17941.0, 10523.0, 6415.0, 3942.0, 2518.0, 1529.0, 980.0, 584.0, 376.0, 243.0, 174.0, 109.0, 62.0, 31.0, 34.0, 18.0, 16.0, 5.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.7041015625, -0.6801834106445312, -0.6562652587890625, -0.6323471069335938, -0.608428955078125, -0.5845108032226562, -0.5605926513671875, -0.5366744995117188, -0.51275634765625, -0.48883819580078125, -0.4649200439453125, -0.44100189208984375, -0.417083740234375, -0.39316558837890625, -0.3692474365234375, -0.34532928466796875, -0.3214111328125, -0.29749298095703125, -0.2735748291015625, -0.24965667724609375, -0.225738525390625, -0.20182037353515625, -0.1779022216796875, -0.15398406982421875, -0.13006591796875, -0.10614776611328125, -0.0822296142578125, -0.05831146240234375, -0.034393310546875, -0.01047515869140625, 0.0134429931640625, 0.03736114501953125, 0.061279296875, 0.08519744873046875, 0.1091156005859375, 0.13303375244140625, 0.156951904296875, 0.18087005615234375, 0.2047882080078125, 0.22870635986328125, 0.25262451171875, 0.27654266357421875, 0.3004608154296875, 0.32437896728515625, 0.348297119140625, 0.37221527099609375, 0.3961334228515625, 0.42005157470703125, 0.4439697265625, 0.46788787841796875, 0.4918060302734375, 0.5157241821289062, 0.539642333984375, 0.5635604858398438, 0.5874786376953125, 0.6113967895507812, 0.63531494140625, 0.6592330932617188, 0.6831512451171875, 0.7070693969726562, 0.730987548828125, 0.7549057006835938, 0.7788238525390625, 0.8027420043945312, 0.82666015625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 11.0, 5.0, 4.0, 7.0, 15.0, 18.0, 29.0, 26.0, 32.0, 21.0, 32.0, 60.0, 41.0, 66.0, 58.0, 56.0, 64.0, 53.0, 52.0, 59.0, 36.0, 42.0, 31.0, 29.0, 41.0, 26.0, 22.0, 14.0, 9.0, 8.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0027141571044921875, -0.002634882926940918, -0.0025556087493896484, -0.002476334571838379, -0.0023970603942871094, -0.00231778621673584, -0.0022385120391845703, -0.0021592378616333008, -0.0020799636840820312, -0.0020006895065307617, -0.0019214153289794922, -0.0018421411514282227, -0.0017628669738769531, -0.0016835927963256836, -0.001604318618774414, -0.0015250444412231445, -0.001445770263671875, -0.0013664960861206055, -0.001287221908569336, -0.0012079477310180664, -0.0011286735534667969, -0.0010493993759155273, -0.0009701251983642578, -0.0008908510208129883, -0.0008115768432617188, -0.0007323026657104492, -0.0006530284881591797, -0.0005737543106079102, -0.0004944801330566406, -0.0004152059555053711, -0.00033593177795410156, -0.00025665760040283203, -0.0001773834228515625, -9.810924530029297e-05, -1.8835067749023438e-05, 6.0439109802246094e-05, 0.00013971328735351562, 0.00021898746490478516, 0.0002982616424560547, 0.0003775358200073242, 0.00045680999755859375, 0.0005360841751098633, 0.0006153583526611328, 0.0006946325302124023, 0.0007739067077636719, 0.0008531808853149414, 0.0009324550628662109, 0.0010117292404174805, 0.00109100341796875, 0.0011702775955200195, 0.001249551773071289, 0.0013288259506225586, 0.0014081001281738281, 0.0014873743057250977, 0.0015666484832763672, 0.0016459226608276367, 0.0017251968383789062, 0.0018044710159301758, 0.0018837451934814453, 0.001963019371032715, 0.0020422935485839844, 0.002121567726135254, 0.0022008419036865234, 0.002280116081237793, 0.0023593902587890625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 10.0, 6.0, 15.0, 27.0, 27.0, 34.0, 46.0, 76.0, 82.0, 77.0, 126.0, 174.0, 318.0, 609.0, 2237.0, 859854.0, 182102.0, 1234.0, 498.0, 280.0, 176.0, 118.0, 98.0, 69.0, 50.0, 39.0, 24.0, 37.0, 21.0, 14.0, 13.0, 12.0, 8.0, 6.0, 7.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04827880859375, -0.04671478271484375, -0.0451507568359375, -0.04358673095703125, -0.042022705078125, -0.04045867919921875, -0.0388946533203125, -0.03733062744140625, -0.0357666015625, -0.03420257568359375, -0.0326385498046875, -0.03107452392578125, -0.029510498046875, -0.02794647216796875, -0.0263824462890625, -0.02481842041015625, -0.02325439453125, -0.02169036865234375, -0.0201263427734375, -0.01856231689453125, -0.016998291015625, -0.01543426513671875, -0.0138702392578125, -0.01230621337890625, -0.0107421875, -0.00917816162109375, -0.0076141357421875, -0.00605010986328125, -0.004486083984375, -0.00292205810546875, -0.0013580322265625, 0.00020599365234375, 0.00177001953125, 0.00333404541015625, 0.0048980712890625, 0.00646209716796875, 0.008026123046875, 0.00959014892578125, 0.0111541748046875, 0.01271820068359375, 0.0142822265625, 0.01584625244140625, 0.0174102783203125, 0.01897430419921875, 0.020538330078125, 0.02210235595703125, 0.0236663818359375, 0.02523040771484375, 0.02679443359375, 0.02835845947265625, 0.0299224853515625, 0.03148651123046875, 0.033050537109375, 0.03461456298828125, 0.0361785888671875, 0.03774261474609375, 0.039306640625, 0.04087066650390625, 0.0424346923828125, 0.04399871826171875, 0.045562744140625, 0.04712677001953125, 0.0486907958984375, 0.05025482177734375, 0.05181884765625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 981.0, 32.0], "bins": [-0.057560306042432785, -0.056641124188899994, -0.0557219460606575, -0.05480276420712471, -0.05388358607888222, -0.052964404225349426, -0.052045226097106934, -0.05112604424357414, -0.05020686611533165, -0.04928768426179886, -0.048368506133556366, -0.047449324280023575, -0.04653014615178108, -0.04561096429824829, -0.0446917861700058, -0.04377260431647301, -0.042853426188230515, -0.04193424433469772, -0.04101506620645523, -0.04009588435292244, -0.03917670622467995, -0.038257524371147156, -0.03733834624290466, -0.03641916438937187, -0.03549998626112938, -0.03458080440759659, -0.033661626279354095, -0.032742444425821304, -0.03182326629757881, -0.03090408630669117, -0.029984906315803528, -0.029065726324915886, -0.028146542608737946, -0.027227362617850304, -0.026308182626962662, -0.02538900263607502, -0.024469822645187378, -0.023550642654299736, -0.022631462663412094, -0.021712282672524452, -0.02079310268163681, -0.01987392269074917, -0.018954742699861526, -0.018035562708973885, -0.017116382718086243, -0.0161972027271986, -0.015278022736310959, -0.014358842745423317, -0.0134396618232131, -0.012520481832325459, -0.011601301841437817, -0.010682121850550175, -0.009762941859662533, -0.008843760937452316, -0.007924580946564674, -0.00700540142133832, -0.006086221896111965, -0.005167041905224323, -0.004247861914336681, -0.003328681690618396, -0.002409501699730754, -0.0014903214760124683, -0.0005711414851248264, 0.0003480385057628155, 0.0012672186130657792]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 9.0, 17.0, 29.0, 31.0, 29.0, 45.0, 41.0, 61.0, 76.0, 59.0, 79.0, 89.0, 67.0, 80.0, 72.0, 67.0, 34.0, 32.0, 23.0, 26.0, 18.0, 8.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014080405235290527, -0.0013303542509675026, -0.0012526679784059525, -0.0011749817058444023, -0.0010972954332828522, -0.001019609160721302, -0.0009419228881597519, -0.0008642366155982018, -0.0007865503430366516, -0.0007088640704751015, -0.0006311777979135513, -0.0005534915253520012, -0.00047580525279045105, -0.0003981189802289009, -0.00032043270766735077, -0.00024274643510580063, -0.0001650601625442505, -8.737388998270035e-05, -9.687617421150208e-06, 6.799865514039993e-05, 0.00014568492770195007, 0.00022337120026350021, 0.00030105747282505035, 0.0003787437453866005, 0.00045643001794815063, 0.0005341162905097008, 0.0006118025630712509, 0.0006894888356328011, 0.0007671751081943512, 0.0008448613807559013, 0.0009225476533174515, 0.0010002339258790016, 0.0010779201984405518, 0.001155606471002102, 0.001233292743563652, 0.0013109790161252022, 0.0013886652886867523, 0.0014663515612483025, 0.0015440378338098526, 0.0016217241063714027, 0.0016994103789329529, 0.001777096651494503, 0.0018547829240560532, 0.0019324691966176033, 0.0020101554691791534, 0.0020878417417407036, 0.0021655280143022537, 0.002243214286863804, 0.002320900559425354, 0.002398586831986904, 0.0024762731045484543, 0.0025539593771100044, 0.0026316456496715546, 0.0027093319222331047, 0.002787018194794655, 0.002864704467356205, 0.002942390739917755, 0.0030200770124793053, 0.0030977632850408554, 0.0031754495576024055, 0.0032531358301639557, 0.003330822102725506, 0.003408508375287056, 0.003486194647848606, 0.0035638809204101562]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 1.0, 7.0, 8.0, 9.0, 6.0, 8.0, 7.0, 8.0, 17.0, 13.0, 13.0, 16.0, 20.0, 24.0, 25.0, 26.0, 40.0, 37.0, 26.0, 31.0, 32.0, 34.0, 47.0, 53.0, 34.0, 34.0, 33.0, 33.0, 38.0, 35.0, 21.0, 30.0, 30.0, 28.0, 20.0, 24.0, 26.0, 12.0, 12.0, 16.0, 20.0, 9.0, 6.0, 5.0, 6.0, 9.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.45703125, -5.27044677734375, -5.0838623046875, -4.89727783203125, -4.710693359375, -4.52410888671875, -4.3375244140625, -4.15093994140625, -3.96435546875, -3.77777099609375, -3.5911865234375, -3.40460205078125, -3.218017578125, -3.03143310546875, -2.8448486328125, -2.65826416015625, -2.4716796875, -2.28509521484375, -2.0985107421875, -1.91192626953125, -1.725341796875, -1.53875732421875, -1.3521728515625, -1.16558837890625, -0.97900390625, -0.79241943359375, -0.6058349609375, -0.41925048828125, -0.232666015625, -0.04608154296875, 0.1405029296875, 0.32708740234375, 0.513671875, 0.70025634765625, 0.8868408203125, 1.07342529296875, 1.260009765625, 1.44659423828125, 1.6331787109375, 1.81976318359375, 2.00634765625, 2.19293212890625, 2.3795166015625, 2.56610107421875, 2.752685546875, 2.93927001953125, 3.1258544921875, 3.31243896484375, 3.4990234375, 3.68560791015625, 3.8721923828125, 4.05877685546875, 4.245361328125, 4.43194580078125, 4.6185302734375, 4.80511474609375, 4.99169921875, 5.17828369140625, 5.3648681640625, 5.55145263671875, 5.738037109375, 5.92462158203125, 6.1112060546875, 6.29779052734375, 6.484375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 10.0, 12.0, 16.0, 17.0, 24.0, 26.0, 32.0, 48.0, 41.0, 69.0, 83.0, 113.0, 157.0, 275.0, 392.0, 700.0, 1315.0, 2563.0, 5607.0, 12830.0, 31776.0, 88536.0, 303733.0, 410432.0, 118732.0, 41176.0, 16071.0, 6819.0, 3154.0, 1491.0, 794.0, 494.0, 275.0, 178.0, 144.0, 107.0, 66.0, 55.0, 33.0, 41.0, 27.0, 14.0, 17.0, 12.0, 12.0, 5.0, 10.0, 6.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.95703125, -6.71820068359375, -6.4793701171875, -6.24053955078125, -6.001708984375, -5.76287841796875, -5.5240478515625, -5.28521728515625, -5.04638671875, -4.80755615234375, -4.5687255859375, -4.32989501953125, -4.091064453125, -3.85223388671875, -3.6134033203125, -3.37457275390625, -3.1357421875, -2.89691162109375, -2.6580810546875, -2.41925048828125, -2.180419921875, -1.94158935546875, -1.7027587890625, -1.46392822265625, -1.22509765625, -0.98626708984375, -0.7474365234375, -0.50860595703125, -0.269775390625, -0.03094482421875, 0.2078857421875, 0.44671630859375, 0.685546875, 0.92437744140625, 1.1632080078125, 1.40203857421875, 1.640869140625, 1.87969970703125, 2.1185302734375, 2.35736083984375, 2.59619140625, 2.83502197265625, 3.0738525390625, 3.31268310546875, 3.551513671875, 3.79034423828125, 4.0291748046875, 4.26800537109375, 4.5068359375, 4.74566650390625, 4.9844970703125, 5.22332763671875, 5.462158203125, 5.70098876953125, 5.9398193359375, 6.17864990234375, 6.41748046875, 6.65631103515625, 6.8951416015625, 7.13397216796875, 7.372802734375, 7.61163330078125, 7.8504638671875, 8.08929443359375, 8.328125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 1.0, 5.0, 7.0, 16.0, 14.0, 7.0, 20.0, 19.0, 20.0, 14.0, 32.0, 35.0, 29.0, 42.0, 41.0, 44.0, 51.0, 75.0, 111.0, 313.0, 1510.0, 147.0, 86.0, 76.0, 49.0, 37.0, 42.0, 26.0, 20.0, 24.0, 17.0, 23.0, 18.0, 7.0, 16.0, 8.0, 7.0, 8.0, 6.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.8125, -16.23583984375, -15.6591796875, -15.08251953125, -14.505859375, -13.92919921875, -13.3525390625, -12.77587890625, -12.19921875, -11.62255859375, -11.0458984375, -10.46923828125, -9.892578125, -9.31591796875, -8.7392578125, -8.16259765625, -7.5859375, -7.00927734375, -6.4326171875, -5.85595703125, -5.279296875, -4.70263671875, -4.1259765625, -3.54931640625, -2.97265625, -2.39599609375, -1.8193359375, -1.24267578125, -0.666015625, -0.08935546875, 0.4873046875, 1.06396484375, 1.640625, 2.21728515625, 2.7939453125, 3.37060546875, 3.947265625, 4.52392578125, 5.1005859375, 5.67724609375, 6.25390625, 6.83056640625, 7.4072265625, 7.98388671875, 8.560546875, 9.13720703125, 9.7138671875, 10.29052734375, 10.8671875, 11.44384765625, 12.0205078125, 12.59716796875, 13.173828125, 13.75048828125, 14.3271484375, 14.90380859375, 15.48046875, 16.05712890625, 16.6337890625, 17.21044921875, 17.787109375, 18.36376953125, 18.9404296875, 19.51708984375, 20.09375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 9.0, 7.0, 10.0, 16.0, 23.0, 39.0, 29.0, 52.0, 95.0, 131.0, 198.0, 364.0, 793.0, 6256.0, 583838.0, 2540141.0, 11527.0, 1013.0, 421.0, 258.0, 155.0, 89.0, 63.0, 59.0, 28.0, 25.0, 17.0, 20.0, 8.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.4375, -29.27099609375, -28.1044921875, -26.93798828125, -25.771484375, -24.60498046875, -23.4384765625, -22.27197265625, -21.10546875, -19.93896484375, -18.7724609375, -17.60595703125, -16.439453125, -15.27294921875, -14.1064453125, -12.93994140625, -11.7734375, -10.60693359375, -9.4404296875, -8.27392578125, -7.107421875, -5.94091796875, -4.7744140625, -3.60791015625, -2.44140625, -1.27490234375, -0.1083984375, 1.05810546875, 2.224609375, 3.39111328125, 4.5576171875, 5.72412109375, 6.890625, 8.05712890625, 9.2236328125, 10.39013671875, 11.556640625, 12.72314453125, 13.8896484375, 15.05615234375, 16.22265625, 17.38916015625, 18.5556640625, 19.72216796875, 20.888671875, 22.05517578125, 23.2216796875, 24.38818359375, 25.5546875, 26.72119140625, 27.8876953125, 29.05419921875, 30.220703125, 31.38720703125, 32.5537109375, 33.72021484375, 34.88671875, 36.05322265625, 37.2197265625, 38.38623046875, 39.552734375, 40.71923828125, 41.8857421875, 43.05224609375, 44.21875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 514.0, 474.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.32444763183594, -55.664268493652344, -51.004093170166016, -46.34391784667969, -41.683738708496094, -37.0235595703125, -32.36338424682617, -27.703208923339844, -23.04302978515625, -18.38285255432129, -13.722675323486328, -9.062498092651367, -4.402320861816406, 0.2578563690185547, 4.918033599853516, 9.578208923339844, 14.238388061523438, 18.8985652923584, 23.55874252319336, 28.21891975402832, 32.87909698486328, 37.539276123046875, 42.1994514465332, 46.85962677001953, 51.519805908203125, 56.17998504638672, 60.84016036987305, 65.50033569335938, 70.16051483154297, 74.82069396972656, 79.48086547851562, 84.14104461669922, 88.80122375488281, 93.4614028930664, 98.12158203125, 102.78175354003906, 107.44193267822266, 112.10211181640625, 116.76228332519531, 121.4224624633789, 126.0826416015625, 130.74281311035156, 135.4029998779297, 140.06317138671875, 144.72335815429688, 149.38352966308594, 154.043701171875, 158.70388793945312, 163.3640594482422, 168.02423095703125, 172.68441772460938, 177.34458923339844, 182.0047607421875, 186.66494750976562, 191.3251190185547, 195.98529052734375, 200.64547729492188, 205.30564880371094, 209.96583557128906, 214.62600708007812, 219.28619384765625, 223.9463653564453, 228.60653686523438, 233.2667236328125, 237.92689514160156]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 4.0, 9.0, 3.0, 9.0, 9.0, 8.0, 12.0, 15.0, 19.0, 20.0, 25.0, 24.0, 24.0, 16.0, 20.0, 26.0, 25.0, 36.0, 36.0, 39.0, 34.0, 35.0, 38.0, 46.0, 38.0, 33.0, 33.0, 32.0, 31.0, 35.0, 20.0, 36.0, 23.0, 24.0, 23.0, 24.0, 13.0, 14.0, 12.0, 6.0, 7.0, 9.0, 7.0, 7.0, 9.0, 4.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0], "bins": [-34.837284088134766, -33.746849060058594, -32.65641784667969, -31.56598472595215, -30.47555160522461, -29.38511848449707, -28.29468536376953, -27.20425033569336, -26.113819122314453, -25.023386001586914, -23.932952880859375, -22.842519760131836, -21.752086639404297, -20.661653518676758, -19.57122039794922, -18.480785369873047, -17.390352249145508, -16.29991912841797, -15.20948600769043, -14.11905288696289, -13.028619766235352, -11.938186645507812, -10.847752571105957, -9.757319450378418, -8.666886329650879, -7.57645320892334, -6.486020088195801, -5.3955864906311035, -4.3051533699035645, -3.2147202491760254, -2.124286651611328, -1.033853530883789, 0.05657958984375, 1.1470128297805786, 2.2374460697174072, 3.3278794288635254, 4.4183125495910645, 5.5087456703186035, 6.599179267883301, 7.68961238861084, 8.780045509338379, 9.870478630065918, 10.960911750793457, 12.051345825195312, 13.141778945922852, 14.23221206665039, 15.32264518737793, 16.41307830810547, 17.503511428833008, 18.593944549560547, 19.684377670288086, 20.774810791015625, 21.865243911743164, 22.955677032470703, 24.046112060546875, 25.13654327392578, 26.226978302001953, 27.317411422729492, 28.40784454345703, 29.49827766418457, 30.58871078491211, 31.67914390563965, 32.76957702636719, 33.86001205444336, 34.950443267822266]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 5.0, 6.0, 7.0, 14.0, 8.0, 7.0, 15.0, 11.0, 17.0, 21.0, 14.0, 23.0, 27.0, 31.0, 37.0, 32.0, 36.0, 40.0, 26.0, 40.0, 46.0, 42.0, 33.0, 35.0, 34.0, 31.0, 38.0, 33.0, 29.0, 28.0, 31.0, 24.0, 27.0, 18.0, 18.0, 14.0, 14.0, 17.0, 16.0, 6.0, 8.0, 9.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78125, -5.5869140625, -5.392578125, -5.1982421875, -5.00390625, -4.8095703125, -4.615234375, -4.4208984375, -4.2265625, -4.0322265625, -3.837890625, -3.6435546875, -3.44921875, -3.2548828125, -3.060546875, -2.8662109375, -2.671875, -2.4775390625, -2.283203125, -2.0888671875, -1.89453125, -1.7001953125, -1.505859375, -1.3115234375, -1.1171875, -0.9228515625, -0.728515625, -0.5341796875, -0.33984375, -0.1455078125, 0.048828125, 0.2431640625, 0.4375, 0.6318359375, 0.826171875, 1.0205078125, 1.21484375, 1.4091796875, 1.603515625, 1.7978515625, 1.9921875, 2.1865234375, 2.380859375, 2.5751953125, 2.76953125, 2.9638671875, 3.158203125, 3.3525390625, 3.546875, 3.7412109375, 3.935546875, 4.1298828125, 4.32421875, 4.5185546875, 4.712890625, 4.9072265625, 5.1015625, 5.2958984375, 5.490234375, 5.6845703125, 5.87890625, 6.0732421875, 6.267578125, 6.4619140625, 6.65625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 7.0, 8.0, 17.0, 10.0, 12.0, 25.0, 27.0, 36.0, 45.0, 88.0, 124.0, 272.0, 562.0, 1310.0, 3861.0, 14236.0, 111318.0, 2352079.0, 1626123.0, 68044.0, 10808.0, 3115.0, 1116.0, 457.0, 196.0, 126.0, 66.0, 36.0, 27.0, 23.0, 19.0, 17.0, 17.0, 10.0, 11.0, 6.0, 5.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.484375, -16.879638671875, -16.27490234375, -15.670166015625, -15.0654296875, -14.460693359375, -13.85595703125, -13.251220703125, -12.646484375, -12.041748046875, -11.43701171875, -10.832275390625, -10.2275390625, -9.622802734375, -9.01806640625, -8.413330078125, -7.80859375, -7.203857421875, -6.59912109375, -5.994384765625, -5.3896484375, -4.784912109375, -4.18017578125, -3.575439453125, -2.970703125, -2.365966796875, -1.76123046875, -1.156494140625, -0.5517578125, 0.052978515625, 0.65771484375, 1.262451171875, 1.8671875, 2.471923828125, 3.07666015625, 3.681396484375, 4.2861328125, 4.890869140625, 5.49560546875, 6.100341796875, 6.705078125, 7.309814453125, 7.91455078125, 8.519287109375, 9.1240234375, 9.728759765625, 10.33349609375, 10.938232421875, 11.54296875, 12.147705078125, 12.75244140625, 13.357177734375, 13.9619140625, 14.566650390625, 15.17138671875, 15.776123046875, 16.380859375, 16.985595703125, 17.59033203125, 18.195068359375, 18.7998046875, 19.404541015625, 20.00927734375, 20.614013671875, 21.21875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 9.0, 3.0, 8.0, 8.0, 11.0, 13.0, 12.0, 28.0, 25.0, 29.0, 41.0, 59.0, 88.0, 127.0, 172.0, 243.0, 333.0, 471.0, 533.0, 502.0, 408.0, 267.0, 179.0, 131.0, 96.0, 73.0, 49.0, 35.0, 34.0, 18.0, 16.0, 17.0, 8.0, 11.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.696044921875, -8.39208984375, -8.088134765625, -7.7841796875, -7.480224609375, -7.17626953125, -6.872314453125, -6.568359375, -6.264404296875, -5.96044921875, -5.656494140625, -5.3525390625, -5.048583984375, -4.74462890625, -4.440673828125, -4.13671875, -3.832763671875, -3.52880859375, -3.224853515625, -2.9208984375, -2.616943359375, -2.31298828125, -2.009033203125, -1.705078125, -1.401123046875, -1.09716796875, -0.793212890625, -0.4892578125, -0.185302734375, 0.11865234375, 0.422607421875, 0.7265625, 1.030517578125, 1.33447265625, 1.638427734375, 1.9423828125, 2.246337890625, 2.55029296875, 2.854248046875, 3.158203125, 3.462158203125, 3.76611328125, 4.070068359375, 4.3740234375, 4.677978515625, 4.98193359375, 5.285888671875, 5.58984375, 5.893798828125, 6.19775390625, 6.501708984375, 6.8056640625, 7.109619140625, 7.41357421875, 7.717529296875, 8.021484375, 8.325439453125, 8.62939453125, 8.933349609375, 9.2373046875, 9.541259765625, 9.84521484375, 10.149169921875, 10.453125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 12.0, 10.0, 9.0, 18.0, 22.0, 27.0, 47.0, 68.0, 122.0, 199.0, 462.0, 951.0, 2524.0, 9882.0, 64205.0, 1255360.0, 2729127.0, 111346.0, 14171.0, 3314.0, 1189.0, 543.0, 268.0, 128.0, 87.0, 61.0, 37.0, 19.0, 25.0, 16.0, 11.0, 6.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.734375, -21.0576171875, -20.380859375, -19.7041015625, -19.02734375, -18.3505859375, -17.673828125, -16.9970703125, -16.3203125, -15.6435546875, -14.966796875, -14.2900390625, -13.61328125, -12.9365234375, -12.259765625, -11.5830078125, -10.90625, -10.2294921875, -9.552734375, -8.8759765625, -8.19921875, -7.5224609375, -6.845703125, -6.1689453125, -5.4921875, -4.8154296875, -4.138671875, -3.4619140625, -2.78515625, -2.1083984375, -1.431640625, -0.7548828125, -0.078125, 0.5986328125, 1.275390625, 1.9521484375, 2.62890625, 3.3056640625, 3.982421875, 4.6591796875, 5.3359375, 6.0126953125, 6.689453125, 7.3662109375, 8.04296875, 8.7197265625, 9.396484375, 10.0732421875, 10.75, 11.4267578125, 12.103515625, 12.7802734375, 13.45703125, 14.1337890625, 14.810546875, 15.4873046875, 16.1640625, 16.8408203125, 17.517578125, 18.1943359375, 18.87109375, 19.5478515625, 20.224609375, 20.9013671875, 21.578125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 8.0, 14.0, 63.0, 195.0, 365.0, 249.0, 94.0, 23.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.16478729248047, -119.70677185058594, -116.2487564086914, -112.79074096679688, -109.33272552490234, -105.87471008300781, -102.41669464111328, -98.95867919921875, -95.50066375732422, -92.04264831542969, -88.58463287353516, -85.12661743164062, -81.6686019897461, -78.21058654785156, -74.75257110595703, -71.2945556640625, -67.83654022216797, -64.37852478027344, -60.920509338378906, -57.462493896484375, -54.004478454589844, -50.54646301269531, -47.08844757080078, -43.63043212890625, -40.17241668701172, -36.71440124511719, -33.256385803222656, -29.798370361328125, -26.340354919433594, -22.882339477539062, -19.42432403564453, -15.96630859375, -12.508293151855469, -9.050277709960938, -5.592262268066406, -2.134246826171875, 1.3237686157226562, 4.7817840576171875, 8.239799499511719, 11.69781494140625, 15.155830383300781, 18.613845825195312, 22.071861267089844, 25.529876708984375, 28.987892150878906, 32.44590759277344, 35.90392303466797, 39.3619384765625, 42.81995391845703, 46.27796936035156, 49.735984802246094, 53.194000244140625, 56.652015686035156, 60.11003112792969, 63.56804656982422, 67.02606201171875, 70.48407745361328, 73.94209289550781, 77.40010833740234, 80.85812377929688, 84.3161392211914, 87.77415466308594, 91.23217010498047, 94.690185546875, 98.14820098876953]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 11.0, 10.0, 9.0, 8.0, 9.0, 17.0, 18.0, 23.0, 21.0, 24.0, 23.0, 26.0, 32.0, 21.0, 29.0, 29.0, 36.0, 24.0, 30.0, 48.0, 32.0, 40.0, 40.0, 38.0, 37.0, 30.0, 36.0, 29.0, 22.0, 23.0, 32.0, 33.0, 23.0, 17.0, 23.0, 18.0, 14.0, 13.0, 3.0, 11.0, 9.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-26.51313018798828, -25.61332893371582, -24.713525772094727, -23.813724517822266, -22.913921356201172, -22.01412010192871, -21.11431884765625, -20.214515686035156, -19.314714431762695, -18.414913177490234, -17.51511001586914, -16.61530876159668, -15.715506553649902, -14.815704345703125, -13.915903091430664, -13.016100883483887, -12.11629867553711, -11.216496467590332, -10.316694259643555, -9.416893005371094, -8.517090797424316, -7.617288589477539, -6.71748685836792, -5.817685127258301, -4.917882919311523, -4.018080711364746, -3.118278980255127, -2.2184770107269287, -1.3186750411987305, -0.4188728332519531, 0.480928897857666, 1.3807306289672852, 2.2805328369140625, 3.1803348064422607, 4.080136775970459, 4.979938507080078, 5.8797407150268555, 6.779542922973633, 7.679344654083252, 8.579146385192871, 9.478948593139648, 10.378750801086426, 11.278553009033203, 12.178354263305664, 13.078156471252441, 13.977958679199219, 14.87775993347168, 15.777562141418457, 16.677364349365234, 17.577165603637695, 18.47696876525879, 19.37677001953125, 20.276573181152344, 21.176374435424805, 22.076175689697266, 22.97597885131836, 23.87578010559082, 24.77558135986328, 25.675384521484375, 26.575185775756836, 27.474987030029297, 28.37479019165039, 29.27459144592285, 30.174392700195312, 31.074195861816406]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 9.0, 15.0, 17.0, 9.0, 11.0, 14.0, 21.0, 17.0, 32.0, 21.0, 32.0, 28.0, 18.0, 40.0, 40.0, 38.0, 36.0, 39.0, 32.0, 32.0, 41.0, 33.0, 38.0, 41.0, 37.0, 32.0, 27.0, 32.0, 26.0, 28.0, 21.0, 17.0, 17.0, 13.0, 17.0, 12.0, 9.0, 7.0, 8.0, 11.0, 4.0, 8.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.234375, -6.03515625, -5.8359375, -5.63671875, -5.4375, -5.23828125, -5.0390625, -4.83984375, -4.640625, -4.44140625, -4.2421875, -4.04296875, -3.84375, -3.64453125, -3.4453125, -3.24609375, -3.046875, -2.84765625, -2.6484375, -2.44921875, -2.25, -2.05078125, -1.8515625, -1.65234375, -1.453125, -1.25390625, -1.0546875, -0.85546875, -0.65625, -0.45703125, -0.2578125, -0.05859375, 0.140625, 0.33984375, 0.5390625, 0.73828125, 0.9375, 1.13671875, 1.3359375, 1.53515625, 1.734375, 1.93359375, 2.1328125, 2.33203125, 2.53125, 2.73046875, 2.9296875, 3.12890625, 3.328125, 3.52734375, 3.7265625, 3.92578125, 4.125, 4.32421875, 4.5234375, 4.72265625, 4.921875, 5.12109375, 5.3203125, 5.51953125, 5.71875, 5.91796875, 6.1171875, 6.31640625, 6.515625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 9.0, 15.0, 25.0, 29.0, 33.0, 70.0, 97.0, 161.0, 222.0, 325.0, 479.0, 764.0, 1124.0, 1699.0, 2473.0, 3792.0, 5855.0, 8868.0, 13828.0, 21026.0, 33838.0, 55115.0, 91566.0, 150865.0, 209461.0, 170818.0, 105179.0, 63770.0, 38976.0, 23965.0, 15091.0, 9728.0, 6466.0, 4293.0, 2856.0, 1822.0, 1255.0, 837.0, 574.0, 400.0, 256.0, 180.0, 131.0, 78.0, 45.0, 34.0, 26.0, 14.0, 5.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8173828125, -0.7907028198242188, -0.7640228271484375, -0.7373428344726562, -0.710662841796875, -0.6839828491210938, -0.6573028564453125, -0.6306228637695312, -0.60394287109375, -0.5772628784179688, -0.5505828857421875, -0.5239028930664062, -0.497222900390625, -0.47054290771484375, -0.4438629150390625, -0.41718292236328125, -0.3905029296875, -0.36382293701171875, -0.3371429443359375, -0.31046295166015625, -0.283782958984375, -0.25710296630859375, -0.2304229736328125, -0.20374298095703125, -0.17706298828125, -0.15038299560546875, -0.1237030029296875, -0.09702301025390625, -0.070343017578125, -0.04366302490234375, -0.0169830322265625, 0.00969696044921875, 0.036376953125, 0.06305694580078125, 0.0897369384765625, 0.11641693115234375, 0.143096923828125, 0.16977691650390625, 0.1964569091796875, 0.22313690185546875, 0.24981689453125, 0.27649688720703125, 0.3031768798828125, 0.32985687255859375, 0.356536865234375, 0.38321685791015625, 0.4098968505859375, 0.43657684326171875, 0.4632568359375, 0.48993682861328125, 0.5166168212890625, 0.5432968139648438, 0.569976806640625, 0.5966567993164062, 0.6233367919921875, 0.6500167846679688, 0.67669677734375, 0.7033767700195312, 0.7300567626953125, 0.7567367553710938, 0.783416748046875, 0.8100967407226562, 0.8367767333984375, 0.8634567260742188, 0.89013671875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 6.0, 6.0, 6.0, 6.0, 4.0, 5.0, 11.0, 15.0, 11.0, 11.0, 23.0, 16.0, 26.0, 14.0, 28.0, 32.0, 23.0, 28.0, 37.0, 24.0, 34.0, 38.0, 41.0, 35.0, 1056.0, 37.0, 44.0, 46.0, 36.0, 26.0, 32.0, 20.0, 23.0, 30.0, 17.0, 30.0, 25.0, 17.0, 18.0, 14.0, 15.0, 12.0, 9.0, 3.0, 7.0, 7.0, 5.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-3.947265625, -3.82916259765625, -3.7110595703125, -3.59295654296875, -3.474853515625, -3.35675048828125, -3.2386474609375, -3.12054443359375, -3.00244140625, -2.88433837890625, -2.7662353515625, -2.64813232421875, -2.530029296875, -2.41192626953125, -2.2938232421875, -2.17572021484375, -2.0576171875, -1.93951416015625, -1.8214111328125, -1.70330810546875, -1.585205078125, -1.46710205078125, -1.3489990234375, -1.23089599609375, -1.11279296875, -0.99468994140625, -0.8765869140625, -0.75848388671875, -0.640380859375, -0.52227783203125, -0.4041748046875, -0.28607177734375, -0.16796875, -0.04986572265625, 0.0682373046875, 0.18634033203125, 0.304443359375, 0.42254638671875, 0.5406494140625, 0.65875244140625, 0.77685546875, 0.89495849609375, 1.0130615234375, 1.13116455078125, 1.249267578125, 1.36737060546875, 1.4854736328125, 1.60357666015625, 1.7216796875, 1.83978271484375, 1.9578857421875, 2.07598876953125, 2.194091796875, 2.31219482421875, 2.4302978515625, 2.54840087890625, 2.66650390625, 2.78460693359375, 2.9027099609375, 3.02081298828125, 3.138916015625, 3.25701904296875, 3.3751220703125, 3.49322509765625, 3.611328125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 9.0, 6.0, 9.0, 13.0, 23.0, 30.0, 51.0, 66.0, 124.0, 198.0, 330.0, 490.0, 734.0, 1227.0, 1997.0, 3299.0, 5399.0, 8884.0, 14799.0, 25152.0, 42918.0, 74204.0, 129930.0, 240808.0, 1223232.0, 134986.0, 77447.0, 45035.0, 26078.0, 15774.0, 9265.0, 5676.0, 3469.0, 2022.0, 1263.0, 800.0, 528.0, 295.0, 184.0, 141.0, 86.0, 51.0, 45.0, 18.0, 13.0, 9.0, 3.0, 7.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.810546875, -0.7867355346679688, -0.7629241943359375, -0.7391128540039062, -0.715301513671875, -0.6914901733398438, -0.6676788330078125, -0.6438674926757812, -0.62005615234375, -0.5962448120117188, -0.5724334716796875, -0.5486221313476562, -0.524810791015625, -0.5009994506835938, -0.4771881103515625, -0.45337677001953125, -0.4295654296875, -0.40575408935546875, -0.3819427490234375, -0.35813140869140625, -0.334320068359375, -0.31050872802734375, -0.2866973876953125, -0.26288604736328125, -0.23907470703125, -0.21526336669921875, -0.1914520263671875, -0.16764068603515625, -0.143829345703125, -0.12001800537109375, -0.0962066650390625, -0.07239532470703125, -0.048583984375, -0.02477264404296875, -0.0009613037109375, 0.02285003662109375, 0.046661376953125, 0.07047271728515625, 0.0942840576171875, 0.11809539794921875, 0.14190673828125, 0.16571807861328125, 0.1895294189453125, 0.21334075927734375, 0.237152099609375, 0.26096343994140625, 0.2847747802734375, 0.30858612060546875, 0.3323974609375, 0.35620880126953125, 0.3800201416015625, 0.40383148193359375, 0.427642822265625, 0.45145416259765625, 0.4752655029296875, 0.49907684326171875, 0.52288818359375, 0.5466995239257812, 0.5705108642578125, 0.5943222045898438, 0.618133544921875, 0.6419448852539062, 0.6657562255859375, 0.6895675659179688, 0.71337890625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 10.0, 12.0, 19.0, 18.0, 23.0, 42.0, 55.0, 56.0, 53.0, 67.0, 72.0, 85.0, 68.0, 74.0, 53.0, 62.0, 45.0, 33.0, 37.0, 20.0, 17.0, 14.0, 20.0, 7.0, 2.0, 6.0, 7.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028076171875, -0.002715975046157837, -0.002624332904815674, -0.0025326907634735107, -0.0024410486221313477, -0.0023494064807891846, -0.0022577643394470215, -0.0021661221981048584, -0.0020744800567626953, -0.0019828379154205322, -0.0018911957740783691, -0.001799553632736206, -0.001707911491394043, -0.0016162693500518799, -0.0015246272087097168, -0.0014329850673675537, -0.0013413429260253906, -0.0012497007846832275, -0.0011580586433410645, -0.0010664165019989014, -0.0009747743606567383, -0.0008831322193145752, -0.0007914900779724121, -0.000699847936630249, -0.0006082057952880859, -0.0005165636539459229, -0.00042492151260375977, -0.0003332793712615967, -0.0002416372299194336, -0.0001499950885772705, -5.835294723510742e-05, 3.3289194107055664e-05, 0.00012493133544921875, 0.00021657347679138184, 0.0003082156181335449, 0.000399857759475708, 0.0004914999008178711, 0.0005831420421600342, 0.0006747841835021973, 0.0007664263248443604, 0.0008580684661865234, 0.0009497106075286865, 0.0010413527488708496, 0.0011329948902130127, 0.0012246370315551758, 0.0013162791728973389, 0.001407921314239502, 0.001499563455581665, 0.0015912055969238281, 0.0016828477382659912, 0.0017744898796081543, 0.0018661320209503174, 0.0019577741622924805, 0.0020494163036346436, 0.0021410584449768066, 0.0022327005863189697, 0.002324342727661133, 0.002415984869003296, 0.002507627010345459, 0.002599269151687622, 0.002690911293029785, 0.0027825534343719482, 0.0028741955757141113, 0.0029658377170562744, 0.0030574798583984375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 6.0, 8.0, 9.0, 11.0, 20.0, 24.0, 27.0, 54.0, 52.0, 66.0, 92.0, 141.0, 222.0, 425.0, 1038.0, 203211.0, 840326.0, 1555.0, 460.0, 262.0, 165.0, 83.0, 86.0, 65.0, 38.0, 17.0, 24.0, 10.0, 13.0, 8.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06024169921875, -0.05842161178588867, -0.056601524353027344, -0.054781436920166016, -0.05296134948730469, -0.05114126205444336, -0.04932117462158203, -0.0475010871887207, -0.045680999755859375, -0.04386091232299805, -0.04204082489013672, -0.04022073745727539, -0.03840065002441406, -0.036580562591552734, -0.034760475158691406, -0.03294038772583008, -0.03112030029296875, -0.029300212860107422, -0.027480125427246094, -0.025660037994384766, -0.023839950561523438, -0.02201986312866211, -0.02019977569580078, -0.018379688262939453, -0.016559600830078125, -0.014739513397216797, -0.012919425964355469, -0.01109933853149414, -0.009279251098632812, -0.007459163665771484, -0.005639076232910156, -0.003818988800048828, -0.0019989013671875, -0.00017881393432617188, 0.0016412734985351562, 0.0034613609313964844, 0.0052814483642578125, 0.007101535797119141, 0.008921623229980469, 0.010741710662841797, 0.012561798095703125, 0.014381885528564453, 0.01620197296142578, 0.01802206039428711, 0.019842147827148438, 0.021662235260009766, 0.023482322692871094, 0.025302410125732422, 0.02712249755859375, 0.028942584991455078, 0.030762672424316406, 0.032582759857177734, 0.03440284729003906, 0.03622293472290039, 0.03804302215576172, 0.03986310958862305, 0.041683197021484375, 0.0435032844543457, 0.04532337188720703, 0.04714345932006836, 0.04896354675292969, 0.050783634185791016, 0.052603721618652344, 0.05442380905151367, 0.056243896484375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 11.0, 36.0, 120.0, 277.0, 344.0, 165.0, 44.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007026367820799351, -0.0005662731127813458, -0.00042990950169041753, -0.00029354586149565876, -0.00015718222130089998, -2.0818552002310753e-05, 0.00011554505908861756, 0.0002519086701795459, 0.0003882723394781351, 0.0005246360087767243, 0.0006609996198676527, 0.000797363230958581, 0.0009337269002571702, 0.0010700905695557594, 0.0012064541224390268, 0.001342817791737616, 0.0014791814610362053, 0.0016155451303347945, 0.0017519087996333838, 0.0018882723525166512, 0.002024636138230562, 0.0021609996911138296, 0.002297363243997097, 0.002433727029711008, 0.0025700905825942755, 0.002706454135477543, 0.002842817921191454, 0.0029791814740747213, 0.0031155450269579887, 0.0032519088126719, 0.003388272365555167, 0.0035246359184384346, 0.0036609992384910583, 0.0037973627913743258, 0.003933726344257593, 0.004070090129971504, 0.004206453915685415, 0.004342817701399326, 0.00447918102145195, 0.004615544807165861, 0.004751908592879772, 0.004888272378593683, 0.005024635698646307, 0.005160999484360218, 0.005297363270074129, 0.00543372705578804, 0.005570090375840664, 0.005706454161554575, 0.005842817481607199, 0.00597918126732111, 0.0061155445873737335, 0.006251908373087645, 0.006388272158801556, 0.006524635478854179, 0.0066609992645680904, 0.0067973630502820015, 0.006933726370334625, 0.007070090156048536, 0.00720645347610116, 0.007342817261815071, 0.007479181047528982, 0.007615544833242893, 0.007751908153295517, 0.00788827147334814, 0.008024635724723339]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 3.0, 8.0, 11.0, 9.0, 19.0, 14.0, 12.0, 10.0, 18.0, 14.0, 25.0, 15.0, 29.0, 27.0, 43.0, 29.0, 30.0, 38.0, 39.0, 43.0, 44.0, 40.0, 43.0, 47.0, 32.0, 33.0, 37.0, 40.0, 27.0, 22.0, 33.0, 23.0, 22.0, 15.0, 26.0, 15.0, 14.0, 11.0, 7.0, 9.0, 8.0, 4.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013598799705505371, -0.0013212459161877632, -0.0012826118618249893, -0.0012439778074622154, -0.0012053437530994415, -0.0011667096987366676, -0.0011280756443738937, -0.0010894415900111198, -0.001050807535648346, -0.001012173481285572, -0.0009735394269227982, -0.0009349053725600243, -0.0008962713181972504, -0.0008576372638344765, -0.0008190032094717026, -0.0007803691551089287, -0.0007417351007461548, -0.0007031010463833809, -0.000664466992020607, -0.0006258329376578331, -0.0005871988832950592, -0.0005485648289322853, -0.0005099307745695114, -0.0004712967202067375, -0.0004326626658439636, -0.00039402861148118973, -0.00035539455711841583, -0.00031676050275564194, -0.00027812644839286804, -0.00023949239403009415, -0.00020085833966732025, -0.00016222428530454636, -0.00012359023094177246, -8.495617657899857e-05, -4.632212221622467e-05, -7.688067853450775e-06, 3.094598650932312e-05, 6.958004087209702e-05, 0.00010821409523487091, 0.0001468481495976448, 0.0001854822039604187, 0.0002241162583231926, 0.0002627503126859665, 0.0003013843670487404, 0.0003400184214115143, 0.0003786524757742882, 0.00041728653013706207, 0.00045592058449983597, 0.0004945546388626099, 0.0005331886932253838, 0.0005718227475881577, 0.0006104568019509315, 0.0006490908563137054, 0.0006877249106764793, 0.0007263589650392532, 0.0007649930194020271, 0.000803627073764801, 0.0008422611281275749, 0.0008808951824903488, 0.0009195292368531227, 0.0009581632912158966, 0.0009967973455786705, 0.0010354313999414444, 0.0010740654543042183, 0.0011126995086669922]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 9.0, 15.0, 17.0, 9.0, 11.0, 14.0, 21.0, 17.0, 32.0, 21.0, 32.0, 28.0, 18.0, 40.0, 40.0, 38.0, 36.0, 39.0, 32.0, 32.0, 41.0, 33.0, 38.0, 41.0, 37.0, 32.0, 27.0, 32.0, 26.0, 28.0, 21.0, 17.0, 17.0, 13.0, 17.0, 12.0, 9.0, 7.0, 8.0, 11.0, 4.0, 8.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.234375, -6.03515625, -5.8359375, -5.63671875, -5.4375, -5.23828125, -5.0390625, -4.83984375, -4.640625, -4.44140625, -4.2421875, -4.04296875, -3.84375, -3.64453125, -3.4453125, -3.24609375, -3.046875, -2.84765625, -2.6484375, -2.44921875, -2.25, -2.05078125, -1.8515625, -1.65234375, -1.453125, -1.25390625, -1.0546875, -0.85546875, -0.65625, -0.45703125, -0.2578125, -0.05859375, 0.140625, 0.33984375, 0.5390625, 0.73828125, 0.9375, 1.13671875, 1.3359375, 1.53515625, 1.734375, 1.93359375, 2.1328125, 2.33203125, 2.53125, 2.73046875, 2.9296875, 3.12890625, 3.328125, 3.52734375, 3.7265625, 3.92578125, 4.125, 4.32421875, 4.5234375, 4.72265625, 4.921875, 5.12109375, 5.3203125, 5.51953125, 5.71875, 5.91796875, 6.1171875, 6.31640625, 6.515625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 13.0, 14.0, 13.0, 34.0, 34.0, 49.0, 70.0, 102.0, 101.0, 172.0, 240.0, 344.0, 457.0, 665.0, 1062.0, 1912.0, 3571.0, 7290.0, 17513.0, 46002.0, 136100.0, 388499.0, 290937.0, 94208.0, 33127.0, 12872.0, 5707.0, 2863.0, 1537.0, 946.0, 615.0, 413.0, 288.0, 232.0, 144.0, 112.0, 99.0, 55.0, 41.0, 31.0, 19.0, 20.0, 11.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.9921875, -7.748779296875, -7.50537109375, -7.261962890625, -7.0185546875, -6.775146484375, -6.53173828125, -6.288330078125, -6.044921875, -5.801513671875, -5.55810546875, -5.314697265625, -5.0712890625, -4.827880859375, -4.58447265625, -4.341064453125, -4.09765625, -3.854248046875, -3.61083984375, -3.367431640625, -3.1240234375, -2.880615234375, -2.63720703125, -2.393798828125, -2.150390625, -1.906982421875, -1.66357421875, -1.420166015625, -1.1767578125, -0.933349609375, -0.68994140625, -0.446533203125, -0.203125, 0.040283203125, 0.28369140625, 0.527099609375, 0.7705078125, 1.013916015625, 1.25732421875, 1.500732421875, 1.744140625, 1.987548828125, 2.23095703125, 2.474365234375, 2.7177734375, 2.961181640625, 3.20458984375, 3.447998046875, 3.69140625, 3.934814453125, 4.17822265625, 4.421630859375, 4.6650390625, 4.908447265625, 5.15185546875, 5.395263671875, 5.638671875, 5.882080078125, 6.12548828125, 6.368896484375, 6.6123046875, 6.855712890625, 7.09912109375, 7.342529296875, 7.5859375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 3.0, 6.0, 1.0, 3.0, 7.0, 12.0, 11.0, 16.0, 12.0, 18.0, 13.0, 23.0, 18.0, 27.0, 34.0, 30.0, 36.0, 58.0, 71.0, 77.0, 152.0, 1402.0, 370.0, 155.0, 91.0, 62.0, 41.0, 61.0, 28.0, 34.0, 31.0, 32.0, 22.0, 15.0, 18.0, 8.0, 9.0, 9.0, 9.0, 4.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-18.421875, -17.879638671875, -17.33740234375, -16.795166015625, -16.2529296875, -15.710693359375, -15.16845703125, -14.626220703125, -14.083984375, -13.541748046875, -12.99951171875, -12.457275390625, -11.9150390625, -11.372802734375, -10.83056640625, -10.288330078125, -9.74609375, -9.203857421875, -8.66162109375, -8.119384765625, -7.5771484375, -7.034912109375, -6.49267578125, -5.950439453125, -5.408203125, -4.865966796875, -4.32373046875, -3.781494140625, -3.2392578125, -2.697021484375, -2.15478515625, -1.612548828125, -1.0703125, -0.528076171875, 0.01416015625, 0.556396484375, 1.0986328125, 1.640869140625, 2.18310546875, 2.725341796875, 3.267578125, 3.809814453125, 4.35205078125, 4.894287109375, 5.4365234375, 5.978759765625, 6.52099609375, 7.063232421875, 7.60546875, 8.147705078125, 8.68994140625, 9.232177734375, 9.7744140625, 10.316650390625, 10.85888671875, 11.401123046875, 11.943359375, 12.485595703125, 13.02783203125, 13.570068359375, 14.1123046875, 14.654541015625, 15.19677734375, 15.739013671875, 16.28125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 4.0, 9.0, 6.0, 16.0, 17.0, 16.0, 23.0, 27.0, 32.0, 40.0, 41.0, 78.0, 118.0, 164.0, 222.0, 372.0, 667.0, 2887.0, 50415.0, 2964031.0, 119874.0, 4577.0, 837.0, 373.0, 234.0, 149.0, 118.0, 82.0, 64.0, 56.0, 33.0, 24.0, 31.0, 16.0, 9.0, 6.0, 9.0, 7.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.125, -26.1767578125, -25.228515625, -24.2802734375, -23.33203125, -22.3837890625, -21.435546875, -20.4873046875, -19.5390625, -18.5908203125, -17.642578125, -16.6943359375, -15.74609375, -14.7978515625, -13.849609375, -12.9013671875, -11.953125, -11.0048828125, -10.056640625, -9.1083984375, -8.16015625, -7.2119140625, -6.263671875, -5.3154296875, -4.3671875, -3.4189453125, -2.470703125, -1.5224609375, -0.57421875, 0.3740234375, 1.322265625, 2.2705078125, 3.21875, 4.1669921875, 5.115234375, 6.0634765625, 7.01171875, 7.9599609375, 8.908203125, 9.8564453125, 10.8046875, 11.7529296875, 12.701171875, 13.6494140625, 14.59765625, 15.5458984375, 16.494140625, 17.4423828125, 18.390625, 19.3388671875, 20.287109375, 21.2353515625, 22.18359375, 23.1318359375, 24.080078125, 25.0283203125, 25.9765625, 26.9248046875, 27.873046875, 28.8212890625, 29.76953125, 30.7177734375, 31.666015625, 32.6142578125, 33.5625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.0, 832.0, 128.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.935203552246094, -56.08351135253906, -50.23181915283203, -44.380123138427734, -38.5284309387207, -32.67673873901367, -26.825042724609375, -20.973350524902344, -15.121658325195312, -9.269965171813965, -3.418272018432617, 2.433422088623047, 8.285114288330078, 14.13680648803711, 19.988502502441406, 25.840194702148438, 31.69188690185547, 37.5435791015625, 43.39527130126953, 49.24696731567383, 55.09865951538086, 60.95035171508789, 66.80204772949219, 72.65373992919922, 78.50543212890625, 84.35712432861328, 90.20881652832031, 96.06051635742188, 101.91220092773438, 107.76390075683594, 113.61559295654297, 119.46728515625, 125.3189697265625, 131.17066955566406, 137.02235412597656, 142.87405395507812, 148.72573852539062, 154.5774383544922, 160.42913818359375, 166.28082275390625, 172.13250732421875, 177.9842071533203, 183.8358917236328, 189.68759155273438, 195.53927612304688, 201.39097595214844, 207.24267578125, 213.0943603515625, 218.94606018066406, 224.79776000976562, 230.64944458007812, 236.5011444091797, 242.3528289794922, 248.20452880859375, 254.05621337890625, 259.90789794921875, 265.7596130371094, 271.6112976074219, 277.4630126953125, 283.314697265625, 289.1663818359375, 295.01806640625, 300.8697814941406, 306.7214660644531, 312.5731506347656]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 3.0, 9.0, 10.0, 15.0, 12.0, 7.0, 16.0, 20.0, 25.0, 22.0, 36.0, 33.0, 23.0, 35.0, 41.0, 49.0, 32.0, 47.0, 36.0, 46.0, 54.0, 33.0, 34.0, 36.0, 30.0, 30.0, 36.0, 32.0, 26.0, 25.0, 29.0, 26.0, 27.0, 12.0, 12.0, 7.0, 7.0, 3.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.90922546386719, -37.681705474853516, -36.45418930053711, -35.22666931152344, -33.99915313720703, -32.77163314819336, -31.544113159179688, -30.31659507751465, -29.08907699584961, -27.86155891418457, -26.63404083251953, -25.40652084350586, -24.17900276184082, -22.95148468017578, -21.72396469116211, -20.49644660949707, -19.26892852783203, -18.041410446166992, -16.813892364501953, -15.586372375488281, -14.358854293823242, -13.131336212158203, -11.903817176818848, -10.676298141479492, -9.448780059814453, -8.221261978149414, -6.993742942810059, -5.766224384307861, -4.538705825805664, -3.311187267303467, -2.0836687088012695, -0.8561496734619141, 0.3713645935058594, 1.5988831520080566, 2.826401710510254, 4.053920269012451, 5.281438827514648, 6.508957386016846, 7.736475944519043, 8.963994979858398, 10.191513061523438, 11.419031143188477, 12.646550178527832, 13.874069213867188, 15.101587295532227, 16.329105377197266, 17.556625366210938, 18.784143447875977, 20.011661529541016, 21.239179611206055, 22.466697692871094, 23.694217681884766, 24.921735763549805, 26.149253845214844, 27.376773834228516, 28.604291915893555, 29.831809997558594, 31.059328079223633, 32.28684616088867, 33.514366149902344, 34.74188232421875, 35.96940231323242, 37.196922302246094, 38.4244384765625, 39.65195846557617]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 6.0, 3.0, 12.0, 15.0, 12.0, 9.0, 13.0, 25.0, 23.0, 26.0, 36.0, 22.0, 33.0, 37.0, 33.0, 46.0, 46.0, 42.0, 40.0, 37.0, 40.0, 39.0, 35.0, 47.0, 49.0, 29.0, 35.0, 30.0, 29.0, 16.0, 26.0, 16.0, 17.0, 17.0, 11.0, 15.0, 11.0, 10.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.64453125, -6.42071533203125, -6.1968994140625, -5.97308349609375, -5.749267578125, -5.52545166015625, -5.3016357421875, -5.07781982421875, -4.85400390625, -4.63018798828125, -4.4063720703125, -4.18255615234375, -3.958740234375, -3.73492431640625, -3.5111083984375, -3.28729248046875, -3.0634765625, -2.83966064453125, -2.6158447265625, -2.39202880859375, -2.168212890625, -1.94439697265625, -1.7205810546875, -1.49676513671875, -1.27294921875, -1.04913330078125, -0.8253173828125, -0.60150146484375, -0.377685546875, -0.15386962890625, 0.0699462890625, 0.29376220703125, 0.517578125, 0.74139404296875, 0.9652099609375, 1.18902587890625, 1.412841796875, 1.63665771484375, 1.8604736328125, 2.08428955078125, 2.30810546875, 2.53192138671875, 2.7557373046875, 2.97955322265625, 3.203369140625, 3.42718505859375, 3.6510009765625, 3.87481689453125, 4.0986328125, 4.32244873046875, 4.5462646484375, 4.77008056640625, 4.993896484375, 5.21771240234375, 5.4415283203125, 5.66534423828125, 5.88916015625, 6.11297607421875, 6.3367919921875, 6.56060791015625, 6.784423828125, 7.00823974609375, 7.2320556640625, 7.45587158203125, 7.6796875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 11.0, 4.0, 11.0, 14.0, 19.0, 11.0, 28.0, 39.0, 44.0, 59.0, 67.0, 105.0, 131.0, 219.0, 278.0, 395.0, 477.0, 3671.0, 4185128.0, 1776.0, 468.0, 335.0, 261.0, 192.0, 135.0, 93.0, 77.0, 47.0, 34.0, 31.0, 27.0, 26.0, 22.0, 10.0, 7.0, 9.0, 4.0, 9.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.375, -146.23046875, -141.0859375, -135.94140625, -130.796875, -125.65234375, -120.5078125, -115.36328125, -110.21875, -105.07421875, -99.9296875, -94.78515625, -89.640625, -84.49609375, -79.3515625, -74.20703125, -69.0625, -63.91796875, -58.7734375, -53.62890625, -48.484375, -43.33984375, -38.1953125, -33.05078125, -27.90625, -22.76171875, -17.6171875, -12.47265625, -7.328125, -2.18359375, 2.9609375, 8.10546875, 13.25, 18.39453125, 23.5390625, 28.68359375, 33.828125, 38.97265625, 44.1171875, 49.26171875, 54.40625, 59.55078125, 64.6953125, 69.83984375, 74.984375, 80.12890625, 85.2734375, 90.41796875, 95.5625, 100.70703125, 105.8515625, 110.99609375, 116.140625, 121.28515625, 126.4296875, 131.57421875, 136.71875, 141.86328125, 147.0078125, 152.15234375, 157.296875, 162.44140625, 167.5859375, 172.73046875, 177.875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 17.0, 14.0, 25.0, 49.0, 83.0, 121.0, 270.0, 508.0, 1006.0, 1008.0, 459.0, 226.0, 110.0, 61.0, 37.0, 33.0, 11.0, 10.0, 6.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.046875, -14.418212890625, -13.78955078125, -13.160888671875, -12.5322265625, -11.903564453125, -11.27490234375, -10.646240234375, -10.017578125, -9.388916015625, -8.76025390625, -8.131591796875, -7.5029296875, -6.874267578125, -6.24560546875, -5.616943359375, -4.98828125, -4.359619140625, -3.73095703125, -3.102294921875, -2.4736328125, -1.844970703125, -1.21630859375, -0.587646484375, 0.041015625, 0.669677734375, 1.29833984375, 1.927001953125, 2.5556640625, 3.184326171875, 3.81298828125, 4.441650390625, 5.0703125, 5.698974609375, 6.32763671875, 6.956298828125, 7.5849609375, 8.213623046875, 8.84228515625, 9.470947265625, 10.099609375, 10.728271484375, 11.35693359375, 11.985595703125, 12.6142578125, 13.242919921875, 13.87158203125, 14.500244140625, 15.12890625, 15.757568359375, 16.38623046875, 17.014892578125, 17.6435546875, 18.272216796875, 18.90087890625, 19.529541015625, 20.158203125, 20.786865234375, 21.41552734375, 22.044189453125, 22.6728515625, 23.301513671875, 23.93017578125, 24.558837890625, 25.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 17.0, 19.0, 21.0, 14.0, 31.0, 37.0, 65.0, 83.0, 117.0, 479.0, 99437.0, 4092251.0, 1212.0, 172.0, 92.0, 52.0, 48.0, 36.0, 25.0, 17.0, 19.0, 16.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.0, -140.32421875, -136.6484375, -132.97265625, -129.296875, -125.62109375, -121.9453125, -118.26953125, -114.59375, -110.91796875, -107.2421875, -103.56640625, -99.890625, -96.21484375, -92.5390625, -88.86328125, -85.1875, -81.51171875, -77.8359375, -74.16015625, -70.484375, -66.80859375, -63.1328125, -59.45703125, -55.78125, -52.10546875, -48.4296875, -44.75390625, -41.078125, -37.40234375, -33.7265625, -30.05078125, -26.375, -22.69921875, -19.0234375, -15.34765625, -11.671875, -7.99609375, -4.3203125, -0.64453125, 3.03125, 6.70703125, 10.3828125, 14.05859375, 17.734375, 21.41015625, 25.0859375, 28.76171875, 32.4375, 36.11328125, 39.7890625, 43.46484375, 47.140625, 50.81640625, 54.4921875, 58.16796875, 61.84375, 65.51953125, 69.1953125, 72.87109375, 76.546875, 80.22265625, 83.8984375, 87.57421875, 91.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 44.0, 430.0, 460.0, 75.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.61212158203125, -81.81055450439453, -76.00898742675781, -70.20741271972656, -64.40585327148438, -58.60428237915039, -52.802711486816406, -47.00114440917969, -41.19957733154297, -35.39801025390625, -29.5964412689209, -23.794872283935547, -17.993305206298828, -12.19173812866211, -6.390167236328125, -0.5886001586914062, 5.2129669189453125, 11.014534950256348, 16.816102981567383, 22.617671966552734, 28.419239044189453, 34.22080612182617, 40.022377014160156, 45.823944091796875, 51.625511169433594, 57.42707824707031, 63.22864532470703, 69.03021240234375, 74.831787109375, 80.63334655761719, 86.43492126464844, 92.23648834228516, 98.03805541992188, 103.8396224975586, 109.64118957519531, 115.44276428222656, 121.24432373046875, 127.0458984375, 132.84747314453125, 138.64903259277344, 144.45059204101562, 150.25216674804688, 156.05372619628906, 161.8553009033203, 167.6568603515625, 173.45843505859375, 179.260009765625, 185.0615692138672, 190.86314392089844, 196.6647186279297, 202.46627807617188, 208.26785278320312, 214.0694122314453, 219.87098693847656, 225.67254638671875, 231.47412109375, 237.27569580078125, 243.0772705078125, 248.8788299560547, 254.68040466308594, 260.4819641113281, 266.2835388183594, 272.0851135253906, 277.88665771484375, 283.688232421875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 10.0, 14.0, 15.0, 18.0, 18.0, 21.0, 27.0, 24.0, 21.0, 33.0, 32.0, 46.0, 49.0, 36.0, 44.0, 51.0, 34.0, 49.0, 55.0, 44.0, 43.0, 29.0, 29.0, 32.0, 32.0, 30.0, 21.0, 24.0, 15.0, 19.0, 14.0, 19.0, 6.0, 6.0, 8.0, 6.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.53916931152344, -41.313228607177734, -40.08728790283203, -38.861351013183594, -37.63541030883789, -36.40946960449219, -35.183528900146484, -33.95758819580078, -32.731651306152344, -31.50571060180664, -30.27977180480957, -29.053831100463867, -27.827892303466797, -26.601951599121094, -25.37601089477539, -24.15007209777832, -22.924131393432617, -21.698190689086914, -20.472251892089844, -19.24631118774414, -18.02037239074707, -16.794431686401367, -15.56849193572998, -14.342552185058594, -13.116612434387207, -11.89067268371582, -10.664732933044434, -9.438793182373047, -8.212852478027344, -6.986913204193115, -5.76097297668457, -4.535033226013184, -3.309093475341797, -2.08315372467041, -0.8572137355804443, 0.3687262535095215, 1.5946660041809082, 2.820605754852295, 4.04654598236084, 5.272485733032227, 6.498425483703613, 7.724365234375, 8.950304985046387, 10.176244735717773, 11.402185440063477, 12.628124237060547, 13.85406494140625, 15.080004692077637, 16.305944442749023, 17.531885147094727, 18.757823944091797, 19.9837646484375, 21.20970344543457, 22.435644149780273, 23.661582946777344, 24.887523651123047, 26.11346435546875, 27.339405059814453, 28.565343856811523, 29.791284561157227, 31.017223358154297, 32.2431640625, 33.4691047668457, 34.695045471191406, 35.920982360839844]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 7.0, 7.0, 8.0, 9.0, 14.0, 20.0, 26.0, 22.0, 23.0, 32.0, 33.0, 30.0, 28.0, 34.0, 37.0, 36.0, 48.0, 55.0, 43.0, 45.0, 41.0, 24.0, 32.0, 41.0, 38.0, 30.0, 22.0, 33.0, 27.0, 29.0, 24.0, 22.0, 17.0, 19.0, 9.0, 3.0, 2.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.51171875, -6.2928466796875, -6.073974609375, -5.8551025390625, -5.63623046875, -5.4173583984375, -5.198486328125, -4.9796142578125, -4.7607421875, -4.5418701171875, -4.322998046875, -4.1041259765625, -3.88525390625, -3.6663818359375, -3.447509765625, -3.2286376953125, -3.009765625, -2.7908935546875, -2.572021484375, -2.3531494140625, -2.13427734375, -1.9154052734375, -1.696533203125, -1.4776611328125, -1.2587890625, -1.0399169921875, -0.821044921875, -0.6021728515625, -0.38330078125, -0.1644287109375, 0.054443359375, 0.2733154296875, 0.4921875, 0.7110595703125, 0.929931640625, 1.1488037109375, 1.36767578125, 1.5865478515625, 1.805419921875, 2.0242919921875, 2.2431640625, 2.4620361328125, 2.680908203125, 2.8997802734375, 3.11865234375, 3.3375244140625, 3.556396484375, 3.7752685546875, 3.994140625, 4.2130126953125, 4.431884765625, 4.6507568359375, 4.86962890625, 5.0885009765625, 5.307373046875, 5.5262451171875, 5.7451171875, 5.9639892578125, 6.182861328125, 6.4017333984375, 6.62060546875, 6.8394775390625, 7.058349609375, 7.2772216796875, 7.49609375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 16.0, 9.0, 12.0, 20.0, 50.0, 58.0, 91.0, 170.0, 246.0, 338.0, 492.0, 718.0, 1007.0, 1479.0, 2085.0, 2942.0, 4389.0, 6360.0, 9391.0, 13893.0, 20580.0, 31233.0, 48640.0, 80304.0, 138135.0, 213606.0, 182488.0, 107490.0, 63208.0, 39778.0, 25661.0, 17148.0, 11458.0, 7689.0, 5388.0, 3657.0, 2525.0, 1803.0, 1278.0, 859.0, 628.0, 435.0, 295.0, 176.0, 126.0, 65.0, 49.0, 27.0, 15.0, 13.0, 8.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.84326171875, -0.8167190551757812, -0.7901763916015625, -0.7636337280273438, -0.737091064453125, -0.7105484008789062, -0.6840057373046875, -0.6574630737304688, -0.63092041015625, -0.6043777465820312, -0.5778350830078125, -0.5512924194335938, -0.524749755859375, -0.49820709228515625, -0.4716644287109375, -0.44512176513671875, -0.4185791015625, -0.39203643798828125, -0.3654937744140625, -0.33895111083984375, -0.312408447265625, -0.28586578369140625, -0.2593231201171875, -0.23278045654296875, -0.20623779296875, -0.17969512939453125, -0.1531524658203125, -0.12660980224609375, -0.100067138671875, -0.07352447509765625, -0.0469818115234375, -0.02043914794921875, 0.006103515625, 0.03264617919921875, 0.0591888427734375, 0.08573150634765625, 0.112274169921875, 0.13881683349609375, 0.1653594970703125, 0.19190216064453125, 0.21844482421875, 0.24498748779296875, 0.2715301513671875, 0.29807281494140625, 0.324615478515625, 0.35115814208984375, 0.3777008056640625, 0.40424346923828125, 0.4307861328125, 0.45732879638671875, 0.4838714599609375, 0.5104141235351562, 0.536956787109375, 0.5634994506835938, 0.5900421142578125, 0.6165847778320312, 0.64312744140625, 0.6696701049804688, 0.6962127685546875, 0.7227554321289062, 0.749298095703125, 0.7758407592773438, 0.8023834228515625, 0.8289260864257812, 0.85546875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 10.0, 5.0, 14.0, 11.0, 10.0, 13.0, 14.0, 18.0, 24.0, 19.0, 27.0, 26.0, 35.0, 39.0, 33.0, 40.0, 43.0, 48.0, 38.0, 1062.0, 39.0, 39.0, 38.0, 40.0, 22.0, 34.0, 29.0, 31.0, 27.0, 30.0, 31.0, 25.0, 21.0, 16.0, 10.0, 14.0, 11.0, 14.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.9454345703125, -3.816650390625, -3.6878662109375, -3.55908203125, -3.4302978515625, -3.301513671875, -3.1727294921875, -3.0439453125, -2.9151611328125, -2.786376953125, -2.6575927734375, -2.52880859375, -2.4000244140625, -2.271240234375, -2.1424560546875, -2.013671875, -1.8848876953125, -1.756103515625, -1.6273193359375, -1.49853515625, -1.3697509765625, -1.240966796875, -1.1121826171875, -0.9833984375, -0.8546142578125, -0.725830078125, -0.5970458984375, -0.46826171875, -0.3394775390625, -0.210693359375, -0.0819091796875, 0.046875, 0.1756591796875, 0.304443359375, 0.4332275390625, 0.56201171875, 0.6907958984375, 0.819580078125, 0.9483642578125, 1.0771484375, 1.2059326171875, 1.334716796875, 1.4635009765625, 1.59228515625, 1.7210693359375, 1.849853515625, 1.9786376953125, 2.107421875, 2.2362060546875, 2.364990234375, 2.4937744140625, 2.62255859375, 2.7513427734375, 2.880126953125, 3.0089111328125, 3.1376953125, 3.2664794921875, 3.395263671875, 3.5240478515625, 3.65283203125, 3.7816162109375, 3.910400390625, 4.0391845703125, 4.16796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 13.0, 25.0, 26.0, 54.0, 57.0, 100.0, 167.0, 264.0, 440.0, 700.0, 1215.0, 2009.0, 3298.0, 5706.0, 10047.0, 17603.0, 31345.0, 57347.0, 107622.0, 197239.0, 1295831.0, 166805.0, 89077.0, 48082.0, 26513.0, 14989.0, 8668.0, 4935.0, 2780.0, 1663.0, 992.0, 585.0, 361.0, 193.0, 141.0, 86.0, 49.0, 33.0, 24.0, 13.0, 9.0, 7.0, 6.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73193359375, -0.70611572265625, -0.6802978515625, -0.65447998046875, -0.628662109375, -0.60284423828125, -0.5770263671875, -0.55120849609375, -0.525390625, -0.49957275390625, -0.4737548828125, -0.44793701171875, -0.422119140625, -0.39630126953125, -0.3704833984375, -0.34466552734375, -0.31884765625, -0.29302978515625, -0.2672119140625, -0.24139404296875, -0.215576171875, -0.18975830078125, -0.1639404296875, -0.13812255859375, -0.1123046875, -0.08648681640625, -0.0606689453125, -0.03485107421875, -0.009033203125, 0.01678466796875, 0.0426025390625, 0.06842041015625, 0.09423828125, 0.12005615234375, 0.1458740234375, 0.17169189453125, 0.197509765625, 0.22332763671875, 0.2491455078125, 0.27496337890625, 0.30078125, 0.32659912109375, 0.3524169921875, 0.37823486328125, 0.404052734375, 0.42987060546875, 0.4556884765625, 0.48150634765625, 0.50732421875, 0.53314208984375, 0.5589599609375, 0.58477783203125, 0.610595703125, 0.63641357421875, 0.6622314453125, 0.68804931640625, 0.7138671875, 0.73968505859375, 0.7655029296875, 0.79132080078125, 0.817138671875, 0.84295654296875, 0.8687744140625, 0.89459228515625, 0.92041015625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 6.0, 7.0, 12.0, 8.0, 18.0, 17.0, 29.0, 20.0, 41.0, 44.0, 44.0, 48.0, 61.0, 63.0, 64.0, 63.0, 59.0, 49.0, 53.0, 54.0, 32.0, 44.0, 24.0, 30.0, 18.0, 19.0, 13.0, 14.0, 9.0, 5.0, 8.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00217437744140625, -0.002096414566040039, -0.002018451690673828, -0.0019404888153076172, -0.0018625259399414062, -0.0017845630645751953, -0.0017066001892089844, -0.0016286373138427734, -0.0015506744384765625, -0.0014727115631103516, -0.0013947486877441406, -0.0013167858123779297, -0.0012388229370117188, -0.0011608600616455078, -0.0010828971862792969, -0.001004934310913086, -0.000926971435546875, -0.0008490085601806641, -0.0007710456848144531, -0.0006930828094482422, -0.0006151199340820312, -0.0005371570587158203, -0.0004591941833496094, -0.00038123130798339844, -0.0003032684326171875, -0.00022530555725097656, -0.00014734268188476562, -6.937980651855469e-05, 8.58306884765625e-06, 8.654594421386719e-05, 0.00016450881958007812, 0.00024247169494628906, 0.0003204345703125, 0.00039839744567871094, 0.0004763603210449219, 0.0005543231964111328, 0.0006322860717773438, 0.0007102489471435547, 0.0007882118225097656, 0.0008661746978759766, 0.0009441375732421875, 0.0010221004486083984, 0.0011000633239746094, 0.0011780261993408203, 0.0012559890747070312, 0.0013339519500732422, 0.0014119148254394531, 0.001489877700805664, 0.001567840576171875, 0.001645803451538086, 0.0017237663269042969, 0.0018017292022705078, 0.0018796920776367188, 0.0019576549530029297, 0.0020356178283691406, 0.0021135807037353516, 0.0021915435791015625, 0.0022695064544677734, 0.0023474693298339844, 0.0024254322052001953, 0.0025033950805664062, 0.002581357955932617, 0.002659320831298828, 0.002737283706665039, 0.00281524658203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 10.0, 8.0, 27.0, 21.0, 26.0, 32.0, 46.0, 51.0, 57.0, 94.0, 141.0, 168.0, 249.0, 365.0, 684.0, 2128.0, 859295.0, 182208.0, 1280.0, 562.0, 317.0, 217.0, 134.0, 105.0, 73.0, 57.0, 42.0, 33.0, 20.0, 21.0, 21.0, 10.0, 5.0, 10.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.047515869140625, -0.04615306854248047, -0.04479026794433594, -0.043427467346191406, -0.042064666748046875, -0.040701866149902344, -0.03933906555175781, -0.03797626495361328, -0.03661346435546875, -0.03525066375732422, -0.03388786315917969, -0.032525062561035156, -0.031162261962890625, -0.029799461364746094, -0.028436660766601562, -0.02707386016845703, -0.0257110595703125, -0.02434825897216797, -0.022985458374023438, -0.021622657775878906, -0.020259857177734375, -0.018897056579589844, -0.017534255981445312, -0.01617145538330078, -0.01480865478515625, -0.013445854187011719, -0.012083053588867188, -0.010720252990722656, -0.009357452392578125, -0.007994651794433594, -0.0066318511962890625, -0.005269050598144531, -0.00390625, -0.0025434494018554688, -0.0011806488037109375, 0.00018215179443359375, 0.001544952392578125, 0.0029077529907226562, 0.0042705535888671875, 0.005633354187011719, 0.00699615478515625, 0.008358955383300781, 0.009721755981445312, 0.011084556579589844, 0.012447357177734375, 0.013810157775878906, 0.015172958374023438, 0.01653575897216797, 0.0178985595703125, 0.01926136016845703, 0.020624160766601562, 0.021986961364746094, 0.023349761962890625, 0.024712562561035156, 0.026075363159179688, 0.02743816375732422, 0.02880096435546875, 0.03016376495361328, 0.03152656555175781, 0.032889366149902344, 0.034252166748046875, 0.035614967346191406, 0.03697776794433594, 0.03834056854248047, 0.039703369140625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [56.0, 955.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010350876254960895, -0.0002198097645305097, 0.00059546809643507, 0.0014107458991929889, 0.0022260239347815514, 0.0030413013882935047, 0.0038565793074667454, 0.004671857226639986, 0.005487135145813227, 0.006302413064986467, 0.007117690984159708, 0.007932968437671661, 0.008748246356844902, 0.009563524276018143, 0.010378802195191383, 0.011194080114364624, 0.012009358033537865, 0.012824635952711105, 0.013639913871884346, 0.014455191791057587, 0.015270469710230827, 0.016085747629404068, 0.01690102554857731, 0.01771630346775055, 0.01853158138692379, 0.01934685930609703, 0.02016213722527027, 0.020977415144443512, 0.021792693063616753, 0.022607970982789993, 0.023423248901963234, 0.024238526821136475, 0.025053804740309715, 0.025869082659482956, 0.026684360578656197, 0.027499638497829437, 0.028314916417002678, 0.02913019433617592, 0.02994547225534916, 0.0307607501745224, 0.03157602623105049, 0.03239130228757858, 0.03320658206939697, 0.034021858125925064, 0.034837137907743454, 0.035652413964271545, 0.036467693746089935, 0.03728296980261803, 0.03809824958443642, 0.03891352564096451, 0.0397288054227829, 0.04054408147931099, 0.04135936126112938, 0.04217463731765747, 0.04298991709947586, 0.04380519315600395, 0.04462047293782234, 0.04543574899435043, 0.04625102877616882, 0.047066304832696915, 0.047881584614515305, 0.048696860671043396, 0.049512140452861786, 0.05032741650938988, 0.05114269629120827]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 5.0, 8.0, 10.0, 17.0, 26.0, 24.0, 30.0, 29.0, 42.0, 53.0, 62.0, 46.0, 58.0, 73.0, 70.0, 65.0, 44.0, 66.0, 65.0, 50.0, 38.0, 39.0, 23.0, 28.0, 15.0, 10.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.002855837345123291, -0.0027908040210604668, -0.0027257706969976425, -0.0026607373729348183, -0.002595704048871994, -0.0025306707248091698, -0.0024656374007463455, -0.0024006040766835213, -0.002335570752620697, -0.0022705374285578728, -0.0022055041044950485, -0.0021404707804322243, -0.0020754374563694, -0.0020104041323065758, -0.0019453708082437515, -0.0018803374841809273, -0.001815304160118103, -0.0017502708360552788, -0.0016852375119924545, -0.0016202041879296303, -0.001555170863866806, -0.0014901375398039818, -0.0014251042157411575, -0.0013600708916783333, -0.001295037567615509, -0.0012300042435526848, -0.0011649709194898605, -0.0010999375954270363, -0.001034904271364212, -0.0009698709473013878, -0.0009048376232385635, -0.0008398042991757393, -0.000774770975112915, -0.0007097376510500908, -0.0006447043269872665, -0.0005796710029244423, -0.000514637678861618, -0.0004496043547987938, -0.00038457103073596954, -0.0003195377066731453, -0.00025450438261032104, -0.0001894710585474968, -0.00012443773448467255, -5.94044104218483e-05, 5.628913640975952e-06, 7.06622377038002e-05, 0.00013569556176662445, 0.0002007288858294487, 0.00026576220989227295, 0.0003307955339550972, 0.00039582885801792145, 0.0004608621820807457, 0.00052589550614357, 0.0005909288302063942, 0.0006559621542692184, 0.0007209954783320427, 0.0007860288023948669, 0.0008510621264576912, 0.0009160954505205154, 0.0009811287745833397, 0.001046162098646164, 0.0011111954227089882, 0.0011762287467718124, 0.0012412620708346367, 0.001306295394897461]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 7.0, 7.0, 8.0, 9.0, 14.0, 20.0, 26.0, 22.0, 23.0, 32.0, 33.0, 30.0, 28.0, 34.0, 37.0, 36.0, 48.0, 55.0, 43.0, 45.0, 41.0, 24.0, 32.0, 41.0, 38.0, 30.0, 22.0, 33.0, 27.0, 29.0, 24.0, 22.0, 17.0, 19.0, 9.0, 3.0, 2.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.51171875, -6.2928466796875, -6.073974609375, -5.8551025390625, -5.63623046875, -5.4173583984375, -5.198486328125, -4.9796142578125, -4.7607421875, -4.5418701171875, -4.322998046875, -4.1041259765625, -3.88525390625, -3.6663818359375, -3.447509765625, -3.2286376953125, -3.009765625, -2.7908935546875, -2.572021484375, -2.3531494140625, -2.13427734375, -1.9154052734375, -1.696533203125, -1.4776611328125, -1.2587890625, -1.0399169921875, -0.821044921875, -0.6021728515625, -0.38330078125, -0.1644287109375, 0.054443359375, 0.2733154296875, 0.4921875, 0.7110595703125, 0.929931640625, 1.1488037109375, 1.36767578125, 1.5865478515625, 1.805419921875, 2.0242919921875, 2.2431640625, 2.4620361328125, 2.680908203125, 2.8997802734375, 3.11865234375, 3.3375244140625, 3.556396484375, 3.7752685546875, 3.994140625, 4.2130126953125, 4.431884765625, 4.6507568359375, 4.86962890625, 5.0885009765625, 5.307373046875, 5.5262451171875, 5.7451171875, 5.9639892578125, 6.182861328125, 6.4017333984375, 6.62060546875, 6.8394775390625, 7.058349609375, 7.2772216796875, 7.49609375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 9.0, 6.0, 15.0, 13.0, 24.0, 30.0, 35.0, 52.0, 56.0, 89.0, 143.0, 190.0, 248.0, 380.0, 492.0, 688.0, 1013.0, 1492.0, 2581.0, 5677.0, 18922.0, 90323.0, 480420.0, 356058.0, 63536.0, 14478.0, 4762.0, 2265.0, 1287.0, 964.0, 647.0, 450.0, 357.0, 258.0, 162.0, 121.0, 87.0, 61.0, 54.0, 38.0, 18.0, 13.0, 13.0, 12.0, 7.0, 8.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9765625, -11.60107421875, -11.2255859375, -10.85009765625, -10.474609375, -10.09912109375, -9.7236328125, -9.34814453125, -8.97265625, -8.59716796875, -8.2216796875, -7.84619140625, -7.470703125, -7.09521484375, -6.7197265625, -6.34423828125, -5.96875, -5.59326171875, -5.2177734375, -4.84228515625, -4.466796875, -4.09130859375, -3.7158203125, -3.34033203125, -2.96484375, -2.58935546875, -2.2138671875, -1.83837890625, -1.462890625, -1.08740234375, -0.7119140625, -0.33642578125, 0.0390625, 0.41455078125, 0.7900390625, 1.16552734375, 1.541015625, 1.91650390625, 2.2919921875, 2.66748046875, 3.04296875, 3.41845703125, 3.7939453125, 4.16943359375, 4.544921875, 4.92041015625, 5.2958984375, 5.67138671875, 6.046875, 6.42236328125, 6.7978515625, 7.17333984375, 7.548828125, 7.92431640625, 8.2998046875, 8.67529296875, 9.05078125, 9.42626953125, 9.8017578125, 10.17724609375, 10.552734375, 10.92822265625, 11.3037109375, 11.67919921875, 12.0546875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 10.0, 7.0, 9.0, 13.0, 20.0, 15.0, 20.0, 24.0, 22.0, 31.0, 35.0, 31.0, 56.0, 56.0, 74.0, 97.0, 283.0, 1545.0, 174.0, 87.0, 48.0, 52.0, 42.0, 54.0, 38.0, 33.0, 24.0, 19.0, 20.0, 21.0, 11.0, 9.0, 9.0, 5.0, 10.0, 7.0, 2.0, 7.0, 7.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.0546875, -14.5211181640625, -13.987548828125, -13.4539794921875, -12.92041015625, -12.3868408203125, -11.853271484375, -11.3197021484375, -10.7861328125, -10.2525634765625, -9.718994140625, -9.1854248046875, -8.65185546875, -8.1182861328125, -7.584716796875, -7.0511474609375, -6.517578125, -5.9840087890625, -5.450439453125, -4.9168701171875, -4.38330078125, -3.8497314453125, -3.316162109375, -2.7825927734375, -2.2490234375, -1.7154541015625, -1.181884765625, -0.6483154296875, -0.11474609375, 0.4188232421875, 0.952392578125, 1.4859619140625, 2.01953125, 2.5531005859375, 3.086669921875, 3.6202392578125, 4.15380859375, 4.6873779296875, 5.220947265625, 5.7545166015625, 6.2880859375, 6.8216552734375, 7.355224609375, 7.8887939453125, 8.42236328125, 8.9559326171875, 9.489501953125, 10.0230712890625, 10.556640625, 11.0902099609375, 11.623779296875, 12.1573486328125, 12.69091796875, 13.2244873046875, 13.758056640625, 14.2916259765625, 14.8251953125, 15.3587646484375, 15.892333984375, 16.4259033203125, 16.95947265625, 17.4930419921875, 18.026611328125, 18.5601806640625, 19.09375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 6.0, 14.0, 9.0, 24.0, 18.0, 23.0, 43.0, 50.0, 59.0, 91.0, 151.0, 216.0, 407.0, 813.0, 3367.0, 3101719.0, 36195.0, 1228.0, 491.0, 254.0, 145.0, 108.0, 71.0, 55.0, 29.0, 19.0, 17.0, 13.0, 13.0, 6.0, 13.0, 5.0, 3.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.75, -64.8271484375, -62.904296875, -60.9814453125, -59.05859375, -57.1357421875, -55.212890625, -53.2900390625, -51.3671875, -49.4443359375, -47.521484375, -45.5986328125, -43.67578125, -41.7529296875, -39.830078125, -37.9072265625, -35.984375, -34.0615234375, -32.138671875, -30.2158203125, -28.29296875, -26.3701171875, -24.447265625, -22.5244140625, -20.6015625, -18.6787109375, -16.755859375, -14.8330078125, -12.91015625, -10.9873046875, -9.064453125, -7.1416015625, -5.21875, -3.2958984375, -1.373046875, 0.5498046875, 2.47265625, 4.3955078125, 6.318359375, 8.2412109375, 10.1640625, 12.0869140625, 14.009765625, 15.9326171875, 17.85546875, 19.7783203125, 21.701171875, 23.6240234375, 25.546875, 27.4697265625, 29.392578125, 31.3154296875, 33.23828125, 35.1611328125, 37.083984375, 39.0068359375, 40.9296875, 42.8525390625, 44.775390625, 46.6982421875, 48.62109375, 50.5439453125, 52.466796875, 54.3896484375, 56.3125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 48.0, 734.0, 228.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.92311096191406, -202.90771484375, -196.89231872558594, -190.8769073486328, -184.86151123046875, -178.8461151123047, -172.83071899414062, -166.8153076171875, -160.79991149902344, -154.78451538085938, -148.7691192626953, -142.7537078857422, -136.73831176757812, -130.72291564941406, -124.70751953125, -118.6921157836914, -112.67671966552734, -106.66132354736328, -100.64591979980469, -94.63052368164062, -88.61511993408203, -82.59972381591797, -76.58432006835938, -70.56892395019531, -64.55352783203125, -58.53812789916992, -52.522727966308594, -46.50733184814453, -40.49192810058594, -34.476531982421875, -28.461132049560547, -22.44573211669922, -16.430328369140625, -10.414928436279297, -4.399529457092285, 1.6158695220947266, 7.631269454956055, 13.646669387817383, 19.662067413330078, 25.677467346191406, 31.692867279052734, 37.70826721191406, 43.72366714477539, 49.73906707763672, 55.75446319580078, 61.769866943359375, 67.78526306152344, 73.8006591796875, 79.8160629272461, 85.83145904541016, 91.84686279296875, 97.86225891113281, 103.8776626586914, 109.89305877685547, 115.90846252441406, 121.92385864257812, 127.93925476074219, 133.95465087890625, 139.9700469970703, 145.98545837402344, 152.0008544921875, 158.01625061035156, 164.03164672851562, 170.04705810546875, 176.0624542236328]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 6.0, 7.0, 10.0, 12.0, 12.0, 10.0, 18.0, 23.0, 28.0, 23.0, 25.0, 31.0, 27.0, 32.0, 39.0, 37.0, 44.0, 37.0, 58.0, 48.0, 36.0, 33.0, 37.0, 44.0, 30.0, 30.0, 33.0, 18.0, 35.0, 28.0, 26.0, 25.0, 17.0, 13.0, 13.0, 18.0, 6.0, 6.0, 6.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.710960388183594, -48.23847198486328, -46.765987396240234, -45.29350280761719, -43.821014404296875, -42.34852600097656, -40.876041412353516, -39.40355682373047, -37.931068420410156, -36.458580017089844, -34.9860954284668, -33.51361083984375, -32.04112243652344, -30.568635940551758, -29.096149444580078, -27.6236629486084, -26.15117645263672, -24.67868995666504, -23.20620346069336, -21.73371696472168, -20.26123046875, -18.78874397277832, -17.31625747680664, -15.843770980834961, -14.371284484863281, -12.898797988891602, -11.426311492919922, -9.953824996948242, -8.481338500976562, -7.008852005004883, -5.536365509033203, -4.063879013061523, -2.5913925170898438, -1.118906021118164, 0.3535804748535156, 1.8260669708251953, 3.298553466796875, 4.771039962768555, 6.243526458740234, 7.716012954711914, 9.188499450683594, 10.660985946655273, 12.133472442626953, 13.605958938598633, 15.078445434570312, 16.550931930541992, 18.023418426513672, 19.49590492248535, 20.96839141845703, 22.44087791442871, 23.91336441040039, 25.38585090637207, 26.85833740234375, 28.33082389831543, 29.80331039428711, 31.27579689025879, 32.74828338623047, 34.22077178955078, 35.69325637817383, 37.165740966796875, 38.63822937011719, 40.1107177734375, 41.58320236206055, 43.055686950683594, 44.528175354003906]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 8.0, 11.0, 10.0, 16.0, 13.0, 18.0, 23.0, 18.0, 31.0, 33.0, 39.0, 41.0, 44.0, 51.0, 50.0, 43.0, 46.0, 36.0, 36.0, 58.0, 41.0, 42.0, 33.0, 44.0, 38.0, 27.0, 20.0, 31.0, 15.0, 23.0, 12.0, 15.0, 11.0, 6.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.36328125, -7.11932373046875, -6.8753662109375, -6.63140869140625, -6.387451171875, -6.14349365234375, -5.8995361328125, -5.65557861328125, -5.41162109375, -5.16766357421875, -4.9237060546875, -4.67974853515625, -4.435791015625, -4.19183349609375, -3.9478759765625, -3.70391845703125, -3.4599609375, -3.21600341796875, -2.9720458984375, -2.72808837890625, -2.484130859375, -2.24017333984375, -1.9962158203125, -1.75225830078125, -1.50830078125, -1.26434326171875, -1.0203857421875, -0.77642822265625, -0.532470703125, -0.28851318359375, -0.0445556640625, 0.19940185546875, 0.443359375, 0.68731689453125, 0.9312744140625, 1.17523193359375, 1.419189453125, 1.66314697265625, 1.9071044921875, 2.15106201171875, 2.39501953125, 2.63897705078125, 2.8829345703125, 3.12689208984375, 3.370849609375, 3.61480712890625, 3.8587646484375, 4.10272216796875, 4.3466796875, 4.59063720703125, 4.8345947265625, 5.07855224609375, 5.322509765625, 5.56646728515625, 5.8104248046875, 6.05438232421875, 6.29833984375, 6.54229736328125, 6.7862548828125, 7.03021240234375, 7.274169921875, 7.51812744140625, 7.7620849609375, 8.00604248046875, 8.25]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 7.0, 11.0, 8.0, 18.0, 21.0, 30.0, 32.0, 62.0, 56.0, 86.0, 145.0, 188.0, 264.0, 463.0, 852.0, 2251.0, 7867.0, 59855.0, 1161659.0, 2705491.0, 230804.0, 17412.0, 3745.0, 1320.0, 580.0, 297.0, 210.0, 124.0, 96.0, 83.0, 67.0, 39.0, 36.0, 26.0, 16.0, 19.0, 19.0, 4.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.90625, -15.362060546875, -14.81787109375, -14.273681640625, -13.7294921875, -13.185302734375, -12.64111328125, -12.096923828125, -11.552734375, -11.008544921875, -10.46435546875, -9.920166015625, -9.3759765625, -8.831787109375, -8.28759765625, -7.743408203125, -7.19921875, -6.655029296875, -6.11083984375, -5.566650390625, -5.0224609375, -4.478271484375, -3.93408203125, -3.389892578125, -2.845703125, -2.301513671875, -1.75732421875, -1.213134765625, -0.6689453125, -0.124755859375, 0.41943359375, 0.963623046875, 1.5078125, 2.052001953125, 2.59619140625, 3.140380859375, 3.6845703125, 4.228759765625, 4.77294921875, 5.317138671875, 5.861328125, 6.405517578125, 6.94970703125, 7.493896484375, 8.0380859375, 8.582275390625, 9.12646484375, 9.670654296875, 10.21484375, 10.759033203125, 11.30322265625, 11.847412109375, 12.3916015625, 12.935791015625, 13.47998046875, 14.024169921875, 14.568359375, 15.112548828125, 15.65673828125, 16.200927734375, 16.7451171875, 17.289306640625, 17.83349609375, 18.377685546875, 18.921875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 18.0, 13.0, 17.0, 17.0, 28.0, 42.0, 68.0, 76.0, 123.0, 155.0, 228.0, 322.0, 481.0, 637.0, 553.0, 360.0, 218.0, 199.0, 130.0, 84.0, 63.0, 70.0, 48.0, 35.0, 26.0, 15.0, 11.0, 6.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.7265625, -14.33544921875, -13.9443359375, -13.55322265625, -13.162109375, -12.77099609375, -12.3798828125, -11.98876953125, -11.59765625, -11.20654296875, -10.8154296875, -10.42431640625, -10.033203125, -9.64208984375, -9.2509765625, -8.85986328125, -8.46875, -8.07763671875, -7.6865234375, -7.29541015625, -6.904296875, -6.51318359375, -6.1220703125, -5.73095703125, -5.33984375, -4.94873046875, -4.5576171875, -4.16650390625, -3.775390625, -3.38427734375, -2.9931640625, -2.60205078125, -2.2109375, -1.81982421875, -1.4287109375, -1.03759765625, -0.646484375, -0.25537109375, 0.1357421875, 0.52685546875, 0.91796875, 1.30908203125, 1.7001953125, 2.09130859375, 2.482421875, 2.87353515625, 3.2646484375, 3.65576171875, 4.046875, 4.43798828125, 4.8291015625, 5.22021484375, 5.611328125, 6.00244140625, 6.3935546875, 6.78466796875, 7.17578125, 7.56689453125, 7.9580078125, 8.34912109375, 8.740234375, 9.13134765625, 9.5224609375, 9.91357421875, 10.3046875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 4.0, 4.0, 13.0, 18.0, 45.0, 51.0, 107.0, 208.0, 473.0, 1244.0, 5797.0, 468210.0, 3691047.0, 23814.0, 2018.0, 649.0, 249.0, 139.0, 75.0, 42.0, 28.0, 18.0, 11.0, 7.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.96875, -37.72021484375, -36.4716796875, -35.22314453125, -33.974609375, -32.72607421875, -31.4775390625, -30.22900390625, -28.98046875, -27.73193359375, -26.4833984375, -25.23486328125, -23.986328125, -22.73779296875, -21.4892578125, -20.24072265625, -18.9921875, -17.74365234375, -16.4951171875, -15.24658203125, -13.998046875, -12.74951171875, -11.5009765625, -10.25244140625, -9.00390625, -7.75537109375, -6.5068359375, -5.25830078125, -4.009765625, -2.76123046875, -1.5126953125, -0.26416015625, 0.984375, 2.23291015625, 3.4814453125, 4.72998046875, 5.978515625, 7.22705078125, 8.4755859375, 9.72412109375, 10.97265625, 12.22119140625, 13.4697265625, 14.71826171875, 15.966796875, 17.21533203125, 18.4638671875, 19.71240234375, 20.9609375, 22.20947265625, 23.4580078125, 24.70654296875, 25.955078125, 27.20361328125, 28.4521484375, 29.70068359375, 30.94921875, 32.19775390625, 33.4462890625, 34.69482421875, 35.943359375, 37.19189453125, 38.4404296875, 39.68896484375, 40.9375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 65.0, 925.0, 26.0, 4.0, 0.0, 0.0, 1.0], "bins": [-877.8282470703125, -862.8021240234375, -847.7760620117188, -832.75, -817.723876953125, -802.69775390625, -787.6716918945312, -772.6456298828125, -757.6195068359375, -742.5933837890625, -727.5673217773438, -712.541259765625, -697.51513671875, -682.489013671875, -667.4629516601562, -652.4368896484375, -637.4107666015625, -622.3846435546875, -607.3585815429688, -592.33251953125, -577.306396484375, -562.2802734375, -547.2542114257812, -532.2281494140625, -517.2020263671875, -502.1759338378906, -487.14984130859375, -472.1237487792969, -457.09765625, -442.0715637207031, -427.04547119140625, -412.0193786621094, -396.9932861328125, -381.9671936035156, -366.94110107421875, -351.9150085449219, -336.888916015625, -321.8628234863281, -306.83673095703125, -291.8106384277344, -276.7845458984375, -261.7584533691406, -246.73236083984375, -231.70626831054688, -216.68017578125, -201.65408325195312, -186.62799072265625, -171.60189819335938, -156.5758056640625, -141.54971313476562, -126.52362060546875, -111.49752807617188, -96.471435546875, -81.44534301757812, -66.41925048828125, -51.393157958984375, -36.36707305908203, -21.340980529785156, -6.314888000488281, 8.711204528808594, 23.73729705810547, 38.763389587402344, 53.78948211669922, 68.8155746459961, 83.84166717529297]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 7.0, 4.0, 15.0, 13.0, 12.0, 22.0, 22.0, 23.0, 22.0, 27.0, 31.0, 32.0, 45.0, 46.0, 53.0, 54.0, 38.0, 39.0, 44.0, 46.0, 40.0, 45.0, 48.0, 32.0, 35.0, 27.0, 18.0, 16.0, 13.0, 24.0, 14.0, 13.0, 13.0, 14.0, 12.0, 10.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.21849822998047, -39.870723724365234, -38.52294921875, -37.17517852783203, -35.8274040222168, -34.47962951660156, -33.13185501098633, -31.784080505371094, -30.43630599975586, -29.088531494140625, -27.740758895874023, -26.39298439025879, -25.045209884643555, -23.697437286376953, -22.34966278076172, -21.001888275146484, -19.654115676879883, -18.30634117126465, -16.958568572998047, -15.610794067382812, -14.263019561767578, -12.91524600982666, -11.567472457885742, -10.219697952270508, -8.87192440032959, -7.524150371551514, -6.1763763427734375, -4.8286027908325195, -3.4808287620544434, -2.133054733276367, -0.7852811813354492, 0.5624933242797852, 1.9102668762207031, 3.2580409049987793, 4.6058149337768555, 5.953588485717773, 7.30136251449585, 8.649136543273926, 9.996910095214844, 11.344684600830078, 12.692458152770996, 14.040231704711914, 15.388006210327148, 16.73577880859375, 18.083553314208984, 19.43132781982422, 20.779102325439453, 22.126876831054688, 23.47464942932129, 24.822423934936523, 26.170196533203125, 27.51797103881836, 28.865745544433594, 30.213520050048828, 31.56129264831543, 32.90906524658203, 34.256839752197266, 35.6046142578125, 36.952388763427734, 38.30016326904297, 39.64793395996094, 40.99570846557617, 42.343482971191406, 43.69125747680664, 45.039031982421875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 7.0, 11.0, 10.0, 8.0, 21.0, 24.0, 23.0, 23.0, 23.0, 35.0, 33.0, 35.0, 46.0, 54.0, 46.0, 46.0, 52.0, 49.0, 54.0, 49.0, 44.0, 39.0, 33.0, 37.0, 29.0, 28.0, 26.0, 27.0, 13.0, 10.0, 18.0, 7.0, 12.0, 8.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.56494140625, -6.3759765625, -6.18701171875, -5.998046875, -5.80908203125, -5.6201171875, -5.43115234375, -5.2421875, -5.05322265625, -4.8642578125, -4.67529296875, -4.486328125, -4.29736328125, -4.1083984375, -3.91943359375, -3.73046875, -3.54150390625, -3.3525390625, -3.16357421875, -2.974609375, -2.78564453125, -2.5966796875, -2.40771484375, -2.21875, -2.02978515625, -1.8408203125, -1.65185546875, -1.462890625, -1.27392578125, -1.0849609375, -0.89599609375, -0.70703125, -0.51806640625, -0.3291015625, -0.14013671875, 0.048828125, 0.23779296875, 0.4267578125, 0.61572265625, 0.8046875, 0.99365234375, 1.1826171875, 1.37158203125, 1.560546875, 1.74951171875, 1.9384765625, 2.12744140625, 2.31640625, 2.50537109375, 2.6943359375, 2.88330078125, 3.072265625, 3.26123046875, 3.4501953125, 3.63916015625, 3.828125, 4.01708984375, 4.2060546875, 4.39501953125, 4.583984375, 4.77294921875, 4.9619140625, 5.15087890625, 5.33984375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 7.0, 7.0, 9.0, 19.0, 22.0, 40.0, 42.0, 66.0, 97.0, 118.0, 189.0, 230.0, 357.0, 487.0, 640.0, 934.0, 1296.0, 1769.0, 2559.0, 3505.0, 5139.0, 7519.0, 11091.0, 17117.0, 26390.0, 42101.0, 69008.0, 118177.0, 191284.0, 203960.0, 133178.0, 77372.0, 46738.0, 29159.0, 18610.0, 12237.0, 8098.0, 5521.0, 3904.0, 2762.0, 1921.0, 1390.0, 944.0, 705.0, 525.0, 375.0, 297.0, 204.0, 131.0, 87.0, 80.0, 44.0, 35.0, 25.0, 15.0, 12.0, 10.0, 7.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.6220703125, -0.6020736694335938, -0.5820770263671875, -0.5620803833007812, -0.542083740234375, -0.5220870971679688, -0.5020904541015625, -0.48209381103515625, -0.46209716796875, -0.44210052490234375, -0.4221038818359375, -0.40210723876953125, -0.382110595703125, -0.36211395263671875, -0.3421173095703125, -0.32212066650390625, -0.3021240234375, -0.28212738037109375, -0.2621307373046875, -0.24213409423828125, -0.222137451171875, -0.20214080810546875, -0.1821441650390625, -0.16214752197265625, -0.14215087890625, -0.12215423583984375, -0.1021575927734375, -0.08216094970703125, -0.062164306640625, -0.04216766357421875, -0.0221710205078125, -0.00217437744140625, 0.017822265625, 0.03781890869140625, 0.0578155517578125, 0.07781219482421875, 0.097808837890625, 0.11780548095703125, 0.1378021240234375, 0.15779876708984375, 0.17779541015625, 0.19779205322265625, 0.2177886962890625, 0.23778533935546875, 0.257781982421875, 0.27777862548828125, 0.2977752685546875, 0.31777191162109375, 0.3377685546875, 0.35776519775390625, 0.3777618408203125, 0.39775848388671875, 0.417755126953125, 0.43775177001953125, 0.4577484130859375, 0.47774505615234375, 0.49774169921875, 0.5177383422851562, 0.5377349853515625, 0.5577316284179688, 0.577728271484375, 0.5977249145507812, 0.6177215576171875, 0.6377182006835938, 0.65771484375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 3.0, 1.0, 5.0, 8.0, 8.0, 6.0, 16.0, 18.0, 17.0, 21.0, 27.0, 27.0, 26.0, 27.0, 29.0, 32.0, 26.0, 38.0, 51.0, 56.0, 46.0, 1070.0, 54.0, 35.0, 38.0, 36.0, 26.0, 38.0, 33.0, 34.0, 33.0, 22.0, 22.0, 18.0, 14.0, 13.0, 12.0, 14.0, 5.0, 12.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.478515625, -3.371337890625, -3.26416015625, -3.156982421875, -3.0498046875, -2.942626953125, -2.83544921875, -2.728271484375, -2.62109375, -2.513916015625, -2.40673828125, -2.299560546875, -2.1923828125, -2.085205078125, -1.97802734375, -1.870849609375, -1.763671875, -1.656494140625, -1.54931640625, -1.442138671875, -1.3349609375, -1.227783203125, -1.12060546875, -1.013427734375, -0.90625, -0.799072265625, -0.69189453125, -0.584716796875, -0.4775390625, -0.370361328125, -0.26318359375, -0.156005859375, -0.048828125, 0.058349609375, 0.16552734375, 0.272705078125, 0.3798828125, 0.487060546875, 0.59423828125, 0.701416015625, 0.80859375, 0.915771484375, 1.02294921875, 1.130126953125, 1.2373046875, 1.344482421875, 1.45166015625, 1.558837890625, 1.666015625, 1.773193359375, 1.88037109375, 1.987548828125, 2.0947265625, 2.201904296875, 2.30908203125, 2.416259765625, 2.5234375, 2.630615234375, 2.73779296875, 2.844970703125, 2.9521484375, 3.059326171875, 3.16650390625, 3.273681640625, 3.380859375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 5.0, 13.0, 22.0, 23.0, 41.0, 48.0, 97.0, 131.0, 217.0, 311.0, 473.0, 762.0, 1193.0, 1857.0, 3028.0, 4942.0, 7999.0, 13899.0, 23807.0, 40539.0, 71963.0, 126860.0, 217354.0, 1253651.0, 139914.0, 79021.0, 44535.0, 25740.0, 15314.0, 8946.0, 5442.0, 3285.0, 2077.0, 1323.0, 769.0, 559.0, 324.0, 210.0, 152.0, 97.0, 50.0, 45.0, 32.0, 17.0, 13.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.595703125, -0.57769775390625, -0.5596923828125, -0.54168701171875, -0.523681640625, -0.50567626953125, -0.4876708984375, -0.46966552734375, -0.45166015625, -0.43365478515625, -0.4156494140625, -0.39764404296875, -0.379638671875, -0.36163330078125, -0.3436279296875, -0.32562255859375, -0.3076171875, -0.28961181640625, -0.2716064453125, -0.25360107421875, -0.235595703125, -0.21759033203125, -0.1995849609375, -0.18157958984375, -0.16357421875, -0.14556884765625, -0.1275634765625, -0.10955810546875, -0.091552734375, -0.07354736328125, -0.0555419921875, -0.03753662109375, -0.01953125, -0.00152587890625, 0.0164794921875, 0.03448486328125, 0.052490234375, 0.07049560546875, 0.0885009765625, 0.10650634765625, 0.12451171875, 0.14251708984375, 0.1605224609375, 0.17852783203125, 0.196533203125, 0.21453857421875, 0.2325439453125, 0.25054931640625, 0.2685546875, 0.28656005859375, 0.3045654296875, 0.32257080078125, 0.340576171875, 0.35858154296875, 0.3765869140625, 0.39459228515625, 0.41259765625, 0.43060302734375, 0.4486083984375, 0.46661376953125, 0.484619140625, 0.50262451171875, 0.5206298828125, 0.53863525390625, 0.556640625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 8.0, 13.0, 14.0, 25.0, 22.0, 20.0, 39.0, 40.0, 50.0, 58.0, 53.0, 69.0, 70.0, 60.0, 73.0, 58.0, 58.0, 42.0, 46.0, 43.0, 24.0, 14.0, 17.0, 12.0, 14.0, 7.0, 6.0, 11.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0023441314697265625, -0.0022708475589752197, -0.002197563648223877, -0.002124279737472534, -0.0020509958267211914, -0.0019777119159698486, -0.0019044280052185059, -0.001831144094467163, -0.0017578601837158203, -0.0016845762729644775, -0.0016112923622131348, -0.001538008451461792, -0.0014647245407104492, -0.0013914406299591064, -0.0013181567192077637, -0.001244872808456421, -0.0011715888977050781, -0.0010983049869537354, -0.0010250210762023926, -0.0009517371654510498, -0.000878453254699707, -0.0008051693439483643, -0.0007318854331970215, -0.0006586015224456787, -0.0005853176116943359, -0.0005120337009429932, -0.0004387497901916504, -0.0003654658794403076, -0.00029218196868896484, -0.00021889805793762207, -0.0001456141471862793, -7.233023643493652e-05, 9.5367431640625e-07, 7.423758506774902e-05, 0.0001475214958190918, 0.00022080540657043457, 0.00029408931732177734, 0.0003673732280731201, 0.0004406571388244629, 0.0005139410495758057, 0.0005872249603271484, 0.0006605088710784912, 0.000733792781829834, 0.0008070766925811768, 0.0008803606033325195, 0.0009536445140838623, 0.001026928424835205, 0.0011002123355865479, 0.0011734962463378906, 0.0012467801570892334, 0.0013200640678405762, 0.001393347978591919, 0.0014666318893432617, 0.0015399158000946045, 0.0016131997108459473, 0.00168648362159729, 0.0017597675323486328, 0.0018330514430999756, 0.0019063353538513184, 0.001979619264602661, 0.002052903175354004, 0.0021261870861053467, 0.0021994709968566895, 0.0022727549076080322, 0.002346038818359375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 5.0, 11.0, 18.0, 23.0, 28.0, 30.0, 42.0, 49.0, 79.0, 132.0, 176.0, 300.0, 453.0, 928.0, 21364.0, 1020948.0, 2171.0, 636.0, 362.0, 213.0, 158.0, 97.0, 81.0, 66.0, 47.0, 32.0, 25.0, 13.0, 15.0, 10.0, 3.0, 6.0, 2.0, 0.0, 7.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04681396484375, -0.045317649841308594, -0.04382133483886719, -0.04232501983642578, -0.040828704833984375, -0.03933238983154297, -0.03783607482910156, -0.036339759826660156, -0.03484344482421875, -0.033347129821777344, -0.03185081481933594, -0.03035449981689453, -0.028858184814453125, -0.02736186981201172, -0.025865554809570312, -0.024369239807128906, -0.0228729248046875, -0.021376609802246094, -0.019880294799804688, -0.01838397979736328, -0.016887664794921875, -0.015391349792480469, -0.013895034790039062, -0.012398719787597656, -0.01090240478515625, -0.009406089782714844, -0.007909774780273438, -0.006413459777832031, -0.004917144775390625, -0.0034208297729492188, -0.0019245147705078125, -0.00042819976806640625, 0.001068115234375, 0.0025644302368164062, 0.0040607452392578125, 0.005557060241699219, 0.007053375244140625, 0.008549690246582031, 0.010046005249023438, 0.011542320251464844, 0.01303863525390625, 0.014534950256347656, 0.016031265258789062, 0.01752758026123047, 0.019023895263671875, 0.02052021026611328, 0.022016525268554688, 0.023512840270996094, 0.0250091552734375, 0.026505470275878906, 0.028001785278320312, 0.02949810028076172, 0.030994415283203125, 0.03249073028564453, 0.03398704528808594, 0.035483360290527344, 0.03697967529296875, 0.038475990295410156, 0.03997230529785156, 0.04146862030029297, 0.042964935302734375, 0.04446125030517578, 0.04595756530761719, 0.047453880310058594, 0.0489501953125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 752.0, 263.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011446215212345123, -0.00053387664956972, 7.686822209507227e-05, 0.0006876131519675255, 0.0012983579654246569, 0.0019091027788817883, 0.0025198478251695633, 0.003130592405796051, 0.003741337452083826, 0.004352082498371601, 0.004962827078998089, 0.005573572125285864, 0.006184317171573639, 0.006795061752200127, 0.007405806798487902, 0.008016550913453102, 0.008627296425402164, 0.009238041006028652, 0.009848786517977715, 0.010459531098604202, 0.01107027567923069, 0.011681020259857178, 0.01229176577180624, 0.012902510352432728, 0.01351325586438179, 0.014124000445008278, 0.01473474595695734, 0.015345490537583828, 0.01595623604953289, 0.016566980630159378, 0.017177725210785866, 0.017788469791412354, 0.01839921437203884, 0.01900995895266533, 0.019620703533291817, 0.020231448113918304, 0.02084219455718994, 0.02145293913781643, 0.022063683718442917, 0.022674428299069405, 0.023285172879695892, 0.02389591746032238, 0.024506662040948868, 0.025117408484220505, 0.025728153064846992, 0.02633889764547348, 0.026949642226099968, 0.027560386806726456, 0.028171133249998093, 0.02878187783062458, 0.029392622411251068, 0.030003368854522705, 0.030614113435149193, 0.03122485801577568, 0.03183560073375702, 0.032446347177028656, 0.033057089895009995, 0.03366783633828163, 0.03427857905626297, 0.03488932549953461, 0.035500068217515945, 0.03611081466078758, 0.03672155737876892, 0.03733230382204056, 0.037943050265312195]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 13.0, 15.0, 17.0, 29.0, 29.0, 35.0, 40.0, 44.0, 43.0, 52.0, 59.0, 50.0, 57.0, 62.0, 51.0, 49.0, 43.0, 50.0, 40.0, 30.0, 35.0, 27.0, 27.0, 24.0, 14.0, 19.0, 11.0, 7.0, 7.0, 1.0, 8.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.0020979642868041992, -0.002047979272902012, -0.0019979942589998245, -0.0019480092450976372, -0.0018980242311954498, -0.0018480392172932625, -0.0017980542033910751, -0.0017480691894888878, -0.0016980841755867004, -0.001648099161684513, -0.0015981141477823257, -0.0015481291338801384, -0.001498144119977951, -0.0014481591060757637, -0.0013981740921735764, -0.001348189078271389, -0.0012982040643692017, -0.0012482190504670143, -0.001198234036564827, -0.0011482490226626396, -0.0010982640087604523, -0.001048278994858265, -0.0009982939809560776, -0.0009483089670538902, -0.0008983239531517029, -0.0008483389392495155, -0.0007983539253473282, -0.0007483689114451408, -0.0006983838975429535, -0.0006483988836407661, -0.0005984138697385788, -0.0005484288558363914, -0.0004984438419342041, -0.00044845882803201675, -0.0003984738141298294, -0.00034848880022764206, -0.0002985037863254547, -0.00024851877242326736, -0.00019853375852108002, -0.00014854874461889267, -9.856373071670532e-05, -4.8578716814517975e-05, 1.4062970876693726e-06, 5.139131098985672e-05, 0.00010137632489204407, 0.00015136133879423141, 0.00020134635269641876, 0.0002513313665986061, 0.00030131638050079346, 0.0003513013944029808, 0.00040128640830516815, 0.0004512714222073555, 0.0005012564361095428, 0.0005512414500117302, 0.0006012264639139175, 0.0006512114778161049, 0.0007011964917182922, 0.0007511815056204796, 0.0008011665195226669, 0.0008511515334248543, 0.0009011365473270416, 0.000951121561229229, 0.0010011065751314163, 0.0010510915890336037, 0.001101076602935791]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 7.0, 11.0, 10.0, 8.0, 21.0, 24.0, 23.0, 23.0, 23.0, 35.0, 33.0, 35.0, 46.0, 54.0, 46.0, 46.0, 52.0, 49.0, 54.0, 49.0, 44.0, 39.0, 33.0, 37.0, 29.0, 28.0, 26.0, 27.0, 13.0, 10.0, 18.0, 7.0, 12.0, 8.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.56494140625, -6.3759765625, -6.18701171875, -5.998046875, -5.80908203125, -5.6201171875, -5.43115234375, -5.2421875, -5.05322265625, -4.8642578125, -4.67529296875, -4.486328125, -4.29736328125, -4.1083984375, -3.91943359375, -3.73046875, -3.54150390625, -3.3525390625, -3.16357421875, -2.974609375, -2.78564453125, -2.5966796875, -2.40771484375, -2.21875, -2.02978515625, -1.8408203125, -1.65185546875, -1.462890625, -1.27392578125, -1.0849609375, -0.89599609375, -0.70703125, -0.51806640625, -0.3291015625, -0.14013671875, 0.048828125, 0.23779296875, 0.4267578125, 0.61572265625, 0.8046875, 0.99365234375, 1.1826171875, 1.37158203125, 1.560546875, 1.74951171875, 1.9384765625, 2.12744140625, 2.31640625, 2.50537109375, 2.6943359375, 2.88330078125, 3.072265625, 3.26123046875, 3.4501953125, 3.63916015625, 3.828125, 4.01708984375, 4.2060546875, 4.39501953125, 4.583984375, 4.77294921875, 4.9619140625, 5.15087890625, 5.33984375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 0.0, 3.0, 5.0, 5.0, 10.0, 11.0, 23.0, 28.0, 27.0, 61.0, 82.0, 119.0, 169.0, 253.0, 374.0, 566.0, 819.0, 1424.0, 2236.0, 4419.0, 11927.0, 76621.0, 718412.0, 197393.0, 20207.0, 5856.0, 2928.0, 1537.0, 1019.0, 685.0, 449.0, 248.0, 199.0, 139.0, 103.0, 63.0, 35.0, 34.0, 13.0, 19.0, 15.0, 11.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.765625, -13.28564453125, -12.8056640625, -12.32568359375, -11.845703125, -11.36572265625, -10.8857421875, -10.40576171875, -9.92578125, -9.44580078125, -8.9658203125, -8.48583984375, -8.005859375, -7.52587890625, -7.0458984375, -6.56591796875, -6.0859375, -5.60595703125, -5.1259765625, -4.64599609375, -4.166015625, -3.68603515625, -3.2060546875, -2.72607421875, -2.24609375, -1.76611328125, -1.2861328125, -0.80615234375, -0.326171875, 0.15380859375, 0.6337890625, 1.11376953125, 1.59375, 2.07373046875, 2.5537109375, 3.03369140625, 3.513671875, 3.99365234375, 4.4736328125, 4.95361328125, 5.43359375, 5.91357421875, 6.3935546875, 6.87353515625, 7.353515625, 7.83349609375, 8.3134765625, 8.79345703125, 9.2734375, 9.75341796875, 10.2333984375, 10.71337890625, 11.193359375, 11.67333984375, 12.1533203125, 12.63330078125, 13.11328125, 13.59326171875, 14.0732421875, 14.55322265625, 15.033203125, 15.51318359375, 15.9931640625, 16.47314453125, 16.953125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 7.0, 3.0, 7.0, 10.0, 12.0, 13.0, 19.0, 21.0, 25.0, 23.0, 42.0, 41.0, 30.0, 52.0, 57.0, 83.0, 215.0, 1654.0, 246.0, 89.0, 63.0, 51.0, 48.0, 37.0, 39.0, 20.0, 26.0, 25.0, 12.0, 12.0, 13.0, 9.0, 8.0, 4.0, 11.0, 5.0, 8.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.03125, -13.556640625, -13.08203125, -12.607421875, -12.1328125, -11.658203125, -11.18359375, -10.708984375, -10.234375, -9.759765625, -9.28515625, -8.810546875, -8.3359375, -7.861328125, -7.38671875, -6.912109375, -6.4375, -5.962890625, -5.48828125, -5.013671875, -4.5390625, -4.064453125, -3.58984375, -3.115234375, -2.640625, -2.166015625, -1.69140625, -1.216796875, -0.7421875, -0.267578125, 0.20703125, 0.681640625, 1.15625, 1.630859375, 2.10546875, 2.580078125, 3.0546875, 3.529296875, 4.00390625, 4.478515625, 4.953125, 5.427734375, 5.90234375, 6.376953125, 6.8515625, 7.326171875, 7.80078125, 8.275390625, 8.75, 9.224609375, 9.69921875, 10.173828125, 10.6484375, 11.123046875, 11.59765625, 12.072265625, 12.546875, 13.021484375, 13.49609375, 13.970703125, 14.4453125, 14.919921875, 15.39453125, 15.869140625, 16.34375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 6.0, 10.0, 13.0, 11.0, 20.0, 32.0, 26.0, 38.0, 45.0, 73.0, 70.0, 119.0, 167.0, 257.0, 492.0, 1067.0, 9359.0, 3118035.0, 13236.0, 1197.0, 496.0, 252.0, 183.0, 115.0, 92.0, 71.0, 56.0, 30.0, 28.0, 30.0, 25.0, 14.0, 6.0, 3.0, 2.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.8125, -42.4658203125, -41.119140625, -39.7724609375, -38.42578125, -37.0791015625, -35.732421875, -34.3857421875, -33.0390625, -31.6923828125, -30.345703125, -28.9990234375, -27.65234375, -26.3056640625, -24.958984375, -23.6123046875, -22.265625, -20.9189453125, -19.572265625, -18.2255859375, -16.87890625, -15.5322265625, -14.185546875, -12.8388671875, -11.4921875, -10.1455078125, -8.798828125, -7.4521484375, -6.10546875, -4.7587890625, -3.412109375, -2.0654296875, -0.71875, 0.6279296875, 1.974609375, 3.3212890625, 4.66796875, 6.0146484375, 7.361328125, 8.7080078125, 10.0546875, 11.4013671875, 12.748046875, 14.0947265625, 15.44140625, 16.7880859375, 18.134765625, 19.4814453125, 20.828125, 22.1748046875, 23.521484375, 24.8681640625, 26.21484375, 27.5615234375, 28.908203125, 30.2548828125, 31.6015625, 32.9482421875, 34.294921875, 35.6416015625, 36.98828125, 38.3349609375, 39.681640625, 41.0283203125, 42.375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 20.0, 77.0, 179.0, 333.0, 257.0, 88.0, 39.0, 10.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.76789093017578, -79.79903411865234, -77.8301773071289, -75.86132049560547, -73.89246368408203, -71.9236068725586, -69.95475006103516, -67.98589324951172, -66.01703643798828, -64.04817962646484, -62.079322814941406, -60.11046600341797, -58.14160919189453, -56.172752380371094, -54.203895568847656, -52.23503875732422, -50.26618194580078, -48.297325134277344, -46.328468322753906, -44.35961151123047, -42.39075469970703, -40.421897888183594, -38.453041076660156, -36.48418426513672, -34.51533126831055, -32.54647445678711, -30.577617645263672, -28.608760833740234, -26.639904022216797, -24.67104721069336, -22.702190399169922, -20.733333587646484, -18.764476776123047, -16.79561996459961, -14.826763153076172, -12.857906341552734, -10.889049530029297, -8.920193672180176, -6.951336860656738, -4.982480049133301, -3.0136232376098633, -1.0447665452957153, 0.9240901470184326, 2.892946720123291, 4.8618035316467285, 6.830659866333008, 8.799516677856445, 10.768373489379883, 12.73723030090332, 14.706087112426758, 16.674943923950195, 18.643800735473633, 20.61265754699707, 22.581512451171875, 24.550369262695312, 26.51922607421875, 28.488082885742188, 30.456939697265625, 32.42579650878906, 34.3946533203125, 36.36351013183594, 38.332366943359375, 40.30122375488281, 42.27008056640625, 44.23893737792969]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 6.0, 7.0, 6.0, 10.0, 12.0, 14.0, 12.0, 22.0, 21.0, 37.0, 30.0, 35.0, 36.0, 36.0, 34.0, 58.0, 54.0, 48.0, 46.0, 46.0, 46.0, 37.0, 41.0, 45.0, 36.0, 34.0, 36.0, 23.0, 15.0, 18.0, 18.0, 18.0, 19.0, 13.0, 9.0, 2.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.32217788696289, -34.93650817871094, -33.55084228515625, -32.1651725769043, -30.779502868652344, -29.393835067749023, -28.008167266845703, -26.62249755859375, -25.23682975769043, -23.85116195678711, -22.465492248535156, -21.079824447631836, -19.694156646728516, -18.308486938476562, -16.922819137573242, -15.537150382995605, -14.151481628417969, -12.765812873840332, -11.380144119262695, -9.994476318359375, -8.608807563781738, -7.223138809204102, -5.837471008300781, -4.4518022537231445, -3.066133499145508, -1.6804649829864502, -0.2947964668273926, 1.090871810913086, 2.4765405654907227, 3.8622093200683594, 5.24787712097168, 6.633545875549316, 8.019218444824219, 9.404887199401855, 10.790555953979492, 12.176223754882812, 13.56189250946045, 14.947561264038086, 16.333229064941406, 17.71889877319336, 19.10456657409668, 20.490234375, 21.875904083251953, 23.261571884155273, 24.647239685058594, 26.032909393310547, 27.418577194213867, 28.804244995117188, 30.18991470336914, 31.57558250427246, 32.96125030517578, 34.346920013427734, 35.73258972167969, 37.118255615234375, 38.50392532348633, 39.88959503173828, 41.27526092529297, 42.66093063354492, 44.04659652709961, 45.43226623535156, 46.817935943603516, 48.20360565185547, 49.589271545410156, 50.97494125366211, 52.36061096191406]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 8.0, 6.0, 7.0, 13.0, 20.0, 21.0, 14.0, 25.0, 37.0, 27.0, 39.0, 46.0, 52.0, 52.0, 56.0, 55.0, 50.0, 48.0, 52.0, 52.0, 37.0, 40.0, 43.0, 33.0, 23.0, 33.0, 25.0, 18.0, 15.0, 9.0, 7.0, 10.0, 6.0, 7.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-8.4453125, -8.23016357421875, -8.0150146484375, -7.79986572265625, -7.584716796875, -7.36956787109375, -7.1544189453125, -6.93927001953125, -6.72412109375, -6.50897216796875, -6.2938232421875, -6.07867431640625, -5.863525390625, -5.64837646484375, -5.4332275390625, -5.21807861328125, -5.0029296875, -4.78778076171875, -4.5726318359375, -4.35748291015625, -4.142333984375, -3.92718505859375, -3.7120361328125, -3.49688720703125, -3.28173828125, -3.06658935546875, -2.8514404296875, -2.63629150390625, -2.421142578125, -2.20599365234375, -1.9908447265625, -1.77569580078125, -1.560546875, -1.34539794921875, -1.1302490234375, -0.91510009765625, -0.699951171875, -0.48480224609375, -0.2696533203125, -0.05450439453125, 0.16064453125, 0.37579345703125, 0.5909423828125, 0.80609130859375, 1.021240234375, 1.23638916015625, 1.4515380859375, 1.66668701171875, 1.8818359375, 2.09698486328125, 2.3121337890625, 2.52728271484375, 2.742431640625, 2.95758056640625, 3.1727294921875, 3.38787841796875, 3.60302734375, 3.81817626953125, 4.0333251953125, 4.24847412109375, 4.463623046875, 4.67877197265625, 4.8939208984375, 5.10906982421875, 5.32421875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 2.0, 5.0, 10.0, 11.0, 14.0, 18.0, 25.0, 36.0, 40.0, 60.0, 61.0, 107.0, 166.0, 196.0, 319.0, 512.0, 774.0, 1377.0, 2452.0, 4824.0, 10949.0, 38124.0, 260956.0, 1456664.0, 1921304.0, 407484.0, 60104.0, 14695.0, 6000.0, 2836.0, 1574.0, 913.0, 556.0, 351.0, 231.0, 152.0, 105.0, 81.0, 45.0, 41.0, 21.0, 14.0, 32.0, 14.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.5, -9.2215576171875, -8.943115234375, -8.6646728515625, -8.38623046875, -8.1077880859375, -7.829345703125, -7.5509033203125, -7.2724609375, -6.9940185546875, -6.715576171875, -6.4371337890625, -6.15869140625, -5.8802490234375, -5.601806640625, -5.3233642578125, -5.044921875, -4.7664794921875, -4.488037109375, -4.2095947265625, -3.93115234375, -3.6527099609375, -3.374267578125, -3.0958251953125, -2.8173828125, -2.5389404296875, -2.260498046875, -1.9820556640625, -1.70361328125, -1.4251708984375, -1.146728515625, -0.8682861328125, -0.58984375, -0.3114013671875, -0.032958984375, 0.2454833984375, 0.52392578125, 0.8023681640625, 1.080810546875, 1.3592529296875, 1.6376953125, 1.9161376953125, 2.194580078125, 2.4730224609375, 2.75146484375, 3.0299072265625, 3.308349609375, 3.5867919921875, 3.865234375, 4.1436767578125, 4.422119140625, 4.7005615234375, 4.97900390625, 5.2574462890625, 5.535888671875, 5.8143310546875, 6.0927734375, 6.3712158203125, 6.649658203125, 6.9281005859375, 7.20654296875, 7.4849853515625, 7.763427734375, 8.0418701171875, 8.3203125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 9.0, 19.0, 86.0, 247.0, 625.0, 1685.0, 956.0, 328.0, 94.0, 19.0, 13.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.34619140625, -31.2548828125, -30.16357421875, -29.072265625, -27.98095703125, -26.8896484375, -25.79833984375, -24.70703125, -23.61572265625, -22.5244140625, -21.43310546875, -20.341796875, -19.25048828125, -18.1591796875, -17.06787109375, -15.9765625, -14.88525390625, -13.7939453125, -12.70263671875, -11.611328125, -10.52001953125, -9.4287109375, -8.33740234375, -7.24609375, -6.15478515625, -5.0634765625, -3.97216796875, -2.880859375, -1.78955078125, -0.6982421875, 0.39306640625, 1.484375, 2.57568359375, 3.6669921875, 4.75830078125, 5.849609375, 6.94091796875, 8.0322265625, 9.12353515625, 10.21484375, 11.30615234375, 12.3974609375, 13.48876953125, 14.580078125, 15.67138671875, 16.7626953125, 17.85400390625, 18.9453125, 20.03662109375, 21.1279296875, 22.21923828125, 23.310546875, 24.40185546875, 25.4931640625, 26.58447265625, 27.67578125, 28.76708984375, 29.8583984375, 30.94970703125, 32.041015625, 33.13232421875, 34.2236328125, 35.31494140625, 36.40625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 12.0, 28.0, 56.0, 175.0, 565.0, 1972.0, 73297.0, 4111303.0, 5234.0, 1072.0, 318.0, 126.0, 50.0, 21.0, 12.0, 5.0, 7.0, 5.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.0625, -53.30078125, -51.5390625, -49.77734375, -48.015625, -46.25390625, -44.4921875, -42.73046875, -40.96875, -39.20703125, -37.4453125, -35.68359375, -33.921875, -32.16015625, -30.3984375, -28.63671875, -26.875, -25.11328125, -23.3515625, -21.58984375, -19.828125, -18.06640625, -16.3046875, -14.54296875, -12.78125, -11.01953125, -9.2578125, -7.49609375, -5.734375, -3.97265625, -2.2109375, -0.44921875, 1.3125, 3.07421875, 4.8359375, 6.59765625, 8.359375, 10.12109375, 11.8828125, 13.64453125, 15.40625, 17.16796875, 18.9296875, 20.69140625, 22.453125, 24.21484375, 25.9765625, 27.73828125, 29.5, 31.26171875, 33.0234375, 34.78515625, 36.546875, 38.30859375, 40.0703125, 41.83203125, 43.59375, 45.35546875, 47.1171875, 48.87890625, 50.640625, 52.40234375, 54.1640625, 55.92578125, 57.6875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 37.0, 278.0, 505.0, 174.0, 14.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.3079833984375, -119.59233093261719, -114.8766860961914, -110.16104125976562, -105.44538879394531, -100.729736328125, -96.01409149169922, -91.29844665527344, -86.58279418945312, -81.86714172363281, -77.15149688720703, -72.43585205078125, -67.72019958496094, -63.00455093383789, -58.288902282714844, -53.5732536315918, -48.85760498046875, -44.1419563293457, -39.426307678222656, -34.71065902709961, -29.995010375976562, -25.279361724853516, -20.56371307373047, -15.848064422607422, -11.132415771484375, -6.416767120361328, -1.7011184692382812, 3.0145301818847656, 7.7301788330078125, 12.44582748413086, 17.161476135253906, 21.877124786376953, 26.592758178710938, 31.308406829833984, 36.02405548095703, 40.73970413208008, 45.455352783203125, 50.17100143432617, 54.88665008544922, 59.602298736572266, 64.31794738769531, 69.03359985351562, 73.7492446899414, 78.46488952636719, 83.1805419921875, 87.89619445800781, 92.6118392944336, 97.32748413085938, 102.04313659667969, 106.7587890625, 111.47443389892578, 116.19007873535156, 120.90573120117188, 125.62138366699219, 130.3370361328125, 135.05267333984375, 139.76832580566406, 144.48397827148438, 149.19961547851562, 153.91526794433594, 158.63092041015625, 163.34657287597656, 168.06222534179688, 172.77786254882812, 177.49351501464844]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 4.0, 6.0, 5.0, 6.0, 7.0, 19.0, 19.0, 13.0, 24.0, 26.0, 26.0, 28.0, 29.0, 47.0, 41.0, 51.0, 37.0, 42.0, 39.0, 57.0, 42.0, 42.0, 44.0, 46.0, 41.0, 24.0, 39.0, 29.0, 28.0, 20.0, 18.0, 9.0, 16.0, 12.0, 8.0, 16.0, 8.0, 10.0, 3.0, 5.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.028053283691406, -37.715789794921875, -36.403526306152344, -35.09126281738281, -33.77899932861328, -32.46673583984375, -31.154470443725586, -29.842205047607422, -28.52994155883789, -27.21767807006836, -25.905414581298828, -24.593151092529297, -23.280885696411133, -21.9686222076416, -20.65635871887207, -19.344093322753906, -18.031831741333008, -16.719568252563477, -15.407303810119629, -14.095040321350098, -12.78277587890625, -11.470512390136719, -10.158248901367188, -8.84598445892334, -7.533720970153809, -6.221457004547119, -4.90919303894043, -3.5969295501708984, -2.284665584564209, -0.9724016189575195, 0.3398618698120117, 1.6521263122558594, 2.9643898010253906, 4.27665376663208, 5.5889177322387695, 6.901181221008301, 8.213445663452148, 9.52570915222168, 10.837972640991211, 12.150237083435059, 13.46250057220459, 14.774764060974121, 16.08702850341797, 17.3992919921875, 18.71155548095703, 20.023818969726562, 21.336082458496094, 22.648347854614258, 23.96061134338379, 25.27287483215332, 26.58513832092285, 27.897403717041016, 29.209667205810547, 30.521930694580078, 31.83419418334961, 33.14645767211914, 34.45872116088867, 35.7709846496582, 37.083248138427734, 38.395511627197266, 39.7077751159668, 41.020042419433594, 42.332305908203125, 43.644569396972656, 44.95683288574219]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 0.0, 4.0, 6.0, 2.0, 3.0, 10.0, 4.0, 8.0, 9.0, 11.0, 8.0, 13.0, 17.0, 14.0, 15.0, 30.0, 29.0, 27.0, 33.0, 24.0, 43.0, 29.0, 30.0, 41.0, 33.0, 40.0, 48.0, 47.0, 43.0, 48.0, 39.0, 36.0, 34.0, 32.0, 35.0, 23.0, 24.0, 25.0, 10.0, 14.0, 10.0, 9.0, 6.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 7.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.8359375, -3.70758056640625, -3.5792236328125, -3.45086669921875, -3.322509765625, -3.19415283203125, -3.0657958984375, -2.93743896484375, -2.80908203125, -2.68072509765625, -2.5523681640625, -2.42401123046875, -2.295654296875, -2.16729736328125, -2.0389404296875, -1.91058349609375, -1.7822265625, -1.65386962890625, -1.5255126953125, -1.39715576171875, -1.268798828125, -1.14044189453125, -1.0120849609375, -0.88372802734375, -0.75537109375, -0.62701416015625, -0.4986572265625, -0.37030029296875, -0.241943359375, -0.11358642578125, 0.0147705078125, 0.14312744140625, 0.271484375, 0.39984130859375, 0.5281982421875, 0.65655517578125, 0.784912109375, 0.91326904296875, 1.0416259765625, 1.16998291015625, 1.29833984375, 1.42669677734375, 1.5550537109375, 1.68341064453125, 1.811767578125, 1.94012451171875, 2.0684814453125, 2.19683837890625, 2.3251953125, 2.45355224609375, 2.5819091796875, 2.71026611328125, 2.838623046875, 2.96697998046875, 3.0953369140625, 3.22369384765625, 3.35205078125, 3.48040771484375, 3.6087646484375, 3.73712158203125, 3.865478515625, 3.99383544921875, 4.1221923828125, 4.25054931640625, 4.37890625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 17.0, 18.0, 12.0, 34.0, 47.0, 88.0, 114.0, 157.0, 199.0, 313.0, 403.0, 595.0, 883.0, 1269.0, 1951.0, 2957.0, 4450.0, 6854.0, 10989.0, 17409.0, 29387.0, 52234.0, 97966.0, 185731.0, 255804.0, 169070.0, 89091.0, 47916.0, 26940.0, 16506.0, 10110.0, 6404.0, 4039.0, 2824.0, 1875.0, 1231.0, 834.0, 591.0, 349.0, 259.0, 174.0, 136.0, 115.0, 73.0, 49.0, 30.0, 24.0, 15.0, 12.0, 11.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58935546875, -0.5699844360351562, -0.5506134033203125, -0.5312423706054688, -0.511871337890625, -0.49250030517578125, -0.4731292724609375, -0.45375823974609375, -0.43438720703125, -0.41501617431640625, -0.3956451416015625, -0.37627410888671875, -0.356903076171875, -0.33753204345703125, -0.3181610107421875, -0.29878997802734375, -0.2794189453125, -0.26004791259765625, -0.2406768798828125, -0.22130584716796875, -0.201934814453125, -0.18256378173828125, -0.1631927490234375, -0.14382171630859375, -0.12445068359375, -0.10507965087890625, -0.0857086181640625, -0.06633758544921875, -0.046966552734375, -0.02759552001953125, -0.0082244873046875, 0.01114654541015625, 0.030517578125, 0.04988861083984375, 0.0692596435546875, 0.08863067626953125, 0.108001708984375, 0.12737274169921875, 0.1467437744140625, 0.16611480712890625, 0.18548583984375, 0.20485687255859375, 0.2242279052734375, 0.24359893798828125, 0.262969970703125, 0.28234100341796875, 0.3017120361328125, 0.32108306884765625, 0.3404541015625, 0.35982513427734375, 0.3791961669921875, 0.39856719970703125, 0.417938232421875, 0.43730926513671875, 0.4566802978515625, 0.47605133056640625, 0.49542236328125, 0.5147933959960938, 0.5341644287109375, 0.5535354614257812, 0.572906494140625, 0.5922775268554688, 0.6116485595703125, 0.6310195922851562, 0.650390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 6.0, 10.0, 11.0, 14.0, 22.0, 18.0, 23.0, 29.0, 28.0, 35.0, 29.0, 33.0, 31.0, 31.0, 40.0, 35.0, 41.0, 40.0, 1072.0, 41.0, 34.0, 39.0, 31.0, 35.0, 31.0, 22.0, 26.0, 22.0, 27.0, 21.0, 16.0, 16.0, 13.0, 15.0, 10.0, 15.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.859375, -2.778076171875, -2.69677734375, -2.615478515625, -2.5341796875, -2.452880859375, -2.37158203125, -2.290283203125, -2.208984375, -2.127685546875, -2.04638671875, -1.965087890625, -1.8837890625, -1.802490234375, -1.72119140625, -1.639892578125, -1.55859375, -1.477294921875, -1.39599609375, -1.314697265625, -1.2333984375, -1.152099609375, -1.07080078125, -0.989501953125, -0.908203125, -0.826904296875, -0.74560546875, -0.664306640625, -0.5830078125, -0.501708984375, -0.42041015625, -0.339111328125, -0.2578125, -0.176513671875, -0.09521484375, -0.013916015625, 0.0673828125, 0.148681640625, 0.22998046875, 0.311279296875, 0.392578125, 0.473876953125, 0.55517578125, 0.636474609375, 0.7177734375, 0.799072265625, 0.88037109375, 0.961669921875, 1.04296875, 1.124267578125, 1.20556640625, 1.286865234375, 1.3681640625, 1.449462890625, 1.53076171875, 1.612060546875, 1.693359375, 1.774658203125, 1.85595703125, 1.937255859375, 2.0185546875, 2.099853515625, 2.18115234375, 2.262451171875, 2.34375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 6.0, 10.0, 21.0, 20.0, 37.0, 62.0, 90.0, 128.0, 225.0, 348.0, 599.0, 958.0, 1519.0, 2646.0, 4361.0, 7299.0, 12503.0, 21733.0, 37855.0, 69330.0, 127592.0, 230837.0, 1267561.0, 139119.0, 74551.0, 41511.0, 23384.0, 13296.0, 7764.0, 4641.0, 2717.0, 1701.0, 1027.0, 642.0, 345.0, 251.0, 162.0, 85.0, 73.0, 43.0, 28.0, 18.0, 9.0, 9.0, 11.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5283203125, -0.5113143920898438, -0.4943084716796875, -0.47730255126953125, -0.460296630859375, -0.44329071044921875, -0.4262847900390625, -0.40927886962890625, -0.39227294921875, -0.37526702880859375, -0.3582611083984375, -0.34125518798828125, -0.324249267578125, -0.30724334716796875, -0.2902374267578125, -0.27323150634765625, -0.2562255859375, -0.23921966552734375, -0.2222137451171875, -0.20520782470703125, -0.188201904296875, -0.17119598388671875, -0.1541900634765625, -0.13718414306640625, -0.12017822265625, -0.10317230224609375, -0.0861663818359375, -0.06916046142578125, -0.052154541015625, -0.03514862060546875, -0.0181427001953125, -0.00113677978515625, 0.015869140625, 0.03287506103515625, 0.0498809814453125, 0.06688690185546875, 0.083892822265625, 0.10089874267578125, 0.1179046630859375, 0.13491058349609375, 0.15191650390625, 0.16892242431640625, 0.1859283447265625, 0.20293426513671875, 0.219940185546875, 0.23694610595703125, 0.2539520263671875, 0.27095794677734375, 0.2879638671875, 0.30496978759765625, 0.3219757080078125, 0.33898162841796875, 0.355987548828125, 0.37299346923828125, 0.3899993896484375, 0.40700531005859375, 0.42401123046875, 0.44101715087890625, 0.4580230712890625, 0.47502899169921875, 0.492034912109375, 0.5090408325195312, 0.5260467529296875, 0.5430526733398438, 0.56005859375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 9.0, 4.0, 8.0, 12.0, 15.0, 24.0, 20.0, 43.0, 37.0, 63.0, 54.0, 68.0, 66.0, 85.0, 77.0, 85.0, 67.0, 51.0, 40.0, 41.0, 36.0, 28.0, 10.0, 10.0, 12.0, 5.0, 6.0, 6.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015535354614257812, -0.00149555504322052, -0.0014375746250152588, -0.0013795942068099976, -0.0013216137886047363, -0.001263633370399475, -0.0012056529521942139, -0.0011476725339889526, -0.0010896921157836914, -0.0010317116975784302, -0.0009737312793731689, -0.0009157508611679077, -0.0008577704429626465, -0.0007997900247573853, -0.000741809606552124, -0.0006838291883468628, -0.0006258487701416016, -0.0005678683519363403, -0.0005098879337310791, -0.00045190751552581787, -0.00039392709732055664, -0.0003359466791152954, -0.0002779662609100342, -0.00021998584270477295, -0.00016200542449951172, -0.00010402500629425049, -4.604458808898926e-05, 1.1935830116271973e-05, 6.99162483215332e-05, 0.00012789666652679443, 0.00018587708473205566, 0.0002438575029373169, 0.0003018379211425781, 0.00035981833934783936, 0.0004177987575531006, 0.0004757791757583618, 0.000533759593963623, 0.0005917400121688843, 0.0006497204303741455, 0.0007077008485794067, 0.000765681266784668, 0.0008236616849899292, 0.0008816421031951904, 0.0009396225214004517, 0.0009976029396057129, 0.0010555833578109741, 0.0011135637760162354, 0.0011715441942214966, 0.0012295246124267578, 0.001287505030632019, 0.0013454854488372803, 0.0014034658670425415, 0.0014614462852478027, 0.001519426703453064, 0.0015774071216583252, 0.0016353875398635864, 0.0016933679580688477, 0.0017513483762741089, 0.0018093287944793701, 0.0018673092126846313, 0.0019252896308898926, 0.001983270049095154, 0.002041250467300415, 0.0020992308855056763, 0.0021572113037109375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 9.0, 8.0, 6.0, 18.0, 18.0, 25.0, 36.0, 39.0, 45.0, 76.0, 88.0, 129.0, 190.0, 321.0, 483.0, 950.0, 8580.0, 1032903.0, 2423.0, 791.0, 427.0, 288.0, 175.0, 132.0, 90.0, 67.0, 65.0, 35.0, 26.0, 26.0, 15.0, 18.0, 6.0, 6.0, 8.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03228759765625, -0.031258583068847656, -0.030229568481445312, -0.02920055389404297, -0.028171539306640625, -0.02714252471923828, -0.026113510131835938, -0.025084495544433594, -0.02405548095703125, -0.023026466369628906, -0.021997451782226562, -0.02096843719482422, -0.019939422607421875, -0.01891040802001953, -0.017881393432617188, -0.016852378845214844, -0.0158233642578125, -0.014794349670410156, -0.013765335083007812, -0.012736320495605469, -0.011707305908203125, -0.010678291320800781, -0.009649276733398438, -0.008620262145996094, -0.00759124755859375, -0.006562232971191406, -0.0055332183837890625, -0.004504203796386719, -0.003475189208984375, -0.0024461746215820312, -0.0014171600341796875, -0.00038814544677734375, 0.000640869140625, 0.0016698837280273438, 0.0026988983154296875, 0.0037279129028320312, 0.004756927490234375, 0.005785942077636719, 0.0068149566650390625, 0.007843971252441406, 0.00887298583984375, 0.009902000427246094, 0.010931015014648438, 0.011960029602050781, 0.012989044189453125, 0.014018058776855469, 0.015047073364257812, 0.016076087951660156, 0.0171051025390625, 0.018134117126464844, 0.019163131713867188, 0.02019214630126953, 0.021221160888671875, 0.02225017547607422, 0.023279190063476562, 0.024308204650878906, 0.02533721923828125, 0.026366233825683594, 0.027395248413085938, 0.02842426300048828, 0.029453277587890625, 0.03048229217529297, 0.03151130676269531, 0.032540321350097656, 0.0335693359375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 861.0, 139.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003612068947404623, -0.0033659166656434536, -0.003119764616712928, -0.002873612567782402, -0.0026274602860212326, -0.002381308004260063, -0.0021351559553295374, -0.0018890037899836898, -0.0016428516246378422, -0.0013966994592919946, -0.001150547293946147, -0.0009043951286002994, -0.0006582429632544518, -0.00041209079790860415, -0.00016593863256275654, 8.021353278309107e-05, 0.0003263656981289387, 0.0005725178634747863, 0.0008186700288206339, 0.0010648221941664815, 0.001310974359512329, 0.0015571265248581767, 0.0018032786902040243, 0.00204943073913455, 0.0022955830208957195, 0.002541735302656889, 0.0027878873515874147, 0.0030340394005179405, 0.00328019168227911, 0.0035263439640402794, 0.003772496012970805, 0.004018648061901331, 0.004264800809323788, 0.004510953091084957, 0.0047571053728461266, 0.005003257188946009, 0.005249409470707178, 0.0054955617524683475, 0.00574171356856823, 0.005987865850329399, 0.0062340181320905685, 0.006480170413851738, 0.006726322695612907, 0.0069724745117127895, 0.007218626793473959, 0.007464779075235128, 0.0077109308913350105, 0.00795708317309618, 0.00820323545485735, 0.008449387736618519, 0.008695540018379688, 0.008941692300140858, 0.009187843650579453, 0.009433995932340622, 0.009680148214101791, 0.00992630049586296, 0.01017245277762413, 0.0104186050593853, 0.010664757341146469, 0.010910909622907639, 0.011157061904668808, 0.011403213255107403, 0.011649365536868572, 0.011895517818629742, 0.012141670100390911]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 9.0, 4.0, 8.0, 2.0, 7.0, 10.0, 6.0, 14.0, 24.0, 21.0, 21.0, 27.0, 23.0, 37.0, 32.0, 42.0, 39.0, 40.0, 44.0, 42.0, 45.0, 39.0, 41.0, 43.0, 40.0, 36.0, 27.0, 36.0, 36.0, 30.0, 25.0, 26.0, 27.0, 21.0, 15.0, 14.0, 10.0, 8.0, 6.0, 11.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008364319801330566, -0.0008103298023343086, -0.0007842276245355606, -0.0007581254467368126, -0.0007320232689380646, -0.0007059210911393166, -0.0006798189133405685, -0.0006537167355418205, -0.0006276145577430725, -0.0006015123799443245, -0.0005754102021455765, -0.0005493080243468285, -0.0005232058465480804, -0.0004971036687493324, -0.0004710014909505844, -0.0004448993131518364, -0.0004187971353530884, -0.00039269495755434036, -0.00036659277975559235, -0.00034049060195684433, -0.0003143884241580963, -0.0002882862463593483, -0.0002621840685606003, -0.00023608189076185226, -0.00020997971296310425, -0.00018387753516435623, -0.00015777535736560822, -0.0001316731795668602, -0.00010557100176811218, -7.946882396936417e-05, -5.336664617061615e-05, -2.7264468371868134e-05, -1.1622905731201172e-06, 2.49398872256279e-05, 5.1042065024375916e-05, 7.714424282312393e-05, 0.00010324642062187195, 0.00012934859842061996, 0.00015545077621936798, 0.000181552954018116, 0.00020765513181686401, 0.00023375730961561203, 0.00025985948741436005, 0.00028596166521310806, 0.0003120638430118561, 0.0003381660208106041, 0.0003642681986093521, 0.00039037037640810013, 0.00041647255420684814, 0.00044257473200559616, 0.0004686769098043442, 0.0004947790876030922, 0.0005208812654018402, 0.0005469834432005882, 0.0005730856209993362, 0.0005991877987980843, 0.0006252899765968323, 0.0006513921543955803, 0.0006774943321943283, 0.0007035965099930763, 0.0007296986877918243, 0.0007558008655905724, 0.0007819030433893204, 0.0008080052211880684, 0.0008341073989868164]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 0.0, 4.0, 6.0, 2.0, 3.0, 10.0, 4.0, 8.0, 9.0, 11.0, 8.0, 13.0, 17.0, 14.0, 15.0, 30.0, 29.0, 27.0, 33.0, 24.0, 43.0, 29.0, 31.0, 40.0, 33.0, 40.0, 48.0, 47.0, 43.0, 48.0, 40.0, 35.0, 34.0, 33.0, 34.0, 23.0, 24.0, 25.0, 10.0, 14.0, 10.0, 9.0, 6.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 7.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.8359375, -3.70758056640625, -3.5792236328125, -3.45086669921875, -3.322509765625, -3.19415283203125, -3.0657958984375, -2.93743896484375, -2.80908203125, -2.68072509765625, -2.5523681640625, -2.42401123046875, -2.295654296875, -2.16729736328125, -2.0389404296875, -1.91058349609375, -1.7822265625, -1.65386962890625, -1.5255126953125, -1.39715576171875, -1.268798828125, -1.14044189453125, -1.0120849609375, -0.88372802734375, -0.75537109375, -0.62701416015625, -0.4986572265625, -0.37030029296875, -0.241943359375, -0.11358642578125, 0.0147705078125, 0.14312744140625, 0.271484375, 0.39984130859375, 0.5281982421875, 0.65655517578125, 0.784912109375, 0.91326904296875, 1.0416259765625, 1.16998291015625, 1.29833984375, 1.42669677734375, 1.5550537109375, 1.68341064453125, 1.811767578125, 1.94012451171875, 2.0684814453125, 2.19683837890625, 2.3251953125, 2.45355224609375, 2.5819091796875, 2.71026611328125, 2.838623046875, 2.96697998046875, 3.0953369140625, 3.22369384765625, 3.35205078125, 3.48040771484375, 3.6087646484375, 3.73712158203125, 3.865478515625, 3.99383544921875, 4.1221923828125, 4.25054931640625, 4.37890625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 9.0, 15.0, 11.0, 12.0, 21.0, 25.0, 25.0, 42.0, 44.0, 58.0, 101.0, 102.0, 179.0, 222.0, 306.0, 427.0, 703.0, 1200.0, 2338.0, 5273.0, 14022.0, 53856.0, 323901.0, 524177.0, 87237.0, 20479.0, 6793.0, 2878.0, 1470.0, 836.0, 494.0, 361.0, 246.0, 181.0, 123.0, 101.0, 67.0, 47.0, 34.0, 28.0, 21.0, 15.0, 11.0, 9.0, 8.0, 7.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-6.90625, -6.67718505859375, -6.4481201171875, -6.21905517578125, -5.989990234375, -5.76092529296875, -5.5318603515625, -5.30279541015625, -5.07373046875, -4.84466552734375, -4.6156005859375, -4.38653564453125, -4.157470703125, -3.92840576171875, -3.6993408203125, -3.47027587890625, -3.2412109375, -3.01214599609375, -2.7830810546875, -2.55401611328125, -2.324951171875, -2.09588623046875, -1.8668212890625, -1.63775634765625, -1.40869140625, -1.17962646484375, -0.9505615234375, -0.72149658203125, -0.492431640625, -0.26336669921875, -0.0343017578125, 0.19476318359375, 0.423828125, 0.65289306640625, 0.8819580078125, 1.11102294921875, 1.340087890625, 1.56915283203125, 1.7982177734375, 2.02728271484375, 2.25634765625, 2.48541259765625, 2.7144775390625, 2.94354248046875, 3.172607421875, 3.40167236328125, 3.6307373046875, 3.85980224609375, 4.0888671875, 4.31793212890625, 4.5469970703125, 4.77606201171875, 5.005126953125, 5.23419189453125, 5.4632568359375, 5.69232177734375, 5.92138671875, 6.15045166015625, 6.3795166015625, 6.60858154296875, 6.837646484375, 7.06671142578125, 7.2957763671875, 7.52484130859375, 7.75390625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 11.0, 8.0, 9.0, 15.0, 19.0, 16.0, 17.0, 26.0, 27.0, 44.0, 51.0, 49.0, 85.0, 116.0, 448.0, 1597.0, 111.0, 73.0, 48.0, 47.0, 38.0, 45.0, 23.0, 23.0, 29.0, 14.0, 10.0, 4.0, 9.0, 5.0, 9.0, 6.0, 2.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.40625, -9.991455078125, -9.57666015625, -9.161865234375, -8.7470703125, -8.332275390625, -7.91748046875, -7.502685546875, -7.087890625, -6.673095703125, -6.25830078125, -5.843505859375, -5.4287109375, -5.013916015625, -4.59912109375, -4.184326171875, -3.76953125, -3.354736328125, -2.93994140625, -2.525146484375, -2.1103515625, -1.695556640625, -1.28076171875, -0.865966796875, -0.451171875, -0.036376953125, 0.37841796875, 0.793212890625, 1.2080078125, 1.622802734375, 2.03759765625, 2.452392578125, 2.8671875, 3.281982421875, 3.69677734375, 4.111572265625, 4.5263671875, 4.941162109375, 5.35595703125, 5.770751953125, 6.185546875, 6.600341796875, 7.01513671875, 7.429931640625, 7.8447265625, 8.259521484375, 8.67431640625, 9.089111328125, 9.50390625, 9.918701171875, 10.33349609375, 10.748291015625, 11.1630859375, 11.577880859375, 11.99267578125, 12.407470703125, 12.822265625, 13.237060546875, 13.65185546875, 14.066650390625, 14.4814453125, 14.896240234375, 15.31103515625, 15.725830078125, 16.140625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 8.0, 9.0, 3.0, 9.0, 11.0, 7.0, 20.0, 21.0, 31.0, 56.0, 87.0, 129.0, 226.0, 455.0, 1288.0, 416160.0, 2724655.0, 1413.0, 469.0, 274.0, 119.0, 85.0, 55.0, 25.0, 24.0, 18.0, 14.0, 8.0, 4.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-47.71875, -46.46435546875, -45.2099609375, -43.95556640625, -42.701171875, -41.44677734375, -40.1923828125, -38.93798828125, -37.68359375, -36.42919921875, -35.1748046875, -33.92041015625, -32.666015625, -31.41162109375, -30.1572265625, -28.90283203125, -27.6484375, -26.39404296875, -25.1396484375, -23.88525390625, -22.630859375, -21.37646484375, -20.1220703125, -18.86767578125, -17.61328125, -16.35888671875, -15.1044921875, -13.85009765625, -12.595703125, -11.34130859375, -10.0869140625, -8.83251953125, -7.578125, -6.32373046875, -5.0693359375, -3.81494140625, -2.560546875, -1.30615234375, -0.0517578125, 1.20263671875, 2.45703125, 3.71142578125, 4.9658203125, 6.22021484375, 7.474609375, 8.72900390625, 9.9833984375, 11.23779296875, 12.4921875, 13.74658203125, 15.0009765625, 16.25537109375, 17.509765625, 18.76416015625, 20.0185546875, 21.27294921875, 22.52734375, 23.78173828125, 25.0361328125, 26.29052734375, 27.544921875, 28.79931640625, 30.0537109375, 31.30810546875, 32.5625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [4.0, 9.0, 19.0, 78.0, 153.0, 246.0, 259.0, 139.0, 70.0, 23.0, 8.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.243184566497803, -3.504897117614746, -2.7666096687316895, -2.028322458267212, -1.2900350093841553, -0.5517475605010986, 0.1865396499633789, 0.9248270988464355, 1.6631145477294922, 2.401401996612549, 3.1396894454956055, 3.877976655960083, 4.616264343261719, 5.354551315307617, 6.092838764190674, 6.8311262130737305, 7.569413661956787, 8.307701110839844, 9.045988082885742, 9.784276008605957, 10.522562980651855, 11.26085090637207, 11.999137878417969, 12.737424850463867, 13.475712776184082, 14.21399974822998, 14.952287673950195, 15.690574645996094, 16.428861618041992, 17.167150497436523, 17.905437469482422, 18.64372444152832, 19.38201332092285, 20.12030029296875, 20.85858726501465, 21.59687614440918, 22.335163116455078, 23.073450088500977, 23.811737060546875, 24.550025939941406, 25.288312911987305, 26.026599884033203, 26.7648868560791, 27.503175735473633, 28.24146270751953, 28.97974967956543, 29.718036651611328, 30.45632553100586, 31.194610595703125, 31.932897567749023, 32.67118453979492, 33.40947341918945, 34.14775848388672, 34.88604736328125, 35.62433624267578, 36.36262130737305, 37.10091018676758, 37.83919906616211, 38.577484130859375, 39.315773010253906, 40.05405807495117, 40.7923469543457, 41.530635833740234, 42.2689208984375, 43.00720977783203]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 6.0, 6.0, 9.0, 6.0, 3.0, 13.0, 11.0, 8.0, 14.0, 21.0, 15.0, 22.0, 23.0, 26.0, 33.0, 30.0, 30.0, 40.0, 43.0, 46.0, 40.0, 33.0, 43.0, 31.0, 40.0, 30.0, 35.0, 30.0, 46.0, 27.0, 25.0, 21.0, 28.0, 20.0, 16.0, 26.0, 22.0, 13.0, 14.0, 11.0, 11.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-23.05164337158203, -22.2810001373291, -21.510358810424805, -20.739715576171875, -19.969074249267578, -19.19843101501465, -18.42778778076172, -17.657146453857422, -16.886503219604492, -16.115859985351562, -15.345218658447266, -14.574575424194336, -13.803933143615723, -13.03329086303711, -12.26264762878418, -11.492005348205566, -10.721363067626953, -9.95072078704834, -9.180078506469727, -8.409435272216797, -7.638792991638184, -6.86815071105957, -6.097507953643799, -5.326865196228027, -4.556222915649414, -3.7855803966522217, -3.0149378776550293, -2.244295358657837, -1.4736528396606445, -0.7030103206634521, 0.06763219833374023, 0.8382749557495117, 1.608917236328125, 2.3795597553253174, 3.1502022743225098, 3.920844793319702, 4.6914873123168945, 5.462129592895508, 6.232772350311279, 7.003415107727051, 7.774057388305664, 8.544699668884277, 9.31534194946289, 10.08598518371582, 10.856627464294434, 11.627269744873047, 12.397912979125977, 13.16855525970459, 13.939197540283203, 14.709839820861816, 15.48048210144043, 16.25112533569336, 17.021766662597656, 17.792409896850586, 18.563053131103516, 19.333694458007812, 20.104337692260742, 20.874980926513672, 21.64562225341797, 22.4162654876709, 23.186908721923828, 23.957550048828125, 24.728193283081055, 25.498836517333984, 26.26947784423828]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 7.0, 5.0, 10.0, 7.0, 10.0, 8.0, 17.0, 27.0, 19.0, 22.0, 27.0, 32.0, 33.0, 37.0, 33.0, 34.0, 60.0, 37.0, 38.0, 61.0, 49.0, 51.0, 45.0, 42.0, 35.0, 36.0, 42.0, 28.0, 21.0, 26.0, 16.0, 13.0, 10.0, 14.0, 13.0, 4.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.30859375, -5.1435546875, -4.978515625, -4.8134765625, -4.6484375, -4.4833984375, -4.318359375, -4.1533203125, -3.98828125, -3.8232421875, -3.658203125, -3.4931640625, -3.328125, -3.1630859375, -2.998046875, -2.8330078125, -2.66796875, -2.5029296875, -2.337890625, -2.1728515625, -2.0078125, -1.8427734375, -1.677734375, -1.5126953125, -1.34765625, -1.1826171875, -1.017578125, -0.8525390625, -0.6875, -0.5224609375, -0.357421875, -0.1923828125, -0.02734375, 0.1376953125, 0.302734375, 0.4677734375, 0.6328125, 0.7978515625, 0.962890625, 1.1279296875, 1.29296875, 1.4580078125, 1.623046875, 1.7880859375, 1.953125, 2.1181640625, 2.283203125, 2.4482421875, 2.61328125, 2.7783203125, 2.943359375, 3.1083984375, 3.2734375, 3.4384765625, 3.603515625, 3.7685546875, 3.93359375, 4.0986328125, 4.263671875, 4.4287109375, 4.59375, 4.7587890625, 4.923828125, 5.0888671875, 5.25390625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 6.0, 9.0, 8.0, 17.0, 20.0, 26.0, 44.0, 32.0, 53.0, 76.0, 90.0, 107.0, 135.0, 210.0, 256.0, 385.0, 618.0, 1189.0, 3628.0, 46896.0, 3683444.0, 445041.0, 7740.0, 1744.0, 771.0, 491.0, 302.0, 207.0, 147.0, 145.0, 95.0, 79.0, 55.0, 35.0, 39.0, 30.0, 16.0, 23.0, 21.0, 9.0, 10.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.40625, -30.446044921875, -29.48583984375, -28.525634765625, -27.5654296875, -26.605224609375, -25.64501953125, -24.684814453125, -23.724609375, -22.764404296875, -21.80419921875, -20.843994140625, -19.8837890625, -18.923583984375, -17.96337890625, -17.003173828125, -16.04296875, -15.082763671875, -14.12255859375, -13.162353515625, -12.2021484375, -11.241943359375, -10.28173828125, -9.321533203125, -8.361328125, -7.401123046875, -6.44091796875, -5.480712890625, -4.5205078125, -3.560302734375, -2.60009765625, -1.639892578125, -0.6796875, 0.280517578125, 1.24072265625, 2.200927734375, 3.1611328125, 4.121337890625, 5.08154296875, 6.041748046875, 7.001953125, 7.962158203125, 8.92236328125, 9.882568359375, 10.8427734375, 11.802978515625, 12.76318359375, 13.723388671875, 14.68359375, 15.643798828125, 16.60400390625, 17.564208984375, 18.5244140625, 19.484619140625, 20.44482421875, 21.405029296875, 22.365234375, 23.325439453125, 24.28564453125, 25.245849609375, 26.2060546875, 27.166259765625, 28.12646484375, 29.086669921875, 30.046875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 7.0, 14.0, 13.0, 27.0, 35.0, 43.0, 58.0, 112.0, 170.0, 245.0, 378.0, 514.0, 592.0, 523.0, 431.0, 279.0, 195.0, 144.0, 77.0, 57.0, 40.0, 31.0, 17.0, 15.0, 9.0, 8.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.3671875, -9.0804443359375, -8.793701171875, -8.5069580078125, -8.22021484375, -7.9334716796875, -7.646728515625, -7.3599853515625, -7.0732421875, -6.7864990234375, -6.499755859375, -6.2130126953125, -5.92626953125, -5.6395263671875, -5.352783203125, -5.0660400390625, -4.779296875, -4.4925537109375, -4.205810546875, -3.9190673828125, -3.63232421875, -3.3455810546875, -3.058837890625, -2.7720947265625, -2.4853515625, -2.1986083984375, -1.911865234375, -1.6251220703125, -1.33837890625, -1.0516357421875, -0.764892578125, -0.4781494140625, -0.19140625, 0.0953369140625, 0.382080078125, 0.6688232421875, 0.95556640625, 1.2423095703125, 1.529052734375, 1.8157958984375, 2.1025390625, 2.3892822265625, 2.676025390625, 2.9627685546875, 3.24951171875, 3.5362548828125, 3.822998046875, 4.1097412109375, 4.396484375, 4.6832275390625, 4.969970703125, 5.2567138671875, 5.54345703125, 5.8302001953125, 6.116943359375, 6.4036865234375, 6.6904296875, 6.9771728515625, 7.263916015625, 7.5506591796875, 7.83740234375, 8.1241455078125, 8.410888671875, 8.6976318359375, 8.984375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 23.0, 12.0, 36.0, 52.0, 106.0, 274.0, 777.0, 2414.0, 11196.0, 105131.0, 2777698.0, 1233180.0, 53430.0, 7227.0, 1681.0, 582.0, 212.0, 103.0, 56.0, 24.0, 17.0, 10.0, 10.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0625, -10.61767578125, -10.1728515625, -9.72802734375, -9.283203125, -8.83837890625, -8.3935546875, -7.94873046875, -7.50390625, -7.05908203125, -6.6142578125, -6.16943359375, -5.724609375, -5.27978515625, -4.8349609375, -4.39013671875, -3.9453125, -3.50048828125, -3.0556640625, -2.61083984375, -2.166015625, -1.72119140625, -1.2763671875, -0.83154296875, -0.38671875, 0.05810546875, 0.5029296875, 0.94775390625, 1.392578125, 1.83740234375, 2.2822265625, 2.72705078125, 3.171875, 3.61669921875, 4.0615234375, 4.50634765625, 4.951171875, 5.39599609375, 5.8408203125, 6.28564453125, 6.73046875, 7.17529296875, 7.6201171875, 8.06494140625, 8.509765625, 8.95458984375, 9.3994140625, 9.84423828125, 10.2890625, 10.73388671875, 11.1787109375, 11.62353515625, 12.068359375, 12.51318359375, 12.9580078125, 13.40283203125, 13.84765625, 14.29248046875, 14.7373046875, 15.18212890625, 15.626953125, 16.07177734375, 16.5166015625, 16.96142578125, 17.40625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 9.0, 11.0, 20.0, 38.0, 80.0, 93.0, 148.0, 170.0, 134.0, 132.0, 74.0, 45.0, 19.0, 10.0, 8.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.44524383544922, -54.77109909057617, -52.096954345703125, -49.422813415527344, -46.7486686706543, -44.07452392578125, -41.4003791809082, -38.726234436035156, -36.052093505859375, -33.37794876098633, -30.703805923461914, -28.029661178588867, -25.355518341064453, -22.681373596191406, -20.00722885131836, -17.333086013793945, -14.658939361572266, -11.984795570373535, -9.310651779174805, -6.636507034301758, -3.9623632431030273, -1.2882194519042969, 1.38592529296875, 4.060068130493164, 6.734212875366211, 9.408356666564941, 12.082500457763672, 14.756645202636719, 17.430789947509766, 20.10493278503418, 22.779077529907227, 25.45322036743164, 28.127365112304688, 30.801509857177734, 33.47565460205078, 36.14979553222656, 38.82394027709961, 41.498085021972656, 44.1722297668457, 46.84637451171875, 49.52051544189453, 52.19466018676758, 54.868804931640625, 57.542945861816406, 60.21709060668945, 62.8912353515625, 65.56538391113281, 68.2395248413086, 70.91366577148438, 73.58780670166016, 76.26195526123047, 78.93609619140625, 81.61024475097656, 84.28438568115234, 86.95852661132812, 89.63267517089844, 92.30682373046875, 94.98096466064453, 97.65511322021484, 100.32925415039062, 103.00340270996094, 105.67754364013672, 108.3516845703125, 111.02583312988281, 113.6999740600586]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 6.0, 8.0, 8.0, 9.0, 15.0, 11.0, 17.0, 23.0, 24.0, 27.0, 28.0, 25.0, 29.0, 24.0, 42.0, 36.0, 38.0, 52.0, 37.0, 26.0, 48.0, 47.0, 30.0, 29.0, 41.0, 38.0, 32.0, 36.0, 35.0, 20.0, 19.0, 21.0, 18.0, 11.0, 18.0, 13.0, 7.0, 13.0, 8.0, 9.0, 4.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.084197998046875, -26.1844482421875, -25.284700393676758, -24.384950637817383, -23.48520278930664, -22.585453033447266, -21.68570327758789, -20.785953521728516, -19.886205673217773, -18.9864559173584, -18.086708068847656, -17.18695831298828, -16.287208557128906, -15.387460708618164, -14.487710952758789, -13.58796215057373, -12.688213348388672, -11.788464546203613, -10.888715744018555, -9.98896598815918, -9.089217185974121, -8.189468383789062, -7.289719104766846, -6.389969825744629, -5.49022102355957, -4.590472221374512, -3.690722942352295, -2.7909739017486572, -1.8912248611450195, -0.9914760589599609, -0.09172677993774414, 0.8080224990844727, 1.7077693939208984, 2.607518434524536, 3.507267475128174, 4.407016754150391, 5.306765556335449, 6.206514358520508, 7.106263637542725, 8.006012916564941, 8.90576171875, 9.805510520935059, 10.705259323120117, 11.605009078979492, 12.50475788116455, 13.40450668334961, 14.304256439208984, 15.204005241394043, 16.1037540435791, 17.003503799438477, 17.90325164794922, 18.803001403808594, 19.70275115966797, 20.60249900817871, 21.502248764038086, 22.401996612548828, 23.301746368408203, 24.201496124267578, 25.10124397277832, 26.000993728637695, 26.900741577148438, 27.800491333007812, 28.700241088867188, 29.599990844726562, 30.499738693237305]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 10.0, 9.0, 15.0, 11.0, 20.0, 18.0, 16.0, 22.0, 32.0, 20.0, 24.0, 29.0, 30.0, 31.0, 34.0, 43.0, 42.0, 35.0, 47.0, 33.0, 37.0, 31.0, 39.0, 40.0, 33.0, 30.0, 25.0, 31.0, 25.0, 26.0, 17.0, 15.0, 24.0, 14.0, 10.0, 8.0, 12.0, 6.0, 11.0, 10.0, 4.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-42.59375, -41.2333984375, -39.873046875, -38.5126953125, -37.15234375, -35.7919921875, -34.431640625, -33.0712890625, -31.7109375, -30.3505859375, -28.990234375, -27.6298828125, -26.26953125, -24.9091796875, -23.548828125, -22.1884765625, -20.828125, -19.4677734375, -18.107421875, -16.7470703125, -15.38671875, -14.0263671875, -12.666015625, -11.3056640625, -9.9453125, -8.5849609375, -7.224609375, -5.8642578125, -4.50390625, -3.1435546875, -1.783203125, -0.4228515625, 0.9375, 2.2978515625, 3.658203125, 5.0185546875, 6.37890625, 7.7392578125, 9.099609375, 10.4599609375, 11.8203125, 13.1806640625, 14.541015625, 15.9013671875, 17.26171875, 18.6220703125, 19.982421875, 21.3427734375, 22.703125, 24.0634765625, 25.423828125, 26.7841796875, 28.14453125, 29.5048828125, 30.865234375, 32.2255859375, 33.5859375, 34.9462890625, 36.306640625, 37.6669921875, 39.02734375, 40.3876953125, 41.748046875, 43.1083984375, 44.46875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 12.0, 3.0, 15.0, 14.0, 21.0, 36.0, 46.0, 66.0, 92.0, 137.0, 163.0, 270.0, 365.0, 564.0, 745.0, 1106.0, 1590.0, 2315.0, 3508.0, 5365.0, 8277.0, 12489.0, 20248.0, 31952.0, 51580.0, 81918.0, 126912.0, 174760.0, 174876.0, 126072.0, 82268.0, 51296.0, 32045.0, 19996.0, 12728.0, 8158.0, 5377.0, 3475.0, 2378.0, 1586.0, 1075.0, 785.0, 574.0, 367.0, 270.0, 197.0, 136.0, 100.0, 61.0, 59.0, 30.0, 24.0, 19.0, 18.0, 3.0, 9.0, 4.0, 4.0, 4.0, 2.0], "bins": [-4.2265625, -4.094482421875, -3.96240234375, -3.830322265625, -3.6982421875, -3.566162109375, -3.43408203125, -3.302001953125, -3.169921875, -3.037841796875, -2.90576171875, -2.773681640625, -2.6416015625, -2.509521484375, -2.37744140625, -2.245361328125, -2.11328125, -1.981201171875, -1.84912109375, -1.717041015625, -1.5849609375, -1.452880859375, -1.32080078125, -1.188720703125, -1.056640625, -0.924560546875, -0.79248046875, -0.660400390625, -0.5283203125, -0.396240234375, -0.26416015625, -0.132080078125, 0.0, 0.132080078125, 0.26416015625, 0.396240234375, 0.5283203125, 0.660400390625, 0.79248046875, 0.924560546875, 1.056640625, 1.188720703125, 1.32080078125, 1.452880859375, 1.5849609375, 1.717041015625, 1.84912109375, 1.981201171875, 2.11328125, 2.245361328125, 2.37744140625, 2.509521484375, 2.6416015625, 2.773681640625, 2.90576171875, 3.037841796875, 3.169921875, 3.302001953125, 3.43408203125, 3.566162109375, 3.6982421875, 3.830322265625, 3.96240234375, 4.094482421875, 4.2265625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 1.0, 2.0, 5.0, 4.0, 11.0, 7.0, 8.0, 14.0, 12.0, 21.0, 18.0, 27.0, 32.0, 31.0, 37.0, 37.0, 36.0, 39.0, 41.0, 51.0, 42.0, 1067.0, 41.0, 47.0, 49.0, 35.0, 48.0, 32.0, 38.0, 37.0, 23.0, 18.0, 26.0, 17.0, 19.0, 11.0, 11.0, 8.0, 7.0, 7.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.8125, -23.7919921875, -22.771484375, -21.7509765625, -20.73046875, -19.7099609375, -18.689453125, -17.6689453125, -16.6484375, -15.6279296875, -14.607421875, -13.5869140625, -12.56640625, -11.5458984375, -10.525390625, -9.5048828125, -8.484375, -7.4638671875, -6.443359375, -5.4228515625, -4.40234375, -3.3818359375, -2.361328125, -1.3408203125, -0.3203125, 0.7001953125, 1.720703125, 2.7412109375, 3.76171875, 4.7822265625, 5.802734375, 6.8232421875, 7.84375, 8.8642578125, 9.884765625, 10.9052734375, 11.92578125, 12.9462890625, 13.966796875, 14.9873046875, 16.0078125, 17.0283203125, 18.048828125, 19.0693359375, 20.08984375, 21.1103515625, 22.130859375, 23.1513671875, 24.171875, 25.1923828125, 26.212890625, 27.2333984375, 28.25390625, 29.2744140625, 30.294921875, 31.3154296875, 32.3359375, 33.3564453125, 34.376953125, 35.3974609375, 36.41796875, 37.4384765625, 38.458984375, 39.4794921875, 40.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 12.0, 13.0, 28.0, 23.0, 43.0, 66.0, 103.0, 143.0, 219.0, 323.0, 557.0, 878.0, 1367.0, 2179.0, 3615.0, 6280.0, 10174.0, 18275.0, 32544.0, 60119.0, 111510.0, 191309.0, 1279580.0, 167332.0, 93223.0, 50677.0, 27796.0, 15730.0, 9076.0, 5335.0, 3170.0, 2030.0, 1201.0, 823.0, 487.0, 290.0, 200.0, 133.0, 89.0, 58.0, 39.0, 32.0, 15.0, 14.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.7578125, -5.585205078125, -5.41259765625, -5.239990234375, -5.0673828125, -4.894775390625, -4.72216796875, -4.549560546875, -4.376953125, -4.204345703125, -4.03173828125, -3.859130859375, -3.6865234375, -3.513916015625, -3.34130859375, -3.168701171875, -2.99609375, -2.823486328125, -2.65087890625, -2.478271484375, -2.3056640625, -2.133056640625, -1.96044921875, -1.787841796875, -1.615234375, -1.442626953125, -1.27001953125, -1.097412109375, -0.9248046875, -0.752197265625, -0.57958984375, -0.406982421875, -0.234375, -0.061767578125, 0.11083984375, 0.283447265625, 0.4560546875, 0.628662109375, 0.80126953125, 0.973876953125, 1.146484375, 1.319091796875, 1.49169921875, 1.664306640625, 1.8369140625, 2.009521484375, 2.18212890625, 2.354736328125, 2.52734375, 2.699951171875, 2.87255859375, 3.045166015625, 3.2177734375, 3.390380859375, 3.56298828125, 3.735595703125, 3.908203125, 4.080810546875, 4.25341796875, 4.426025390625, 4.5986328125, 4.771240234375, 4.94384765625, 5.116455078125, 5.2890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 5.0, 8.0, 5.0, 10.0, 3.0, 8.0, 11.0, 12.0, 7.0, 22.0, 15.0, 24.0, 24.0, 43.0, 37.0, 61.0, 74.0, 93.0, 79.0, 76.0, 66.0, 52.0, 44.0, 41.0, 36.0, 27.0, 15.0, 18.0, 10.0, 9.0, 15.0, 13.0, 3.0, 7.0, 2.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.06610107421875, -0.06407356262207031, -0.062046051025390625, -0.06001853942871094, -0.05799102783203125, -0.05596351623535156, -0.053936004638671875, -0.05190849304199219, -0.0498809814453125, -0.04785346984863281, -0.045825958251953125, -0.04379844665527344, -0.04177093505859375, -0.03974342346191406, -0.037715911865234375, -0.03568840026855469, -0.033660888671875, -0.03163337707519531, -0.029605865478515625, -0.027578353881835938, -0.02555084228515625, -0.023523330688476562, -0.021495819091796875, -0.019468307495117188, -0.0174407958984375, -0.015413284301757812, -0.013385772705078125, -0.011358261108398438, -0.00933074951171875, -0.0073032379150390625, -0.005275726318359375, -0.0032482147216796875, -0.001220703125, 0.0008068084716796875, 0.002834320068359375, 0.0048618316650390625, 0.00688934326171875, 0.008916854858398438, 0.010944366455078125, 0.012971878051757812, 0.0149993896484375, 0.017026901245117188, 0.019054412841796875, 0.021081924438476562, 0.02310943603515625, 0.025136947631835938, 0.027164459228515625, 0.029191970825195312, 0.031219482421875, 0.03324699401855469, 0.035274505615234375, 0.03730201721191406, 0.03932952880859375, 0.04135704040527344, 0.043384552001953125, 0.04541206359863281, 0.0474395751953125, 0.04946708679199219, 0.051494598388671875, 0.05352210998535156, 0.05554962158203125, 0.05757713317871094, 0.059604644775390625, 0.06163215637207031, 0.06365966796875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 4.0, 12.0, 17.0, 9.0, 17.0, 21.0, 26.0, 31.0, 28.0, 46.0, 53.0, 74.0, 80.0, 96.0, 132.0, 164.0, 244.0, 326.0, 556.0, 1035.0, 2121.0, 5079.0, 13413.0, 40509.0, 142992.0, 513543.0, 234296.0, 60817.0, 19499.0, 6974.0, 2861.0, 1247.0, 655.0, 380.0, 271.0, 172.0, 150.0, 113.0, 91.0, 74.0, 58.0, 54.0, 43.0, 37.0, 36.0, 19.0, 15.0, 13.0, 9.0, 3.0, 12.0, 9.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.36376953125, -0.3522834777832031, -0.34079742431640625, -0.3293113708496094, -0.3178253173828125, -0.3063392639160156, -0.29485321044921875, -0.2833671569824219, -0.271881103515625, -0.2603950500488281, -0.24890899658203125, -0.23742294311523438, -0.2259368896484375, -0.21445083618164062, -0.20296478271484375, -0.19147872924804688, -0.17999267578125, -0.16850662231445312, -0.15702056884765625, -0.14553451538085938, -0.1340484619140625, -0.12256240844726562, -0.11107635498046875, -0.09959030151367188, -0.088104248046875, -0.07661819458007812, -0.06513214111328125, -0.053646087646484375, -0.0421600341796875, -0.030673980712890625, -0.01918792724609375, -0.007701873779296875, 0.0037841796875, 0.015270233154296875, 0.02675628662109375, 0.038242340087890625, 0.0497283935546875, 0.061214447021484375, 0.07270050048828125, 0.08418655395507812, 0.095672607421875, 0.10715866088867188, 0.11864471435546875, 0.13013076782226562, 0.1416168212890625, 0.15310287475585938, 0.16458892822265625, 0.17607498168945312, 0.18756103515625, 0.19904708862304688, 0.21053314208984375, 0.22201919555664062, 0.2335052490234375, 0.24499130249023438, 0.25647735595703125, 0.2679634094238281, 0.279449462890625, 0.2909355163574219, 0.30242156982421875, 0.3139076232910156, 0.3253936767578125, 0.3368797302246094, 0.34836578369140625, 0.3598518371582031, 0.371337890625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 13.0, 20.0, 14.0, 31.0, 72.0, 112.0, 174.0, 165.0, 141.0, 92.0, 62.0, 37.0, 14.0, 14.0, 10.0, 13.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07205367088317871, -0.06828658282756805, -0.0645194947719574, -0.06075240299105644, -0.056985314935445786, -0.05321822315454483, -0.049451135098934174, -0.04568404704332352, -0.04191695898771286, -0.0381498709321022, -0.03438277915120125, -0.03061569109559059, -0.026848603039979935, -0.02308151312172413, -0.019314423203468323, -0.015547335147857666, -0.01178024336695671, -0.00801315438002348, -0.004246064927428961, -0.00047897547483444214, 0.003288113512098789, 0.007055202499032021, 0.010822292417287827, 0.014589380472898483, 0.01835647039115429, 0.022123560309410095, 0.025890648365020752, 0.029657738283276558, 0.033424828201532364, 0.03719191625714302, 0.040959008038043976, 0.04472609609365463, 0.04849318414926529, 0.052260272204875946, 0.0560273639857769, 0.05979445204138756, 0.06356154382228851, 0.06732863187789917, 0.07109571993350983, 0.07486280798912048, 0.07862989604473114, 0.0823969841003418, 0.08616407215595245, 0.08993116021156311, 0.09369825571775436, 0.09746534377336502, 0.10123243182897568, 0.10499951988458633, 0.10876661539077759, 0.11253370344638824, 0.1163007915019989, 0.12006787955760956, 0.12383497506380081, 0.12760205566883087, 0.13136914372444153, 0.13513624668121338, 0.13890331983566284, 0.1426704078912735, 0.14643749594688416, 0.1502045840024948, 0.15397167205810547, 0.15773876011371613, 0.16150584816932678, 0.16527295112609863, 0.1690400391817093]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 7.0, 5.0, 3.0, 4.0, 5.0, 7.0, 12.0, 10.0, 11.0, 13.0, 14.0, 16.0, 19.0, 27.0, 23.0, 27.0, 29.0, 28.0, 43.0, 31.0, 41.0, 52.0, 29.0, 39.0, 45.0, 48.0, 33.0, 45.0, 36.0, 32.0, 34.0, 24.0, 23.0, 20.0, 24.0, 23.0, 25.0, 20.0, 15.0, 14.0, 10.0, 6.0, 7.0, 3.0, 5.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.03513616323471069, -0.03407980874180794, -0.03302345424890518, -0.03196709603071213, -0.030910741537809372, -0.029854387044906616, -0.02879803068935871, -0.027741674333810806, -0.02668531984090805, -0.025628965348005295, -0.02457260899245739, -0.023516252636909485, -0.02245989814400673, -0.021403543651103973, -0.02034718729555607, -0.019290830940008163, -0.018234476447105408, -0.017178121954202652, -0.016121765598654747, -0.015065410174429417, -0.014009054750204086, -0.012952699325978756, -0.011896343901753426, -0.010839988477528095, -0.009783633053302765, -0.008727277629077435, -0.007670922204852104, -0.006614566780626774, -0.0055582113564014435, -0.004501855932176113, -0.0034455005079507828, -0.0023891450837254524, -0.001332789659500122, -0.0002764342352747917, 0.0007799211889505386, 0.001836276613175869, 0.0028926320374011993, 0.00394898746162653, 0.00500534288585186, 0.00606169831007719, 0.007118053734302521, 0.008174409158527851, 0.009230764582753181, 0.010287120006978512, 0.011343475431203842, 0.012399830855429173, 0.013456186279654503, 0.014512541703879833, 0.015568897128105164, 0.01662525162100792, 0.017681607976555824, 0.01873796433210373, 0.019794318825006485, 0.02085067331790924, 0.021907029673457146, 0.02296338602900505, 0.024019740521907806, 0.025076095014810562, 0.026132451370358467, 0.027188807725906372, 0.028245162218809128, 0.029301516711711884, 0.03035787306725979, 0.031414229422807693, 0.03247058391571045]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 7.0, 10.0, 10.0, 15.0, 10.0, 19.0, 20.0, 16.0, 20.0, 31.0, 23.0, 24.0, 30.0, 26.0, 34.0, 35.0, 42.0, 42.0, 34.0, 49.0, 31.0, 36.0, 34.0, 38.0, 39.0, 34.0, 33.0, 20.0, 34.0, 25.0, 25.0, 13.0, 20.0, 23.0, 13.0, 11.0, 7.0, 13.0, 6.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-42.5625, -41.20361328125, -39.8447265625, -38.48583984375, -37.126953125, -35.76806640625, -34.4091796875, -33.05029296875, -31.69140625, -30.33251953125, -28.9736328125, -27.61474609375, -26.255859375, -24.89697265625, -23.5380859375, -22.17919921875, -20.8203125, -19.46142578125, -18.1025390625, -16.74365234375, -15.384765625, -14.02587890625, -12.6669921875, -11.30810546875, -9.94921875, -8.59033203125, -7.2314453125, -5.87255859375, -4.513671875, -3.15478515625, -1.7958984375, -0.43701171875, 0.921875, 2.28076171875, 3.6396484375, 4.99853515625, 6.357421875, 7.71630859375, 9.0751953125, 10.43408203125, 11.79296875, 13.15185546875, 14.5107421875, 15.86962890625, 17.228515625, 18.58740234375, 19.9462890625, 21.30517578125, 22.6640625, 24.02294921875, 25.3818359375, 26.74072265625, 28.099609375, 29.45849609375, 30.8173828125, 32.17626953125, 33.53515625, 34.89404296875, 36.2529296875, 37.61181640625, 38.970703125, 40.32958984375, 41.6884765625, 43.04736328125, 44.40625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 11.0, 14.0, 13.0, 15.0, 17.0, 36.0, 38.0, 59.0, 83.0, 101.0, 189.0, 305.0, 539.0, 892.0, 1645.0, 2976.0, 6207.0, 16346.0, 60693.0, 306090.0, 501120.0, 108559.0, 25467.0, 8656.0, 3762.0, 1906.0, 1052.0, 652.0, 382.0, 225.0, 145.0, 112.0, 54.0, 45.0, 39.0, 31.0, 16.0, 11.0, 13.0, 9.0, 11.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.5234375, -11.1539306640625, -10.784423828125, -10.4149169921875, -10.04541015625, -9.6759033203125, -9.306396484375, -8.9368896484375, -8.5673828125, -8.1978759765625, -7.828369140625, -7.4588623046875, -7.08935546875, -6.7198486328125, -6.350341796875, -5.9808349609375, -5.611328125, -5.2418212890625, -4.872314453125, -4.5028076171875, -4.13330078125, -3.7637939453125, -3.394287109375, -3.0247802734375, -2.6552734375, -2.2857666015625, -1.916259765625, -1.5467529296875, -1.17724609375, -0.8077392578125, -0.438232421875, -0.0687255859375, 0.30078125, 0.6702880859375, 1.039794921875, 1.4093017578125, 1.77880859375, 2.1483154296875, 2.517822265625, 2.8873291015625, 3.2568359375, 3.6263427734375, 3.995849609375, 4.3653564453125, 4.73486328125, 5.1043701171875, 5.473876953125, 5.8433837890625, 6.212890625, 6.5823974609375, 6.951904296875, 7.3214111328125, 7.69091796875, 8.0604248046875, 8.429931640625, 8.7994384765625, 9.1689453125, 9.5384521484375, 9.907958984375, 10.2774658203125, 10.64697265625, 11.0164794921875, 11.385986328125, 11.7554931640625, 12.125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 8.0, 17.0, 9.0, 25.0, 32.0, 37.0, 54.0, 67.0, 94.0, 81.0, 1971.0, 275.0, 78.0, 80.0, 59.0, 44.0, 39.0, 32.0, 14.0, 15.0, 9.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.875, -143.7626953125, -139.650390625, -135.5380859375, -131.42578125, -127.3134765625, -123.201171875, -119.0888671875, -114.9765625, -110.8642578125, -106.751953125, -102.6396484375, -98.52734375, -94.4150390625, -90.302734375, -86.1904296875, -82.078125, -77.9658203125, -73.853515625, -69.7412109375, -65.62890625, -61.5166015625, -57.404296875, -53.2919921875, -49.1796875, -45.0673828125, -40.955078125, -36.8427734375, -32.73046875, -28.6181640625, -24.505859375, -20.3935546875, -16.28125, -12.1689453125, -8.056640625, -3.9443359375, 0.16796875, 4.2802734375, 8.392578125, 12.5048828125, 16.6171875, 20.7294921875, 24.841796875, 28.9541015625, 33.06640625, 37.1787109375, 41.291015625, 45.4033203125, 49.515625, 53.6279296875, 57.740234375, 61.8525390625, 65.96484375, 70.0771484375, 74.189453125, 78.3017578125, 82.4140625, 86.5263671875, 90.638671875, 94.7509765625, 98.86328125, 102.9755859375, 107.087890625, 111.2001953125, 115.3125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 16.0, 12.0, 20.0, 24.0, 46.0, 78.0, 112.0, 254.0, 500.0, 1309.0, 4723.0, 149646.0, 2966920.0, 18150.0, 2321.0, 790.0, 343.0, 191.0, 93.0, 52.0, 36.0, 26.0, 14.0, 11.0, 5.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.40625, -30.4013671875, -29.396484375, -28.3916015625, -27.38671875, -26.3818359375, -25.376953125, -24.3720703125, -23.3671875, -22.3623046875, -21.357421875, -20.3525390625, -19.34765625, -18.3427734375, -17.337890625, -16.3330078125, -15.328125, -14.3232421875, -13.318359375, -12.3134765625, -11.30859375, -10.3037109375, -9.298828125, -8.2939453125, -7.2890625, -6.2841796875, -5.279296875, -4.2744140625, -3.26953125, -2.2646484375, -1.259765625, -0.2548828125, 0.75, 1.7548828125, 2.759765625, 3.7646484375, 4.76953125, 5.7744140625, 6.779296875, 7.7841796875, 8.7890625, 9.7939453125, 10.798828125, 11.8037109375, 12.80859375, 13.8134765625, 14.818359375, 15.8232421875, 16.828125, 17.8330078125, 18.837890625, 19.8427734375, 20.84765625, 21.8525390625, 22.857421875, 23.8623046875, 24.8671875, 25.8720703125, 26.876953125, 27.8818359375, 28.88671875, 29.8916015625, 30.896484375, 31.9013671875, 32.90625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 11.0, 24.0, 68.0, 167.0, 347.0, 225.0, 93.0, 26.0, 19.0, 8.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.62771606445312, -86.21513366699219, -78.80254364013672, -71.38995361328125, -63.97737121582031, -56.56478500366211, -49.152198791503906, -41.7396125793457, -34.3270263671875, -26.914440155029297, -19.501853942871094, -12.08926773071289, -4.6766815185546875, 2.7359046936035156, 10.148490905761719, 17.561077117919922, 24.973663330078125, 32.38624954223633, 39.79883575439453, 47.211421966552734, 54.62400817871094, 62.03659439086914, 69.44918060302734, 76.86177062988281, 84.27435302734375, 91.68693542480469, 99.09952545166016, 106.51211547851562, 113.92469787597656, 121.3372802734375, 128.7498779296875, 136.16246032714844, 143.57504272460938, 150.9876251220703, 158.40020751953125, 165.81280517578125, 173.2253875732422, 180.63796997070312, 188.05056762695312, 195.46315002441406, 202.875732421875, 210.28831481933594, 217.70089721679688, 225.11349487304688, 232.5260772705078, 239.93865966796875, 247.35125732421875, 254.7638397216797, 262.1764221191406, 269.5890197753906, 277.0015869140625, 284.4141845703125, 291.8267822265625, 299.2393493652344, 306.6519470214844, 314.06451416015625, 321.47711181640625, 328.88970947265625, 336.3022766113281, 343.7148742675781, 351.12744140625, 358.5400390625, 365.95263671875, 373.3652038574219, 380.7778015136719]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 12.0, 12.0, 19.0, 15.0, 25.0, 35.0, 29.0, 34.0, 48.0, 53.0, 53.0, 55.0, 51.0, 49.0, 43.0, 46.0, 61.0, 41.0, 42.0, 61.0, 34.0, 25.0, 19.0, 19.0, 22.0, 21.0, 8.0, 9.0, 12.0, 10.0, 3.0, 8.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-114.47296142578125, -111.21401977539062, -107.955078125, -104.69613647460938, -101.43719482421875, -98.17825317382812, -94.9193115234375, -91.66036987304688, -88.40142822265625, -85.14248657226562, -81.883544921875, -78.62460327148438, -75.36566162109375, -72.10671997070312, -68.8477783203125, -65.58883666992188, -62.32990264892578, -59.070960998535156, -55.81201934814453, -52.553077697753906, -49.29413604736328, -46.035194396972656, -42.7762565612793, -39.51731491088867, -36.25837326049805, -32.99943161010742, -29.740489959716797, -26.481550216674805, -23.22260856628418, -19.963666915893555, -16.704727172851562, -13.445785522460938, -10.186843872070312, -6.927902698516846, -3.668961524963379, -0.4100208282470703, 2.8489208221435547, 6.10786247253418, 9.366802215576172, 12.625743865966797, 15.884685516357422, 19.143627166748047, 22.402568817138672, 25.661508560180664, 28.92045021057129, 32.17938995361328, 35.438331604003906, 38.69727325439453, 41.956214904785156, 45.21515655517578, 48.474098205566406, 51.73303985595703, 54.991981506347656, 58.25092315673828, 61.50986099243164, 64.768798828125, 68.02774047851562, 71.28668212890625, 74.54562377929688, 77.8045654296875, 81.06350708007812, 84.32244873046875, 87.58139038085938, 90.84033203125, 94.09927368164062]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 8.0, 11.0, 15.0, 19.0, 28.0, 37.0, 65.0, 92.0, 131.0, 141.0, 191.0, 285.0, 343.0, 465.0, 624.0, 905.0, 1040176.0, 1711.0, 904.0, 612.0, 418.0, 344.0, 272.0, 213.0, 138.0, 121.0, 81.0, 50.0, 48.0, 22.0, 30.0, 18.0, 15.0, 10.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.43365478515625, -26.28952980041504, -25.145404815673828, -24.00128173828125, -22.85715675354004, -21.713031768798828, -20.568906784057617, -19.424781799316406, -18.280658721923828, -17.136533737182617, -15.992409706115723, -14.848284721374512, -13.704160690307617, -12.560035705566406, -11.415910720825195, -10.2717866897583, -9.127660751342773, -7.983536243438721, -6.839411735534668, -5.695286750793457, -4.551162242889404, -3.4070377349853516, -2.2629127502441406, -1.118788719177246, 0.025336265563964844, 1.1694608926773071, 2.3135855197906494, 3.4577102661132812, 4.601834774017334, 5.745959281921387, 6.890084266662598, 8.034208297729492, 9.178333282470703, 10.322458267211914, 11.466582298278809, 12.61070728302002, 13.754831314086914, 14.898956298828125, 16.043081283569336, 17.187206268310547, 18.331329345703125, 19.475454330444336, 20.619579315185547, 21.763702392578125, 22.907827377319336, 24.051952362060547, 25.196077346801758, 26.34020233154297, 27.48432731628418, 28.62845230102539, 29.7725772857666, 30.916702270507812, 32.06082534790039, 33.20494842529297, 34.34907531738281, 35.49319839477539, 36.637325286865234, 37.78144836425781, 38.925575256347656, 40.069698333740234, 41.21382522583008, 42.357948303222656, 43.5020751953125, 44.64619827270508, 45.790321350097656]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 7.0, 6.0, 6.0, 4.0, 6.0, 8.0, 10.0, 18.0, 31.0, 57.0, 153.0, 10681.0, 51451892.0, 170.0, 48.0, 18.0, 14.0, 6.0, 7.0, 3.0, 8.0, 5.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2576.9765625, -2478.245849609375, -2379.51513671875, -2280.784423828125, -2182.0537109375, -2083.322998046875, -1984.59228515625, -1885.861572265625, -1787.130859375, -1688.400146484375, -1589.66943359375, -1490.938720703125, -1392.2080078125, -1293.477294921875, -1194.74658203125, -1096.015869140625, -997.2850341796875, -898.5543212890625, -799.8236083984375, -701.0928955078125, -602.3621826171875, -503.6314392089844, -404.90069580078125, -306.16998291015625, -207.43927001953125, -108.70854949951172, -9.977828979492188, 88.75289916992188, 187.48361206054688, 286.2143249511719, 384.945068359375, 483.67578125, 582.406494140625, 681.13720703125, 779.867919921875, 878.5986328125, 977.329345703125, 1076.06005859375, 1174.790771484375, 1273.521484375, 1372.252197265625, 1470.98291015625, 1569.713623046875, 1668.4443359375, 1767.175048828125, 1865.90576171875, 1964.636474609375, 2063.3671875, 2162.09814453125, 2260.828857421875, 2359.5595703125, 2458.290283203125, 2557.02099609375, 2655.751708984375, 2754.482421875, 2853.213134765625, 2951.94384765625, 3050.674560546875, 3149.4052734375, 3248.135986328125, 3346.86669921875, 3445.597412109375, 3544.328125, 3643.058837890625, 3741.78955078125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 11.0, 7.0, 7.0, 22.0, 38.0, 42.0, 63.0, 92.0, 121.0, 151.0, 202.0, 296.0, 379.0, 493.0, 833.0, 1177.0, 1647.0, 2427.0, 3529.0, 5489.0, 8623.0, 13538.0, 22836.0, 38799.0, 68611.0, 129379.0, 244227.0, 442904.0, 2928465.0, 1457480.0, 414743.0, 226887.0, 119603.0, 64500.0, 35892.0, 21091.0, 12758.0, 8105.0, 5143.0, 3307.0, 2320.0, 1588.0, 1052.0, 706.0, 546.0, 346.0, 290.0, 201.0, 130.0, 88.0, 74.0, 60.0, 34.0, 28.0, 23.0, 19.0, 10.0, 8.0, 5.0], "bins": [-2.091796875, -2.0301666259765625, -1.968536376953125, -1.9069061279296875, -1.84527587890625, -1.7836456298828125, -1.722015380859375, -1.6603851318359375, -1.5987548828125, -1.5371246337890625, -1.475494384765625, -1.4138641357421875, -1.35223388671875, -1.2906036376953125, -1.228973388671875, -1.1673431396484375, -1.105712890625, -1.0440826416015625, -0.982452392578125, -0.9208221435546875, -0.85919189453125, -0.7975616455078125, -0.735931396484375, -0.6743011474609375, -0.6126708984375, -0.5510406494140625, -0.489410400390625, -0.4277801513671875, -0.36614990234375, -0.3045196533203125, -0.242889404296875, -0.1812591552734375, -0.11962890625, -0.0579986572265625, 0.003631591796875, 0.0652618408203125, 0.12689208984375, 0.1885223388671875, 0.250152587890625, 0.3117828369140625, 0.3734130859375, 0.4350433349609375, 0.496673583984375, 0.5583038330078125, 0.61993408203125, 0.6815643310546875, 0.743194580078125, 0.8048248291015625, 0.866455078125, 0.9280853271484375, 0.989715576171875, 1.0513458251953125, 1.11297607421875, 1.1746063232421875, 1.236236572265625, 1.2978668212890625, 1.3594970703125, 1.4211273193359375, 1.482757568359375, 1.5443878173828125, 1.60601806640625, 1.6676483154296875, 1.729278564453125, 1.7909088134765625, 1.8525390625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 9.0, 10.0, 6.0, 10.0, 15.0, 7.0, 17.0, 21.0, 14.0, 23.0, 36.0, 32.0, 34.0, 31.0, 33.0, 44.0, 37.0, 46.0, 129.0, 759.0, 244.0, 43.0, 33.0, 39.0, 45.0, 37.0, 32.0, 20.0, 25.0, 22.0, 26.0, 18.0, 20.0, 29.0, 11.0, 8.0, 13.0, 6.0, 4.0, 6.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.2890625, -8.966552734375, -8.64404296875, -8.321533203125, -7.9990234375, -7.676513671875, -7.35400390625, -7.031494140625, -6.708984375, -6.386474609375, -6.06396484375, -5.741455078125, -5.4189453125, -5.096435546875, -4.77392578125, -4.451416015625, -4.12890625, -3.806396484375, -3.48388671875, -3.161376953125, -2.8388671875, -2.516357421875, -2.19384765625, -1.871337890625, -1.548828125, -1.226318359375, -0.90380859375, -0.581298828125, -0.2587890625, 0.063720703125, 0.38623046875, 0.708740234375, 1.03125, 1.353759765625, 1.67626953125, 1.998779296875, 2.3212890625, 2.643798828125, 2.96630859375, 3.288818359375, 3.611328125, 3.933837890625, 4.25634765625, 4.578857421875, 4.9013671875, 5.223876953125, 5.54638671875, 5.868896484375, 6.19140625, 6.513916015625, 6.83642578125, 7.158935546875, 7.4814453125, 7.803955078125, 8.12646484375, 8.448974609375, 8.771484375, 9.093994140625, 9.41650390625, 9.739013671875, 10.0615234375, 10.384033203125, 10.70654296875, 11.029052734375, 11.3515625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 10.0, 32.0, 33.0, 42.0, 73.0, 108.0, 167.0, 223.0, 294.0, 451.0, 638.0, 1065.0, 1621.0, 2474.0, 3801.0, 5940.0, 9829.0, 15979.0, 27510.0, 47915.0, 84866.0, 156282.0, 298747.0, 587823.0, 3764142.0, 606279.0, 308329.0, 160117.0, 86595.0, 48067.0, 28051.0, 16457.0, 10107.0, 6183.0, 3929.0, 2487.0, 1591.0, 1032.0, 715.0, 454.0, 325.0, 218.0, 128.0, 96.0, 68.0, 30.0, 24.0, 18.0, 25.0, 15.0, 10.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0], "bins": [-2.296875, -2.22161865234375, -2.1463623046875, -2.07110595703125, -1.995849609375, -1.92059326171875, -1.8453369140625, -1.77008056640625, -1.69482421875, -1.61956787109375, -1.5443115234375, -1.46905517578125, -1.393798828125, -1.31854248046875, -1.2432861328125, -1.16802978515625, -1.0927734375, -1.01751708984375, -0.9422607421875, -0.86700439453125, -0.791748046875, -0.71649169921875, -0.6412353515625, -0.56597900390625, -0.49072265625, -0.41546630859375, -0.3402099609375, -0.26495361328125, -0.189697265625, -0.11444091796875, -0.0391845703125, 0.03607177734375, 0.111328125, 0.18658447265625, 0.2618408203125, 0.33709716796875, 0.412353515625, 0.48760986328125, 0.5628662109375, 0.63812255859375, 0.71337890625, 0.78863525390625, 0.8638916015625, 0.93914794921875, 1.014404296875, 1.08966064453125, 1.1649169921875, 1.24017333984375, 1.3154296875, 1.39068603515625, 1.4659423828125, 1.54119873046875, 1.616455078125, 1.69171142578125, 1.7669677734375, 1.84222412109375, 1.91748046875, 1.99273681640625, 2.0679931640625, 2.14324951171875, 2.218505859375, 2.29376220703125, 2.3690185546875, 2.44427490234375, 2.51953125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 4.0, 2.0, 14.0, 13.0, 22.0, 17.0, 19.0, 12.0, 20.0, 28.0, 20.0, 37.0, 29.0, 30.0, 36.0, 31.0, 39.0, 36.0, 101.0, 681.0, 338.0, 57.0, 41.0, 42.0, 40.0, 47.0, 39.0, 23.0, 23.0, 25.0, 19.0, 21.0, 26.0, 12.0, 13.0, 11.0, 12.0, 8.0, 6.0, 9.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.90625, -7.666259765625, -7.42626953125, -7.186279296875, -6.9462890625, -6.706298828125, -6.46630859375, -6.226318359375, -5.986328125, -5.746337890625, -5.50634765625, -5.266357421875, -5.0263671875, -4.786376953125, -4.54638671875, -4.306396484375, -4.06640625, -3.826416015625, -3.58642578125, -3.346435546875, -3.1064453125, -2.866455078125, -2.62646484375, -2.386474609375, -2.146484375, -1.906494140625, -1.66650390625, -1.426513671875, -1.1865234375, -0.946533203125, -0.70654296875, -0.466552734375, -0.2265625, 0.013427734375, 0.25341796875, 0.493408203125, 0.7333984375, 0.973388671875, 1.21337890625, 1.453369140625, 1.693359375, 1.933349609375, 2.17333984375, 2.413330078125, 2.6533203125, 2.893310546875, 3.13330078125, 3.373291015625, 3.61328125, 3.853271484375, 4.09326171875, 4.333251953125, 4.5732421875, 4.813232421875, 5.05322265625, 5.293212890625, 5.533203125, 5.773193359375, 6.01318359375, 6.253173828125, 6.4931640625, 6.733154296875, 6.97314453125, 7.213134765625, 7.453125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 1.0, 5.0, 7.0, 13.0, 24.0, 26.0, 32.0, 50.0, 71.0, 72.0, 105.0, 136.0, 192.0, 289.0, 312.0, 452.0, 706.0, 965.0, 1557.0, 2628.0, 4359.0, 8559.0, 19359.0, 62235.0, 5495867.0, 595629.0, 58679.0, 18992.0, 8323.0, 4279.0, 2475.0, 1561.0, 1012.0, 672.0, 460.0, 353.0, 259.0, 159.0, 140.0, 100.0, 84.0, 61.0, 42.0, 39.0, 27.0, 21.0, 12.0, 14.0, 12.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-10.609375, -10.2877197265625, -9.966064453125, -9.6444091796875, -9.32275390625, -9.0010986328125, -8.679443359375, -8.3577880859375, -8.0361328125, -7.7144775390625, -7.392822265625, -7.0711669921875, -6.74951171875, -6.4278564453125, -6.106201171875, -5.7845458984375, -5.462890625, -5.1412353515625, -4.819580078125, -4.4979248046875, -4.17626953125, -3.8546142578125, -3.532958984375, -3.2113037109375, -2.8896484375, -2.5679931640625, -2.246337890625, -1.9246826171875, -1.60302734375, -1.2813720703125, -0.959716796875, -0.6380615234375, -0.31640625, 0.0052490234375, 0.326904296875, 0.6485595703125, 0.97021484375, 1.2918701171875, 1.613525390625, 1.9351806640625, 2.2568359375, 2.5784912109375, 2.900146484375, 3.2218017578125, 3.54345703125, 3.8651123046875, 4.186767578125, 4.5084228515625, 4.830078125, 5.1517333984375, 5.473388671875, 5.7950439453125, 6.11669921875, 6.4383544921875, 6.760009765625, 7.0816650390625, 7.4033203125, 7.7249755859375, 8.046630859375, 8.3682861328125, 8.68994140625, 9.0115966796875, 9.333251953125, 9.6549072265625, 9.9765625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 5.0, 6.0, 4.0, 5.0, 9.0, 12.0, 10.0, 9.0, 23.0, 16.0, 20.0, 18.0, 21.0, 19.0, 25.0, 31.0, 44.0, 32.0, 32.0, 38.0, 51.0, 74.0, 141.0, 505.0, 394.0, 75.0, 40.0, 30.0, 32.0, 36.0, 26.0, 31.0, 19.0, 18.0, 20.0, 19.0, 12.0, 23.0, 9.0, 16.0, 15.0, 17.0, 10.0, 7.0, 2.0, 9.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.0703125, -4.90692138671875, -4.7435302734375, -4.58013916015625, -4.416748046875, -4.25335693359375, -4.0899658203125, -3.92657470703125, -3.76318359375, -3.59979248046875, -3.4364013671875, -3.27301025390625, -3.109619140625, -2.94622802734375, -2.7828369140625, -2.61944580078125, -2.4560546875, -2.29266357421875, -2.1292724609375, -1.96588134765625, -1.802490234375, -1.63909912109375, -1.4757080078125, -1.31231689453125, -1.14892578125, -0.98553466796875, -0.8221435546875, -0.65875244140625, -0.495361328125, -0.33197021484375, -0.1685791015625, -0.00518798828125, 0.158203125, 0.32159423828125, 0.4849853515625, 0.64837646484375, 0.811767578125, 0.97515869140625, 1.1385498046875, 1.30194091796875, 1.46533203125, 1.62872314453125, 1.7921142578125, 1.95550537109375, 2.118896484375, 2.28228759765625, 2.4456787109375, 2.60906982421875, 2.7724609375, 2.93585205078125, 3.0992431640625, 3.26263427734375, 3.426025390625, 3.58941650390625, 3.7528076171875, 3.91619873046875, 4.07958984375, 4.24298095703125, 4.4063720703125, 4.56976318359375, 4.733154296875, 4.89654541015625, 5.0599365234375, 5.22332763671875, 5.38671875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 10.0, 9.0, 37.0, 80.0, 176.0, 309.0, 233.0, 98.0, 23.0, 11.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.99706268310547, -43.09306335449219, -42.189064025878906, -41.285064697265625, -40.381065368652344, -39.47706604003906, -38.57306671142578, -37.669071197509766, -36.765071868896484, -35.8610725402832, -34.95707321166992, -34.05307388305664, -33.14907455444336, -32.245079040527344, -31.34107780456543, -30.43707847595215, -29.533079147338867, -28.629079818725586, -27.725080490112305, -26.821083068847656, -25.917083740234375, -25.013084411621094, -24.109085083007812, -23.20508575439453, -22.30108642578125, -21.39708709716797, -20.493087768554688, -19.589088439941406, -18.685091018676758, -17.781091690063477, -16.877092361450195, -15.973093032836914, -15.069096565246582, -14.1650972366333, -13.261098861694336, -12.357099533081055, -11.453100204467773, -10.549101829528809, -9.645102500915527, -8.741104125976562, -7.837104797363281, -6.933105945587158, -6.029107093811035, -5.125107765197754, -4.221108913421631, -3.317110061645508, -2.4131107330322266, -1.5091118812561035, -0.6051130294799805, 0.29888594150543213, 1.2028849124908447, 2.106884002685547, 3.01088285446167, 3.914881706237793, 4.818881034851074, 5.722879886627197, 6.62687873840332, 7.530877590179443, 8.434876441955566, 9.338875770568848, 10.242874145507812, 11.146873474121094, 12.050872802734375, 12.954872131347656, 13.858870506286621]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 17.0, 22.0, 24.0, 23.0, 38.0, 42.0, 39.0, 53.0, 70.0, 67.0, 61.0, 71.0, 77.0, 71.0, 73.0, 55.0, 48.0, 25.0, 28.0, 17.0, 14.0, 12.0, 14.0, 8.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.263928413391113, -14.757878303527832, -14.25182819366455, -13.74577808380127, -13.239728927612305, -12.733678817749023, -12.227628707885742, -11.721578598022461, -11.21552848815918, -10.709478378295898, -10.203428268432617, -9.697378158569336, -9.191328048706055, -8.685277938842773, -8.179228782653809, -7.673178672790527, -7.167128562927246, -6.661078453063965, -6.155028343200684, -5.6489787101745605, -5.142928600311279, -4.636878490447998, -4.130828857421875, -3.6247787475585938, -3.1187286376953125, -2.6126785278320312, -2.106628656387329, -1.6005786657333374, -1.0945286750793457, -0.5884785652160645, -0.0824286937713623, 0.42362117767333984, 0.9296722412109375, 1.4357222318649292, 1.941772222518921, 2.447822093963623, 2.9538722038269043, 3.4599223136901855, 3.9659721851348877, 4.47202205657959, 4.978072166442871, 5.484122276306152, 5.990172386169434, 6.496222019195557, 7.002272129058838, 7.508322238922119, 8.014371871948242, 8.520421981811523, 9.026472091674805, 9.532522201538086, 10.038572311401367, 10.544622421264648, 11.05067253112793, 11.556722640991211, 12.062771797180176, 12.568821907043457, 13.074872016906738, 13.58092212677002, 14.0869722366333, 14.593022346496582, 15.099071502685547, 15.605121612548828, 16.11117172241211, 16.61722183227539, 17.123271942138672]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 8.0, 8.0, 14.0, 10.0, 22.0, 34.0, 43.0, 51.0, 76.0, 112.0, 158.0, 208.0, 315.0, 482.0, 732.0, 1237.0, 1983.0, 3272.0, 6075.0, 12140.0, 29409.0, 105581.0, 3804638.0, 153821.0, 38835.0, 16019.0, 7727.0, 4329.0, 2527.0, 1543.0, 939.0, 611.0, 402.0, 282.0, 177.0, 130.0, 89.0, 69.0, 33.0, 42.0, 18.0, 22.0, 10.0, 16.0, 7.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.2049560546875, -0.19803237915039062, -0.19110870361328125, -0.18418502807617188, -0.1772613525390625, -0.17033767700195312, -0.16341400146484375, -0.15649032592773438, -0.149566650390625, -0.14264297485351562, -0.13571929931640625, -0.12879562377929688, -0.1218719482421875, -0.11494827270507812, -0.10802459716796875, -0.10110092163085938, -0.09417724609375, -0.08725357055664062, -0.08032989501953125, -0.07340621948242188, -0.0664825439453125, -0.059558868408203125, -0.05263519287109375, -0.045711517333984375, -0.038787841796875, -0.031864166259765625, -0.02494049072265625, -0.018016815185546875, -0.0110931396484375, -0.004169464111328125, 0.00275421142578125, 0.009677886962890625, 0.0166015625, 0.023525238037109375, 0.03044891357421875, 0.037372589111328125, 0.0442962646484375, 0.051219940185546875, 0.05814361572265625, 0.06506729125976562, 0.071990966796875, 0.07891464233398438, 0.08583831787109375, 0.09276199340820312, 0.0996856689453125, 0.10660934448242188, 0.11353302001953125, 0.12045669555664062, 0.12738037109375, 0.13430404663085938, 0.14122772216796875, 0.14815139770507812, 0.1550750732421875, 0.16199874877929688, 0.16892242431640625, 0.17584609985351562, 0.182769775390625, 0.18969345092773438, 0.19661712646484375, 0.20354080200195312, 0.2104644775390625, 0.21738815307617188, 0.22431182861328125, 0.23123550415039062, 0.2381591796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 1.0, 3.0, 8.0, 5.0, 10.0, 15.0, 19.0, 20.0, 44.0, 751.0, 19.0, 20.0, 17.0, 6.0, 8.0, 3.0, 7.0, 3.0, 5.0, 3.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06097412109375, -0.05882549285888672, -0.05667686462402344, -0.054528236389160156, -0.052379608154296875, -0.050230979919433594, -0.04808235168457031, -0.04593372344970703, -0.04378509521484375, -0.04163646697998047, -0.03948783874511719, -0.037339210510253906, -0.035190582275390625, -0.033041954040527344, -0.030893325805664062, -0.02874469757080078, -0.0265960693359375, -0.02444744110107422, -0.022298812866210938, -0.020150184631347656, -0.018001556396484375, -0.015852928161621094, -0.013704299926757812, -0.011555671691894531, -0.00940704345703125, -0.007258415222167969, -0.0051097869873046875, -0.0029611587524414062, -0.000812530517578125, 0.0013360977172851562, 0.0034847259521484375, 0.005633354187011719, 0.007781982421875, 0.009930610656738281, 0.012079238891601562, 0.014227867126464844, 0.016376495361328125, 0.018525123596191406, 0.020673751831054688, 0.02282238006591797, 0.02497100830078125, 0.02711963653564453, 0.029268264770507812, 0.031416893005371094, 0.033565521240234375, 0.035714149475097656, 0.03786277770996094, 0.04001140594482422, 0.0421600341796875, 0.04430866241455078, 0.04645729064941406, 0.048605918884277344, 0.050754547119140625, 0.052903175354003906, 0.05505180358886719, 0.05720043182373047, 0.05934906005859375, 0.06149768829345703, 0.06364631652832031, 0.0657949447631836, 0.06794357299804688, 0.07009220123291016, 0.07224082946777344, 0.07438945770263672, 0.0765380859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 11.0, 10.0, 12.0, 28.0, 31.0, 52.0, 76.0, 145.0, 272.0, 430.0, 894.0, 1901.0, 4254.0, 10652.0, 30840.0, 106418.0, 517918.0, 2725018.0, 622595.0, 119964.0, 33609.0, 11176.0, 4300.0, 1873.0, 865.0, 380.0, 232.0, 118.0, 66.0, 49.0, 30.0, 18.0, 21.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.223876953125, -0.21757888793945312, -0.21128082275390625, -0.20498275756835938, -0.1986846923828125, -0.19238662719726562, -0.18608856201171875, -0.17979049682617188, -0.173492431640625, -0.16719436645507812, -0.16089630126953125, -0.15459823608398438, -0.1483001708984375, -0.14200210571289062, -0.13570404052734375, -0.12940597534179688, -0.12310791015625, -0.11680984497070312, -0.11051177978515625, -0.10421371459960938, -0.0979156494140625, -0.09161758422851562, -0.08531951904296875, -0.07902145385742188, -0.072723388671875, -0.06642532348632812, -0.06012725830078125, -0.053829193115234375, -0.0475311279296875, -0.041233062744140625, -0.03493499755859375, -0.028636932373046875, -0.0223388671875, -0.016040802001953125, -0.00974273681640625, -0.003444671630859375, 0.0028533935546875, 0.009151458740234375, 0.01544952392578125, 0.021747589111328125, 0.028045654296875, 0.034343719482421875, 0.04064178466796875, 0.046939849853515625, 0.0532379150390625, 0.059535980224609375, 0.06583404541015625, 0.07213211059570312, 0.07843017578125, 0.08472824096679688, 0.09102630615234375, 0.09732437133789062, 0.1036224365234375, 0.10992050170898438, 0.11621856689453125, 0.12251663208007812, 0.128814697265625, 0.13511276245117188, 0.14141082763671875, 0.14770889282226562, 0.1540069580078125, 0.16030502319335938, 0.16660308837890625, 0.17290115356445312, 0.17919921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 4.0, 7.0, 7.0, 7.0, 9.0, 18.0, 30.0, 28.0, 42.0, 44.0, 89.0, 85.0, 127.0, 205.0, 287.0, 476.0, 777.0, 656.0, 367.0, 235.0, 172.0, 97.0, 69.0, 45.0, 55.0, 32.0, 23.0, 22.0, 16.0, 11.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0823974609375, -0.08009052276611328, -0.07778358459472656, -0.07547664642333984, -0.07316970825195312, -0.0708627700805664, -0.06855583190917969, -0.06624889373779297, -0.06394195556640625, -0.06163501739501953, -0.05932807922363281, -0.057021141052246094, -0.054714202880859375, -0.052407264709472656, -0.05010032653808594, -0.04779338836669922, -0.0454864501953125, -0.04317951202392578, -0.04087257385253906, -0.038565635681152344, -0.036258697509765625, -0.033951759338378906, -0.03164482116699219, -0.02933788299560547, -0.02703094482421875, -0.02472400665283203, -0.022417068481445312, -0.020110130310058594, -0.017803192138671875, -0.015496253967285156, -0.013189315795898438, -0.010882377624511719, -0.008575439453125, -0.006268501281738281, -0.0039615631103515625, -0.0016546249389648438, 0.000652313232421875, 0.0029592514038085938, 0.0052661895751953125, 0.007573127746582031, 0.00988006591796875, 0.012187004089355469, 0.014493942260742188, 0.016800880432128906, 0.019107818603515625, 0.021414756774902344, 0.023721694946289062, 0.02602863311767578, 0.0283355712890625, 0.03064250946044922, 0.03294944763183594, 0.035256385803222656, 0.037563323974609375, 0.039870262145996094, 0.04217720031738281, 0.04448413848876953, 0.04679107666015625, 0.04909801483154297, 0.05140495300292969, 0.053711891174316406, 0.056018829345703125, 0.058325767517089844, 0.06063270568847656, 0.06293964385986328, 0.06524658203125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 14.0, 28.0, 37.0, 79.0, 143.0, 207.0, 226.0, 145.0, 58.0, 39.0, 15.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7778091430664062, -0.7519026398658752, -0.7259961366653442, -0.700089693069458, -0.674183189868927, -0.648276686668396, -0.622370183467865, -0.596463680267334, -0.5705572366714478, -0.5446507334709167, -0.5187442302703857, -0.4928377568721771, -0.4669312834739685, -0.4410247802734375, -0.4151182770729065, -0.3892117738723755, -0.3633052706718445, -0.3373987674713135, -0.31149229407310486, -0.28558579087257385, -0.25967931747436523, -0.23377281427383423, -0.20786631107330322, -0.1819598227739334, -0.1560533344745636, -0.1301468461751938, -0.10424035042524338, -0.07833385467529297, -0.05242736637592316, -0.026520878076553345, -0.0006143748760223389, 0.025292113423347473, 0.05119854211807251, 0.07710503041744232, 0.10301152616739273, 0.12891802191734314, 0.15482451021671295, 0.18073099851608276, 0.20663750171661377, 0.23254399001598358, 0.2584504783153534, 0.2843569815158844, 0.310263454914093, 0.336169958114624, 0.36207646131515503, 0.38798293471336365, 0.41388943791389465, 0.43979591131210327, 0.4657024145126343, 0.4916089177131653, 0.5175154209136963, 0.5434218645095825, 0.5693283677101135, 0.5952348709106445, 0.6211413741111755, 0.6470478773117065, 0.6729543209075928, 0.6988608241081238, 0.7247673273086548, 0.750673770904541, 0.776580274105072, 0.802486777305603, 0.828393280506134, 0.854299783706665, 0.880206286907196]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 9.0, 8.0, 19.0, 20.0, 22.0, 30.0, 36.0, 35.0, 47.0, 54.0, 61.0, 59.0, 67.0, 78.0, 70.0, 60.0, 61.0, 56.0, 56.0, 26.0, 30.0, 20.0, 21.0, 13.0, 12.0, 8.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38632452487945557, -0.37400761246681213, -0.3616907000541687, -0.34937378764152527, -0.33705687522888184, -0.3247399628162384, -0.31242305040359497, -0.30010613799095154, -0.2877892255783081, -0.2754723131656647, -0.26315540075302124, -0.2508384883403778, -0.23852157592773438, -0.22620466351509094, -0.2138877511024475, -0.20157083868980408, -0.18925391137599945, -0.17693699896335602, -0.16462008655071259, -0.15230317413806915, -0.13998626172542572, -0.1276693493127823, -0.11535242944955826, -0.10303551703691483, -0.09071860462427139, -0.07840169221162796, -0.06608477979898453, -0.053767863661050797, -0.041450951248407364, -0.02913403883576393, -0.0168171226978302, -0.004500210285186768, 0.007816702127456665, 0.020133614540100098, 0.03245052695274353, 0.04476744309067726, 0.057084355503320694, 0.06940126419067383, 0.08171818405389786, 0.09403509646654129, 0.10635200887918472, 0.11866892129182816, 0.13098584115505219, 0.14330275356769562, 0.15561966598033905, 0.16793657839298248, 0.18025349080562592, 0.19257040321826935, 0.20488731563091278, 0.2172042280435562, 0.22952114045619965, 0.24183805286884308, 0.2541549801826477, 0.26647189259529114, 0.27878880500793457, 0.291105717420578, 0.30342262983322144, 0.31573954224586487, 0.3280564546585083, 0.34037336707115173, 0.35269027948379517, 0.3650071918964386, 0.37732410430908203, 0.38964101672172546, 0.4019579291343689]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 8.0, 13.0, 5.0, 17.0, 17.0, 34.0, 44.0, 63.0, 79.0, 128.0, 180.0, 261.0, 422.0, 617.0, 890.0, 1479.0, 2346.0, 3811.0, 6338.0, 12112.0, 25601.0, 226965.0, 699391.0, 33924.0, 14625.0, 7580.0, 4351.0, 2621.0, 1639.0, 967.0, 688.0, 408.0, 286.0, 192.0, 125.0, 97.0, 66.0, 45.0, 36.0, 19.0, 25.0, 13.0, 8.0, 3.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.31787109375, -0.3079795837402344, -0.29808807373046875, -0.2881965637207031, -0.2783050537109375, -0.2684135437011719, -0.25852203369140625, -0.24863052368164062, -0.238739013671875, -0.22884750366210938, -0.21895599365234375, -0.20906448364257812, -0.1991729736328125, -0.18928146362304688, -0.17938995361328125, -0.16949844360351562, -0.15960693359375, -0.14971542358398438, -0.13982391357421875, -0.12993240356445312, -0.1200408935546875, -0.11014938354492188, -0.10025787353515625, -0.09036636352539062, -0.080474853515625, -0.07058334350585938, -0.06069183349609375, -0.050800323486328125, -0.0409088134765625, -0.031017303466796875, -0.02112579345703125, -0.011234283447265625, -0.0013427734375, 0.008548736572265625, 0.01844024658203125, 0.028331756591796875, 0.0382232666015625, 0.048114776611328125, 0.05800628662109375, 0.06789779663085938, 0.077789306640625, 0.08768081665039062, 0.09757232666015625, 0.10746383666992188, 0.1173553466796875, 0.12724685668945312, 0.13713836669921875, 0.14702987670898438, 0.15692138671875, 0.16681289672851562, 0.17670440673828125, 0.18659591674804688, 0.1964874267578125, 0.20637893676757812, 0.21627044677734375, 0.22616195678710938, 0.236053466796875, 0.24594497680664062, 0.25583648681640625, 0.2657279968261719, 0.2756195068359375, 0.2855110168457031, 0.29540252685546875, 0.3052940368652344, 0.315185546875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 12.0, 13.0, 19.0, 26.0, 181.0, 426.0, 184.0, 31.0, 15.0, 8.0, 8.0, 9.0, 2.0, 3.0, 7.0, 4.0, 5.0, 2.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0614013671875, -0.05939292907714844, -0.057384490966796875, -0.05537605285644531, -0.05336761474609375, -0.05135917663574219, -0.049350738525390625, -0.04734230041503906, -0.0453338623046875, -0.04332542419433594, -0.041316986083984375, -0.03930854797363281, -0.03730010986328125, -0.03529167175292969, -0.033283233642578125, -0.03127479553222656, -0.029266357421875, -0.027257919311523438, -0.025249481201171875, -0.023241043090820312, -0.02123260498046875, -0.019224166870117188, -0.017215728759765625, -0.015207290649414062, -0.0131988525390625, -0.011190414428710938, -0.009181976318359375, -0.0071735382080078125, -0.00516510009765625, -0.0031566619873046875, -0.001148223876953125, 0.0008602142333984375, 0.00286865234375, 0.0048770904541015625, 0.006885528564453125, 0.008893966674804688, 0.01090240478515625, 0.012910842895507812, 0.014919281005859375, 0.016927719116210938, 0.0189361572265625, 0.020944595336914062, 0.022953033447265625, 0.024961471557617188, 0.02696990966796875, 0.028978347778320312, 0.030986785888671875, 0.03299522399902344, 0.035003662109375, 0.03701210021972656, 0.039020538330078125, 0.04102897644042969, 0.04303741455078125, 0.04504585266113281, 0.047054290771484375, 0.04906272888183594, 0.0510711669921875, 0.05307960510253906, 0.055088043212890625, 0.05709648132324219, 0.05910491943359375, 0.06111335754394531, 0.06312179565429688, 0.06513023376464844, 0.067138671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 11.0, 13.0, 11.0, 19.0, 26.0, 36.0, 51.0, 86.0, 141.0, 211.0, 306.0, 557.0, 1038.0, 2093.0, 5188.0, 14830.0, 52014.0, 218862.0, 507783.0, 180027.0, 43579.0, 12728.0, 4606.0, 1982.0, 945.0, 527.0, 304.0, 165.0, 131.0, 97.0, 41.0, 45.0, 24.0, 21.0, 12.0, 5.0, 5.0, 9.0, 6.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.3056640625, -0.2967872619628906, -0.28791046142578125, -0.2790336608886719, -0.2701568603515625, -0.2612800598144531, -0.25240325927734375, -0.24352645874023438, -0.234649658203125, -0.22577285766601562, -0.21689605712890625, -0.20801925659179688, -0.1991424560546875, -0.19026565551757812, -0.18138885498046875, -0.17251205444335938, -0.16363525390625, -0.15475845336914062, -0.14588165283203125, -0.13700485229492188, -0.1281280517578125, -0.11925125122070312, -0.11037445068359375, -0.10149765014648438, -0.092620849609375, -0.08374404907226562, -0.07486724853515625, -0.06599044799804688, -0.0571136474609375, -0.048236846923828125, -0.03936004638671875, -0.030483245849609375, -0.0216064453125, -0.012729644775390625, -0.00385284423828125, 0.005023956298828125, 0.0139007568359375, 0.022777557373046875, 0.03165435791015625, 0.040531158447265625, 0.049407958984375, 0.058284759521484375, 0.06716156005859375, 0.07603836059570312, 0.0849151611328125, 0.09379196166992188, 0.10266876220703125, 0.11154556274414062, 0.12042236328125, 0.12929916381835938, 0.13817596435546875, 0.14705276489257812, 0.1559295654296875, 0.16480636596679688, 0.17368316650390625, 0.18255996704101562, 0.191436767578125, 0.20031356811523438, 0.20919036865234375, 0.21806716918945312, 0.2269439697265625, 0.23582077026367188, 0.24469757080078125, 0.2535743713378906, 0.262451171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 12.0, 11.0, 11.0, 14.0, 21.0, 25.0, 21.0, 28.0, 29.0, 31.0, 34.0, 41.0, 51.0, 46.0, 41.0, 48.0, 46.0, 52.0, 50.0, 45.0, 47.0, 27.0, 42.0, 34.0, 37.0, 34.0, 19.0, 23.0, 13.0, 15.0, 13.0, 8.0, 2.0, 9.0, 7.0, 6.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.253173828125, -0.24493789672851562, -0.23670196533203125, -0.22846603393554688, -0.2202301025390625, -0.21199417114257812, -0.20375823974609375, -0.19552230834960938, -0.187286376953125, -0.17905044555664062, -0.17081451416015625, -0.16257858276367188, -0.1543426513671875, -0.14610671997070312, -0.13787078857421875, -0.12963485717773438, -0.12139892578125, -0.11316299438476562, -0.10492706298828125, -0.09669113159179688, -0.0884552001953125, -0.08021926879882812, -0.07198333740234375, -0.06374740600585938, -0.055511474609375, -0.047275543212890625, -0.03903961181640625, -0.030803680419921875, -0.0225677490234375, -0.014331817626953125, -0.00609588623046875, 0.002140045166015625, 0.0103759765625, 0.018611907958984375, 0.02684783935546875, 0.035083770751953125, 0.0433197021484375, 0.051555633544921875, 0.05979156494140625, 0.06802749633789062, 0.076263427734375, 0.08449935913085938, 0.09273529052734375, 0.10097122192382812, 0.1092071533203125, 0.11744308471679688, 0.12567901611328125, 0.13391494750976562, 0.14215087890625, 0.15038681030273438, 0.15862274169921875, 0.16685867309570312, 0.1750946044921875, 0.18333053588867188, 0.19156646728515625, 0.19980239868164062, 0.208038330078125, 0.21627426147460938, 0.22451019287109375, 0.23274612426757812, 0.2409820556640625, 0.24921798706054688, 0.25745391845703125, 0.2656898498535156, 0.27392578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 4.0, 5.0, 11.0, 10.0, 18.0, 24.0, 52.0, 62.0, 98.0, 176.0, 272.0, 529.0, 1157.0, 2838.0, 8840.0, 60830.0, 877939.0, 80101.0, 9944.0, 3124.0, 1210.0, 544.0, 290.0, 151.0, 83.0, 72.0, 50.0, 44.0, 25.0, 18.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.505828857421875, -0.48870849609375, -0.471588134765625, -0.4544677734375, -0.437347412109375, -0.42022705078125, -0.403106689453125, -0.385986328125, -0.368865966796875, -0.35174560546875, -0.334625244140625, -0.3175048828125, -0.300384521484375, -0.28326416015625, -0.266143798828125, -0.2490234375, -0.231903076171875, -0.21478271484375, -0.197662353515625, -0.1805419921875, -0.163421630859375, -0.14630126953125, -0.129180908203125, -0.112060546875, -0.094940185546875, -0.07781982421875, -0.060699462890625, -0.0435791015625, -0.026458740234375, -0.00933837890625, 0.007781982421875, 0.02490234375, 0.042022705078125, 0.05914306640625, 0.076263427734375, 0.0933837890625, 0.110504150390625, 0.12762451171875, 0.144744873046875, 0.161865234375, 0.178985595703125, 0.19610595703125, 0.213226318359375, 0.2303466796875, 0.247467041015625, 0.26458740234375, 0.281707763671875, 0.298828125, 0.315948486328125, 0.33306884765625, 0.350189208984375, 0.3673095703125, 0.384429931640625, 0.40155029296875, 0.418670654296875, 0.435791015625, 0.452911376953125, 0.47003173828125, 0.487152099609375, 0.5042724609375, 0.521392822265625, 0.53851318359375, 0.555633544921875, 0.57275390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 8.0, 4.0, 1.0, 8.0, 6.0, 11.0, 15.0, 18.0, 28.0, 35.0, 51.0, 46.0, 70.0, 59.0, 73.0, 58.0, 100.0, 75.0, 59.0, 51.0, 43.0, 33.0, 39.0, 24.0, 21.0, 7.0, 15.0, 9.0, 5.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.722574234008789e-05, -1.6555190086364746e-05, -1.58846378326416e-05, -1.5214085578918457e-05, -1.4543533325195312e-05, -1.3872981071472168e-05, -1.3202428817749023e-05, -1.2531876564025879e-05, -1.1861324310302734e-05, -1.119077205657959e-05, -1.0520219802856445e-05, -9.8496675491333e-06, -9.179115295410156e-06, -8.508563041687012e-06, -7.838010787963867e-06, -7.167458534240723e-06, -6.496906280517578e-06, -5.826354026794434e-06, -5.155801773071289e-06, -4.4852495193481445e-06, -3.814697265625e-06, -3.1441450119018555e-06, -2.473592758178711e-06, -1.8030405044555664e-06, -1.1324882507324219e-06, -4.6193599700927734e-07, 2.086162567138672e-07, 8.791685104370117e-07, 1.5497207641601562e-06, 2.2202730178833008e-06, 2.8908252716064453e-06, 3.56137752532959e-06, 4.231929779052734e-06, 4.902482032775879e-06, 5.5730342864990234e-06, 6.243586540222168e-06, 6.9141387939453125e-06, 7.584691047668457e-06, 8.255243301391602e-06, 8.925795555114746e-06, 9.59634780883789e-06, 1.0266900062561035e-05, 1.093745231628418e-05, 1.1608004570007324e-05, 1.2278556823730469e-05, 1.2949109077453613e-05, 1.3619661331176758e-05, 1.4290213584899902e-05, 1.4960765838623047e-05, 1.563131809234619e-05, 1.6301870346069336e-05, 1.697242259979248e-05, 1.7642974853515625e-05, 1.831352710723877e-05, 1.8984079360961914e-05, 1.965463161468506e-05, 2.0325183868408203e-05, 2.0995736122131348e-05, 2.1666288375854492e-05, 2.2336840629577637e-05, 2.300739288330078e-05, 2.3677945137023926e-05, 2.434849739074707e-05, 2.5019049644470215e-05, 2.568960189819336e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 7.0, 5.0, 17.0, 23.0, 25.0, 51.0, 62.0, 91.0, 113.0, 201.0, 291.0, 410.0, 741.0, 1351.0, 2493.0, 4686.0, 10600.0, 26936.0, 82704.0, 312472.0, 426013.0, 116963.0, 35916.0, 13589.0, 6000.0, 2900.0, 1555.0, 845.0, 516.0, 305.0, 207.0, 128.0, 97.0, 73.0, 47.0, 30.0, 22.0, 16.0, 13.0, 5.0, 5.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.23828125, -0.23109054565429688, -0.22389984130859375, -0.21670913696289062, -0.2095184326171875, -0.20232772827148438, -0.19513702392578125, -0.18794631958007812, -0.180755615234375, -0.17356491088867188, -0.16637420654296875, -0.15918350219726562, -0.1519927978515625, -0.14480209350585938, -0.13761138916015625, -0.13042068481445312, -0.12322998046875, -0.11603927612304688, -0.10884857177734375, -0.10165786743164062, -0.0944671630859375, -0.08727645874023438, -0.08008575439453125, -0.07289505004882812, -0.065704345703125, -0.058513641357421875, -0.05132293701171875, -0.044132232666015625, -0.0369415283203125, -0.029750823974609375, -0.02256011962890625, -0.015369415283203125, -0.0081787109375, -0.000988006591796875, 0.00620269775390625, 0.013393402099609375, 0.0205841064453125, 0.027774810791015625, 0.03496551513671875, 0.042156219482421875, 0.049346923828125, 0.056537628173828125, 0.06372833251953125, 0.07091903686523438, 0.0781097412109375, 0.08530044555664062, 0.09249114990234375, 0.09968185424804688, 0.10687255859375, 0.11406326293945312, 0.12125396728515625, 0.12844467163085938, 0.1356353759765625, 0.14282608032226562, 0.15001678466796875, 0.15720748901367188, 0.164398193359375, 0.17158889770507812, 0.17877960205078125, 0.18597030639648438, 0.1931610107421875, 0.20035171508789062, 0.20754241943359375, 0.21473312377929688, 0.221923828125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 5.0, 3.0, 8.0, 12.0, 16.0, 15.0, 26.0, 35.0, 28.0, 38.0, 49.0, 44.0, 62.0, 77.0, 71.0, 69.0, 56.0, 50.0, 58.0, 47.0, 48.0, 30.0, 27.0, 20.0, 35.0, 12.0, 10.0, 7.0, 9.0, 4.0, 6.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.204833984375, -0.19755172729492188, -0.19026947021484375, -0.18298721313476562, -0.1757049560546875, -0.16842269897460938, -0.16114044189453125, -0.15385818481445312, -0.146575927734375, -0.13929367065429688, -0.13201141357421875, -0.12472915649414062, -0.1174468994140625, -0.11016464233398438, -0.10288238525390625, -0.09560012817382812, -0.08831787109375, -0.08103561401367188, -0.07375335693359375, -0.06647109985351562, -0.0591888427734375, -0.051906585693359375, -0.04462432861328125, -0.037342071533203125, -0.030059814453125, -0.022777557373046875, -0.01549530029296875, -0.008213043212890625, -0.0009307861328125, 0.006351470947265625, 0.01363372802734375, 0.020915985107421875, 0.0281982421875, 0.035480499267578125, 0.04276275634765625, 0.050045013427734375, 0.0573272705078125, 0.06460952758789062, 0.07189178466796875, 0.07917404174804688, 0.086456298828125, 0.09373855590820312, 0.10102081298828125, 0.10830307006835938, 0.1155853271484375, 0.12286758422851562, 0.13014984130859375, 0.13743209838867188, 0.14471435546875, 0.15199661254882812, 0.15927886962890625, 0.16656112670898438, 0.1738433837890625, 0.18112564086914062, 0.18840789794921875, 0.19569015502929688, 0.202972412109375, 0.21025466918945312, 0.21753692626953125, 0.22481918334960938, 0.2321014404296875, 0.23938369750976562, 0.24666595458984375, 0.2539482116699219, 0.26123046875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 18.0, 25.0, 83.0, 195.0, 336.0, 200.0, 74.0, 25.0, 13.0, 6.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.972434043884277, -4.819847106933594, -4.667260646820068, -4.514673709869385, -4.362086772918701, -4.209499835968018, -4.056913375854492, -3.9043264389038086, -3.751739501953125, -3.5991528034210205, -3.446565866470337, -3.2939791679382324, -3.141392230987549, -2.9888055324554443, -2.83621883392334, -2.6836318969726562, -2.5310451984405518, -2.3784584999084473, -2.2258715629577637, -2.073284864425659, -1.9206979274749756, -1.768111228942871, -1.615524411201477, -1.462937593460083, -1.310350775718689, -1.157763957977295, -1.0051771402359009, -0.8525903820991516, -0.7000035643577576, -0.5474167466163635, -0.39482998847961426, -0.24224317073822021, -0.08965635299682617, 0.06293044984340668, 0.21551725268363953, 0.3681040406227112, 0.5206908583641052, 0.6732776761054993, 0.8258644342422485, 0.9784512519836426, 1.1310380697250366, 1.2836248874664307, 1.4362117052078247, 1.5887985229492188, 1.7413852214813232, 1.8939721584320068, 2.0465588569641113, 2.199145793914795, 2.3517324924468994, 2.504319190979004, 2.6569061279296875, 2.809492826461792, 2.9620797634124756, 3.11466646194458, 3.2672533988952637, 3.419840097427368, 3.5724267959594727, 3.725013494491577, 3.8776004314422607, 4.030187129974365, 4.182774066925049, 4.335361003875732, 4.487947463989258, 4.640534400939941, 4.793121337890625]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 5.0, 7.0, 8.0, 17.0, 23.0, 32.0, 60.0, 93.0, 153.0, 168.0, 145.0, 96.0, 52.0, 43.0, 24.0, 12.0, 10.0, 5.0, 9.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.309418201446533, -5.1514363288879395, -4.993454933166504, -4.83547306060791, -4.677491188049316, -4.519509315490723, -4.361527442932129, -4.203546047210693, -4.0455641746521, -3.887582302093506, -3.729600667953491, -3.5716190338134766, -3.413637161254883, -3.255655288696289, -3.0976736545562744, -2.9396920204162598, -2.781710147857666, -2.6237282752990723, -2.4657466411590576, -2.307765007019043, -2.149783134460449, -1.991801381111145, -1.8338196277618408, -1.6758378744125366, -1.5178561210632324, -1.3598743677139282, -1.201892614364624, -1.0439108610153198, -0.8859291076660156, -0.7279473543167114, -0.5699656009674072, -0.411983847618103, -0.25400257110595703, -0.09602081775665283, 0.06196093559265137, 0.21994268894195557, 0.37792444229125977, 0.535906195640564, 0.6938879489898682, 0.8518697023391724, 1.0098514556884766, 1.1678332090377808, 1.325814962387085, 1.4837967157363892, 1.6417784690856934, 1.7997602224349976, 1.9577419757843018, 2.1157236099243164, 2.27370548248291, 2.431687355041504, 2.5896689891815186, 2.747650623321533, 2.905632495880127, 3.0636143684387207, 3.2215960025787354, 3.37957763671875, 3.5375595092773438, 3.6955413818359375, 3.853523015975952, 4.011504650115967, 4.1694865226745605, 4.327468395233154, 4.48544979095459, 4.643431663513184, 4.801413536071777]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 13.0, 8.0, 9.0, 7.0, 13.0, 21.0, 34.0, 82.0, 260.0, 1243.0, 9365.0, 654588.0, 3512291.0, 13534.0, 2011.0, 478.0, 156.0, 60.0, 28.0, 18.0, 14.0, 8.0, 11.0, 5.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.729522705078125, -1.66998291015625, -1.610443115234375, -1.5509033203125, -1.491363525390625, -1.43182373046875, -1.372283935546875, -1.312744140625, -1.253204345703125, -1.19366455078125, -1.134124755859375, -1.0745849609375, -1.015045166015625, -0.95550537109375, -0.895965576171875, -0.83642578125, -0.776885986328125, -0.71734619140625, -0.657806396484375, -0.5982666015625, -0.538726806640625, -0.47918701171875, -0.419647216796875, -0.360107421875, -0.300567626953125, -0.24102783203125, -0.181488037109375, -0.1219482421875, -0.062408447265625, -0.00286865234375, 0.056671142578125, 0.1162109375, 0.175750732421875, 0.23529052734375, 0.294830322265625, 0.3543701171875, 0.413909912109375, 0.47344970703125, 0.532989501953125, 0.592529296875, 0.652069091796875, 0.71160888671875, 0.771148681640625, 0.8306884765625, 0.890228271484375, 0.94976806640625, 1.009307861328125, 1.06884765625, 1.128387451171875, 1.18792724609375, 1.247467041015625, 1.3070068359375, 1.366546630859375, 1.42608642578125, 1.485626220703125, 1.545166015625, 1.604705810546875, 1.66424560546875, 1.723785400390625, 1.7833251953125, 1.842864990234375, 1.90240478515625, 1.961944580078125, 2.021484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 5.0, 8.0, 8.0, 16.0, 13.0, 10.0, 29.0, 58.0, 108.0, 169.0, 191.0, 150.0, 61.0, 55.0, 16.0, 11.0, 5.0, 5.0, 13.0, 12.0, 6.0, 3.0, 2.0, 4.0, 6.0, 3.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.034820556640625, -0.033509254455566406, -0.03219795227050781, -0.03088665008544922, -0.029575347900390625, -0.02826404571533203, -0.026952743530273438, -0.025641441345214844, -0.02433013916015625, -0.023018836975097656, -0.021707534790039062, -0.02039623260498047, -0.019084930419921875, -0.01777362823486328, -0.016462326049804688, -0.015151023864746094, -0.0138397216796875, -0.012528419494628906, -0.011217117309570312, -0.009905815124511719, -0.008594512939453125, -0.007283210754394531, -0.0059719085693359375, -0.004660606384277344, -0.00334930419921875, -0.0020380020141601562, -0.0007266998291015625, 0.0005846023559570312, 0.001895904541015625, 0.0032072067260742188, 0.0045185089111328125, 0.005829811096191406, 0.00714111328125, 0.008452415466308594, 0.009763717651367188, 0.011075019836425781, 0.012386322021484375, 0.013697624206542969, 0.015008926391601562, 0.016320228576660156, 0.01763153076171875, 0.018942832946777344, 0.020254135131835938, 0.02156543731689453, 0.022876739501953125, 0.02418804168701172, 0.025499343872070312, 0.026810646057128906, 0.0281219482421875, 0.029433250427246094, 0.030744552612304688, 0.03205585479736328, 0.033367156982421875, 0.03467845916748047, 0.03598976135253906, 0.037301063537597656, 0.03861236572265625, 0.039923667907714844, 0.04123497009277344, 0.04254627227783203, 0.043857574462890625, 0.04516887664794922, 0.04648017883300781, 0.047791481018066406, 0.049102783203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 7.0, 7.0, 12.0, 7.0, 18.0, 33.0, 33.0, 72.0, 81.0, 130.0, 180.0, 306.0, 601.0, 1145.0, 2458.0, 6579.0, 21231.0, 97273.0, 1304138.0, 2593578.0, 127856.0, 25318.0, 7466.0, 2806.0, 1278.0, 670.0, 354.0, 216.0, 132.0, 104.0, 56.0, 40.0, 27.0, 20.0, 12.0, 10.0, 12.0, 6.0, 4.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441650390625, -0.4259223937988281, -0.41019439697265625, -0.3944664001464844, -0.3787384033203125, -0.3630104064941406, -0.34728240966796875, -0.3315544128417969, -0.315826416015625, -0.3000984191894531, -0.28437042236328125, -0.2686424255371094, -0.2529144287109375, -0.23718643188476562, -0.22145843505859375, -0.20573043823242188, -0.19000244140625, -0.17427444458007812, -0.15854644775390625, -0.14281845092773438, -0.1270904541015625, -0.11136245727539062, -0.09563446044921875, -0.07990646362304688, -0.064178466796875, -0.048450469970703125, -0.03272247314453125, -0.016994476318359375, -0.0012664794921875, 0.014461517333984375, 0.03018951416015625, 0.045917510986328125, 0.0616455078125, 0.07737350463867188, 0.09310150146484375, 0.10882949829101562, 0.1245574951171875, 0.14028549194335938, 0.15601348876953125, 0.17174148559570312, 0.187469482421875, 0.20319747924804688, 0.21892547607421875, 0.23465347290039062, 0.2503814697265625, 0.2661094665527344, 0.28183746337890625, 0.2975654602050781, 0.31329345703125, 0.3290214538574219, 0.34474945068359375, 0.3604774475097656, 0.3762054443359375, 0.3919334411621094, 0.40766143798828125, 0.4233894348144531, 0.439117431640625, 0.4548454284667969, 0.47057342529296875, 0.4863014221191406, 0.5020294189453125, 0.5177574157714844, 0.5334854125976562, 0.5492134094238281, 0.56494140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 13.0, 24.0, 15.0, 29.0, 39.0, 67.0, 97.0, 173.0, 337.0, 856.0, 1486.0, 475.0, 191.0, 92.0, 69.0, 23.0, 29.0, 14.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06597900390625, -0.06301498413085938, -0.06005096435546875, -0.057086944580078125, -0.0541229248046875, -0.051158905029296875, -0.04819488525390625, -0.045230865478515625, -0.042266845703125, -0.039302825927734375, -0.03633880615234375, -0.033374786376953125, -0.0304107666015625, -0.027446746826171875, -0.02448272705078125, -0.021518707275390625, -0.0185546875, -0.015590667724609375, -0.01262664794921875, -0.009662628173828125, -0.0066986083984375, -0.003734588623046875, -0.00077056884765625, 0.002193450927734375, 0.005157470703125, 0.008121490478515625, 0.01108551025390625, 0.014049530029296875, 0.0170135498046875, 0.019977569580078125, 0.02294158935546875, 0.025905609130859375, 0.02886962890625, 0.031833648681640625, 0.03479766845703125, 0.037761688232421875, 0.0407257080078125, 0.043689727783203125, 0.04665374755859375, 0.049617767333984375, 0.052581787109375, 0.055545806884765625, 0.05850982666015625, 0.061473846435546875, 0.0644378662109375, 0.06740188598632812, 0.07036590576171875, 0.07332992553710938, 0.0762939453125, 0.07925796508789062, 0.08222198486328125, 0.08518600463867188, 0.0881500244140625, 0.09111404418945312, 0.09407806396484375, 0.09704208374023438, 0.100006103515625, 0.10297012329101562, 0.10593414306640625, 0.10889816284179688, 0.1118621826171875, 0.11482620239257812, 0.11779022216796875, 0.12075424194335938, 0.12371826171875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 10.0, 9.0, 20.0, 57.0, 162.0, 391.0, 267.0, 58.0, 16.0, 9.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6056296825408936, -1.5581352710723877, -1.5106408596038818, -1.463146448135376, -1.4156520366668701, -1.3681575059890747, -1.3206630945205688, -1.273168683052063, -1.2256742715835571, -1.1781798601150513, -1.1306854486465454, -1.0831910371780396, -1.0356965065002441, -0.9882021546363831, -0.9407076835632324, -0.8932132720947266, -0.8457188606262207, -0.7982244491577148, -0.750730037689209, -0.7032355666160583, -0.6557411551475525, -0.6082467436790466, -0.560752272605896, -0.5132578611373901, -0.4657634496688843, -0.4182690382003784, -0.37077459692955017, -0.3232801556587219, -0.27578574419021606, -0.228291317820549, -0.18079689145088196, -0.1333024501800537, -0.08580803871154785, -0.0383136123418808, 0.009180814027786255, 0.05667524039745331, 0.10416966676712036, 0.15166409313678741, 0.19915851950645447, 0.24665296077728271, 0.2941473722457886, 0.34164178371429443, 0.3891362249851227, 0.4366306662559509, 0.4841250777244568, 0.5316194891929626, 0.5791139602661133, 0.6266083717346191, 0.674102783203125, 0.7215971946716309, 0.7690916061401367, 0.8165860772132874, 0.8640804886817932, 0.9115749001502991, 0.9590693712234497, 1.0065637826919556, 1.0540581941604614, 1.1015526056289673, 1.1490470170974731, 1.196541428565979, 1.2440359592437744, 1.2915303707122803, 1.3390247821807861, 1.386519193649292, 1.4340136051177979]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 14.0, 14.0, 19.0, 17.0, 18.0, 33.0, 32.0, 50.0, 52.0, 68.0, 74.0, 82.0, 82.0, 69.0, 64.0, 74.0, 59.0, 40.0, 38.0, 22.0, 15.0, 21.0, 18.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6058225631713867, -0.5881983637809753, -0.5705742239952087, -0.5529500246047974, -0.5353258848190308, -0.5177016854286194, -0.5000775456428528, -0.4824533462524414, -0.4648291766643524, -0.4472050070762634, -0.42958083748817444, -0.41195666790008545, -0.3943324685096741, -0.37670832872390747, -0.3590841293334961, -0.3414599597454071, -0.3238357901573181, -0.3062116205692291, -0.28858745098114014, -0.27096328139305115, -0.25333911180496216, -0.23571492731571198, -0.2180907428264618, -0.2004665732383728, -0.1828424036502838, -0.16521823406219482, -0.14759406447410583, -0.12996987998485565, -0.11234571039676666, -0.09472154080867767, -0.07709736377000809, -0.0594731867313385, -0.04184907674789429, -0.024224903434515, -0.006600730121135712, 0.011023443192243576, 0.028647616505622864, 0.04627178609371185, 0.06389596313238144, 0.08152014017105103, 0.09914430975914001, 0.116768479347229, 0.134392648935318, 0.15201683342456818, 0.16964100301265717, 0.18726517260074615, 0.20488935708999634, 0.22251352667808533, 0.24013769626617432, 0.2577618658542633, 0.2753860354423523, 0.2930102050304413, 0.3106343746185303, 0.32825857400894165, 0.34588274359703064, 0.36350691318511963, 0.3811310827732086, 0.3987552523612976, 0.4163794219493866, 0.4340035915374756, 0.45162779092788696, 0.46925193071365356, 0.48687613010406494, 0.5045002698898315, 0.5221244692802429]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 13.0, 12.0, 10.0, 19.0, 16.0, 31.0, 41.0, 60.0, 108.0, 200.0, 432.0, 1133.0, 3974.0, 21125.0, 364981.0, 620383.0, 28594.0, 4945.0, 1377.0, 502.0, 192.0, 120.0, 51.0, 41.0, 40.0, 29.0, 21.0, 13.0, 8.0, 7.0, 13.0, 8.0, 10.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8408203125, -0.814605712890625, -0.78839111328125, -0.762176513671875, -0.7359619140625, -0.709747314453125, -0.68353271484375, -0.657318115234375, -0.631103515625, -0.604888916015625, -0.57867431640625, -0.552459716796875, -0.5262451171875, -0.500030517578125, -0.47381591796875, -0.447601318359375, -0.42138671875, -0.395172119140625, -0.36895751953125, -0.342742919921875, -0.3165283203125, -0.290313720703125, -0.26409912109375, -0.237884521484375, -0.211669921875, -0.185455322265625, -0.15924072265625, -0.133026123046875, -0.1068115234375, -0.080596923828125, -0.05438232421875, -0.028167724609375, -0.001953125, 0.024261474609375, 0.05047607421875, 0.076690673828125, 0.1029052734375, 0.129119873046875, 0.15533447265625, 0.181549072265625, 0.207763671875, 0.233978271484375, 0.26019287109375, 0.286407470703125, 0.3126220703125, 0.338836669921875, 0.36505126953125, 0.391265869140625, 0.41748046875, 0.443695068359375, 0.46990966796875, 0.496124267578125, 0.5223388671875, 0.548553466796875, 0.57476806640625, 0.600982666015625, 0.627197265625, 0.653411865234375, 0.67962646484375, 0.705841064453125, 0.7320556640625, 0.758270263671875, 0.78448486328125, 0.810699462890625, 0.8369140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 15.0, 28.0, 49.0, 76.0, 136.0, 203.0, 194.0, 117.0, 81.0, 37.0, 20.0, 13.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.1181640625, -0.11569547653198242, -0.11322689056396484, -0.11075830459594727, -0.10828971862792969, -0.10582113265991211, -0.10335254669189453, -0.10088396072387695, -0.09841537475585938, -0.0959467887878418, -0.09347820281982422, -0.09100961685180664, -0.08854103088378906, -0.08607244491577148, -0.0836038589477539, -0.08113527297973633, -0.07866668701171875, -0.07619810104370117, -0.0737295150756836, -0.07126092910766602, -0.06879234313964844, -0.06632375717163086, -0.06385517120361328, -0.0613865852355957, -0.058917999267578125, -0.05644941329956055, -0.05398082733154297, -0.05151224136352539, -0.04904365539550781, -0.046575069427490234, -0.044106483459472656, -0.04163789749145508, -0.0391693115234375, -0.03670072555541992, -0.034232139587402344, -0.031763553619384766, -0.029294967651367188, -0.02682638168334961, -0.02435779571533203, -0.021889209747314453, -0.019420623779296875, -0.016952037811279297, -0.014483451843261719, -0.01201486587524414, -0.009546279907226562, -0.007077693939208984, -0.004609107971191406, -0.002140522003173828, 0.00032806396484375, 0.002796649932861328, 0.005265235900878906, 0.007733821868896484, 0.010202407836914062, 0.01267099380493164, 0.015139579772949219, 0.017608165740966797, 0.020076751708984375, 0.022545337677001953, 0.02501392364501953, 0.02748250961303711, 0.029951095581054688, 0.032419681549072266, 0.034888267517089844, 0.03735685348510742, 0.039825439453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 10.0, 6.0, 6.0, 7.0, 12.0, 30.0, 87.0, 472.0, 7848.0, 791643.0, 244937.0, 2999.0, 312.0, 76.0, 25.0, 15.0, 3.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.1943359375, -1.1529541015625, -1.111572265625, -1.0701904296875, -1.02880859375, -0.9874267578125, -0.946044921875, -0.9046630859375, -0.86328125, -0.8218994140625, -0.780517578125, -0.7391357421875, -0.69775390625, -0.6563720703125, -0.614990234375, -0.5736083984375, -0.5322265625, -0.4908447265625, -0.449462890625, -0.4080810546875, -0.36669921875, -0.3253173828125, -0.283935546875, -0.2425537109375, -0.201171875, -0.1597900390625, -0.118408203125, -0.0770263671875, -0.03564453125, 0.0057373046875, 0.047119140625, 0.0885009765625, 0.1298828125, 0.1712646484375, 0.212646484375, 0.2540283203125, 0.29541015625, 0.3367919921875, 0.378173828125, 0.4195556640625, 0.4609375, 0.5023193359375, 0.543701171875, 0.5850830078125, 0.62646484375, 0.6678466796875, 0.709228515625, 0.7506103515625, 0.7919921875, 0.8333740234375, 0.874755859375, 0.9161376953125, 0.95751953125, 0.9989013671875, 1.040283203125, 1.0816650390625, 1.123046875, 1.1644287109375, 1.205810546875, 1.2471923828125, 1.28857421875, 1.3299560546875, 1.371337890625, 1.4127197265625, 1.4541015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 8.0, 15.0, 11.0, 12.0, 19.0, 22.0, 20.0, 20.0, 32.0, 33.0, 33.0, 33.0, 40.0, 42.0, 33.0, 36.0, 51.0, 46.0, 46.0, 39.0, 34.0, 47.0, 34.0, 33.0, 36.0, 33.0, 26.0, 22.0, 17.0, 21.0, 10.0, 15.0, 13.0, 10.0, 13.0, 6.0, 5.0, 10.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1451416015625, -0.14005470275878906, -0.13496780395507812, -0.1298809051513672, -0.12479400634765625, -0.11970710754394531, -0.11462020874023438, -0.10953330993652344, -0.1044464111328125, -0.09935951232910156, -0.09427261352539062, -0.08918571472167969, -0.08409881591796875, -0.07901191711425781, -0.07392501831054688, -0.06883811950683594, -0.063751220703125, -0.05866432189941406, -0.053577423095703125, -0.04849052429199219, -0.04340362548828125, -0.03831672668457031, -0.033229827880859375, -0.028142929077148438, -0.0230560302734375, -0.017969131469726562, -0.012882232666015625, -0.0077953338623046875, -0.00270843505859375, 0.0023784637451171875, 0.007465362548828125, 0.012552261352539062, 0.01763916015625, 0.022726058959960938, 0.027812957763671875, 0.03289985656738281, 0.03798675537109375, 0.04307365417480469, 0.048160552978515625, 0.05324745178222656, 0.0583343505859375, 0.06342124938964844, 0.06850814819335938, 0.07359504699707031, 0.07868194580078125, 0.08376884460449219, 0.08885574340820312, 0.09394264221191406, 0.099029541015625, 0.10411643981933594, 0.10920333862304688, 0.11429023742675781, 0.11937713623046875, 0.12446403503417969, 0.12955093383789062, 0.13463783264160156, 0.1397247314453125, 0.14481163024902344, 0.14989852905273438, 0.1549854278564453, 0.16007232666015625, 0.1651592254638672, 0.17024612426757812, 0.17533302307128906, 0.180419921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 15.0, 34.0, 127.0, 1855.0, 1044700.0, 1604.0, 119.0, 42.0, 19.0, 11.0, 8.0, 3.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16796875, -6.84906005859375, -6.5301513671875, -6.21124267578125, -5.892333984375, -5.57342529296875, -5.2545166015625, -4.93560791015625, -4.61669921875, -4.29779052734375, -3.9788818359375, -3.65997314453125, -3.341064453125, -3.02215576171875, -2.7032470703125, -2.38433837890625, -2.0654296875, -1.74652099609375, -1.4276123046875, -1.10870361328125, -0.789794921875, -0.47088623046875, -0.1519775390625, 0.16693115234375, 0.48583984375, 0.80474853515625, 1.1236572265625, 1.44256591796875, 1.761474609375, 2.08038330078125, 2.3992919921875, 2.71820068359375, 3.037109375, 3.35601806640625, 3.6749267578125, 3.99383544921875, 4.312744140625, 4.63165283203125, 4.9505615234375, 5.26947021484375, 5.58837890625, 5.90728759765625, 6.2261962890625, 6.54510498046875, 6.864013671875, 7.18292236328125, 7.5018310546875, 7.82073974609375, 8.1396484375, 8.45855712890625, 8.7774658203125, 9.09637451171875, 9.415283203125, 9.73419189453125, 10.0531005859375, 10.37200927734375, 10.69091796875, 11.00982666015625, 11.3287353515625, 11.64764404296875, 11.966552734375, 12.28546142578125, 12.6043701171875, 12.92327880859375, 13.2421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 8.0, 10.0, 19.0, 27.0, 22.0, 36.0, 55.0, 65.0, 121.0, 129.0, 147.0, 89.0, 87.0, 53.0, 32.0, 27.0, 18.0, 12.0, 10.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.064508438110352e-05, -7.841922342777252e-05, -7.619336247444153e-05, -7.396750152111053e-05, -7.174164056777954e-05, -6.951577961444855e-05, -6.728991866111755e-05, -6.506405770778656e-05, -6.283819675445557e-05, -6.061233580112457e-05, -5.838647484779358e-05, -5.6160613894462585e-05, -5.393475294113159e-05, -5.17088919878006e-05, -4.9483031034469604e-05, -4.725717008113861e-05, -4.503130912780762e-05, -4.2805448174476624e-05, -4.057958722114563e-05, -3.8353726267814636e-05, -3.612786531448364e-05, -3.390200436115265e-05, -3.1676143407821655e-05, -2.945028245449066e-05, -2.7224421501159668e-05, -2.4998560547828674e-05, -2.277269959449768e-05, -2.0546838641166687e-05, -1.8320977687835693e-05, -1.60951167345047e-05, -1.3869255781173706e-05, -1.1643394827842712e-05, -9.417533874511719e-06, -7.191672921180725e-06, -4.9658119678497314e-06, -2.739951014518738e-06, -5.140900611877441e-07, 1.7117708921432495e-06, 3.937631845474243e-06, 6.163492798805237e-06, 8.38935375213623e-06, 1.0615214705467224e-05, 1.2841075658798218e-05, 1.5066936612129211e-05, 1.7292797565460205e-05, 1.95186585187912e-05, 2.1744519472122192e-05, 2.3970380425453186e-05, 2.619624137878418e-05, 2.8422102332115173e-05, 3.064796328544617e-05, 3.287382423877716e-05, 3.5099685192108154e-05, 3.732554614543915e-05, 3.955140709877014e-05, 4.1777268052101135e-05, 4.400312900543213e-05, 4.622898995876312e-05, 4.8454850912094116e-05, 5.068071186542511e-05, 5.2906572818756104e-05, 5.51324337720871e-05, 5.735829472541809e-05, 5.9584155678749084e-05, 6.181001663208008e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 11.0, 12.0, 13.0, 24.0, 39.0, 77.0, 84.0, 173.0, 240.0, 567.0, 1027.0, 2899.0, 9040.0, 47778.0, 896184.0, 73264.0, 11442.0, 3223.0, 1214.0, 539.0, 289.0, 164.0, 92.0, 40.0, 44.0, 27.0, 16.0, 10.0, 6.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.775390625, -1.7281494140625, -1.680908203125, -1.6336669921875, -1.58642578125, -1.5391845703125, -1.491943359375, -1.4447021484375, -1.3974609375, -1.3502197265625, -1.302978515625, -1.2557373046875, -1.20849609375, -1.1612548828125, -1.114013671875, -1.0667724609375, -1.01953125, -0.9722900390625, -0.925048828125, -0.8778076171875, -0.83056640625, -0.7833251953125, -0.736083984375, -0.6888427734375, -0.6416015625, -0.5943603515625, -0.547119140625, -0.4998779296875, -0.45263671875, -0.4053955078125, -0.358154296875, -0.3109130859375, -0.263671875, -0.2164306640625, -0.169189453125, -0.1219482421875, -0.07470703125, -0.0274658203125, 0.019775390625, 0.0670166015625, 0.1142578125, 0.1614990234375, 0.208740234375, 0.2559814453125, 0.30322265625, 0.3504638671875, 0.397705078125, 0.4449462890625, 0.4921875, 0.5394287109375, 0.586669921875, 0.6339111328125, 0.68115234375, 0.7283935546875, 0.775634765625, 0.8228759765625, 0.8701171875, 0.9173583984375, 0.964599609375, 1.0118408203125, 1.05908203125, 1.1063232421875, 1.153564453125, 1.2008056640625, 1.248046875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 4.0, 6.0, 10.0, 13.0, 13.0, 30.0, 44.0, 105.0, 213.0, 252.0, 135.0, 51.0, 28.0, 22.0, 8.0, 14.0, 14.0, 10.0, 3.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9831161499023438, -0.9535369873046875, -0.9239578247070312, -0.894378662109375, -0.8647994995117188, -0.8352203369140625, -0.8056411743164062, -0.77606201171875, -0.7464828491210938, -0.7169036865234375, -0.6873245239257812, -0.657745361328125, -0.6281661987304688, -0.5985870361328125, -0.5690078735351562, -0.5394287109375, -0.5098495483398438, -0.4802703857421875, -0.45069122314453125, -0.421112060546875, -0.39153289794921875, -0.3619537353515625, -0.33237457275390625, -0.30279541015625, -0.27321624755859375, -0.2436370849609375, -0.21405792236328125, -0.184478759765625, -0.15489959716796875, -0.1253204345703125, -0.09574127197265625, -0.066162109375, -0.03658294677734375, -0.0070037841796875, 0.02257537841796875, 0.052154541015625, 0.08173370361328125, 0.1113128662109375, 0.14089202880859375, 0.17047119140625, 0.20005035400390625, 0.2296295166015625, 0.25920867919921875, 0.288787841796875, 0.31836700439453125, 0.3479461669921875, 0.37752532958984375, 0.4071044921875, 0.43668365478515625, 0.4662628173828125, 0.49584197998046875, 0.525421142578125, 0.5550003051757812, 0.5845794677734375, 0.6141586303710938, 0.64373779296875, 0.6733169555664062, 0.7028961181640625, 0.7324752807617188, 0.762054443359375, 0.7916336059570312, 0.8212127685546875, 0.8507919311523438, 0.88037109375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 12.0, 16.0, 28.0, 78.0, 168.0, 213.0, 242.0, 108.0, 60.0, 31.0, 16.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.424810886383057, -5.306727409362793, -5.188643932342529, -5.070559978485107, -4.952476501464844, -4.83439302444458, -4.716309547424316, -4.598226070404053, -4.480142593383789, -4.362059116363525, -4.243975639343262, -4.12589168548584, -4.007808208465576, -3.8897247314453125, -3.771641254425049, -3.653557777404785, -3.5354738235473633, -3.4173903465270996, -3.299306631088257, -3.181223154067993, -3.0631394386291504, -2.9450559616088867, -2.826972484588623, -2.7088890075683594, -2.5908052921295166, -2.472721815109253, -2.35463809967041, -2.2365546226501465, -2.118471145629883, -2.00038743019104, -1.8823039531707764, -1.7642203569412231, -1.646136999130249, -1.5280534029006958, -1.4099698066711426, -1.291886329650879, -1.1738027334213257, -1.0557191371917725, -0.937635600566864, -0.8195520639419556, -0.7014684677124023, -0.5833848714828491, -0.4653013348579407, -0.34721776843070984, -0.229134202003479, -0.11105060577392578, 0.007032930850982666, 0.1251164674758911, 0.24320006370544434, 0.36128363013267517, 0.479367196559906, 0.5974507331848145, 0.7155343294143677, 0.8336179256439209, 0.9517014622688293, 1.0697849988937378, 1.187868595123291, 1.3059521913528442, 1.4240357875823975, 1.5421192646026611, 1.6602028608322144, 1.7782864570617676, 1.8963699340820312, 2.014453411102295, 2.1325371265411377]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 7.0, 16.0, 23.0, 34.0, 36.0, 42.0, 61.0, 64.0, 79.0, 81.0, 85.0, 86.0, 70.0, 63.0, 45.0, 49.0, 40.0, 27.0, 19.0, 19.0, 9.0, 10.0, 2.0, 3.0, 7.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.428568124771118, -2.3419911861419678, -2.2554140090942383, -2.168837070465088, -2.0822601318359375, -1.995682954788208, -1.9091060161590576, -1.8225289583206177, -1.7359519004821777, -1.6493748426437378, -1.5627977848052979, -1.4762208461761475, -1.3896437883377075, -1.3030667304992676, -1.2164897918701172, -1.1299127340316772, -1.0433356761932373, -0.9567586183547974, -0.8701816201210022, -0.783604621887207, -0.6970275640487671, -0.6104505062103271, -0.523873507976532, -0.4372965097427368, -0.3507194519042969, -0.2641424238681793, -0.17756539583206177, -0.09098836779594421, -0.00441133975982666, 0.0821656882762909, 0.16874271631240845, 0.2553197145462036, 0.34189653396606445, 0.428473562002182, 0.5150505900382996, 0.6016275882720947, 0.6882046461105347, 0.7747817039489746, 0.8613587021827698, 0.9479357004165649, 1.0345127582550049, 1.1210898160934448, 1.2076668739318848, 1.2942438125610352, 1.380820870399475, 1.467397928237915, 1.5539748668670654, 1.6405519247055054, 1.7271289825439453, 1.8137060403823853, 1.9002830982208252, 1.9868600368499756, 2.073437213897705, 2.1600141525268555, 2.246591091156006, 2.3331680297851562, 2.4197452068328857, 2.506322145462036, 2.5928993225097656, 2.679476261138916, 2.7660531997680664, 2.852630376815796, 2.9392073154449463, 3.025784492492676, 3.112361431121826]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 7.0, 13.0, 19.0, 22.0, 35.0, 47.0, 59.0, 66.0, 101.0, 115.0, 191.0, 276.0, 535.0, 906.0, 1633.0, 3404.0, 9100.0, 33407.0, 747845.0, 3329821.0, 46385.0, 11405.0, 4423.0, 1922.0, 1040.0, 573.0, 338.0, 215.0, 126.0, 69.0, 48.0, 31.0, 24.0, 19.0, 14.0, 8.0, 9.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 5.0, 0.0, 4.0, 1.0], "bins": [-1.12109375, -1.09002685546875, -1.0589599609375, -1.02789306640625, -0.996826171875, -0.96575927734375, -0.9346923828125, -0.90362548828125, -0.87255859375, -0.84149169921875, -0.8104248046875, -0.77935791015625, -0.748291015625, -0.71722412109375, -0.6861572265625, -0.65509033203125, -0.6240234375, -0.59295654296875, -0.5618896484375, -0.53082275390625, -0.499755859375, -0.46868896484375, -0.4376220703125, -0.40655517578125, -0.37548828125, -0.34442138671875, -0.3133544921875, -0.28228759765625, -0.251220703125, -0.22015380859375, -0.1890869140625, -0.15802001953125, -0.126953125, -0.09588623046875, -0.0648193359375, -0.03375244140625, -0.002685546875, 0.02838134765625, 0.0594482421875, 0.09051513671875, 0.12158203125, 0.15264892578125, 0.1837158203125, 0.21478271484375, 0.245849609375, 0.27691650390625, 0.3079833984375, 0.33905029296875, 0.3701171875, 0.40118408203125, 0.4322509765625, 0.46331787109375, 0.494384765625, 0.52545166015625, 0.5565185546875, 0.58758544921875, 0.61865234375, 0.64971923828125, 0.6807861328125, 0.71185302734375, 0.742919921875, 0.77398681640625, 0.8050537109375, 0.83612060546875, 0.8671875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 6.0, 7.0, 13.0, 11.0, 29.0, 33.0, 56.0, 59.0, 102.0, 121.0, 114.0, 102.0, 84.0, 58.0, 46.0, 42.0, 23.0, 21.0, 18.0, 11.0, 5.0, 8.0, 7.0, 7.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054595947265625, -0.05306053161621094, -0.051525115966796875, -0.04998970031738281, -0.04845428466796875, -0.04691886901855469, -0.045383453369140625, -0.04384803771972656, -0.0423126220703125, -0.04077720642089844, -0.039241790771484375, -0.03770637512207031, -0.03617095947265625, -0.03463554382324219, -0.033100128173828125, -0.03156471252441406, -0.030029296875, -0.028493881225585938, -0.026958465576171875, -0.025423049926757812, -0.02388763427734375, -0.022352218627929688, -0.020816802978515625, -0.019281387329101562, -0.0177459716796875, -0.016210556030273438, -0.014675140380859375, -0.013139724731445312, -0.01160430908203125, -0.010068893432617188, -0.008533477783203125, -0.0069980621337890625, -0.005462646484375, -0.0039272308349609375, -0.002391815185546875, -0.0008563995361328125, 0.00067901611328125, 0.0022144317626953125, 0.003749847412109375, 0.0052852630615234375, 0.0068206787109375, 0.008356094360351562, 0.009891510009765625, 0.011426925659179688, 0.01296234130859375, 0.014497756958007812, 0.016033172607421875, 0.017568588256835938, 0.01910400390625, 0.020639419555664062, 0.022174835205078125, 0.023710250854492188, 0.02524566650390625, 0.026781082153320312, 0.028316497802734375, 0.029851913452148438, 0.0313873291015625, 0.03292274475097656, 0.034458160400390625, 0.03599357604980469, 0.03752899169921875, 0.03906440734863281, 0.040599822998046875, 0.04213523864746094, 0.043670654296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 1.0, 5.0, 12.0, 11.0, 8.0, 19.0, 11.0, 26.0, 28.0, 57.0, 125.0, 313.0, 1183.0, 8582.0, 253006.0, 3894634.0, 32441.0, 2819.0, 550.0, 192.0, 76.0, 41.0, 44.0, 19.0, 11.0, 14.0, 14.0, 7.0, 7.0, 4.0, 2.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.875, -1.8246612548828125, -1.774322509765625, -1.7239837646484375, -1.67364501953125, -1.6233062744140625, -1.572967529296875, -1.5226287841796875, -1.4722900390625, -1.4219512939453125, -1.371612548828125, -1.3212738037109375, -1.27093505859375, -1.2205963134765625, -1.170257568359375, -1.1199188232421875, -1.069580078125, -1.0192413330078125, -0.968902587890625, -0.9185638427734375, -0.86822509765625, -0.8178863525390625, -0.767547607421875, -0.7172088623046875, -0.6668701171875, -0.6165313720703125, -0.566192626953125, -0.5158538818359375, -0.46551513671875, -0.4151763916015625, -0.364837646484375, -0.3144989013671875, -0.26416015625, -0.2138214111328125, -0.163482666015625, -0.1131439208984375, -0.06280517578125, -0.0124664306640625, 0.037872314453125, 0.0882110595703125, 0.1385498046875, 0.1888885498046875, 0.239227294921875, 0.2895660400390625, 0.33990478515625, 0.3902435302734375, 0.440582275390625, 0.4909210205078125, 0.541259765625, 0.5915985107421875, 0.641937255859375, 0.6922760009765625, 0.74261474609375, 0.7929534912109375, 0.843292236328125, 0.8936309814453125, 0.9439697265625, 0.9943084716796875, 1.044647216796875, 1.0949859619140625, 1.14532470703125, 1.1956634521484375, 1.246002197265625, 1.2963409423828125, 1.3466796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 3.0, 8.0, 13.0, 18.0, 18.0, 24.0, 42.0, 53.0, 92.0, 131.0, 254.0, 661.0, 1392.0, 633.0, 294.0, 168.0, 71.0, 62.0, 32.0, 22.0, 18.0, 13.0, 8.0, 9.0, 5.0, 1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07427978515625, -0.07125282287597656, -0.06822586059570312, -0.06519889831542969, -0.06217193603515625, -0.05914497375488281, -0.056118011474609375, -0.05309104919433594, -0.0500640869140625, -0.04703712463378906, -0.044010162353515625, -0.04098320007324219, -0.03795623779296875, -0.03492927551269531, -0.031902313232421875, -0.028875350952148438, -0.025848388671875, -0.022821426391601562, -0.019794464111328125, -0.016767501831054688, -0.01374053955078125, -0.010713577270507812, -0.007686614990234375, -0.0046596527099609375, -0.0016326904296875, 0.0013942718505859375, 0.004421234130859375, 0.0074481964111328125, 0.01047515869140625, 0.013502120971679688, 0.016529083251953125, 0.019556045532226562, 0.0225830078125, 0.025609970092773438, 0.028636932373046875, 0.03166389465332031, 0.03469085693359375, 0.03771781921386719, 0.040744781494140625, 0.04377174377441406, 0.0467987060546875, 0.04982566833496094, 0.052852630615234375, 0.05587959289550781, 0.05890655517578125, 0.06193351745605469, 0.06496047973632812, 0.06798744201660156, 0.071014404296875, 0.07404136657714844, 0.07706832885742188, 0.08009529113769531, 0.08312225341796875, 0.08614921569824219, 0.08917617797851562, 0.09220314025878906, 0.0952301025390625, 0.09825706481933594, 0.10128402709960938, 0.10431098937988281, 0.10733795166015625, 0.11036491394042969, 0.11339187622070312, 0.11641883850097656, 0.11944580078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 18.0, 245.0, 529.0, 147.0, 43.0, 8.0, 8.0, 3.0, 1.0], "bins": [-4.585784435272217, -4.505848407745361, -4.425912380218506, -4.34597635269165, -4.266040802001953, -4.186104774475098, -4.106168746948242, -4.026232719421387, -3.9462966918945312, -3.866360664367676, -3.7864246368408203, -3.706488847732544, -3.6265528202056885, -3.546616792678833, -3.4666810035705566, -3.386744976043701, -3.3068089485168457, -3.2268729209899902, -3.1469368934631348, -3.0670011043548584, -2.987065076828003, -2.9071290493011475, -2.827193260192871, -2.7472572326660156, -2.66732120513916, -2.5873851776123047, -2.507449150085449, -2.427513360977173, -2.3475773334503174, -2.267641305923462, -2.1877055168151855, -2.10776948928833, -2.0278334617614746, -1.9478974342346191, -1.8679615259170532, -1.7880256175994873, -1.7080895900726318, -1.6281535625457764, -1.5482176542282104, -1.4682817459106445, -1.388345718383789, -1.3084096908569336, -1.2284737825393677, -1.1485378742218018, -1.0686018466949463, -0.9886658787727356, -0.9087299108505249, -0.8287939429283142, -0.7488580346107483, -0.6689220666885376, -0.5889860987663269, -0.5090501308441162, -0.4291141629219055, -0.3491781949996948, -0.26924222707748413, -0.18930625915527344, -0.10937029123306274, -0.02943432331085205, 0.05050164461135864, 0.13043761253356934, 0.21037358045578003, 0.2903095483779907, 0.3702455163002014, 0.4501814842224121, 0.5301174521446228]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 13.0, 17.0, 20.0, 50.0, 61.0, 78.0, 83.0, 105.0, 134.0, 90.0, 81.0, 79.0, 55.0, 48.0, 32.0, 18.0, 12.0, 9.0, 6.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.3663687705993652, -1.3385528326034546, -1.310736894607544, -1.2829209566116333, -1.2551050186157227, -1.2272891998291016, -1.1994731426239014, -1.1716573238372803, -1.1438413858413696, -1.116025447845459, -1.0882095098495483, -1.0603935718536377, -1.032577633857727, -1.0047616958618164, -0.9769458174705505, -0.9491298794746399, -0.9213139414787292, -0.8934980034828186, -0.865682065486908, -0.8378661870956421, -0.8100502490997314, -0.7822343111038208, -0.7544183731079102, -0.7266024351119995, -0.6987864971160889, -0.6709705591201782, -0.6431546211242676, -0.6153386831283569, -0.5875228047370911, -0.5597068667411804, -0.5318909287452698, -0.5040749907493591, -0.47625917196273804, -0.4484432339668274, -0.42062732577323914, -0.3928113877773285, -0.36499547958374023, -0.3371795415878296, -0.30936360359191895, -0.2815476655960083, -0.25373175740242004, -0.2259158343076706, -0.19809991121292114, -0.1702839732170105, -0.14246805012226105, -0.1146521270275116, -0.08683618903160095, -0.0590202659368515, -0.03120434284210205, -0.0033884160220623016, 0.024427510797977448, 0.052243441343307495, 0.08005936443805695, 0.1078752875328064, 0.13569122552871704, 0.1635071486234665, 0.19132307171821594, 0.2191389948129654, 0.24695491790771484, 0.2747708559036255, 0.30258679389953613, 0.3304027020931244, 0.35821864008903503, 0.3860345482826233, 0.41385048627853394]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 13.0, 17.0, 19.0, 20.0, 30.0, 43.0, 38.0, 50.0, 49.0, 56.0, 61.0, 604.0, 201236.0, 844680.0, 1182.0, 87.0, 48.0, 39.0, 41.0, 39.0, 26.0, 24.0, 32.0, 22.0, 13.0, 13.0, 7.0, 9.0, 10.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.6328125, -2.54534912109375, -2.4578857421875, -2.37042236328125, -2.282958984375, -2.19549560546875, -2.1080322265625, -2.02056884765625, -1.93310546875, -1.84564208984375, -1.7581787109375, -1.67071533203125, -1.583251953125, -1.49578857421875, -1.4083251953125, -1.32086181640625, -1.2333984375, -1.14593505859375, -1.0584716796875, -0.97100830078125, -0.883544921875, -0.79608154296875, -0.7086181640625, -0.62115478515625, -0.53369140625, -0.44622802734375, -0.3587646484375, -0.27130126953125, -0.183837890625, -0.09637451171875, -0.0089111328125, 0.07855224609375, 0.166015625, 0.25347900390625, 0.3409423828125, 0.42840576171875, 0.515869140625, 0.60333251953125, 0.6907958984375, 0.77825927734375, 0.86572265625, 0.95318603515625, 1.0406494140625, 1.12811279296875, 1.215576171875, 1.30303955078125, 1.3905029296875, 1.47796630859375, 1.5654296875, 1.65289306640625, 1.7403564453125, 1.82781982421875, 1.915283203125, 2.00274658203125, 2.0902099609375, 2.17767333984375, 2.26513671875, 2.35260009765625, 2.4400634765625, 2.52752685546875, 2.614990234375, 2.70245361328125, 2.7899169921875, 2.87738037109375, 2.96484375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 16.0, 74.0, 257.0, 356.0, 224.0, 62.0, 17.0, 4.0, 1.0, 2.0], "bins": [-0.36865234375, -0.3622255325317383, -0.35579872131347656, -0.34937191009521484, -0.3429450988769531, -0.3365182876586914, -0.3300914764404297, -0.32366466522216797, -0.31723785400390625, -0.31081104278564453, -0.3043842315673828, -0.2979574203491211, -0.2915306091308594, -0.28510379791259766, -0.27867698669433594, -0.2722501754760742, -0.2658233642578125, -0.2593965530395508, -0.25296974182128906, -0.24654293060302734, -0.24011611938476562, -0.2336893081665039, -0.2272624969482422, -0.22083568572998047, -0.21440887451171875, -0.20798206329345703, -0.2015552520751953, -0.1951284408569336, -0.18870162963867188, -0.18227481842041016, -0.17584800720214844, -0.16942119598388672, -0.162994384765625, -0.15656757354736328, -0.15014076232910156, -0.14371395111083984, -0.13728713989257812, -0.1308603286743164, -0.12443351745605469, -0.11800670623779297, -0.11157989501953125, -0.10515308380126953, -0.09872627258300781, -0.0922994613647461, -0.08587265014648438, -0.07944583892822266, -0.07301902770996094, -0.06659221649169922, -0.0601654052734375, -0.05373859405517578, -0.04731178283691406, -0.040884971618652344, -0.034458160400390625, -0.028031349182128906, -0.021604537963867188, -0.015177726745605469, -0.00875091552734375, -0.0023241043090820312, 0.0041027069091796875, 0.010529518127441406, 0.016956329345703125, 0.023383140563964844, 0.029809951782226562, 0.03623676300048828, 0.04266357421875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 8.0, 15.0, 21.0, 27.0, 34.0, 54.0, 101.0, 163.0, 307.0, 705.0, 1779.0, 5795.0, 24837.0, 165652.0, 622193.0, 189517.0, 27701.0, 6169.0, 1923.0, 748.0, 370.0, 180.0, 90.0, 50.0, 34.0, 23.0, 15.0, 13.0, 4.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.79296875, -0.7706527709960938, -0.7483367919921875, -0.7260208129882812, -0.703704833984375, -0.6813888549804688, -0.6590728759765625, -0.6367568969726562, -0.61444091796875, -0.5921249389648438, -0.5698089599609375, -0.5474929809570312, -0.525177001953125, -0.5028610229492188, -0.4805450439453125, -0.45822906494140625, -0.4359130859375, -0.41359710693359375, -0.3912811279296875, -0.36896514892578125, -0.346649169921875, -0.32433319091796875, -0.3020172119140625, -0.27970123291015625, -0.25738525390625, -0.23506927490234375, -0.2127532958984375, -0.19043731689453125, -0.168121337890625, -0.14580535888671875, -0.1234893798828125, -0.10117340087890625, -0.078857421875, -0.05654144287109375, -0.0342254638671875, -0.01190948486328125, 0.010406494140625, 0.03272247314453125, 0.0550384521484375, 0.07735443115234375, 0.09967041015625, 0.12198638916015625, 0.1443023681640625, 0.16661834716796875, 0.188934326171875, 0.21125030517578125, 0.2335662841796875, 0.25588226318359375, 0.2781982421875, 0.30051422119140625, 0.3228302001953125, 0.34514617919921875, 0.367462158203125, 0.38977813720703125, 0.4120941162109375, 0.43441009521484375, 0.45672607421875, 0.47904205322265625, 0.5013580322265625, 0.5236740112304688, 0.545989990234375, 0.5683059692382812, 0.5906219482421875, 0.6129379272460938, 0.63525390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 11.0, 7.0, 6.0, 11.0, 12.0, 19.0, 13.0, 19.0, 20.0, 26.0, 36.0, 49.0, 40.0, 42.0, 37.0, 45.0, 51.0, 45.0, 61.0, 51.0, 59.0, 41.0, 48.0, 31.0, 38.0, 31.0, 26.0, 23.0, 20.0, 16.0, 15.0, 9.0, 9.0, 7.0, 4.0, 3.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.314697265625, -0.3054008483886719, -0.29610443115234375, -0.2868080139160156, -0.2775115966796875, -0.2682151794433594, -0.25891876220703125, -0.24962234497070312, -0.240325927734375, -0.23102951049804688, -0.22173309326171875, -0.21243667602539062, -0.2031402587890625, -0.19384384155273438, -0.18454742431640625, -0.17525100708007812, -0.16595458984375, -0.15665817260742188, -0.14736175537109375, -0.13806533813476562, -0.1287689208984375, -0.11947250366210938, -0.11017608642578125, -0.10087966918945312, -0.091583251953125, -0.08228683471679688, -0.07299041748046875, -0.06369400024414062, -0.0543975830078125, -0.045101165771484375, -0.03580474853515625, -0.026508331298828125, -0.0172119140625, -0.007915496826171875, 0.00138092041015625, 0.010677337646484375, 0.0199737548828125, 0.029270172119140625, 0.03856658935546875, 0.047863006591796875, 0.057159423828125, 0.06645584106445312, 0.07575225830078125, 0.08504867553710938, 0.0943450927734375, 0.10364151000976562, 0.11293792724609375, 0.12223434448242188, 0.13153076171875, 0.14082717895507812, 0.15012359619140625, 0.15942001342773438, 0.1687164306640625, 0.17801284790039062, 0.18730926513671875, 0.19660568237304688, 0.205902099609375, 0.21519851684570312, 0.22449493408203125, 0.23379135131835938, 0.2430877685546875, 0.2523841857910156, 0.26168060302734375, 0.2709770202636719, 0.2802734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 6.0, 6.0, 10.0, 5.0, 19.0, 18.0, 30.0, 44.0, 60.0, 84.0, 146.0, 176.0, 323.0, 573.0, 1032.0, 2257.0, 5781.0, 18391.0, 83155.0, 412102.0, 411744.0, 83603.0, 18371.0, 5731.0, 2377.0, 1087.0, 550.0, 281.0, 174.0, 134.0, 96.0, 46.0, 36.0, 28.0, 19.0, 12.0, 9.0, 13.0, 5.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.556640625, -0.5419921875, -0.52734375, -0.5126953125, -0.498046875, -0.4833984375, -0.46875, -0.4541015625, -0.439453125, -0.4248046875, -0.41015625, -0.3955078125, -0.380859375, -0.3662109375, -0.3515625, -0.3369140625, -0.322265625, -0.3076171875, -0.29296875, -0.2783203125, -0.263671875, -0.2490234375, -0.234375, -0.2197265625, -0.205078125, -0.1904296875, -0.17578125, -0.1611328125, -0.146484375, -0.1318359375, -0.1171875, -0.1025390625, -0.087890625, -0.0732421875, -0.05859375, -0.0439453125, -0.029296875, -0.0146484375, 0.0, 0.0146484375, 0.029296875, 0.0439453125, 0.05859375, 0.0732421875, 0.087890625, 0.1025390625, 0.1171875, 0.1318359375, 0.146484375, 0.1611328125, 0.17578125, 0.1904296875, 0.205078125, 0.2197265625, 0.234375, 0.2490234375, 0.263671875, 0.2783203125, 0.29296875, 0.3076171875, 0.322265625, 0.3369140625, 0.3515625, 0.3662109375, 0.380859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 6.0, 2.0, 4.0, 9.0, 9.0, 13.0, 18.0, 36.0, 39.0, 60.0, 108.0, 109.0, 149.0, 123.0, 88.0, 78.0, 50.0, 31.0, 16.0, 14.0, 12.0, 10.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010305643081665039, -0.00010038074105978012, -9.770505130290985e-05, -9.502936154603958e-05, -9.235367178916931e-05, -8.967798203229904e-05, -8.700229227542877e-05, -8.43266025185585e-05, -8.165091276168823e-05, -7.897522300481796e-05, -7.629953324794769e-05, -7.362384349107742e-05, -7.094815373420715e-05, -6.827246397733688e-05, -6.559677422046661e-05, -6.292108446359634e-05, -6.0245394706726074e-05, -5.7569704949855804e-05, -5.4894015192985535e-05, -5.2218325436115265e-05, -4.9542635679244995e-05, -4.6866945922374725e-05, -4.4191256165504456e-05, -4.1515566408634186e-05, -3.8839876651763916e-05, -3.6164186894893646e-05, -3.3488497138023376e-05, -3.081280738115311e-05, -2.8137117624282837e-05, -2.5461427867412567e-05, -2.2785738110542297e-05, -2.0110048353672028e-05, -1.7434358596801758e-05, -1.4758668839931488e-05, -1.2082979083061218e-05, -9.407289326190948e-06, -6.731599569320679e-06, -4.055909812450409e-06, -1.3802200555801392e-06, 1.2954697012901306e-06, 3.9711594581604e-06, 6.64684921503067e-06, 9.32253897190094e-06, 1.199822872877121e-05, 1.467391848564148e-05, 1.734960824251175e-05, 2.002529799938202e-05, 2.270098775625229e-05, 2.537667751312256e-05, 2.805236726999283e-05, 3.07280570268631e-05, 3.340374678373337e-05, 3.607943654060364e-05, 3.875512629747391e-05, 4.143081605434418e-05, 4.410650581121445e-05, 4.678219556808472e-05, 4.9457885324954987e-05, 5.2133575081825256e-05, 5.4809264838695526e-05, 5.7484954595565796e-05, 6.0160644352436066e-05, 6.283633410930634e-05, 6.55120238661766e-05, 6.818771362304688e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 10.0, 15.0, 13.0, 26.0, 46.0, 69.0, 124.0, 221.0, 379.0, 956.0, 2553.0, 9792.0, 91500.0, 837106.0, 91716.0, 9581.0, 2611.0, 918.0, 391.0, 216.0, 115.0, 71.0, 50.0, 23.0, 21.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.125, -1.0923919677734375, -1.059783935546875, -1.0271759033203125, -0.99456787109375, -0.9619598388671875, -0.929351806640625, -0.8967437744140625, -0.8641357421875, -0.8315277099609375, -0.798919677734375, -0.7663116455078125, -0.73370361328125, -0.7010955810546875, -0.668487548828125, -0.6358795166015625, -0.603271484375, -0.5706634521484375, -0.538055419921875, -0.5054473876953125, -0.47283935546875, -0.4402313232421875, -0.407623291015625, -0.3750152587890625, -0.3424072265625, -0.3097991943359375, -0.277191162109375, -0.2445831298828125, -0.21197509765625, -0.1793670654296875, -0.146759033203125, -0.1141510009765625, -0.08154296875, -0.0489349365234375, -0.016326904296875, 0.0162811279296875, 0.04888916015625, 0.0814971923828125, 0.114105224609375, 0.1467132568359375, 0.1793212890625, 0.2119293212890625, 0.244537353515625, 0.2771453857421875, 0.30975341796875, 0.3423614501953125, 0.374969482421875, 0.4075775146484375, 0.440185546875, 0.4727935791015625, 0.505401611328125, 0.5380096435546875, 0.57061767578125, 0.6032257080078125, 0.635833740234375, 0.6684417724609375, 0.7010498046875, 0.7336578369140625, 0.766265869140625, 0.7988739013671875, 0.83148193359375, 0.8640899658203125, 0.896697998046875, 0.9293060302734375, 0.9619140625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 12.0, 13.0, 35.0, 77.0, 128.0, 187.0, 192.0, 149.0, 91.0, 53.0, 27.0, 15.0, 9.0, 5.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.6266517639160156, -0.6107254028320312, -0.5947990417480469, -0.5788726806640625, -0.5629463195800781, -0.5470199584960938, -0.5310935974121094, -0.515167236328125, -0.4992408752441406, -0.48331451416015625, -0.4673881530761719, -0.4514617919921875, -0.4355354309082031, -0.41960906982421875, -0.4036827087402344, -0.38775634765625, -0.3718299865722656, -0.35590362548828125, -0.3399772644042969, -0.3240509033203125, -0.3081245422363281, -0.29219818115234375, -0.2762718200683594, -0.260345458984375, -0.24441909790039062, -0.22849273681640625, -0.21256637573242188, -0.1966400146484375, -0.18071365356445312, -0.16478729248046875, -0.14886093139648438, -0.1329345703125, -0.11700820922851562, -0.10108184814453125, -0.08515548706054688, -0.0692291259765625, -0.053302764892578125, -0.03737640380859375, -0.021450042724609375, -0.005523681640625, 0.010402679443359375, 0.02632904052734375, 0.042255401611328125, 0.0581817626953125, 0.07410812377929688, 0.09003448486328125, 0.10596084594726562, 0.12188720703125, 0.13781356811523438, 0.15373992919921875, 0.16966629028320312, 0.1855926513671875, 0.20151901245117188, 0.21744537353515625, 0.23337173461914062, 0.249298095703125, 0.2652244567871094, 0.28115081787109375, 0.2970771789550781, 0.3130035400390625, 0.3289299011230469, 0.34485626220703125, 0.3607826232910156, 0.376708984375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 19.0, 68.0, 250.0, 356.0, 190.0, 79.0, 23.0, 7.0, 9.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.066506385803223, -3.8166847229003906, -3.5668630599975586, -3.3170413970947266, -3.0672199726104736, -2.8173983097076416, -2.5675766468048096, -2.3177552223205566, -2.0679335594177246, -1.8181118965148926, -1.56829035282135, -1.318468689918518, -1.0686471462249756, -0.8188254833221436, -0.5690038204193115, -0.31918227672576904, -0.06936049461364746, 0.180461123585701, 0.43028274178504944, 0.6801043748855591, 0.9299259781837463, 1.1797475814819336, 1.4295692443847656, 1.679390788078308, 1.9292124509811401, 2.1790339946746826, 2.4288556575775146, 2.6786773204803467, 2.9284989833831787, 3.1783204078674316, 3.4281420707702637, 3.6779637336730957, 3.9277853965759277, 4.17760705947876, 4.427428722381592, 4.677250385284424, 4.927072048187256, 5.17689323425293, 5.426714897155762, 5.676536560058594, 5.926358222961426, 6.176179885864258, 6.42600154876709, 6.675823211669922, 6.925644874572754, 7.175466537475586, 7.425288200378418, 7.675109386444092, 7.924931526184082, 8.174753189086914, 8.424574851989746, 8.674396514892578, 8.92421817779541, 9.174039840698242, 9.423861503601074, 9.673683166503906, 9.923503875732422, 10.173325538635254, 10.423147201538086, 10.672968864440918, 10.92279052734375, 11.172612190246582, 11.422433853149414, 11.672255516052246, 11.922077178955078]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 4.0, 1.0, 2.0, 7.0, 8.0, 11.0, 14.0, 21.0, 28.0, 23.0, 38.0, 29.0, 44.0, 40.0, 44.0, 45.0, 53.0, 66.0, 59.0, 59.0, 53.0, 51.0, 51.0, 43.0, 33.0, 38.0, 25.0, 27.0, 15.0, 25.0, 17.0, 8.0, 7.0, 9.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.217620849609375, -2.146178960800171, -2.074737071990967, -2.003295421600342, -1.9318535327911377, -1.8604116439819336, -1.7889697551727295, -1.7175278663635254, -1.6460860967636108, -1.5746442079544067, -1.5032024383544922, -1.431760549545288, -1.360318660736084, -1.2888768911361694, -1.2174350023269653, -1.1459932327270508, -1.0745513439178467, -1.0031094551086426, -0.931667685508728, -0.8602257966995239, -0.7887839674949646, -0.7173421382904053, -0.6459002494812012, -0.5744584202766418, -0.5030165910720825, -0.4315747618675232, -0.3601329028606415, -0.28869104385375977, -0.21724921464920044, -0.1458073854446411, -0.0743655264377594, -0.0029236674308776855, 0.06851816177368164, 0.13996000587940216, 0.21140184998512268, 0.2828437089920044, 0.3542855381965637, 0.42572736740112305, 0.49716922640800476, 0.5686110854148865, 0.6400529146194458, 0.7114947438240051, 0.7829365730285645, 0.8543784618377686, 0.9258202910423279, 0.9972621202468872, 1.0687040090560913, 1.1401457786560059, 1.21158766746521, 1.283029556274414, 1.3544713258743286, 1.4259132146835327, 1.4973549842834473, 1.5687968730926514, 1.6402387619018555, 1.7116806507110596, 1.7831224203109741, 1.8545643091201782, 1.9260060787200928, 1.9974479675292969, 2.068889856338501, 2.140331745147705, 2.21177339553833, 2.283215284347534, 2.3546571731567383]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 7.0, 9.0, 14.0, 22.0, 32.0, 60.0, 82.0, 120.0, 226.0, 474.0, 14112.0, 4177800.0, 1107.0, 139.0, 62.0, 14.0, 7.0, 3.0, 3.0], "bins": [-14.96875, -14.70281982421875, -14.4368896484375, -14.17095947265625, -13.905029296875, -13.63909912109375, -13.3731689453125, -13.10723876953125, -12.84130859375, -12.57537841796875, -12.3094482421875, -12.04351806640625, -11.777587890625, -11.51165771484375, -11.2457275390625, -10.97979736328125, -10.7138671875, -10.44793701171875, -10.1820068359375, -9.91607666015625, -9.650146484375, -9.38421630859375, -9.1182861328125, -8.85235595703125, -8.58642578125, -8.32049560546875, -8.0545654296875, -7.78863525390625, -7.522705078125, -7.25677490234375, -6.9908447265625, -6.72491455078125, -6.458984375, -6.19305419921875, -5.9271240234375, -5.66119384765625, -5.395263671875, -5.12933349609375, -4.8634033203125, -4.59747314453125, -4.33154296875, -4.06561279296875, -3.7996826171875, -3.53375244140625, -3.267822265625, -3.00189208984375, -2.7359619140625, -2.47003173828125, -2.2041015625, -1.93817138671875, -1.6722412109375, -1.40631103515625, -1.140380859375, -0.87445068359375, -0.6085205078125, -0.34259033203125, -0.07666015625, 0.18927001953125, 0.4552001953125, 0.72113037109375, 0.987060546875, 1.25299072265625, 1.5189208984375, 1.78485107421875, 2.05078125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 9.0, 28.0, 63.0, 154.0, 210.0, 235.0, 156.0, 85.0, 50.0, 8.0, 8.0, 1.0, 4.0], "bins": [-0.373046875, -0.3663954734802246, -0.3597440719604492, -0.35309267044067383, -0.34644126892089844, -0.33978986740112305, -0.33313846588134766, -0.32648706436157227, -0.3198356628417969, -0.3131842613220215, -0.3065328598022461, -0.2998814582824707, -0.2932300567626953, -0.2865786552429199, -0.27992725372314453, -0.27327585220336914, -0.26662445068359375, -0.25997304916381836, -0.25332164764404297, -0.24667024612426758, -0.2400188446044922, -0.2333674430847168, -0.2267160415649414, -0.22006464004516602, -0.21341323852539062, -0.20676183700561523, -0.20011043548583984, -0.19345903396606445, -0.18680763244628906, -0.18015623092651367, -0.17350482940673828, -0.1668534278869629, -0.1602020263671875, -0.1535506248474121, -0.14689922332763672, -0.14024782180786133, -0.13359642028808594, -0.12694501876831055, -0.12029361724853516, -0.11364221572875977, -0.10699081420898438, -0.10033941268920898, -0.0936880111694336, -0.0870366096496582, -0.08038520812988281, -0.07373380661010742, -0.06708240509033203, -0.06043100357055664, -0.05377960205078125, -0.04712820053100586, -0.04047679901123047, -0.03382539749145508, -0.027173995971679688, -0.020522594451904297, -0.013871192932128906, -0.007219791412353516, -0.000568389892578125, 0.006083011627197266, 0.012734413146972656, 0.019385814666748047, 0.026037216186523438, 0.03268861770629883, 0.03934001922607422, 0.04599142074584961, 0.052642822265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 9.0, 6.0, 15.0, 14.0, 28.0, 49.0, 42.0, 64.0, 120.0, 171.0, 272.0, 1264.0, 202102.0, 3986110.0, 2882.0, 483.0, 216.0, 149.0, 95.0, 58.0, 40.0, 36.0, 15.0, 15.0, 9.0, 6.0, 11.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.859375, -8.658538818359375, -8.45770263671875, -8.256866455078125, -8.0560302734375, -7.855194091796875, -7.65435791015625, -7.453521728515625, -7.252685546875, -7.051849365234375, -6.85101318359375, -6.650177001953125, -6.4493408203125, -6.248504638671875, -6.04766845703125, -5.846832275390625, -5.64599609375, -5.445159912109375, -5.24432373046875, -5.043487548828125, -4.8426513671875, -4.641815185546875, -4.44097900390625, -4.240142822265625, -4.039306640625, -3.838470458984375, -3.63763427734375, -3.436798095703125, -3.2359619140625, -3.035125732421875, -2.83428955078125, -2.633453369140625, -2.4326171875, -2.231781005859375, -2.03094482421875, -1.830108642578125, -1.6292724609375, -1.428436279296875, -1.22760009765625, -1.026763916015625, -0.825927734375, -0.625091552734375, -0.42425537109375, -0.223419189453125, -0.0225830078125, 0.178253173828125, 0.37908935546875, 0.579925537109375, 0.78076171875, 0.981597900390625, 1.18243408203125, 1.383270263671875, 1.5841064453125, 1.784942626953125, 1.98577880859375, 2.186614990234375, 2.387451171875, 2.588287353515625, 2.78912353515625, 2.989959716796875, 3.1907958984375, 3.391632080078125, 3.59246826171875, 3.793304443359375, 3.994140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 58.0, 217.0, 2496.0, 1014.0, 168.0, 65.0, 23.0, 17.0, 8.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57568359375, -0.556396484375, -0.537109375, -0.517822265625, -0.49853515625, -0.479248046875, -0.4599609375, -0.440673828125, -0.42138671875, -0.402099609375, -0.3828125, -0.363525390625, -0.34423828125, -0.324951171875, -0.3056640625, -0.286376953125, -0.26708984375, -0.247802734375, -0.228515625, -0.209228515625, -0.18994140625, -0.170654296875, -0.1513671875, -0.132080078125, -0.11279296875, -0.093505859375, -0.07421875, -0.054931640625, -0.03564453125, -0.016357421875, 0.0029296875, 0.022216796875, 0.04150390625, 0.060791015625, 0.080078125, 0.099365234375, 0.11865234375, 0.137939453125, 0.1572265625, 0.176513671875, 0.19580078125, 0.215087890625, 0.234375, 0.253662109375, 0.27294921875, 0.292236328125, 0.3115234375, 0.330810546875, 0.35009765625, 0.369384765625, 0.388671875, 0.407958984375, 0.42724609375, 0.446533203125, 0.4658203125, 0.485107421875, 0.50439453125, 0.523681640625, 0.54296875, 0.562255859375, 0.58154296875, 0.600830078125, 0.6201171875, 0.639404296875, 0.65869140625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 12.0, 24.0, 86.0, 252.0, 373.0, 178.0, 42.0, 13.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1140847206115723, -2.952277660369873, -2.790470600128174, -2.6286633014678955, -2.4668562412261963, -2.305049180984497, -2.1432418823242188, -1.9814348220825195, -1.8196277618408203, -1.657820701599121, -1.4960135221481323, -1.3342063426971436, -1.1723992824554443, -1.0105922222137451, -0.8487850427627563, -0.6869778633117676, -0.5251708030700684, -0.36336368322372437, -0.20155656337738037, -0.03974944353103638, 0.12205767631530762, 0.2838647961616516, 0.4456719160079956, 0.6074790954589844, 0.7692861557006836, 0.9310932755470276, 1.0929003953933716, 1.2547075748443604, 1.4165146350860596, 1.5783216953277588, 1.7401288747787476, 1.9019360542297363, 2.0637435913085938, 2.225550651550293, 2.387357711791992, 2.5491650104522705, 2.7109720706939697, 2.872779130935669, 3.0345864295959473, 3.1963934898376465, 3.3582005500793457, 3.520007610321045, 3.681814670562744, 3.8436219692230225, 4.005429267883301, 4.167236328125, 4.329043388366699, 4.490850448608398, 4.652657508850098, 4.814464569091797, 4.976271629333496, 5.138078689575195, 5.2998857498168945, 5.461693286895752, 5.623500347137451, 5.78530740737915, 5.94711446762085, 6.108921527862549, 6.270728588104248, 6.432535648345947, 6.594343185424805, 6.756150245666504, 6.917957305908203, 7.079764366149902, 7.241571426391602]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 17.0, 24.0, 16.0, 31.0, 35.0, 42.0, 54.0, 64.0, 62.0, 75.0, 72.0, 74.0, 64.0, 66.0, 49.0, 51.0, 47.0, 45.0, 26.0, 21.0, 16.0, 12.0, 10.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380401849746704, -1.3349392414093018, -1.2894765138626099, -1.2440139055252075, -1.1985511779785156, -1.1530885696411133, -1.107625961303711, -1.062163233757019, -1.0167005062103271, -0.97123783826828, -0.9257751703262329, -0.8803125619888306, -0.8348498344421387, -0.7893872261047363, -0.7439245581626892, -0.6984618902206421, -0.6529992818832397, -0.6075366139411926, -0.5620739459991455, -0.5166113376617432, -0.47114863991737366, -0.42568597197532654, -0.3802233338356018, -0.3347606658935547, -0.28929799795150757, -0.24383533000946045, -0.19837267696857452, -0.1529100239276886, -0.10744735598564148, -0.06198468804359436, -0.01652204990386963, 0.02894061803817749, 0.07440328598022461, 0.11986594647169113, 0.16532860696315765, 0.21079126000404358, 0.2562539279460907, 0.3017165958881378, 0.34717923402786255, 0.39264190196990967, 0.4381045699119568, 0.4835672378540039, 0.529029905796051, 0.5744925737380981, 0.6199551820755005, 0.6654179096221924, 0.7108805179595947, 0.7563431859016418, 0.801805853843689, 0.8472685217857361, 0.8927311897277832, 0.9381937980651855, 0.9836565256118774, 1.0291191339492798, 1.0745818614959717, 1.120044469833374, 1.1655070781707764, 1.2109696865081787, 1.2564324140548706, 1.301895022392273, 1.3473577499389648, 1.3928203582763672, 1.4382829666137695, 1.4837456941604614, 1.5292084217071533]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 6.0, 12.0, 4.0, 13.0, 31.0, 26.0, 39.0, 58.0, 105.0, 206.0, 694.0, 4768.0, 166775.0, 854547.0, 18932.0, 1585.0, 359.0, 118.0, 71.0, 51.0, 35.0, 40.0, 29.0, 11.0, 9.0, 4.0, 8.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.8203125, -2.72705078125, -2.6337890625, -2.54052734375, -2.447265625, -2.35400390625, -2.2607421875, -2.16748046875, -2.07421875, -1.98095703125, -1.8876953125, -1.79443359375, -1.701171875, -1.60791015625, -1.5146484375, -1.42138671875, -1.328125, -1.23486328125, -1.1416015625, -1.04833984375, -0.955078125, -0.86181640625, -0.7685546875, -0.67529296875, -0.58203125, -0.48876953125, -0.3955078125, -0.30224609375, -0.208984375, -0.11572265625, -0.0224609375, 0.07080078125, 0.1640625, 0.25732421875, 0.3505859375, 0.44384765625, 0.537109375, 0.63037109375, 0.7236328125, 0.81689453125, 0.91015625, 1.00341796875, 1.0966796875, 1.18994140625, 1.283203125, 1.37646484375, 1.4697265625, 1.56298828125, 1.65625, 1.74951171875, 1.8427734375, 1.93603515625, 2.029296875, 2.12255859375, 2.2158203125, 2.30908203125, 2.40234375, 2.49560546875, 2.5888671875, 2.68212890625, 2.775390625, 2.86865234375, 2.9619140625, 3.05517578125, 3.1484375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 19.0, 66.0, 108.0, 186.0, 205.0, 212.0, 111.0, 65.0, 24.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39599609375, -0.3876628875732422, -0.3793296813964844, -0.37099647521972656, -0.36266326904296875, -0.35433006286621094, -0.3459968566894531, -0.3376636505126953, -0.3293304443359375, -0.3209972381591797, -0.3126640319824219, -0.30433082580566406, -0.29599761962890625, -0.28766441345214844, -0.2793312072753906, -0.2709980010986328, -0.262664794921875, -0.2543315887451172, -0.24599838256835938, -0.23766517639160156, -0.22933197021484375, -0.22099876403808594, -0.21266555786132812, -0.2043323516845703, -0.1959991455078125, -0.1876659393310547, -0.17933273315429688, -0.17099952697753906, -0.16266632080078125, -0.15433311462402344, -0.14599990844726562, -0.1376667022705078, -0.12933349609375, -0.12100028991699219, -0.11266708374023438, -0.10433387756347656, -0.09600067138671875, -0.08766746520996094, -0.07933425903320312, -0.07100105285644531, -0.0626678466796875, -0.05433464050292969, -0.046001434326171875, -0.03766822814941406, -0.02933502197265625, -0.021001815795898438, -0.012668609619140625, -0.0043354034423828125, 0.003997802734375, 0.012331008911132812, 0.020664215087890625, 0.028997421264648438, 0.03733062744140625, 0.04566383361816406, 0.053997039794921875, 0.06233024597167969, 0.0706634521484375, 0.07899665832519531, 0.08732986450195312, 0.09566307067871094, 0.10399627685546875, 0.11232948303222656, 0.12066268920898438, 0.1289958953857422, 0.1373291015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 9.0, 10.0, 6.0, 11.0, 17.0, 20.0, 31.0, 23.0, 47.0, 41.0, 79.0, 141.0, 190.0, 323.0, 527.0, 1109.0, 2520.0, 7633.0, 31246.0, 171401.0, 564230.0, 216419.0, 38059.0, 8921.0, 2869.0, 1172.0, 567.0, 321.0, 213.0, 108.0, 79.0, 58.0, 46.0, 26.0, 21.0, 23.0, 13.0, 16.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.837890625, -0.81292724609375, -0.7879638671875, -0.76300048828125, -0.738037109375, -0.71307373046875, -0.6881103515625, -0.66314697265625, -0.63818359375, -0.61322021484375, -0.5882568359375, -0.56329345703125, -0.538330078125, -0.51336669921875, -0.4884033203125, -0.46343994140625, -0.4384765625, -0.41351318359375, -0.3885498046875, -0.36358642578125, -0.338623046875, -0.31365966796875, -0.2886962890625, -0.26373291015625, -0.23876953125, -0.21380615234375, -0.1888427734375, -0.16387939453125, -0.138916015625, -0.11395263671875, -0.0889892578125, -0.06402587890625, -0.0390625, -0.01409912109375, 0.0108642578125, 0.03582763671875, 0.060791015625, 0.08575439453125, 0.1107177734375, 0.13568115234375, 0.16064453125, 0.18560791015625, 0.2105712890625, 0.23553466796875, 0.260498046875, 0.28546142578125, 0.3104248046875, 0.33538818359375, 0.3603515625, 0.38531494140625, 0.4102783203125, 0.43524169921875, 0.460205078125, 0.48516845703125, 0.5101318359375, 0.53509521484375, 0.56005859375, 0.58502197265625, 0.6099853515625, 0.63494873046875, 0.659912109375, 0.68487548828125, 0.7098388671875, 0.73480224609375, 0.759765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 3.0, 8.0, 8.0, 9.0, 10.0, 12.0, 11.0, 6.0, 28.0, 30.0, 40.0, 32.0, 40.0, 48.0, 63.0, 36.0, 52.0, 38.0, 59.0, 52.0, 49.0, 49.0, 41.0, 32.0, 38.0, 34.0, 26.0, 15.0, 24.0, 22.0, 14.0, 12.0, 9.0, 12.0, 5.0, 4.0, 6.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.4345703125, -0.422210693359375, -0.40985107421875, -0.397491455078125, -0.3851318359375, -0.372772216796875, -0.36041259765625, -0.348052978515625, -0.335693359375, -0.323333740234375, -0.31097412109375, -0.298614501953125, -0.2862548828125, -0.273895263671875, -0.26153564453125, -0.249176025390625, -0.23681640625, -0.224456787109375, -0.21209716796875, -0.199737548828125, -0.1873779296875, -0.175018310546875, -0.16265869140625, -0.150299072265625, -0.137939453125, -0.125579833984375, -0.11322021484375, -0.100860595703125, -0.0885009765625, -0.076141357421875, -0.06378173828125, -0.051422119140625, -0.0390625, -0.026702880859375, -0.01434326171875, -0.001983642578125, 0.0103759765625, 0.022735595703125, 0.03509521484375, 0.047454833984375, 0.059814453125, 0.072174072265625, 0.08453369140625, 0.096893310546875, 0.1092529296875, 0.121612548828125, 0.13397216796875, 0.146331787109375, 0.15869140625, 0.171051025390625, 0.18341064453125, 0.195770263671875, 0.2081298828125, 0.220489501953125, 0.23284912109375, 0.245208740234375, 0.257568359375, 0.269927978515625, 0.28228759765625, 0.294647216796875, 0.3070068359375, 0.319366455078125, 0.33172607421875, 0.344085693359375, 0.3564453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 4.0, 1.0, 5.0, 4.0, 10.0, 10.0, 18.0, 38.0, 33.0, 68.0, 118.0, 237.0, 493.0, 1407.0, 7410.0, 116903.0, 886979.0, 29389.0, 3751.0, 903.0, 341.0, 164.0, 104.0, 63.0, 33.0, 26.0, 14.0, 8.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6416015625, -1.5951080322265625, -1.548614501953125, -1.5021209716796875, -1.45562744140625, -1.4091339111328125, -1.362640380859375, -1.3161468505859375, -1.2696533203125, -1.2231597900390625, -1.176666259765625, -1.1301727294921875, -1.08367919921875, -1.0371856689453125, -0.990692138671875, -0.9441986083984375, -0.897705078125, -0.8512115478515625, -0.804718017578125, -0.7582244873046875, -0.71173095703125, -0.6652374267578125, -0.618743896484375, -0.5722503662109375, -0.5257568359375, -0.4792633056640625, -0.432769775390625, -0.3862762451171875, -0.33978271484375, -0.2932891845703125, -0.246795654296875, -0.2003021240234375, -0.15380859375, -0.1073150634765625, -0.060821533203125, -0.0143280029296875, 0.03216552734375, 0.0786590576171875, 0.125152587890625, 0.1716461181640625, 0.2181396484375, 0.2646331787109375, 0.311126708984375, 0.3576202392578125, 0.40411376953125, 0.4506072998046875, 0.497100830078125, 0.5435943603515625, 0.590087890625, 0.6365814208984375, 0.683074951171875, 0.7295684814453125, 0.77606201171875, 0.8225555419921875, 0.869049072265625, 0.9155426025390625, 0.9620361328125, 1.0085296630859375, 1.055023193359375, 1.1015167236328125, 1.14801025390625, 1.1945037841796875, 1.240997314453125, 1.2874908447265625, 1.333984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 13.0, 15.0, 29.0, 33.0, 44.0, 102.0, 161.0, 191.0, 164.0, 116.0, 59.0, 23.0, 17.0, 11.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012600421905517578, -0.00012107379734516144, -0.0001161433756351471, -0.00011121295392513275, -0.00010628253221511841, -0.00010135211050510406, -9.642168879508972e-05, -9.149126708507538e-05, -8.656084537506104e-05, -8.163042366504669e-05, -7.670000195503235e-05, -7.1769580245018e-05, -6.683915853500366e-05, -6.190873682498932e-05, -5.6978315114974976e-05, -5.204789340496063e-05, -4.711747169494629e-05, -4.2187049984931946e-05, -3.72566282749176e-05, -3.232620656490326e-05, -2.7395784854888916e-05, -2.2465363144874573e-05, -1.753494143486023e-05, -1.2604519724845886e-05, -7.674098014831543e-06, -2.7436763048171997e-06, 2.1867454051971436e-06, 7.117167115211487e-06, 1.204758882522583e-05, 1.6978010535240173e-05, 2.1908432245254517e-05, 2.683885395526886e-05, 3.17692756652832e-05, 3.6699697375297546e-05, 4.163011908531189e-05, 4.656054079532623e-05, 5.1490962505340576e-05, 5.642138421535492e-05, 6.135180592536926e-05, 6.62822276353836e-05, 7.121264934539795e-05, 7.614307105541229e-05, 8.107349276542664e-05, 8.600391447544098e-05, 9.093433618545532e-05, 9.586475789546967e-05, 0.00010079517960548401, 0.00010572560131549835, 0.0001106560230255127, 0.00011558644473552704, 0.00012051686644554138, 0.00012544728815555573, 0.00013037770986557007, 0.0001353081315755844, 0.00014023855328559875, 0.0001451689749956131, 0.00015009939670562744, 0.00015502981841564178, 0.00015996024012565613, 0.00016489066183567047, 0.00016982108354568481, 0.00017475150525569916, 0.0001796819269657135, 0.00018461234867572784, 0.0001895427703857422]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 8.0, 10.0, 23.0, 34.0, 49.0, 68.0, 151.0, 320.0, 806.0, 2764.0, 13564.0, 212739.0, 772559.0, 37612.0, 5510.0, 1411.0, 478.0, 187.0, 91.0, 57.0, 28.0, 18.0, 7.0, 12.0, 14.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.421875, -1.3846893310546875, -1.347503662109375, -1.3103179931640625, -1.27313232421875, -1.2359466552734375, -1.198760986328125, -1.1615753173828125, -1.1243896484375, -1.0872039794921875, -1.050018310546875, -1.0128326416015625, -0.97564697265625, -0.9384613037109375, -0.901275634765625, -0.8640899658203125, -0.826904296875, -0.7897186279296875, -0.752532958984375, -0.7153472900390625, -0.67816162109375, -0.6409759521484375, -0.603790283203125, -0.5666046142578125, -0.5294189453125, -0.4922332763671875, -0.455047607421875, -0.4178619384765625, -0.38067626953125, -0.3434906005859375, -0.306304931640625, -0.2691192626953125, -0.23193359375, -0.1947479248046875, -0.157562255859375, -0.1203765869140625, -0.08319091796875, -0.0460052490234375, -0.008819580078125, 0.0283660888671875, 0.0655517578125, 0.1027374267578125, 0.139923095703125, 0.1771087646484375, 0.21429443359375, 0.2514801025390625, 0.288665771484375, 0.3258514404296875, 0.363037109375, 0.4002227783203125, 0.437408447265625, 0.4745941162109375, 0.51177978515625, 0.5489654541015625, 0.586151123046875, 0.6233367919921875, 0.6605224609375, 0.6977081298828125, 0.734893798828125, 0.7720794677734375, 0.80926513671875, 0.8464508056640625, 0.883636474609375, 0.9208221435546875, 0.9580078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 9.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 10.0, 18.0, 46.0, 58.0, 86.0, 149.0, 157.0, 143.0, 107.0, 65.0, 51.0, 29.0, 16.0, 11.0, 7.0, 3.0, 4.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.65234375, -0.6367225646972656, -0.6211013793945312, -0.6054801940917969, -0.5898590087890625, -0.5742378234863281, -0.5586166381835938, -0.5429954528808594, -0.527374267578125, -0.5117530822753906, -0.49613189697265625, -0.4805107116699219, -0.4648895263671875, -0.4492683410644531, -0.43364715576171875, -0.4180259704589844, -0.40240478515625, -0.3867835998535156, -0.37116241455078125, -0.3555412292480469, -0.3399200439453125, -0.3242988586425781, -0.30867767333984375, -0.2930564880371094, -0.277435302734375, -0.2618141174316406, -0.24619293212890625, -0.23057174682617188, -0.2149505615234375, -0.19932937622070312, -0.18370819091796875, -0.16808700561523438, -0.1524658203125, -0.13684463500976562, -0.12122344970703125, -0.10560226440429688, -0.0899810791015625, -0.07435989379882812, -0.05873870849609375, -0.043117523193359375, -0.027496337890625, -0.011875152587890625, 0.00374603271484375, 0.019367218017578125, 0.0349884033203125, 0.050609588623046875, 0.06623077392578125, 0.08185195922851562, 0.09747314453125, 0.11309432983398438, 0.12871551513671875, 0.14433670043945312, 0.1599578857421875, 0.17557907104492188, 0.19120025634765625, 0.20682144165039062, 0.222442626953125, 0.23806381225585938, 0.25368499755859375, 0.2693061828613281, 0.2849273681640625, 0.3005485534667969, 0.31616973876953125, 0.3317909240722656, 0.347412109375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 166.0, 696.0, 125.0, 16.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.394973754882812, -12.669388771057129, -11.943802833557129, -11.218217849731445, -10.492631912231445, -9.767046928405762, -9.041461944580078, -8.315876007080078, -7.5902910232543945, -6.864705562591553, -6.139120101928711, -5.413535118103027, -4.6879496574401855, -3.9623641967773438, -3.23677921295166, -2.5111937522888184, -1.7856082916259766, -1.0600229501724243, -0.33443760871887207, 0.3911476135253906, 1.1167330741882324, 1.8423185348510742, 2.567903518676758, 3.2934889793395996, 4.019074440002441, 4.744659900665283, 5.470245361328125, 6.195830345153809, 6.92141580581665, 7.647001266479492, 8.372586250305176, 9.09817123413086, 9.82375717163086, 10.549342155456543, 11.274928092956543, 12.000513076782227, 12.726099014282227, 13.45168399810791, 14.177268981933594, 14.902854919433594, 15.628439903259277, 16.35402488708496, 17.07961082458496, 17.805194854736328, 18.530780792236328, 19.256366729736328, 19.981952667236328, 20.707536697387695, 21.433122634887695, 22.158708572387695, 22.884292602539062, 23.609878540039062, 24.335464477539062, 25.061050415039062, 25.78663444519043, 26.51222038269043, 27.237804412841797, 27.963390350341797, 28.688974380493164, 29.414560317993164, 30.140146255493164, 30.86573028564453, 31.59131622314453, 32.31690216064453, 33.04248809814453]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 16.0, 20.0, 17.0, 28.0, 34.0, 45.0, 58.0, 57.0, 59.0, 65.0, 76.0, 87.0, 76.0, 74.0, 53.0, 49.0, 48.0, 35.0, 33.0, 23.0, 16.0, 11.0, 5.0, 9.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.332628011703491, -3.1939985752105713, -3.0553689002990723, -2.9167394638061523, -2.7781097888946533, -2.6394803524017334, -2.5008506774902344, -2.3622212409973145, -2.2235918045043945, -2.0849623680114746, -1.9463326930999756, -1.8077032566070557, -1.6690735816955566, -1.5304441452026367, -1.3918145895004272, -1.2531850337982178, -1.1145553588867188, -0.9759258031845093, -0.8372962474822998, -0.6986667513847351, -0.5600371956825256, -0.42140763998031616, -0.28277814388275146, -0.144148588180542, -0.0055190324783325195, 0.13311050832271576, 0.27174004912376404, 0.4103695750236511, 0.5489991307258606, 0.6876286864280701, 0.8262581825256348, 0.9648877382278442, 1.1035170555114746, 1.242146611213684, 1.3807761669158936, 1.5194056034088135, 1.6580352783203125, 1.7966647148132324, 1.935294270515442, 2.0739238262176514, 2.2125535011291504, 2.3511829376220703, 2.4898126125335693, 2.6284420490264893, 2.7670717239379883, 2.905701160430908, 3.044330596923828, 3.182960271835327, 3.321589708328247, 3.460219144821167, 3.598848819732666, 3.737478256225586, 3.876107931137085, 4.014737606048584, 4.153367042541504, 4.291996479034424, 4.430625915527344, 4.569255352020264, 4.707884788513184, 4.846514701843262, 4.985144138336182, 5.123773574829102, 5.2624030113220215, 5.401032447814941, 5.5396623611450195]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 9.0, 12.0, 12.0, 13.0, 22.0, 20.0, 20.0, 20.0, 40.0, 30.0, 31.0, 43.0, 66.0, 83.0, 130.0, 291.0, 831.0, 3318.0, 26825.0, 3333543.0, 804908.0, 20220.0, 2728.0, 622.0, 219.0, 102.0, 50.0, 20.0, 13.0, 11.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.46875, -3.38189697265625, -3.2950439453125, -3.20819091796875, -3.121337890625, -3.03448486328125, -2.9476318359375, -2.86077880859375, -2.77392578125, -2.68707275390625, -2.6002197265625, -2.51336669921875, -2.426513671875, -2.33966064453125, -2.2528076171875, -2.16595458984375, -2.0791015625, -1.99224853515625, -1.9053955078125, -1.81854248046875, -1.731689453125, -1.64483642578125, -1.5579833984375, -1.47113037109375, -1.38427734375, -1.29742431640625, -1.2105712890625, -1.12371826171875, -1.036865234375, -0.95001220703125, -0.8631591796875, -0.77630615234375, -0.689453125, -0.60260009765625, -0.5157470703125, -0.42889404296875, -0.342041015625, -0.25518798828125, -0.1683349609375, -0.08148193359375, 0.00537109375, 0.09222412109375, 0.1790771484375, 0.26593017578125, 0.352783203125, 0.43963623046875, 0.5264892578125, 0.61334228515625, 0.7001953125, 0.78704833984375, 0.8739013671875, 0.96075439453125, 1.047607421875, 1.13446044921875, 1.2213134765625, 1.30816650390625, 1.39501953125, 1.48187255859375, 1.5687255859375, 1.65557861328125, 1.742431640625, 1.82928466796875, 1.9161376953125, 2.00299072265625, 2.08984375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 9.0, 18.0, 38.0, 51.0, 77.0, 118.0, 153.0, 136.0, 122.0, 111.0, 77.0, 42.0, 23.0, 16.0, 12.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.33642578125, -0.32973575592041016, -0.3230457305908203, -0.31635570526123047, -0.3096656799316406, -0.3029756546020508, -0.29628562927246094, -0.2895956039428711, -0.28290557861328125, -0.2762155532836914, -0.26952552795410156, -0.2628355026245117, -0.2561454772949219, -0.24945545196533203, -0.2427654266357422, -0.23607540130615234, -0.2293853759765625, -0.22269535064697266, -0.2160053253173828, -0.20931529998779297, -0.20262527465820312, -0.19593524932861328, -0.18924522399902344, -0.1825551986694336, -0.17586517333984375, -0.1691751480102539, -0.16248512268066406, -0.15579509735107422, -0.14910507202148438, -0.14241504669189453, -0.1357250213623047, -0.12903499603271484, -0.122344970703125, -0.11565494537353516, -0.10896492004394531, -0.10227489471435547, -0.09558486938476562, -0.08889484405517578, -0.08220481872558594, -0.0755147933959961, -0.06882476806640625, -0.062134742736816406, -0.05544471740722656, -0.04875469207763672, -0.042064666748046875, -0.03537464141845703, -0.028684616088867188, -0.021994590759277344, -0.0153045654296875, -0.008614540100097656, -0.0019245147705078125, 0.004765510559082031, 0.011455535888671875, 0.01814556121826172, 0.024835586547851562, 0.031525611877441406, 0.03821563720703125, 0.044905662536621094, 0.05159568786621094, 0.05828571319580078, 0.06497573852539062, 0.07166576385498047, 0.07835578918457031, 0.08504581451416016, 0.09173583984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 16.0, 20.0, 17.0, 28.0, 70.0, 100.0, 212.0, 599.0, 2686.0, 4050738.0, 137639.0, 1523.0, 335.0, 124.0, 69.0, 40.0, 28.0, 18.0, 8.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.828125, -13.54522705078125, -13.2623291015625, -12.97943115234375, -12.696533203125, -12.41363525390625, -12.1307373046875, -11.84783935546875, -11.56494140625, -11.28204345703125, -10.9991455078125, -10.71624755859375, -10.433349609375, -10.15045166015625, -9.8675537109375, -9.58465576171875, -9.3017578125, -9.01885986328125, -8.7359619140625, -8.45306396484375, -8.170166015625, -7.88726806640625, -7.6043701171875, -7.32147216796875, -7.03857421875, -6.75567626953125, -6.4727783203125, -6.18988037109375, -5.906982421875, -5.62408447265625, -5.3411865234375, -5.05828857421875, -4.775390625, -4.49249267578125, -4.2095947265625, -3.92669677734375, -3.643798828125, -3.36090087890625, -3.0780029296875, -2.79510498046875, -2.51220703125, -2.22930908203125, -1.9464111328125, -1.66351318359375, -1.380615234375, -1.09771728515625, -0.8148193359375, -0.53192138671875, -0.2490234375, 0.03387451171875, 0.3167724609375, 0.59967041015625, 0.882568359375, 1.16546630859375, 1.4483642578125, 1.73126220703125, 2.01416015625, 2.29705810546875, 2.5799560546875, 2.86285400390625, 3.145751953125, 3.42864990234375, 3.7115478515625, 3.99444580078125, 4.27734375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 10.0, 28.0, 65.0, 268.0, 2330.0, 1071.0, 191.0, 71.0, 24.0, 8.0, 7.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2294921875, -1.2062339782714844, -1.1829757690429688, -1.1597175598144531, -1.1364593505859375, -1.1132011413574219, -1.0899429321289062, -1.0666847229003906, -1.043426513671875, -1.0201683044433594, -0.9969100952148438, -0.9736518859863281, -0.9503936767578125, -0.9271354675292969, -0.9038772583007812, -0.8806190490722656, -0.85736083984375, -0.8341026306152344, -0.8108444213867188, -0.7875862121582031, -0.7643280029296875, -0.7410697937011719, -0.7178115844726562, -0.6945533752441406, -0.671295166015625, -0.6480369567871094, -0.6247787475585938, -0.6015205383300781, -0.5782623291015625, -0.5550041198730469, -0.5317459106445312, -0.5084877014160156, -0.4852294921875, -0.4619712829589844, -0.43871307373046875, -0.4154548645019531, -0.3921966552734375, -0.3689384460449219, -0.34568023681640625, -0.3224220275878906, -0.299163818359375, -0.2759056091308594, -0.25264739990234375, -0.22938919067382812, -0.2061309814453125, -0.18287277221679688, -0.15961456298828125, -0.13635635375976562, -0.11309814453125, -0.08983993530273438, -0.06658172607421875, -0.043323516845703125, -0.0200653076171875, 0.003192901611328125, 0.02645111083984375, 0.049709320068359375, 0.072967529296875, 0.09622573852539062, 0.11948394775390625, 0.14274215698242188, 0.1660003662109375, 0.18925857543945312, 0.21251678466796875, 0.23577499389648438, 0.259033203125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 13.0, 28.0, 74.0, 208.0, 366.0, 196.0, 58.0, 28.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.702433586120605, -8.515105247497559, -8.327775955200195, -8.140447616577148, -7.953118324279785, -7.765789985656738, -7.578461170196533, -7.391132354736328, -7.203803539276123, -7.016474723815918, -6.829145908355713, -6.641817092895508, -6.454488754272461, -6.267159938812256, -6.079831123352051, -5.892502307891846, -5.705173492431641, -5.5178446769714355, -5.3305158615112305, -5.143187046051025, -4.95585823059082, -4.768529891967773, -4.581201076507568, -4.393872261047363, -4.206543445587158, -4.019214630126953, -3.831885814666748, -3.644557237625122, -3.457228422164917, -3.269899606704712, -3.082571029663086, -2.895242214202881, -2.707913637161255, -2.52058482170105, -2.333256244659424, -2.1459274291992188, -1.9585986137390137, -1.7712697982788086, -1.583941102027893, -1.3966124057769775, -1.2092835903167725, -1.0219547748565674, -0.8346260786056519, -0.6472973227500916, -0.45996856689453125, -0.27263981103897095, -0.08531105518341064, 0.10201764106750488, 0.28934645652770996, 0.47667521238327026, 0.6640039682388306, 0.8513327240943909, 1.0386614799499512, 1.2259902954101562, 1.4133189916610718, 1.6006476879119873, 1.7879765033721924, 1.9753053188323975, 2.1626338958740234, 2.3499627113342285, 2.5372915267944336, 2.7246203422546387, 2.9119491577148438, 3.0992777347564697, 3.286606550216675]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 11.0, 26.0, 33.0, 47.0, 54.0, 87.0, 95.0, 101.0, 102.0, 98.0, 96.0, 73.0, 60.0, 39.0, 32.0, 11.0, 8.0, 11.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0964064598083496, -3.000277519226074, -2.9041483402252197, -2.8080193996429443, -2.71189022064209, -2.6157612800598145, -2.519632339477539, -2.4235033988952637, -2.327374219894409, -2.231245279312134, -2.1351161003112793, -2.038987159729004, -1.942858099937439, -1.846729040145874, -1.7506000995635986, -1.6544710397720337, -1.5583419799804688, -1.4622129201889038, -1.3660838603973389, -1.2699549198150635, -1.1738258600234985, -1.0776968002319336, -0.9815678000450134, -0.8854387998580933, -0.7893097400665283, -0.6931806802749634, -0.5970516800880432, -0.500922679901123, -0.4047936201095581, -0.30866459012031555, -0.212535560131073, -0.11640655994415283, -0.020277738571166992, 0.07585129141807556, 0.17198032140731812, 0.26810935139656067, 0.3642383813858032, 0.4603674113750458, 0.5564964413642883, 0.6526254415512085, 0.7487545013427734, 0.8448835611343384, 0.9410125613212585, 1.0371415615081787, 1.1332706212997437, 1.2293996810913086, 1.325528621673584, 1.421657681465149, 1.5177867412567139, 1.6139158010482788, 1.7100448608398438, 1.8061738014221191, 1.902302861213684, 1.998431921005249, 2.0945608615875244, 2.190690040588379, 2.2868189811706543, 2.3829479217529297, 2.479077100753784, 2.5752060413360596, 2.671335220336914, 2.7674641609191895, 2.863593101501465, 2.9597220420837402, 3.0558512210845947]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 11.0, 6.0, 7.0, 14.0, 28.0, 33.0, 38.0, 76.0, 106.0, 187.0, 356.0, 872.0, 2785.0, 15452.0, 193535.0, 761857.0, 62793.0, 7264.0, 1764.0, 621.0, 282.0, 158.0, 99.0, 65.0, 44.0, 24.0, 18.0, 14.0, 11.0, 11.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.54296875, -2.468841552734375, -2.39471435546875, -2.320587158203125, -2.2464599609375, -2.172332763671875, -2.09820556640625, -2.024078369140625, -1.949951171875, -1.875823974609375, -1.80169677734375, -1.727569580078125, -1.6534423828125, -1.579315185546875, -1.50518798828125, -1.431060791015625, -1.35693359375, -1.282806396484375, -1.20867919921875, -1.134552001953125, -1.0604248046875, -0.986297607421875, -0.91217041015625, -0.838043212890625, -0.763916015625, -0.689788818359375, -0.61566162109375, -0.541534423828125, -0.4674072265625, -0.393280029296875, -0.31915283203125, -0.245025634765625, -0.1708984375, -0.096771240234375, -0.02264404296875, 0.051483154296875, 0.1256103515625, 0.199737548828125, 0.27386474609375, 0.347991943359375, 0.422119140625, 0.496246337890625, 0.57037353515625, 0.644500732421875, 0.7186279296875, 0.792755126953125, 0.86688232421875, 0.941009521484375, 1.01513671875, 1.089263916015625, 1.16339111328125, 1.237518310546875, 1.3116455078125, 1.385772705078125, 1.45989990234375, 1.534027099609375, 1.608154296875, 1.682281494140625, 1.75640869140625, 1.830535888671875, 1.9046630859375, 1.978790283203125, 2.05291748046875, 2.127044677734375, 2.201171875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 10.0, 16.0, 30.0, 46.0, 73.0, 87.0, 96.0, 136.0, 130.0, 105.0, 83.0, 71.0, 43.0, 28.0, 21.0, 10.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.38037109375, -0.3719196319580078, -0.3634681701660156, -0.35501670837402344, -0.34656524658203125, -0.33811378479003906, -0.3296623229980469, -0.3212108612060547, -0.3127593994140625, -0.3043079376220703, -0.2958564758300781, -0.28740501403808594, -0.27895355224609375, -0.27050209045410156, -0.2620506286621094, -0.2535991668701172, -0.245147705078125, -0.2366962432861328, -0.22824478149414062, -0.21979331970214844, -0.21134185791015625, -0.20289039611816406, -0.19443893432617188, -0.1859874725341797, -0.1775360107421875, -0.1690845489501953, -0.16063308715820312, -0.15218162536621094, -0.14373016357421875, -0.13527870178222656, -0.12682723999023438, -0.11837577819824219, -0.10992431640625, -0.10147285461425781, -0.09302139282226562, -0.08456993103027344, -0.07611846923828125, -0.06766700744628906, -0.059215545654296875, -0.05076408386230469, -0.0423126220703125, -0.03386116027832031, -0.025409698486328125, -0.016958236694335938, -0.00850677490234375, -5.53131103515625e-05, 0.008396148681640625, 0.016847610473632812, 0.025299072265625, 0.03375053405761719, 0.042201995849609375, 0.05065345764160156, 0.05910491943359375, 0.06755638122558594, 0.07600784301757812, 0.08445930480957031, 0.0929107666015625, 0.10136222839355469, 0.10981369018554688, 0.11826515197753906, 0.12671661376953125, 0.13516807556152344, 0.14361953735351562, 0.1520709991455078, 0.1605224609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 6.0, 10.0, 17.0, 19.0, 23.0, 47.0, 61.0, 103.0, 194.0, 325.0, 692.0, 1595.0, 3844.0, 11491.0, 50529.0, 337455.0, 523778.0, 91606.0, 17647.0, 5247.0, 1954.0, 845.0, 403.0, 225.0, 143.0, 84.0, 57.0, 26.0, 34.0, 19.0, 14.0, 12.0, 4.0, 10.0, 4.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1435546875, -1.10906982421875, -1.0745849609375, -1.04010009765625, -1.005615234375, -0.97113037109375, -0.9366455078125, -0.90216064453125, -0.86767578125, -0.83319091796875, -0.7987060546875, -0.76422119140625, -0.729736328125, -0.69525146484375, -0.6607666015625, -0.62628173828125, -0.591796875, -0.55731201171875, -0.5228271484375, -0.48834228515625, -0.453857421875, -0.41937255859375, -0.3848876953125, -0.35040283203125, -0.31591796875, -0.28143310546875, -0.2469482421875, -0.21246337890625, -0.177978515625, -0.14349365234375, -0.1090087890625, -0.07452392578125, -0.0400390625, -0.00555419921875, 0.0289306640625, 0.06341552734375, 0.097900390625, 0.13238525390625, 0.1668701171875, 0.20135498046875, 0.23583984375, 0.27032470703125, 0.3048095703125, 0.33929443359375, 0.373779296875, 0.40826416015625, 0.4427490234375, 0.47723388671875, 0.51171875, 0.54620361328125, 0.5806884765625, 0.61517333984375, 0.649658203125, 0.68414306640625, 0.7186279296875, 0.75311279296875, 0.78759765625, 0.82208251953125, 0.8565673828125, 0.89105224609375, 0.925537109375, 0.96002197265625, 0.9945068359375, 1.02899169921875, 1.0634765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 3.0, 9.0, 13.0, 12.0, 15.0, 16.0, 14.0, 19.0, 30.0, 43.0, 37.0, 34.0, 49.0, 46.0, 54.0, 40.0, 48.0, 69.0, 48.0, 52.0, 43.0, 38.0, 36.0, 40.0, 34.0, 28.0, 19.0, 22.0, 14.0, 16.0, 10.0, 15.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.60498046875, -0.5870590209960938, -0.5691375732421875, -0.5512161254882812, -0.533294677734375, -0.5153732299804688, -0.4974517822265625, -0.47953033447265625, -0.46160888671875, -0.44368743896484375, -0.4257659912109375, -0.40784454345703125, -0.389923095703125, -0.37200164794921875, -0.3540802001953125, -0.33615875244140625, -0.3182373046875, -0.30031585693359375, -0.2823944091796875, -0.26447296142578125, -0.246551513671875, -0.22863006591796875, -0.2107086181640625, -0.19278717041015625, -0.17486572265625, -0.15694427490234375, -0.1390228271484375, -0.12110137939453125, -0.103179931640625, -0.08525848388671875, -0.0673370361328125, -0.04941558837890625, -0.031494140625, -0.01357269287109375, 0.0043487548828125, 0.02227020263671875, 0.040191650390625, 0.05811309814453125, 0.0760345458984375, 0.09395599365234375, 0.11187744140625, 0.12979888916015625, 0.1477203369140625, 0.16564178466796875, 0.183563232421875, 0.20148468017578125, 0.2194061279296875, 0.23732757568359375, 0.2552490234375, 0.27317047119140625, 0.2910919189453125, 0.30901336669921875, 0.326934814453125, 0.34485626220703125, 0.3627777099609375, 0.38069915771484375, 0.39862060546875, 0.41654205322265625, 0.4344635009765625, 0.45238494873046875, 0.470306396484375, 0.48822784423828125, 0.5061492919921875, 0.5240707397460938, 0.5419921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 10.0, 7.0, 15.0, 14.0, 19.0, 40.0, 50.0, 111.0, 193.0, 404.0, 772.0, 1910.0, 5636.0, 25856.0, 371294.0, 590955.0, 39818.0, 7196.0, 2318.0, 966.0, 447.0, 189.0, 119.0, 71.0, 50.0, 29.0, 16.0, 21.0, 9.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8662109375, -0.8400421142578125, -0.813873291015625, -0.7877044677734375, -0.76153564453125, -0.7353668212890625, -0.709197998046875, -0.6830291748046875, -0.6568603515625, -0.6306915283203125, -0.604522705078125, -0.5783538818359375, -0.55218505859375, -0.5260162353515625, -0.499847412109375, -0.4736785888671875, -0.447509765625, -0.4213409423828125, -0.395172119140625, -0.3690032958984375, -0.34283447265625, -0.3166656494140625, -0.290496826171875, -0.2643280029296875, -0.2381591796875, -0.2119903564453125, -0.185821533203125, -0.1596527099609375, -0.13348388671875, -0.1073150634765625, -0.081146240234375, -0.0549774169921875, -0.02880859375, -0.0026397705078125, 0.023529052734375, 0.0496978759765625, 0.07586669921875, 0.1020355224609375, 0.128204345703125, 0.1543731689453125, 0.1805419921875, 0.2067108154296875, 0.232879638671875, 0.2590484619140625, 0.28521728515625, 0.3113861083984375, 0.337554931640625, 0.3637237548828125, 0.389892578125, 0.4160614013671875, 0.442230224609375, 0.4683990478515625, 0.49456787109375, 0.5207366943359375, 0.546905517578125, 0.5730743408203125, 0.5992431640625, 0.6254119873046875, 0.651580810546875, 0.6777496337890625, 0.70391845703125, 0.7300872802734375, 0.756256103515625, 0.7824249267578125, 0.80859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 13.0, 19.0, 24.0, 28.0, 57.0, 73.0, 97.0, 120.0, 130.0, 124.0, 82.0, 57.0, 50.0, 30.0, 19.0, 14.0, 10.0, 9.0, 9.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00012421607971191406, -0.00012098532170057297, -0.00011775456368923187, -0.00011452380567789078, -0.00011129304766654968, -0.00010806228965520859, -0.00010483153164386749, -0.0001016007736325264, -9.83700156211853e-05, -9.513925760984421e-05, -9.190849959850311e-05, -8.867774158716202e-05, -8.544698357582092e-05, -8.221622556447983e-05, -7.898546755313873e-05, -7.575470954179764e-05, -7.252395153045654e-05, -6.929319351911545e-05, -6.606243550777435e-05, -6.283167749643326e-05, -5.960091948509216e-05, -5.637016147375107e-05, -5.313940346240997e-05, -4.990864545106888e-05, -4.667788743972778e-05, -4.344712942838669e-05, -4.021637141704559e-05, -3.69856134057045e-05, -3.37548553943634e-05, -3.052409738302231e-05, -2.7293339371681213e-05, -2.406258136034012e-05, -2.0831823348999023e-05, -1.760106533765793e-05, -1.4370307326316833e-05, -1.1139549314975739e-05, -7.908791303634644e-06, -4.678033292293549e-06, -1.4472752809524536e-06, 1.7834827303886414e-06, 5.014240741729736e-06, 8.244998753070831e-06, 1.1475756764411926e-05, 1.4706514775753021e-05, 1.7937272787094116e-05, 2.116803079843521e-05, 2.4398788809776306e-05, 2.76295468211174e-05, 3.0860304832458496e-05, 3.409106284379959e-05, 3.7321820855140686e-05, 4.055257886648178e-05, 4.3783336877822876e-05, 4.701409488916397e-05, 5.0244852900505066e-05, 5.347561091184616e-05, 5.6706368923187256e-05, 5.993712693452835e-05, 6.316788494586945e-05, 6.639864295721054e-05, 6.962940096855164e-05, 7.286015897989273e-05, 7.609091699123383e-05, 7.932167500257492e-05, 8.255243301391602e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 10.0, 7.0, 22.0, 23.0, 59.0, 72.0, 126.0, 258.0, 509.0, 1002.0, 2267.0, 5979.0, 20589.0, 217102.0, 721806.0, 60927.0, 10816.0, 3737.0, 1551.0, 781.0, 384.0, 177.0, 108.0, 72.0, 43.0, 33.0, 20.0, 13.0, 8.0, 7.0, 4.0, 5.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.896484375, -0.8710708618164062, -0.8456573486328125, -0.8202438354492188, -0.794830322265625, -0.7694168090820312, -0.7440032958984375, -0.7185897827148438, -0.69317626953125, -0.6677627563476562, -0.6423492431640625, -0.6169357299804688, -0.591522216796875, -0.5661087036132812, -0.5406951904296875, -0.5152816772460938, -0.4898681640625, -0.46445465087890625, -0.4390411376953125, -0.41362762451171875, -0.388214111328125, -0.36280059814453125, -0.3373870849609375, -0.31197357177734375, -0.28656005859375, -0.26114654541015625, -0.2357330322265625, -0.21031951904296875, -0.184906005859375, -0.15949249267578125, -0.1340789794921875, -0.10866546630859375, -0.083251953125, -0.05783843994140625, -0.0324249267578125, -0.00701141357421875, 0.018402099609375, 0.04381561279296875, 0.0692291259765625, 0.09464263916015625, 0.12005615234375, 0.14546966552734375, 0.1708831787109375, 0.19629669189453125, 0.221710205078125, 0.24712371826171875, 0.2725372314453125, 0.29795074462890625, 0.3233642578125, 0.34877777099609375, 0.3741912841796875, 0.39960479736328125, 0.425018310546875, 0.45043182373046875, 0.4758453369140625, 0.5012588500976562, 0.52667236328125, 0.5520858764648438, 0.5774993896484375, 0.6029129028320312, 0.628326416015625, 0.6537399291992188, 0.6791534423828125, 0.7045669555664062, 0.72998046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 12.0, 7.0, 12.0, 12.0, 36.0, 66.0, 73.0, 125.0, 142.0, 158.0, 124.0, 87.0, 54.0, 37.0, 17.0, 11.0, 11.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.6201171875, -0.6034126281738281, -0.5867080688476562, -0.5700035095214844, -0.5532989501953125, -0.5365943908691406, -0.5198898315429688, -0.5031852722167969, -0.486480712890625, -0.4697761535644531, -0.45307159423828125, -0.4363670349121094, -0.4196624755859375, -0.4029579162597656, -0.38625335693359375, -0.3695487976074219, -0.35284423828125, -0.3361396789550781, -0.31943511962890625, -0.3027305603027344, -0.2860260009765625, -0.2693214416503906, -0.25261688232421875, -0.23591232299804688, -0.219207763671875, -0.20250320434570312, -0.18579864501953125, -0.16909408569335938, -0.1523895263671875, -0.13568496704101562, -0.11898040771484375, -0.10227584838867188, -0.0855712890625, -0.06886672973632812, -0.05216217041015625, -0.035457611083984375, -0.0187530517578125, -0.002048492431640625, 0.01465606689453125, 0.031360626220703125, 0.048065185546875, 0.06476974487304688, 0.08147430419921875, 0.09817886352539062, 0.1148834228515625, 0.13158798217773438, 0.14829254150390625, 0.16499710083007812, 0.18170166015625, 0.19840621948242188, 0.21511077880859375, 0.23181533813476562, 0.2485198974609375, 0.2652244567871094, 0.28192901611328125, 0.2986335754394531, 0.315338134765625, 0.3320426940917969, 0.34874725341796875, 0.3654518127441406, 0.3821563720703125, 0.3988609313964844, 0.41556549072265625, 0.4322700500488281, 0.448974609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 73.0, 343.0, 463.0, 103.0, 17.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.177642822265625, -25.555749893188477, -24.93385887145996, -24.311965942382812, -23.690074920654297, -23.06818199157715, -22.4462890625, -21.824398040771484, -21.202505111694336, -20.580612182617188, -19.958721160888672, -19.336828231811523, -18.714935302734375, -18.09304428100586, -17.47115135192871, -16.849258422851562, -16.227367401123047, -15.605475425720215, -14.983583450317383, -14.361690521240234, -13.739798545837402, -13.11790657043457, -12.496013641357422, -11.87412166595459, -11.252229690551758, -10.630337715148926, -10.008445739746094, -9.386552810668945, -8.764660835266113, -8.142768859863281, -7.520876407623291, -6.898983955383301, -6.277091026306152, -5.65519905090332, -5.03330659866333, -4.41141414642334, -3.789522171020508, -3.1676299571990967, -2.5457377433776855, -1.9238452911376953, -1.3019533157348633, -0.6800611019134521, -0.058168888092041016, 0.5637233257293701, 1.1856155395507812, 1.8075077533721924, 2.4293999671936035, 3.0512924194335938, 3.673184394836426, 4.295076370239258, 4.916968822479248, 5.538861274719238, 6.16075325012207, 6.782645225524902, 7.404537677764893, 8.026430130004883, 8.648322105407715, 9.270214080810547, 9.892107009887695, 10.513998985290527, 11.13589096069336, 11.757782936096191, 12.379674911499023, 13.001567840576172, 13.623459815979004]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 9.0, 10.0, 14.0, 15.0, 26.0, 13.0, 28.0, 23.0, 30.0, 34.0, 36.0, 50.0, 50.0, 57.0, 55.0, 38.0, 50.0, 61.0, 41.0, 46.0, 43.0, 29.0, 37.0, 27.0, 22.0, 28.0, 21.0, 15.0, 14.0, 21.0, 11.0, 11.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1218209266662598, -3.0180411338806152, -2.91426157951355, -2.8104817867279053, -2.70670223236084, -2.6029224395751953, -2.49914288520813, -2.3953630924224854, -2.29158353805542, -2.1878037452697754, -2.08402419090271, -1.980244517326355, -1.87646484375, -1.7726850509643555, -1.66890549659729, -1.5651257038116455, -1.4613460302352905, -1.3575663566589355, -1.2537866830825806, -1.1500070095062256, -1.0462273359298706, -0.9424476027488708, -0.8386679291725159, -0.7348882555961609, -0.6311085820198059, -0.5273289084434509, -0.42354923486709595, -0.3197695314884186, -0.2159898579120636, -0.11221015453338623, -0.00843048095703125, 0.09534919261932373, 0.1991288661956787, 0.3029085397720337, 0.40668821334838867, 0.5104678869247437, 0.6142475605010986, 0.7180272936820984, 0.8218069672584534, 0.9255866408348083, 1.0293662548065186, 1.1331459283828735, 1.2369256019592285, 1.3407052755355835, 1.4444849491119385, 1.548264741897583, 1.6520442962646484, 1.755824089050293, 1.859603762626648, 1.963383436203003, 2.0671632289886475, 2.170942783355713, 2.2747225761413574, 2.378502130508423, 2.4822819232940674, 2.586061477661133, 2.6898412704467773, 2.793621063232422, 2.8974006175994873, 3.001180410385132, 3.1049599647521973, 3.208739757537842, 3.3125193119049072, 3.4162991046905518, 3.520078659057617]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 4.0, 7.0, 13.0, 8.0, 12.0, 17.0, 16.0, 23.0, 31.0, 33.0, 48.0, 71.0, 85.0, 126.0, 191.0, 301.0, 586.0, 1353.0, 4204.0, 18399.0, 178563.0, 3909916.0, 64907.0, 10893.0, 2754.0, 924.0, 415.0, 171.0, 109.0, 38.0, 21.0, 16.0, 7.0, 4.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.974609375, -2.89697265625, -2.8193359375, -2.74169921875, -2.6640625, -2.58642578125, -2.5087890625, -2.43115234375, -2.353515625, -2.27587890625, -2.1982421875, -2.12060546875, -2.04296875, -1.96533203125, -1.8876953125, -1.81005859375, -1.732421875, -1.65478515625, -1.5771484375, -1.49951171875, -1.421875, -1.34423828125, -1.2666015625, -1.18896484375, -1.111328125, -1.03369140625, -0.9560546875, -0.87841796875, -0.80078125, -0.72314453125, -0.6455078125, -0.56787109375, -0.490234375, -0.41259765625, -0.3349609375, -0.25732421875, -0.1796875, -0.10205078125, -0.0244140625, 0.05322265625, 0.130859375, 0.20849609375, 0.2861328125, 0.36376953125, 0.44140625, 0.51904296875, 0.5966796875, 0.67431640625, 0.751953125, 0.82958984375, 0.9072265625, 0.98486328125, 1.0625, 1.14013671875, 1.2177734375, 1.29541015625, 1.373046875, 1.45068359375, 1.5283203125, 1.60595703125, 1.68359375, 1.76123046875, 1.8388671875, 1.91650390625, 1.994140625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 9.0, 13.0, 20.0, 36.0, 46.0, 73.0, 102.0, 94.0, 135.0, 120.0, 102.0, 87.0, 65.0, 36.0, 30.0, 13.0, 10.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.402099609375, -0.3930950164794922, -0.3840904235839844, -0.37508583068847656, -0.36608123779296875, -0.35707664489746094, -0.3480720520019531, -0.3390674591064453, -0.3300628662109375, -0.3210582733154297, -0.3120536804199219, -0.30304908752441406, -0.29404449462890625, -0.28503990173339844, -0.2760353088378906, -0.2670307159423828, -0.258026123046875, -0.2490215301513672, -0.24001693725585938, -0.23101234436035156, -0.22200775146484375, -0.21300315856933594, -0.20399856567382812, -0.1949939727783203, -0.1859893798828125, -0.1769847869873047, -0.16798019409179688, -0.15897560119628906, -0.14997100830078125, -0.14096641540527344, -0.13196182250976562, -0.12295722961425781, -0.11395263671875, -0.10494804382324219, -0.09594345092773438, -0.08693885803222656, -0.07793426513671875, -0.06892967224121094, -0.059925079345703125, -0.05092048645019531, -0.0419158935546875, -0.03291130065917969, -0.023906707763671875, -0.014902114868164062, -0.00589752197265625, 0.0031070709228515625, 0.012111663818359375, 0.021116256713867188, 0.030120849609375, 0.03912544250488281, 0.048130035400390625, 0.05713462829589844, 0.06613922119140625, 0.07514381408691406, 0.08414840698242188, 0.09315299987792969, 0.1021575927734375, 0.11116218566894531, 0.12016677856445312, 0.12917137145996094, 0.13817596435546875, 0.14718055725097656, 0.15618515014648438, 0.1651897430419922, 0.1741943359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 21.0, 12.0, 23.0, 40.0, 52.0, 68.0, 124.0, 184.0, 401.0, 2177.0, 125713.0, 4058237.0, 6094.0, 636.0, 203.0, 106.0, 62.0, 38.0, 34.0, 21.0, 13.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.754241943359375, -7.57879638671875, -7.403350830078125, -7.2279052734375, -7.052459716796875, -6.87701416015625, -6.701568603515625, -6.526123046875, -6.350677490234375, -6.17523193359375, -5.999786376953125, -5.8243408203125, -5.648895263671875, -5.47344970703125, -5.298004150390625, -5.12255859375, -4.947113037109375, -4.77166748046875, -4.596221923828125, -4.4207763671875, -4.245330810546875, -4.06988525390625, -3.894439697265625, -3.718994140625, -3.543548583984375, -3.36810302734375, -3.192657470703125, -3.0172119140625, -2.841766357421875, -2.66632080078125, -2.490875244140625, -2.3154296875, -2.139984130859375, -1.96453857421875, -1.789093017578125, -1.6136474609375, -1.438201904296875, -1.26275634765625, -1.087310791015625, -0.911865234375, -0.736419677734375, -0.56097412109375, -0.385528564453125, -0.2100830078125, -0.034637451171875, 0.14080810546875, 0.316253662109375, 0.49169921875, 0.667144775390625, 0.84259033203125, 1.018035888671875, 1.1934814453125, 1.368927001953125, 1.54437255859375, 1.719818115234375, 1.895263671875, 2.070709228515625, 2.24615478515625, 2.421600341796875, 2.5970458984375, 2.772491455078125, 2.94793701171875, 3.123382568359375, 3.298828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 17.0, 52.0, 176.0, 2418.0, 1230.0, 141.0, 29.0, 10.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.7275390625, -1.6942520141601562, -1.6609649658203125, -1.6276779174804688, -1.594390869140625, -1.5611038208007812, -1.5278167724609375, -1.4945297241210938, -1.46124267578125, -1.4279556274414062, -1.3946685791015625, -1.3613815307617188, -1.328094482421875, -1.2948074340820312, -1.2615203857421875, -1.2282333374023438, -1.1949462890625, -1.1616592407226562, -1.1283721923828125, -1.0950851440429688, -1.061798095703125, -1.0285110473632812, -0.9952239990234375, -0.9619369506835938, -0.92864990234375, -0.8953628540039062, -0.8620758056640625, -0.8287887573242188, -0.795501708984375, -0.7622146606445312, -0.7289276123046875, -0.6956405639648438, -0.662353515625, -0.6290664672851562, -0.5957794189453125, -0.5624923706054688, -0.529205322265625, -0.49591827392578125, -0.4626312255859375, -0.42934417724609375, -0.39605712890625, -0.36277008056640625, -0.3294830322265625, -0.29619598388671875, -0.262908935546875, -0.22962188720703125, -0.1963348388671875, -0.16304779052734375, -0.1297607421875, -0.09647369384765625, -0.0631866455078125, -0.02989959716796875, 0.003387451171875, 0.03667449951171875, 0.0699615478515625, 0.10324859619140625, 0.13653564453125, 0.16982269287109375, 0.2031097412109375, 0.23639678955078125, 0.269683837890625, 0.30297088623046875, 0.3362579345703125, 0.36954498291015625, 0.40283203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 14.0, 22.0, 65.0, 185.0, 290.0, 253.0, 104.0, 37.0, 11.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.470098972320557, -5.325133323669434, -5.180168151855469, -5.035202503204346, -4.890236854553223, -4.745271682739258, -4.600306034088135, -4.455340385437012, -4.310375213623047, -4.165409564971924, -4.020444393157959, -3.875478744506836, -3.730513095855713, -3.585547685623169, -3.440582275390625, -3.295616626739502, -3.150650978088379, -3.005685567855835, -2.860719919204712, -2.715754508972168, -2.570788860321045, -2.425823450088501, -2.280858039855957, -2.135892391204834, -1.99092698097229, -1.8459614515304565, -1.700995922088623, -1.556030511856079, -1.4110649824142456, -1.266099452972412, -1.1211340427398682, -0.9761685132980347, -0.8312032222747803, -0.6862376928329468, -0.5412722229957581, -0.39630672335624695, -0.25134122371673584, -0.10637569427490234, 0.03858977556228638, 0.1835552453994751, 0.3285207748413086, 0.4734862744808197, 0.6184517741203308, 0.7634172439575195, 0.908382773399353, 1.0533483028411865, 1.1983137130737305, 1.343279242515564, 1.4882447719573975, 1.633210301399231, 1.7781758308410645, 1.9231412410736084, 2.0681066513061523, 2.2130722999572754, 2.3580377101898193, 2.5030031204223633, 2.6479687690734863, 2.7929341793060303, 2.9378998279571533, 3.0828652381896973, 3.2278308868408203, 3.3727962970733643, 3.517761707305908, 3.6627273559570312, 3.807692766189575]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 5.0, 7.0, 16.0, 22.0, 32.0, 35.0, 50.0, 53.0, 84.0, 66.0, 90.0, 80.0, 88.0, 64.0, 64.0, 59.0, 40.0, 45.0, 31.0, 26.0, 11.0, 10.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3638198375701904, -2.2956786155700684, -2.2275376319885254, -2.1593964099884033, -2.0912551879882812, -2.0231142044067383, -1.9549729824066162, -1.8868317604064941, -1.8186906576156616, -1.750549554824829, -1.682408332824707, -1.6142672300338745, -1.546126127243042, -1.47798490524292, -1.4098438024520874, -1.3417026996612549, -1.2735614776611328, -1.2054203748703003, -1.1372791528701782, -1.0691380500793457, -1.0009968280792236, -0.9328557252883911, -0.8647146224975586, -0.7965734601020813, -0.728432297706604, -0.6602911353111267, -0.5921499729156494, -0.5240088701248169, -0.4558677077293396, -0.3877265453338623, -0.3195854127407074, -0.2514442801475525, -0.1833028793334961, -0.11516173183917999, -0.04702058434486389, 0.02112056314945221, 0.08926171064376831, 0.1574028730392456, 0.2255440056324005, 0.2936851382255554, 0.3618263006210327, 0.42996746301651, 0.4981085956096649, 0.5662497282028198, 0.6343908905982971, 0.7025320529937744, 0.7706731557846069, 0.8388143181800842, 0.9069554805755615, 0.9750966429710388, 1.0432378053665161, 1.1113789081573486, 1.1795201301574707, 1.2476612329483032, 1.3158023357391357, 1.3839435577392578, 1.4520846605300903, 1.5202257633209229, 1.588366985321045, 1.6565080881118774, 1.72464919090271, 1.792790412902832, 1.8609315156936646, 1.929072618484497, 1.9972138404846191]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 20.0, 34.0, 49.0, 73.0, 159.0, 310.0, 736.0, 2375.0, 16470.0, 560255.0, 450631.0, 13928.0, 2172.0, 717.0, 286.0, 146.0, 77.0, 37.0, 24.0, 17.0, 4.0, 3.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.6666259765625, -2.559814453125, -2.4530029296875, -2.34619140625, -2.2393798828125, -2.132568359375, -2.0257568359375, -1.9189453125, -1.8121337890625, -1.705322265625, -1.5985107421875, -1.49169921875, -1.3848876953125, -1.278076171875, -1.1712646484375, -1.064453125, -0.9576416015625, -0.850830078125, -0.7440185546875, -0.63720703125, -0.5303955078125, -0.423583984375, -0.3167724609375, -0.2099609375, -0.1031494140625, 0.003662109375, 0.1104736328125, 0.21728515625, 0.3240966796875, 0.430908203125, 0.5377197265625, 0.64453125, 0.7513427734375, 0.858154296875, 0.9649658203125, 1.07177734375, 1.1785888671875, 1.285400390625, 1.3922119140625, 1.4990234375, 1.6058349609375, 1.712646484375, 1.8194580078125, 1.92626953125, 2.0330810546875, 2.139892578125, 2.2467041015625, 2.353515625, 2.4603271484375, 2.567138671875, 2.6739501953125, 2.78076171875, 2.8875732421875, 2.994384765625, 3.1011962890625, 3.2080078125, 3.3148193359375, 3.421630859375, 3.5284423828125, 3.63525390625, 3.7420654296875, 3.848876953125, 3.9556884765625, 4.0625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 13.0, 13.0, 23.0, 51.0, 51.0, 73.0, 73.0, 95.0, 110.0, 107.0, 102.0, 78.0, 61.0, 40.0, 38.0, 25.0, 18.0, 7.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.40673828125, -0.3970069885253906, -0.38727569580078125, -0.3775444030761719, -0.3678131103515625, -0.3580818176269531, -0.34835052490234375, -0.3386192321777344, -0.328887939453125, -0.3191566467285156, -0.30942535400390625, -0.2996940612792969, -0.2899627685546875, -0.2802314758300781, -0.27050018310546875, -0.2607688903808594, -0.25103759765625, -0.24130630493164062, -0.23157501220703125, -0.22184371948242188, -0.2121124267578125, -0.20238113403320312, -0.19264984130859375, -0.18291854858398438, -0.173187255859375, -0.16345596313476562, -0.15372467041015625, -0.14399337768554688, -0.1342620849609375, -0.12453079223632812, -0.11479949951171875, -0.10506820678710938, -0.0953369140625, -0.08560562133789062, -0.07587432861328125, -0.06614303588867188, -0.0564117431640625, -0.046680450439453125, -0.03694915771484375, -0.027217864990234375, -0.017486572265625, -0.007755279541015625, 0.00197601318359375, 0.011707305908203125, 0.0214385986328125, 0.031169891357421875, 0.04090118408203125, 0.050632476806640625, 0.06036376953125, 0.07009506225585938, 0.07982635498046875, 0.08955764770507812, 0.0992889404296875, 0.10902023315429688, 0.11875152587890625, 0.12848281860351562, 0.138214111328125, 0.14794540405273438, 0.15767669677734375, 0.16740798950195312, 0.1771392822265625, 0.18687057495117188, 0.19660186767578125, 0.20633316040039062, 0.216064453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 5.0, 17.0, 14.0, 30.0, 58.0, 85.0, 174.0, 339.0, 879.0, 2375.0, 8723.0, 63852.0, 743702.0, 205061.0, 17218.0, 3721.0, 1271.0, 521.0, 229.0, 106.0, 68.0, 29.0, 22.0, 9.0, 10.0, 9.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.220703125, -2.156707763671875, -2.09271240234375, -2.028717041015625, -1.9647216796875, -1.900726318359375, -1.83673095703125, -1.772735595703125, -1.708740234375, -1.644744873046875, -1.58074951171875, -1.516754150390625, -1.4527587890625, -1.388763427734375, -1.32476806640625, -1.260772705078125, -1.19677734375, -1.132781982421875, -1.06878662109375, -1.004791259765625, -0.9407958984375, -0.876800537109375, -0.81280517578125, -0.748809814453125, -0.684814453125, -0.620819091796875, -0.55682373046875, -0.492828369140625, -0.4288330078125, -0.364837646484375, -0.30084228515625, -0.236846923828125, -0.1728515625, -0.108856201171875, -0.04486083984375, 0.019134521484375, 0.0831298828125, 0.147125244140625, 0.21112060546875, 0.275115966796875, 0.339111328125, 0.403106689453125, 0.46710205078125, 0.531097412109375, 0.5950927734375, 0.659088134765625, 0.72308349609375, 0.787078857421875, 0.85107421875, 0.915069580078125, 0.97906494140625, 1.043060302734375, 1.1070556640625, 1.171051025390625, 1.23504638671875, 1.299041748046875, 1.363037109375, 1.427032470703125, 1.49102783203125, 1.555023193359375, 1.6190185546875, 1.683013916015625, 1.74700927734375, 1.811004638671875, 1.875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 7.0, 7.0, 8.0, 9.0, 22.0, 28.0, 31.0, 37.0, 41.0, 53.0, 68.0, 71.0, 59.0, 72.0, 83.0, 80.0, 69.0, 47.0, 50.0, 37.0, 30.0, 20.0, 22.0, 19.0, 11.0, 4.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.240234375, -1.2054824829101562, -1.1707305908203125, -1.1359786987304688, -1.101226806640625, -1.0664749145507812, -1.0317230224609375, -0.9969711303710938, -0.96221923828125, -0.9274673461914062, -0.8927154541015625, -0.8579635620117188, -0.823211669921875, -0.7884597778320312, -0.7537078857421875, -0.7189559936523438, -0.6842041015625, -0.6494522094726562, -0.6147003173828125, -0.5799484252929688, -0.545196533203125, -0.5104446411132812, -0.4756927490234375, -0.44094085693359375, -0.40618896484375, -0.37143707275390625, -0.3366851806640625, -0.30193328857421875, -0.267181396484375, -0.23242950439453125, -0.1976776123046875, -0.16292572021484375, -0.128173828125, -0.09342193603515625, -0.0586700439453125, -0.02391815185546875, 0.010833740234375, 0.04558563232421875, 0.0803375244140625, 0.11508941650390625, 0.14984130859375, 0.18459320068359375, 0.2193450927734375, 0.25409698486328125, 0.288848876953125, 0.32360076904296875, 0.3583526611328125, 0.39310455322265625, 0.4278564453125, 0.46260833740234375, 0.4973602294921875, 0.5321121215820312, 0.566864013671875, 0.6016159057617188, 0.6363677978515625, 0.6711196899414062, 0.70587158203125, 0.7406234741210938, 0.7753753662109375, 0.8101272583007812, 0.844879150390625, 0.8796310424804688, 0.9143829345703125, 0.9491348266601562, 0.98388671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 1.0, 3.0, 7.0, 11.0, 8.0, 14.0, 13.0, 16.0, 35.0, 41.0, 47.0, 84.0, 160.0, 252.0, 415.0, 729.0, 1386.0, 2867.0, 7451.0, 23423.0, 106552.0, 497975.0, 323975.0, 58314.0, 14798.0, 5224.0, 2198.0, 1033.0, 563.0, 338.0, 189.0, 134.0, 97.0, 53.0, 40.0, 24.0, 23.0, 17.0, 12.0, 7.0, 10.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.6044921875, -0.587615966796875, -0.57073974609375, -0.553863525390625, -0.5369873046875, -0.520111083984375, -0.50323486328125, -0.486358642578125, -0.469482421875, -0.452606201171875, -0.43572998046875, -0.418853759765625, -0.4019775390625, -0.385101318359375, -0.36822509765625, -0.351348876953125, -0.33447265625, -0.317596435546875, -0.30072021484375, -0.283843994140625, -0.2669677734375, -0.250091552734375, -0.23321533203125, -0.216339111328125, -0.199462890625, -0.182586669921875, -0.16571044921875, -0.148834228515625, -0.1319580078125, -0.115081787109375, -0.09820556640625, -0.081329345703125, -0.064453125, -0.047576904296875, -0.03070068359375, -0.013824462890625, 0.0030517578125, 0.019927978515625, 0.03680419921875, 0.053680419921875, 0.070556640625, 0.087432861328125, 0.10430908203125, 0.121185302734375, 0.1380615234375, 0.154937744140625, 0.17181396484375, 0.188690185546875, 0.20556640625, 0.222442626953125, 0.23931884765625, 0.256195068359375, 0.2730712890625, 0.289947509765625, 0.30682373046875, 0.323699951171875, 0.340576171875, 0.357452392578125, 0.37432861328125, 0.391204833984375, 0.4080810546875, 0.424957275390625, 0.44183349609375, 0.458709716796875, 0.4755859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 6.0, 5.0, 15.0, 12.0, 26.0, 26.0, 46.0, 47.0, 70.0, 91.0, 117.0, 127.0, 125.0, 83.0, 48.0, 44.0, 39.0, 23.0, 23.0, 6.0, 4.0, 7.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00017011165618896484, -0.00016617868095636368, -0.0001622457057237625, -0.00015831273049116135, -0.00015437975525856018, -0.00015044678002595901, -0.00014651380479335785, -0.00014258082956075668, -0.00013864785432815552, -0.00013471487909555435, -0.00013078190386295319, -0.00012684892863035202, -0.00012291595339775085, -0.00011898297816514969, -0.00011505000293254852, -0.00011111702769994736, -0.00010718405246734619, -0.00010325107723474503, -9.931810200214386e-05, -9.53851267695427e-05, -9.145215153694153e-05, -8.751917630434036e-05, -8.35862010717392e-05, -7.965322583913803e-05, -7.572025060653687e-05, -7.17872753739357e-05, -6.785430014133453e-05, -6.392132490873337e-05, -5.99883496761322e-05, -5.6055374443531036e-05, -5.212239921092987e-05, -4.8189423978328705e-05, -4.425644874572754e-05, -4.032347351312637e-05, -3.639049828052521e-05, -3.245752304792404e-05, -2.8524547815322876e-05, -2.459157258272171e-05, -2.0658597350120544e-05, -1.672562211751938e-05, -1.2792646884918213e-05, -8.859671652317047e-06, -4.926696419715881e-06, -9.937211871147156e-07, 2.93925404548645e-06, 6.872229278087616e-06, 1.0805204510688782e-05, 1.4738179743289948e-05, 1.8671154975891113e-05, 2.260413020849228e-05, 2.6537105441093445e-05, 3.047008067369461e-05, 3.4403055906295776e-05, 3.833603113889694e-05, 4.226900637149811e-05, 4.6201981604099274e-05, 5.013495683670044e-05, 5.4067932069301605e-05, 5.800090730190277e-05, 6.193388253450394e-05, 6.58668577671051e-05, 6.979983299970627e-05, 7.373280823230743e-05, 7.76657834649086e-05, 8.159875869750977e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 3.0, 13.0, 18.0, 40.0, 81.0, 122.0, 259.0, 428.0, 1019.0, 2616.0, 8315.0, 36580.0, 275942.0, 596525.0, 101745.0, 17181.0, 4627.0, 1637.0, 646.0, 327.0, 143.0, 89.0, 55.0, 38.0, 25.0, 16.0, 9.0, 11.0, 13.0, 1.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.70654296875, -0.6865081787109375, -0.666473388671875, -0.6464385986328125, -0.62640380859375, -0.6063690185546875, -0.586334228515625, -0.5662994384765625, -0.5462646484375, -0.5262298583984375, -0.506195068359375, -0.4861602783203125, -0.46612548828125, -0.4460906982421875, -0.426055908203125, -0.4060211181640625, -0.385986328125, -0.3659515380859375, -0.345916748046875, -0.3258819580078125, -0.30584716796875, -0.2858123779296875, -0.265777587890625, -0.2457427978515625, -0.2257080078125, -0.2056732177734375, -0.185638427734375, -0.1656036376953125, -0.14556884765625, -0.1255340576171875, -0.105499267578125, -0.0854644775390625, -0.0654296875, -0.0453948974609375, -0.025360107421875, -0.0053253173828125, 0.01470947265625, 0.0347442626953125, 0.054779052734375, 0.0748138427734375, 0.0948486328125, 0.1148834228515625, 0.134918212890625, 0.1549530029296875, 0.17498779296875, 0.1950225830078125, 0.215057373046875, 0.2350921630859375, 0.255126953125, 0.2751617431640625, 0.295196533203125, 0.3152313232421875, 0.33526611328125, 0.3553009033203125, 0.375335693359375, 0.3953704833984375, 0.4154052734375, 0.4354400634765625, 0.455474853515625, 0.4755096435546875, 0.49554443359375, 0.5155792236328125, 0.535614013671875, 0.5556488037109375, 0.57568359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 12.0, 10.0, 14.0, 26.0, 23.0, 34.0, 68.0, 73.0, 119.0, 120.0, 111.0, 92.0, 79.0, 63.0, 41.0, 32.0, 24.0, 8.0, 14.0, 6.0, 10.0, 4.0, 3.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.57470703125, -0.5596199035644531, -0.5445327758789062, -0.5294456481933594, -0.5143585205078125, -0.4992713928222656, -0.48418426513671875, -0.4690971374511719, -0.454010009765625, -0.4389228820800781, -0.42383575439453125, -0.4087486267089844, -0.3936614990234375, -0.3785743713378906, -0.36348724365234375, -0.3484001159667969, -0.33331298828125, -0.3182258605957031, -0.30313873291015625, -0.2880516052246094, -0.2729644775390625, -0.2578773498535156, -0.24279022216796875, -0.22770309448242188, -0.212615966796875, -0.19752883911132812, -0.18244171142578125, -0.16735458374023438, -0.1522674560546875, -0.13718032836914062, -0.12209320068359375, -0.10700607299804688, -0.0919189453125, -0.07683181762695312, -0.06174468994140625, -0.046657562255859375, -0.0315704345703125, -0.016483306884765625, -0.00139617919921875, 0.013690948486328125, 0.028778076171875, 0.043865203857421875, 0.05895233154296875, 0.07403945922851562, 0.0891265869140625, 0.10421371459960938, 0.11930084228515625, 0.13438796997070312, 0.14947509765625, 0.16456222534179688, 0.17964935302734375, 0.19473648071289062, 0.2098236083984375, 0.22491073608398438, 0.23999786376953125, 0.2550849914550781, 0.270172119140625, 0.2852592468261719, 0.30034637451171875, 0.3154335021972656, 0.3305206298828125, 0.3456077575683594, 0.36069488525390625, 0.3757820129394531, 0.390869140625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 19.0, 16.0, 46.0, 86.0, 135.0, 204.0, 183.0, 126.0, 62.0, 52.0, 29.0, 23.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.175352096557617, -11.8909912109375, -11.6066312789917, -11.322270393371582, -11.037910461425781, -10.753549575805664, -10.469188690185547, -10.184828758239746, -9.900467872619629, -9.616106986999512, -9.331747055053711, -9.047386169433594, -8.763026237487793, -8.478665351867676, -8.194305419921875, -7.909944534301758, -7.625584125518799, -7.34122371673584, -7.056863307952881, -6.772502899169922, -6.488142013549805, -6.203781604766846, -5.919421195983887, -5.635060787200928, -5.350700378417969, -5.06633996963501, -4.781979560852051, -4.497618675231934, -4.213258266448975, -3.9288978576660156, -3.6445374488830566, -3.3601770401000977, -3.0758161544799805, -2.7914557456970215, -2.5070950984954834, -2.2227346897125244, -1.9383741617202759, -1.6540136337280273, -1.3696532249450684, -1.0852926969528198, -0.8009321689605713, -0.5165716409683228, -0.232211172580719, 0.052149295806884766, 0.3365098237991333, 0.6208703517913818, 0.9052307605743408, 1.1895912885665894, 1.473951816558838, 1.7583123445510864, 2.042672872543335, 2.327033281326294, 2.611393928527832, 2.895754337310791, 3.18011474609375, 3.464475154876709, 3.748835802078247, 4.033196449279785, 4.317556858062744, 4.601917266845703, 4.886277675628662, 5.170638084411621, 5.454998970031738, 5.739359378814697, 6.023719787597656]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 10.0, 6.0, 8.0, 15.0, 11.0, 20.0, 15.0, 18.0, 24.0, 27.0, 46.0, 42.0, 42.0, 39.0, 53.0, 60.0, 48.0, 50.0, 40.0, 61.0, 47.0, 40.0, 40.0, 34.0, 32.0, 30.0, 24.0, 20.0, 12.0, 21.0, 12.0, 12.0, 10.0, 3.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-4.770001411437988, -4.629631042480469, -4.489260673522949, -4.34889030456543, -4.20851993560791, -4.068149566650391, -3.92777943611145, -3.7874090671539307, -3.647038698196411, -3.5066683292388916, -3.366297960281372, -3.2259275913238525, -3.085557460784912, -2.9451870918273926, -2.804816722869873, -2.6644463539123535, -2.524075984954834, -2.3837056159973145, -2.243335247039795, -2.1029648780822754, -1.9625946283340454, -1.8222242593765259, -1.681854009628296, -1.5414836406707764, -1.4011132717132568, -1.2607429027557373, -1.1203725337982178, -0.9800022840499878, -0.8396319150924683, -0.6992615461349487, -0.558891236782074, -0.4185209274291992, -0.2781505584716797, -0.13778021931648254, 0.0025901198387145996, 0.14296045899391174, 0.2833307981491089, 0.4237011671066284, 0.5640714764595032, 0.7044417858123779, 0.8448121547698975, 0.985182523727417, 1.1255528926849365, 1.2659231424331665, 1.406293511390686, 1.5466638803482056, 1.6870341300964355, 1.827404499053955, 1.9677748680114746, 2.108145236968994, 2.2485156059265137, 2.388885974884033, 2.5292563438415527, 2.6696267127990723, 2.8099968433380127, 2.9503672122955322, 3.0907375812530518, 3.2311079502105713, 3.371478319168091, 3.5118486881256104, 3.652218818664551, 3.7925891876220703, 3.93295955657959, 4.073329925537109, 4.213700294494629]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 4.0, 2.0, 10.0, 11.0, 12.0, 15.0, 18.0, 21.0, 20.0, 30.0, 36.0, 52.0, 47.0, 49.0, 79.0, 98.0, 143.0, 160.0, 232.0, 384.0, 710.0, 1235.0, 2823.0, 7460.0, 24687.0, 135258.0, 3723051.0, 245676.0, 35410.0, 10100.0, 3564.0, 1433.0, 695.0, 340.0, 172.0, 92.0, 60.0, 33.0, 21.0, 10.0, 10.0, 3.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.91796875, -2.8525543212890625, -2.787139892578125, -2.7217254638671875, -2.65631103515625, -2.5908966064453125, -2.525482177734375, -2.4600677490234375, -2.3946533203125, -2.3292388916015625, -2.263824462890625, -2.1984100341796875, -2.13299560546875, -2.0675811767578125, -2.002166748046875, -1.9367523193359375, -1.871337890625, -1.8059234619140625, -1.740509033203125, -1.6750946044921875, -1.60968017578125, -1.5442657470703125, -1.478851318359375, -1.4134368896484375, -1.3480224609375, -1.2826080322265625, -1.217193603515625, -1.1517791748046875, -1.08636474609375, -1.0209503173828125, -0.955535888671875, -0.8901214599609375, -0.82470703125, -0.7592926025390625, -0.693878173828125, -0.6284637451171875, -0.56304931640625, -0.4976348876953125, -0.432220458984375, -0.3668060302734375, -0.3013916015625, -0.2359771728515625, -0.170562744140625, -0.1051483154296875, -0.03973388671875, 0.0256805419921875, 0.091094970703125, 0.1565093994140625, 0.221923828125, 0.2873382568359375, 0.352752685546875, 0.4181671142578125, 0.48358154296875, 0.5489959716796875, 0.614410400390625, 0.6798248291015625, 0.7452392578125, 0.8106536865234375, 0.876068115234375, 0.9414825439453125, 1.00689697265625, 1.0723114013671875, 1.137725830078125, 1.2031402587890625, 1.2685546875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 11.0, 20.0, 25.0, 34.0, 52.0, 68.0, 64.0, 100.0, 109.0, 102.0, 109.0, 86.0, 64.0, 50.0, 40.0, 30.0, 13.0, 2.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.42444419860839844, -0.4143180847167969, -0.4041919708251953, -0.39406585693359375, -0.3839397430419922, -0.3738136291503906, -0.36368751525878906, -0.3535614013671875, -0.34343528747558594, -0.3333091735839844, -0.3231830596923828, -0.31305694580078125, -0.3029308319091797, -0.2928047180175781, -0.28267860412597656, -0.272552490234375, -0.26242637634277344, -0.2523002624511719, -0.2421741485595703, -0.23204803466796875, -0.2219219207763672, -0.21179580688476562, -0.20166969299316406, -0.1915435791015625, -0.18141746520996094, -0.17129135131835938, -0.1611652374267578, -0.15103912353515625, -0.1409130096435547, -0.13078689575195312, -0.12066078186035156, -0.11053466796875, -0.10040855407714844, -0.09028244018554688, -0.08015632629394531, -0.07003021240234375, -0.05990409851074219, -0.049777984619140625, -0.03965187072753906, -0.0295257568359375, -0.019399642944335938, -0.009273529052734375, 0.0008525848388671875, 0.01097869873046875, 0.021104812622070312, 0.031230926513671875, 0.04135704040527344, 0.051483154296875, 0.06160926818847656, 0.07173538208007812, 0.08186149597167969, 0.09198760986328125, 0.10211372375488281, 0.11223983764648438, 0.12236595153808594, 0.1324920654296875, 0.14261817932128906, 0.15274429321289062, 0.1628704071044922, 0.17299652099609375, 0.1831226348876953, 0.19324874877929688, 0.20337486267089844, 0.2135009765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 6.0, 7.0, 13.0, 31.0, 78.0, 146.0, 294.0, 1088.0, 9091.0, 4153450.0, 27882.0, 1546.0, 381.0, 146.0, 67.0, 30.0, 16.0, 11.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.265625, -11.9117431640625, -11.557861328125, -11.2039794921875, -10.85009765625, -10.4962158203125, -10.142333984375, -9.7884521484375, -9.4345703125, -9.0806884765625, -8.726806640625, -8.3729248046875, -8.01904296875, -7.6651611328125, -7.311279296875, -6.9573974609375, -6.603515625, -6.2496337890625, -5.895751953125, -5.5418701171875, -5.18798828125, -4.8341064453125, -4.480224609375, -4.1263427734375, -3.7724609375, -3.4185791015625, -3.064697265625, -2.7108154296875, -2.35693359375, -2.0030517578125, -1.649169921875, -1.2952880859375, -0.94140625, -0.5875244140625, -0.233642578125, 0.1202392578125, 0.47412109375, 0.8280029296875, 1.181884765625, 1.5357666015625, 1.8896484375, 2.2435302734375, 2.597412109375, 2.9512939453125, 3.30517578125, 3.6590576171875, 4.012939453125, 4.3668212890625, 4.720703125, 5.0745849609375, 5.428466796875, 5.7823486328125, 6.13623046875, 6.4901123046875, 6.843994140625, 7.1978759765625, 7.5517578125, 7.9056396484375, 8.259521484375, 8.6134033203125, 8.96728515625, 9.3211669921875, 9.675048828125, 10.0289306640625, 10.3828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 7.0, 9.0, 9.0, 11.0, 20.0, 42.0, 197.0, 2614.0, 1006.0, 111.0, 31.0, 11.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.32421875, -2.255523681640625, -2.18682861328125, -2.118133544921875, -2.0494384765625, -1.980743408203125, -1.91204833984375, -1.843353271484375, -1.774658203125, -1.705963134765625, -1.63726806640625, -1.568572998046875, -1.4998779296875, -1.431182861328125, -1.36248779296875, -1.293792724609375, -1.22509765625, -1.156402587890625, -1.08770751953125, -1.019012451171875, -0.9503173828125, -0.881622314453125, -0.81292724609375, -0.744232177734375, -0.675537109375, -0.606842041015625, -0.53814697265625, -0.469451904296875, -0.4007568359375, -0.332061767578125, -0.26336669921875, -0.194671630859375, -0.1259765625, -0.057281494140625, 0.01141357421875, 0.080108642578125, 0.1488037109375, 0.217498779296875, 0.28619384765625, 0.354888916015625, 0.423583984375, 0.492279052734375, 0.56097412109375, 0.629669189453125, 0.6983642578125, 0.767059326171875, 0.83575439453125, 0.904449462890625, 0.97314453125, 1.041839599609375, 1.11053466796875, 1.179229736328125, 1.2479248046875, 1.316619873046875, 1.38531494140625, 1.454010009765625, 1.522705078125, 1.591400146484375, 1.66009521484375, 1.728790283203125, 1.7974853515625, 1.866180419921875, 1.93487548828125, 2.003570556640625, 2.072265625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 12.0, 47.0, 208.0, 500.0, 188.0, 36.0, 11.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.29140281677246, -23.809968948364258, -23.328535079956055, -22.84710121154785, -22.36566734313965, -21.884233474731445, -21.402799606323242, -20.92136573791504, -20.439931869506836, -19.958498001098633, -19.47706413269043, -18.995630264282227, -18.514196395874023, -18.03276252746582, -17.551328659057617, -17.069894790649414, -16.58846092224121, -16.107027053833008, -15.625593185424805, -15.144159317016602, -14.662725448608398, -14.181291580200195, -13.699857711791992, -13.218423843383789, -12.736989974975586, -12.255556106567383, -11.77412223815918, -11.292688369750977, -10.811254501342773, -10.32982063293457, -9.848386764526367, -9.366952896118164, -8.885518074035645, -8.404084205627441, -7.922650337219238, -7.441216468811035, -6.959782600402832, -6.478348731994629, -5.996914863586426, -5.515480995178223, -5.0340471267700195, -4.552613258361816, -4.071179389953613, -3.58974552154541, -3.108311653137207, -2.626877784729004, -2.145443916320801, -1.6640100479125977, -1.1825761795043945, -0.7011423110961914, -0.21970844268798828, 0.26172542572021484, 0.743159294128418, 1.224593162536621, 1.7060270309448242, 2.1874608993530273, 2.6688947677612305, 3.1503286361694336, 3.6317625045776367, 4.11319637298584, 4.594630241394043, 5.076064109802246, 5.557497978210449, 6.038931846618652, 6.5203657150268555]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 0.0, 6.0, 7.0, 10.0, 13.0, 35.0, 48.0, 72.0, 82.0, 94.0, 100.0, 100.0, 93.0, 77.0, 84.0, 61.0, 39.0, 22.0, 24.0, 13.0, 14.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.191410064697266, -4.041649341583252, -3.8918888568878174, -3.7421281337738037, -3.592367649078369, -3.4426069259643555, -3.292846202850342, -3.1430857181549072, -2.9933252334594727, -2.843564510345459, -2.6938040256500244, -2.5440433025360107, -2.394282817840576, -2.2445220947265625, -2.094761371612549, -1.9450008869171143, -1.7952401638031006, -1.6454795598983765, -1.4957189559936523, -1.3459582328796387, -1.196197748184204, -1.0464370250701904, -0.8966764211654663, -0.7469158172607422, -0.5971552133560181, -0.44739460945129395, -0.29763397574424744, -0.14787334203720093, 0.0018872618675231934, 0.15164786577224731, 0.3014085292816162, 0.45116913318634033, 0.6009297370910645, 0.7506903409957886, 0.9004509449005127, 1.0502116680145264, 1.199972152709961, 1.3497328758239746, 1.4994934797286987, 1.6492540836334229, 1.799014687538147, 1.948775291442871, 2.0985360145568848, 2.2482964992523193, 2.398057222366333, 2.5478177070617676, 2.6975784301757812, 2.847339153289795, 2.9970996379852295, 3.146860361099243, 3.2966208457946777, 3.4463815689086914, 3.596142053604126, 3.7459027767181396, 3.895663261413574, 4.045423984527588, 4.195184707641602, 4.344945430755615, 4.494706153869629, 4.644466400146484, 4.794227123260498, 4.943987846374512, 5.093748569488525, 5.243509292602539, 5.3932695388793945]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 7.0, 8.0, 6.0, 6.0, 11.0, 8.0, 11.0, 22.0, 28.0, 47.0, 62.0, 92.0, 132.0, 196.0, 303.0, 522.0, 980.0, 2213.0, 6578.0, 26310.0, 168298.0, 633333.0, 171528.0, 26481.0, 6655.0, 2334.0, 1025.0, 496.0, 265.0, 194.0, 113.0, 88.0, 44.0, 39.0, 34.0, 19.0, 10.0, 12.0, 9.0, 6.0, 12.0, 5.0, 2.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.87109375, -1.81524658203125, -1.7593994140625, -1.70355224609375, -1.647705078125, -1.59185791015625, -1.5360107421875, -1.48016357421875, -1.42431640625, -1.36846923828125, -1.3126220703125, -1.25677490234375, -1.200927734375, -1.14508056640625, -1.0892333984375, -1.03338623046875, -0.9775390625, -0.92169189453125, -0.8658447265625, -0.80999755859375, -0.754150390625, -0.69830322265625, -0.6424560546875, -0.58660888671875, -0.53076171875, -0.47491455078125, -0.4190673828125, -0.36322021484375, -0.307373046875, -0.25152587890625, -0.1956787109375, -0.13983154296875, -0.083984375, -0.02813720703125, 0.0277099609375, 0.08355712890625, 0.139404296875, 0.19525146484375, 0.2510986328125, 0.30694580078125, 0.36279296875, 0.41864013671875, 0.4744873046875, 0.53033447265625, 0.586181640625, 0.64202880859375, 0.6978759765625, 0.75372314453125, 0.8095703125, 0.86541748046875, 0.9212646484375, 0.97711181640625, 1.032958984375, 1.08880615234375, 1.1446533203125, 1.20050048828125, 1.25634765625, 1.31219482421875, 1.3680419921875, 1.42388916015625, 1.479736328125, 1.53558349609375, 1.5914306640625, 1.64727783203125, 1.703125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 6.0, 15.0, 23.0, 17.0, 51.0, 69.0, 79.0, 102.0, 85.0, 115.0, 90.0, 94.0, 82.0, 53.0, 41.0, 29.0, 17.0, 9.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.44677734375, -0.4356727600097656, -0.42456817626953125, -0.4134635925292969, -0.4023590087890625, -0.3912544250488281, -0.38014984130859375, -0.3690452575683594, -0.357940673828125, -0.3468360900878906, -0.33573150634765625, -0.3246269226074219, -0.3135223388671875, -0.3024177551269531, -0.29131317138671875, -0.2802085876464844, -0.26910400390625, -0.2579994201660156, -0.24689483642578125, -0.23579025268554688, -0.2246856689453125, -0.21358108520507812, -0.20247650146484375, -0.19137191772460938, -0.180267333984375, -0.16916275024414062, -0.15805816650390625, -0.14695358276367188, -0.1358489990234375, -0.12474441528320312, -0.11363983154296875, -0.10253524780273438, -0.0914306640625, -0.08032608032226562, -0.06922149658203125, -0.058116912841796875, -0.0470123291015625, -0.035907745361328125, -0.02480316162109375, -0.013698577880859375, -0.002593994140625, 0.008510589599609375, 0.01961517333984375, 0.030719757080078125, 0.0418243408203125, 0.052928924560546875, 0.06403350830078125, 0.07513809204101562, 0.08624267578125, 0.09734725952148438, 0.10845184326171875, 0.11955642700195312, 0.1306610107421875, 0.14176559448242188, 0.15287017822265625, 0.16397476196289062, 0.175079345703125, 0.18618392944335938, 0.19728851318359375, 0.20839309692382812, 0.2194976806640625, 0.23060226440429688, 0.24170684814453125, 0.2528114318847656, 0.263916015625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 13.0, 20.0, 36.0, 39.0, 74.0, 133.0, 269.0, 669.0, 1708.0, 6191.0, 29036.0, 173133.0, 571332.0, 219030.0, 36180.0, 7260.0, 2006.0, 745.0, 297.0, 144.0, 67.0, 44.0, 23.0, 26.0, 10.0, 14.0, 12.0, 2.0, 8.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.091796875, -1.0560760498046875, -1.020355224609375, -0.9846343994140625, -0.94891357421875, -0.9131927490234375, -0.877471923828125, -0.8417510986328125, -0.8060302734375, -0.7703094482421875, -0.734588623046875, -0.6988677978515625, -0.66314697265625, -0.6274261474609375, -0.591705322265625, -0.5559844970703125, -0.520263671875, -0.4845428466796875, -0.448822021484375, -0.4131011962890625, -0.37738037109375, -0.3416595458984375, -0.305938720703125, -0.2702178955078125, -0.2344970703125, -0.1987762451171875, -0.163055419921875, -0.1273345947265625, -0.09161376953125, -0.0558929443359375, -0.020172119140625, 0.0155487060546875, 0.05126953125, 0.0869903564453125, 0.122711181640625, 0.1584320068359375, 0.19415283203125, 0.2298736572265625, 0.265594482421875, 0.3013153076171875, 0.3370361328125, 0.3727569580078125, 0.408477783203125, 0.4441986083984375, 0.47991943359375, 0.5156402587890625, 0.551361083984375, 0.5870819091796875, 0.622802734375, 0.6585235595703125, 0.694244384765625, 0.7299652099609375, 0.76568603515625, 0.8014068603515625, 0.837127685546875, 0.8728485107421875, 0.9085693359375, 0.9442901611328125, 0.980010986328125, 1.0157318115234375, 1.05145263671875, 1.0871734619140625, 1.122894287109375, 1.1586151123046875, 1.1943359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 12.0, 14.0, 19.0, 9.0, 25.0, 26.0, 31.0, 36.0, 40.0, 38.0, 39.0, 35.0, 51.0, 54.0, 44.0, 61.0, 51.0, 47.0, 46.0, 34.0, 48.0, 29.0, 43.0, 23.0, 19.0, 27.0, 18.0, 20.0, 9.0, 9.0, 5.0, 9.0, 8.0, 2.0, 7.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.701171875, -0.6781005859375, -0.655029296875, -0.6319580078125, -0.60888671875, -0.5858154296875, -0.562744140625, -0.5396728515625, -0.5166015625, -0.4935302734375, -0.470458984375, -0.4473876953125, -0.42431640625, -0.4012451171875, -0.378173828125, -0.3551025390625, -0.33203125, -0.3089599609375, -0.285888671875, -0.2628173828125, -0.23974609375, -0.2166748046875, -0.193603515625, -0.1705322265625, -0.1474609375, -0.1243896484375, -0.101318359375, -0.0782470703125, -0.05517578125, -0.0321044921875, -0.009033203125, 0.0140380859375, 0.037109375, 0.0601806640625, 0.083251953125, 0.1063232421875, 0.12939453125, 0.1524658203125, 0.175537109375, 0.1986083984375, 0.2216796875, 0.2447509765625, 0.267822265625, 0.2908935546875, 0.31396484375, 0.3370361328125, 0.360107421875, 0.3831787109375, 0.40625, 0.4293212890625, 0.452392578125, 0.4754638671875, 0.49853515625, 0.5216064453125, 0.544677734375, 0.5677490234375, 0.5908203125, 0.6138916015625, 0.636962890625, 0.6600341796875, 0.68310546875, 0.7061767578125, 0.729248046875, 0.7523193359375, 0.775390625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 2.0, 12.0, 17.0, 24.0, 47.0, 78.0, 124.0, 228.0, 539.0, 1280.0, 4799.0, 30497.0, 387699.0, 564677.0, 49008.0, 6633.0, 1675.0, 614.0, 270.0, 162.0, 60.0, 41.0, 20.0, 12.0, 12.0, 10.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6875, -0.6601104736328125, -0.632720947265625, -0.6053314208984375, -0.57794189453125, -0.5505523681640625, -0.523162841796875, -0.4957733154296875, -0.4683837890625, -0.4409942626953125, -0.413604736328125, -0.3862152099609375, -0.35882568359375, -0.3314361572265625, -0.304046630859375, -0.2766571044921875, -0.249267578125, -0.2218780517578125, -0.194488525390625, -0.1670989990234375, -0.13970947265625, -0.1123199462890625, -0.084930419921875, -0.0575408935546875, -0.0301513671875, -0.0027618408203125, 0.024627685546875, 0.0520172119140625, 0.07940673828125, 0.1067962646484375, 0.134185791015625, 0.1615753173828125, 0.18896484375, 0.2163543701171875, 0.243743896484375, 0.2711334228515625, 0.29852294921875, 0.3259124755859375, 0.353302001953125, 0.3806915283203125, 0.4080810546875, 0.4354705810546875, 0.462860107421875, 0.4902496337890625, 0.51763916015625, 0.5450286865234375, 0.572418212890625, 0.5998077392578125, 0.627197265625, 0.6545867919921875, 0.681976318359375, 0.7093658447265625, 0.73675537109375, 0.7641448974609375, 0.791534423828125, 0.8189239501953125, 0.8463134765625, 0.8737030029296875, 0.901092529296875, 0.9284820556640625, 0.95587158203125, 0.9832611083984375, 1.010650634765625, 1.0380401611328125, 1.0654296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 8.0, 2.0, 20.0, 10.0, 22.0, 40.0, 62.0, 87.0, 97.0, 130.0, 152.0, 111.0, 98.0, 47.0, 42.0, 32.0, 14.0, 8.0, 7.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012421607971191406, -0.00011979788541793823, -0.0001153796911239624, -0.00011096149682998657, -0.00010654330253601074, -0.00010212510824203491, -9.770691394805908e-05, -9.328871965408325e-05, -8.887052536010742e-05, -8.445233106613159e-05, -8.003413677215576e-05, -7.561594247817993e-05, -7.11977481842041e-05, -6.677955389022827e-05, -6.236135959625244e-05, -5.794316530227661e-05, -5.352497100830078e-05, -4.910677671432495e-05, -4.468858242034912e-05, -4.027038812637329e-05, -3.585219383239746e-05, -3.143399953842163e-05, -2.70158052444458e-05, -2.259761095046997e-05, -1.817941665649414e-05, -1.376122236251831e-05, -9.34302806854248e-06, -4.92483377456665e-06, -5.066394805908203e-07, 3.91155481338501e-06, 8.32974910736084e-06, 1.274794340133667e-05, 1.71661376953125e-05, 2.158433198928833e-05, 2.600252628326416e-05, 3.042072057723999e-05, 3.483891487121582e-05, 3.925710916519165e-05, 4.367530345916748e-05, 4.809349775314331e-05, 5.251169204711914e-05, 5.692988634109497e-05, 6.13480806350708e-05, 6.576627492904663e-05, 7.018446922302246e-05, 7.460266351699829e-05, 7.902085781097412e-05, 8.343905210494995e-05, 8.785724639892578e-05, 9.227544069290161e-05, 9.669363498687744e-05, 0.00010111182928085327, 0.0001055300235748291, 0.00010994821786880493, 0.00011436641216278076, 0.00011878460645675659, 0.00012320280075073242, 0.00012762099504470825, 0.00013203918933868408, 0.0001364573836326599, 0.00014087557792663574, 0.00014529377222061157, 0.0001497119665145874, 0.00015413016080856323, 0.00015854835510253906]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 10.0, 7.0, 19.0, 15.0, 27.0, 52.0, 89.0, 215.0, 533.0, 2242.0, 12495.0, 133208.0, 756807.0, 127950.0, 11892.0, 2014.0, 558.0, 177.0, 84.0, 54.0, 34.0, 26.0, 18.0, 8.0, 6.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.503997802734375, -0.47674560546875, -0.449493408203125, -0.4222412109375, -0.394989013671875, -0.36773681640625, -0.340484619140625, -0.313232421875, -0.285980224609375, -0.25872802734375, -0.231475830078125, -0.2042236328125, -0.176971435546875, -0.14971923828125, -0.122467041015625, -0.09521484375, -0.067962646484375, -0.04071044921875, -0.013458251953125, 0.0137939453125, 0.041046142578125, 0.06829833984375, 0.095550537109375, 0.122802734375, 0.150054931640625, 0.17730712890625, 0.204559326171875, 0.2318115234375, 0.259063720703125, 0.28631591796875, 0.313568115234375, 0.3408203125, 0.368072509765625, 0.39532470703125, 0.422576904296875, 0.4498291015625, 0.477081298828125, 0.50433349609375, 0.531585693359375, 0.558837890625, 0.586090087890625, 0.61334228515625, 0.640594482421875, 0.6678466796875, 0.695098876953125, 0.72235107421875, 0.749603271484375, 0.77685546875, 0.804107666015625, 0.83135986328125, 0.858612060546875, 0.8858642578125, 0.913116455078125, 0.94036865234375, 0.967620849609375, 0.994873046875, 1.022125244140625, 1.04937744140625, 1.076629638671875, 1.1038818359375, 1.131134033203125, 1.15838623046875, 1.185638427734375, 1.212890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 11.0, 9.0, 12.0, 15.0, 20.0, 34.0, 41.0, 64.0, 52.0, 71.0, 100.0, 92.0, 77.0, 73.0, 66.0, 61.0, 52.0, 35.0, 19.0, 21.0, 17.0, 14.0, 11.0, 6.0, 6.0, 2.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2420654296875, -0.23076820373535156, -0.21947097778320312, -0.2081737518310547, -0.19687652587890625, -0.1855792999267578, -0.17428207397460938, -0.16298484802246094, -0.1516876220703125, -0.14039039611816406, -0.12909317016601562, -0.11779594421386719, -0.10649871826171875, -0.09520149230957031, -0.08390426635742188, -0.07260704040527344, -0.061309814453125, -0.05001258850097656, -0.038715362548828125, -0.027418136596679688, -0.01612091064453125, -0.0048236846923828125, 0.006473541259765625, 0.017770767211914062, 0.0290679931640625, 0.04036521911621094, 0.051662445068359375, 0.06295967102050781, 0.07425689697265625, 0.08555412292480469, 0.09685134887695312, 0.10814857482910156, 0.11944580078125, 0.13074302673339844, 0.14204025268554688, 0.1533374786376953, 0.16463470458984375, 0.1759319305419922, 0.18722915649414062, 0.19852638244628906, 0.2098236083984375, 0.22112083435058594, 0.23241806030273438, 0.2437152862548828, 0.25501251220703125, 0.2663097381591797, 0.2776069641113281, 0.28890419006347656, 0.300201416015625, 0.31149864196777344, 0.3227958679199219, 0.3340930938720703, 0.34539031982421875, 0.3566875457763672, 0.3679847717285156, 0.37928199768066406, 0.3905792236328125, 0.40187644958496094, 0.4131736755371094, 0.4244709014892578, 0.43576812744140625, 0.4470653533935547, 0.4583625793457031, 0.46965980529785156, 0.48095703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 25.0, 55.0, 144.0, 281.0, 241.0, 144.0, 72.0, 26.0, 8.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.50307846069336, -19.111434936523438, -18.71979331970215, -18.328149795532227, -17.936508178710938, -17.544864654541016, -17.153221130371094, -16.761579513549805, -16.369935989379883, -15.978293418884277, -15.586650848388672, -15.19500732421875, -14.803364753723145, -14.411722183227539, -14.020079612731934, -13.628437042236328, -13.236794471740723, -12.845151901245117, -12.453509330749512, -12.061866760253906, -11.670223236083984, -11.278580665588379, -10.886938095092773, -10.495295524597168, -10.103652954101562, -9.712010383605957, -9.320367813110352, -8.92872428894043, -8.537081718444824, -8.145439147949219, -7.753796577453613, -7.362154006958008, -6.9705095291137695, -6.578866958618164, -6.1872239112854, -5.795581340789795, -5.403938293457031, -5.012295722961426, -4.62065315246582, -4.229010581970215, -3.837367534637451, -3.4457247257232666, -3.054081916809082, -2.6624393463134766, -2.270796537399292, -1.8791537284851074, -1.487511157989502, -1.0958683490753174, -0.7042255401611328, -0.312582790851593, 0.07905995845794678, 0.4707026481628418, 0.8623454570770264, 1.253988265991211, 1.6456308364868164, 2.037273645401001, 2.4289164543151855, 2.82055926322937, 3.2122020721435547, 3.60384464263916, 3.9954874515533447, 4.387130260467529, 4.778772830963135, 5.170415878295898, 5.562058448791504]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 7.0, 10.0, 16.0, 14.0, 20.0, 24.0, 30.0, 27.0, 34.0, 43.0, 51.0, 49.0, 55.0, 48.0, 47.0, 71.0, 52.0, 48.0, 47.0, 49.0, 46.0, 23.0, 29.0, 24.0, 27.0, 14.0, 22.0, 14.0, 16.0, 13.0, 4.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.57539176940918, -4.432658672332764, -4.289925575256348, -4.147192478179932, -4.004459381103516, -3.8617262840270996, -3.7189931869506836, -3.5762600898742676, -3.4335269927978516, -3.2907938957214355, -3.1480607986450195, -3.0053277015686035, -2.8625946044921875, -2.7198615074157715, -2.5771284103393555, -2.4343953132629395, -2.2916624546051025, -2.1489293575286865, -2.0061962604522705, -1.8634631633758545, -1.7207300662994385, -1.5779969692230225, -1.435263991355896, -1.29253089427948, -1.149797797203064, -1.007064700126648, -0.8643316030502319, -0.7215985655784607, -0.5788654685020447, -0.43613237142562866, -0.2933993339538574, -0.1506662368774414, -0.00793313980102539, 0.13479994237422943, 0.27753302454948425, 0.4202660918235779, 0.5629991888999939, 0.7057322859764099, 0.8484653234481812, 0.9911984205245972, 1.1339315176010132, 1.2766646146774292, 1.4193977117538452, 1.5621306896209717, 1.7048637866973877, 1.8475968837738037, 1.9903299808502197, 2.1330630779266357, 2.2757961750030518, 2.4185292720794678, 2.561262369155884, 2.7039954662323, 2.846728563308716, 2.989461660385132, 3.1321945190429688, 3.2749276161193848, 3.417660713195801, 3.560393810272217, 3.703126907348633, 3.845860004425049, 3.988593101501465, 4.131326198577881, 4.274059295654297, 4.416792392730713, 4.559525489807129]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 7.0, 13.0, 11.0, 11.0, 12.0, 15.0, 23.0, 34.0, 42.0, 56.0, 64.0, 100.0, 127.0, 175.0, 317.0, 573.0, 1106.0, 2593.0, 7793.0, 32349.0, 628880.0, 3455649.0, 47820.0, 10218.0, 3368.0, 1416.0, 651.0, 304.0, 216.0, 136.0, 74.0, 38.0, 28.0, 15.0, 7.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0], "bins": [-2.875, -2.809814453125, -2.74462890625, -2.679443359375, -2.6142578125, -2.549072265625, -2.48388671875, -2.418701171875, -2.353515625, -2.288330078125, -2.22314453125, -2.157958984375, -2.0927734375, -2.027587890625, -1.96240234375, -1.897216796875, -1.83203125, -1.766845703125, -1.70166015625, -1.636474609375, -1.5712890625, -1.506103515625, -1.44091796875, -1.375732421875, -1.310546875, -1.245361328125, -1.18017578125, -1.114990234375, -1.0498046875, -0.984619140625, -0.91943359375, -0.854248046875, -0.7890625, -0.723876953125, -0.65869140625, -0.593505859375, -0.5283203125, -0.463134765625, -0.39794921875, -0.332763671875, -0.267578125, -0.202392578125, -0.13720703125, -0.072021484375, -0.0068359375, 0.058349609375, 0.12353515625, 0.188720703125, 0.25390625, 0.319091796875, 0.38427734375, 0.449462890625, 0.5146484375, 0.579833984375, 0.64501953125, 0.710205078125, 0.775390625, 0.840576171875, 0.90576171875, 0.970947265625, 1.0361328125, 1.101318359375, 1.16650390625, 1.231689453125, 1.296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 16.0, 13.0, 30.0, 55.0, 56.0, 65.0, 96.0, 80.0, 96.0, 76.0, 91.0, 71.0, 60.0, 62.0, 45.0, 23.0, 18.0, 10.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.42822265625, -0.41744232177734375, -0.4066619873046875, -0.39588165283203125, -0.385101318359375, -0.37432098388671875, -0.3635406494140625, -0.35276031494140625, -0.34197998046875, -0.33119964599609375, -0.3204193115234375, -0.30963897705078125, -0.298858642578125, -0.28807830810546875, -0.2772979736328125, -0.26651763916015625, -0.2557373046875, -0.24495697021484375, -0.2341766357421875, -0.22339630126953125, -0.212615966796875, -0.20183563232421875, -0.1910552978515625, -0.18027496337890625, -0.16949462890625, -0.15871429443359375, -0.1479339599609375, -0.13715362548828125, -0.126373291015625, -0.11559295654296875, -0.1048126220703125, -0.09403228759765625, -0.083251953125, -0.07247161865234375, -0.0616912841796875, -0.05091094970703125, -0.040130615234375, -0.02935028076171875, -0.0185699462890625, -0.00778961181640625, 0.00299072265625, 0.01377105712890625, 0.0245513916015625, 0.03533172607421875, 0.046112060546875, 0.05689239501953125, 0.0676727294921875, 0.07845306396484375, 0.0892333984375, 0.10001373291015625, 0.1107940673828125, 0.12157440185546875, 0.132354736328125, 0.14313507080078125, 0.1539154052734375, 0.16469573974609375, 0.17547607421875, 0.18625640869140625, 0.1970367431640625, 0.20781707763671875, 0.218597412109375, 0.22937774658203125, 0.2401580810546875, 0.25093841552734375, 0.26171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 11.0, 5.0, 15.0, 10.0, 16.0, 24.0, 46.0, 43.0, 97.0, 125.0, 180.0, 346.0, 610.0, 1130.0, 2483.0, 6044.0, 18418.0, 74643.0, 1214298.0, 2741163.0, 98637.0, 22715.0, 7312.0, 2834.0, 1293.0, 676.0, 393.0, 229.0, 157.0, 93.0, 52.0, 53.0, 29.0, 30.0, 10.0, 20.0, 7.0, 2.0, 4.0, 4.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.23046875, -1.1908721923828125, -1.151275634765625, -1.1116790771484375, -1.07208251953125, -1.0324859619140625, -0.992889404296875, -0.9532928466796875, -0.9136962890625, -0.8740997314453125, -0.834503173828125, -0.7949066162109375, -0.75531005859375, -0.7157135009765625, -0.676116943359375, -0.6365203857421875, -0.596923828125, -0.5573272705078125, -0.517730712890625, -0.4781341552734375, -0.43853759765625, -0.3989410400390625, -0.359344482421875, -0.3197479248046875, -0.2801513671875, -0.2405548095703125, -0.200958251953125, -0.1613616943359375, -0.12176513671875, -0.0821685791015625, -0.042572021484375, -0.0029754638671875, 0.03662109375, 0.0762176513671875, 0.115814208984375, 0.1554107666015625, 0.19500732421875, 0.2346038818359375, 0.274200439453125, 0.3137969970703125, 0.3533935546875, 0.3929901123046875, 0.432586669921875, 0.4721832275390625, 0.51177978515625, 0.5513763427734375, 0.590972900390625, 0.6305694580078125, 0.670166015625, 0.7097625732421875, 0.749359130859375, 0.7889556884765625, 0.82855224609375, 0.8681488037109375, 0.907745361328125, 0.9473419189453125, 0.9869384765625, 1.0265350341796875, 1.066131591796875, 1.1057281494140625, 1.14532470703125, 1.1849212646484375, 1.224517822265625, 1.2641143798828125, 1.3037109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 5.0, 18.0, 14.0, 17.0, 32.0, 39.0, 61.0, 93.0, 191.0, 519.0, 1524.0, 816.0, 297.0, 149.0, 97.0, 52.0, 40.0, 28.0, 12.0, 10.0, 13.0, 12.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.378662109375, -0.3650016784667969, -0.35134124755859375, -0.3376808166503906, -0.3240203857421875, -0.3103599548339844, -0.29669952392578125, -0.2830390930175781, -0.269378662109375, -0.2557182312011719, -0.24205780029296875, -0.22839736938476562, -0.2147369384765625, -0.20107650756835938, -0.18741607666015625, -0.17375564575195312, -0.16009521484375, -0.14643478393554688, -0.13277435302734375, -0.11911392211914062, -0.1054534912109375, -0.09179306030273438, -0.07813262939453125, -0.06447219848632812, -0.050811767578125, -0.037151336669921875, -0.02349090576171875, -0.009830474853515625, 0.0038299560546875, 0.017490386962890625, 0.03115081787109375, 0.044811248779296875, 0.0584716796875, 0.07213211059570312, 0.08579254150390625, 0.09945297241210938, 0.1131134033203125, 0.12677383422851562, 0.14043426513671875, 0.15409469604492188, 0.167755126953125, 0.18141555786132812, 0.19507598876953125, 0.20873641967773438, 0.2223968505859375, 0.23605728149414062, 0.24971771240234375, 0.2633781433105469, 0.27703857421875, 0.2906990051269531, 0.30435943603515625, 0.3180198669433594, 0.3316802978515625, 0.3453407287597656, 0.35900115966796875, 0.3726615905761719, 0.386322021484375, 0.3999824523925781, 0.41364288330078125, 0.4273033142089844, 0.4409637451171875, 0.4546241760253906, 0.46828460693359375, 0.4819450378417969, 0.49560546875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 11.0, 19.0, 76.0, 303.0, 382.0, 163.0, 42.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4266514778137207, -2.1859872341156006, -1.9453227519989014, -1.7046585083007812, -1.4639941453933716, -1.223329782485962, -0.9826655387878418, -0.7420011758804321, -0.5013368129730225, -0.2606724798679352, -0.0200081467628479, 0.220656156539917, 0.46132051944732666, 0.7019848823547363, 0.9426491260528564, 1.1833134889602661, 1.4239778518676758, 1.6646422147750854, 1.9053065776824951, 2.1459708213806152, 2.3866353034973145, 2.6272995471954346, 2.8679637908935547, 3.108628273010254, 3.349292516708374, 3.589956760406494, 3.8306212425231934, 4.071285247802734, 4.311949729919434, 4.552614212036133, 4.793278694152832, 5.033942699432373, 5.274606704711914, 5.515271186828613, 5.755935192108154, 5.9965996742248535, 6.237264156341553, 6.477928161621094, 6.718592643737793, 6.959257125854492, 7.199921607971191, 7.440586090087891, 7.681250095367432, 7.921914577484131, 8.162578582763672, 8.403243064880371, 8.64390754699707, 8.88457202911377, 9.125236511230469, 9.365900993347168, 9.606565475463867, 9.84722900390625, 10.08789348602295, 10.328557968139648, 10.569222450256348, 10.809886932373047, 11.05055046081543, 11.291214942932129, 11.531879425048828, 11.772542953491211, 12.01320743560791, 12.25387191772461, 12.494536399841309, 12.735200881958008, 12.975865364074707]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 8.0, 11.0, 8.0, 11.0, 12.0, 22.0, 24.0, 28.0, 36.0, 49.0, 37.0, 49.0, 47.0, 50.0, 48.0, 54.0, 61.0, 54.0, 54.0, 52.0, 43.0, 45.0, 43.0, 26.0, 30.0, 28.0, 16.0, 19.0, 6.0, 8.0, 11.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4040803909301758, -1.3527841567993164, -1.301487922668457, -1.2501916885375977, -1.1988954544067383, -1.147599220275879, -1.09630286693573, -1.0450066328048706, -0.9937103986740112, -0.9424141645431519, -0.8911179304122925, -0.8398216366767883, -0.788525402545929, -0.7372291684150696, -0.6859328746795654, -0.634636640548706, -0.5833404064178467, -0.5320441722869873, -0.48074790835380554, -0.4294516444206238, -0.3781554102897644, -0.32685917615890503, -0.27556291222572327, -0.2242666482925415, -0.17297041416168213, -0.12167416512966156, -0.07037791609764099, -0.019081667065620422, 0.032214581966400146, 0.08351081609725952, 0.13480708003044128, 0.18610334396362305, 0.23739969730377197, 0.28869593143463135, 0.3399921953678131, 0.3912884593009949, 0.44258469343185425, 0.4938809275627136, 0.5451772212982178, 0.5964734554290771, 0.6477696895599365, 0.6990659236907959, 0.7503621578216553, 0.8016584515571594, 0.8529546856880188, 0.9042509198188782, 0.9555472135543823, 1.0068434476852417, 1.058139681816101, 1.1094359159469604, 1.1607321500778198, 1.2120283842086792, 1.2633247375488281, 1.3146209716796875, 1.3659172058105469, 1.4172134399414062, 1.4685096740722656, 1.519805908203125, 1.5711021423339844, 1.6223983764648438, 1.6736946105957031, 1.7249908447265625, 1.7762871980667114, 1.8275834321975708, 1.8788796663284302]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 13.0, 15.0, 13.0, 28.0, 45.0, 55.0, 91.0, 150.0, 277.0, 521.0, 1187.0, 3159.0, 12052.0, 77991.0, 585883.0, 321296.0, 34956.0, 6832.0, 2104.0, 866.0, 426.0, 216.0, 119.0, 72.0, 56.0, 33.0, 26.0, 15.0, 12.0, 10.0, 7.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7490234375, -1.6812591552734375, -1.613494873046875, -1.5457305908203125, -1.47796630859375, -1.4102020263671875, -1.342437744140625, -1.2746734619140625, -1.2069091796875, -1.1391448974609375, -1.071380615234375, -1.0036163330078125, -0.93585205078125, -0.8680877685546875, -0.800323486328125, -0.7325592041015625, -0.664794921875, -0.5970306396484375, -0.529266357421875, -0.4615020751953125, -0.39373779296875, -0.3259735107421875, -0.258209228515625, -0.1904449462890625, -0.1226806640625, -0.0549163818359375, 0.012847900390625, 0.0806121826171875, 0.14837646484375, 0.2161407470703125, 0.283905029296875, 0.3516693115234375, 0.41943359375, 0.4871978759765625, 0.554962158203125, 0.6227264404296875, 0.69049072265625, 0.7582550048828125, 0.826019287109375, 0.8937835693359375, 0.9615478515625, 1.0293121337890625, 1.097076416015625, 1.1648406982421875, 1.23260498046875, 1.3003692626953125, 1.368133544921875, 1.4358978271484375, 1.503662109375, 1.5714263916015625, 1.639190673828125, 1.7069549560546875, 1.77471923828125, 1.8424835205078125, 1.910247802734375, 1.9780120849609375, 2.0457763671875, 2.1135406494140625, 2.181304931640625, 2.2490692138671875, 2.31683349609375, 2.3845977783203125, 2.452362060546875, 2.5201263427734375, 2.587890625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 12.0, 12.0, 16.0, 25.0, 45.0, 60.0, 57.0, 79.0, 81.0, 92.0, 97.0, 77.0, 78.0, 76.0, 58.0, 43.0, 32.0, 20.0, 15.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.43359375, -0.4227867126464844, -0.41197967529296875, -0.4011726379394531, -0.3903656005859375, -0.3795585632324219, -0.36875152587890625, -0.3579444885253906, -0.347137451171875, -0.3363304138183594, -0.32552337646484375, -0.3147163391113281, -0.3039093017578125, -0.2931022644042969, -0.28229522705078125, -0.2714881896972656, -0.26068115234375, -0.24987411499023438, -0.23906707763671875, -0.22826004028320312, -0.2174530029296875, -0.20664596557617188, -0.19583892822265625, -0.18503189086914062, -0.174224853515625, -0.16341781616210938, -0.15261077880859375, -0.14180374145507812, -0.1309967041015625, -0.12018966674804688, -0.10938262939453125, -0.09857559204101562, -0.0877685546875, -0.07696151733398438, -0.06615447998046875, -0.055347442626953125, -0.0445404052734375, -0.033733367919921875, -0.02292633056640625, -0.012119293212890625, -0.001312255859375, 0.009494781494140625, 0.02030181884765625, 0.031108856201171875, 0.0419158935546875, 0.052722930908203125, 0.06352996826171875, 0.07433700561523438, 0.08514404296875, 0.09595108032226562, 0.10675811767578125, 0.11756515502929688, 0.1283721923828125, 0.13917922973632812, 0.14998626708984375, 0.16079330444335938, 0.171600341796875, 0.18240737915039062, 0.19321441650390625, 0.20402145385742188, 0.2148284912109375, 0.22563552856445312, 0.23644256591796875, 0.24724960327148438, 0.258056640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 7.0, 8.0, 5.0, 5.0, 8.0, 3.0, 6.0, 10.0, 10.0, 16.0, 38.0, 44.0, 82.0, 168.0, 283.0, 581.0, 1340.0, 3710.0, 11489.0, 44796.0, 206902.0, 510060.0, 206784.0, 44331.0, 11613.0, 3668.0, 1423.0, 545.0, 253.0, 132.0, 74.0, 50.0, 34.0, 20.0, 14.0, 15.0, 5.0, 8.0, 4.0, 6.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98193359375, -0.9486465454101562, -0.9153594970703125, -0.8820724487304688, -0.848785400390625, -0.8154983520507812, -0.7822113037109375, -0.7489242553710938, -0.71563720703125, -0.6823501586914062, -0.6490631103515625, -0.6157760620117188, -0.582489013671875, -0.5492019653320312, -0.5159149169921875, -0.48262786865234375, -0.4493408203125, -0.41605377197265625, -0.3827667236328125, -0.34947967529296875, -0.316192626953125, -0.28290557861328125, -0.2496185302734375, -0.21633148193359375, -0.18304443359375, -0.14975738525390625, -0.1164703369140625, -0.08318328857421875, -0.049896240234375, -0.01660919189453125, 0.0166778564453125, 0.04996490478515625, 0.083251953125, 0.11653900146484375, 0.1498260498046875, 0.18311309814453125, 0.216400146484375, 0.24968719482421875, 0.2829742431640625, 0.31626129150390625, 0.34954833984375, 0.38283538818359375, 0.4161224365234375, 0.44940948486328125, 0.482696533203125, 0.5159835815429688, 0.5492706298828125, 0.5825576782226562, 0.6158447265625, 0.6491317749023438, 0.6824188232421875, 0.7157058715820312, 0.748992919921875, 0.7822799682617188, 0.8155670166015625, 0.8488540649414062, 0.88214111328125, 0.9154281616210938, 0.9487152099609375, 0.9820022583007812, 1.015289306640625, 1.0485763549804688, 1.0818634033203125, 1.1151504516601562, 1.1484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 0.0, 5.0, 2.0, 5.0, 5.0, 8.0, 5.0, 10.0, 14.0, 10.0, 17.0, 19.0, 19.0, 33.0, 28.0, 29.0, 26.0, 23.0, 43.0, 49.0, 35.0, 48.0, 47.0, 46.0, 41.0, 39.0, 46.0, 40.0, 43.0, 43.0, 33.0, 29.0, 24.0, 21.0, 17.0, 12.0, 18.0, 17.0, 8.0, 4.0, 12.0, 4.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.814453125, -0.790679931640625, -0.76690673828125, -0.743133544921875, -0.7193603515625, -0.695587158203125, -0.67181396484375, -0.648040771484375, -0.624267578125, -0.600494384765625, -0.57672119140625, -0.552947998046875, -0.5291748046875, -0.505401611328125, -0.48162841796875, -0.457855224609375, -0.43408203125, -0.410308837890625, -0.38653564453125, -0.362762451171875, -0.3389892578125, -0.315216064453125, -0.29144287109375, -0.267669677734375, -0.243896484375, -0.220123291015625, -0.19635009765625, -0.172576904296875, -0.1488037109375, -0.125030517578125, -0.10125732421875, -0.077484130859375, -0.0537109375, -0.029937744140625, -0.00616455078125, 0.017608642578125, 0.0413818359375, 0.065155029296875, 0.08892822265625, 0.112701416015625, 0.136474609375, 0.160247802734375, 0.18402099609375, 0.207794189453125, 0.2315673828125, 0.255340576171875, 0.27911376953125, 0.302886962890625, 0.32666015625, 0.350433349609375, 0.37420654296875, 0.397979736328125, 0.4217529296875, 0.445526123046875, 0.46929931640625, 0.493072509765625, 0.516845703125, 0.540618896484375, 0.56439208984375, 0.588165283203125, 0.6119384765625, 0.635711669921875, 0.65948486328125, 0.683258056640625, 0.70703125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 1.0, 4.0, 4.0, 17.0, 21.0, 43.0, 60.0, 130.0, 277.0, 639.0, 1901.0, 8414.0, 70141.0, 717466.0, 226563.0, 17770.0, 3346.0, 941.0, 383.0, 167.0, 96.0, 59.0, 38.0, 25.0, 17.0, 4.0, 9.0, 9.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96875, -0.9381942749023438, -0.9076385498046875, -0.8770828247070312, -0.846527099609375, -0.8159713745117188, -0.7854156494140625, -0.7548599243164062, -0.72430419921875, -0.6937484741210938, -0.6631927490234375, -0.6326370239257812, -0.602081298828125, -0.5715255737304688, -0.5409698486328125, -0.5104141235351562, -0.4798583984375, -0.44930267333984375, -0.4187469482421875, -0.38819122314453125, -0.357635498046875, -0.32707977294921875, -0.2965240478515625, -0.26596832275390625, -0.23541259765625, -0.20485687255859375, -0.1743011474609375, -0.14374542236328125, -0.113189697265625, -0.08263397216796875, -0.0520782470703125, -0.02152252197265625, 0.009033203125, 0.03958892822265625, 0.0701446533203125, 0.10070037841796875, 0.131256103515625, 0.16181182861328125, 0.1923675537109375, 0.22292327880859375, 0.25347900390625, 0.28403472900390625, 0.3145904541015625, 0.34514617919921875, 0.375701904296875, 0.40625762939453125, 0.4368133544921875, 0.46736907958984375, 0.4979248046875, 0.5284805297851562, 0.5590362548828125, 0.5895919799804688, 0.620147705078125, 0.6507034301757812, 0.6812591552734375, 0.7118148803710938, 0.74237060546875, 0.7729263305664062, 0.8034820556640625, 0.8340377807617188, 0.864593505859375, 0.8951492309570312, 0.9257049560546875, 0.9562606811523438, 0.98681640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 7.0, 6.0, 6.0, 10.0, 12.0, 14.0, 31.0, 30.0, 50.0, 53.0, 73.0, 63.0, 84.0, 88.0, 92.0, 77.0, 74.0, 48.0, 50.0, 27.0, 22.0, 17.0, 14.0, 12.0, 11.0, 6.0, 5.0, 7.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00011146068572998047, -0.00010842457413673401, -0.00010538846254348755, -0.00010235235095024109, -9.931623935699463e-05, -9.628012776374817e-05, -9.324401617050171e-05, -9.020790457725525e-05, -8.717179298400879e-05, -8.413568139076233e-05, -8.109956979751587e-05, -7.806345820426941e-05, -7.502734661102295e-05, -7.199123501777649e-05, -6.895512342453003e-05, -6.591901183128357e-05, -6.288290023803711e-05, -5.984678864479065e-05, -5.681067705154419e-05, -5.377456545829773e-05, -5.073845386505127e-05, -4.770234227180481e-05, -4.466623067855835e-05, -4.163011908531189e-05, -3.859400749206543e-05, -3.555789589881897e-05, -3.252178430557251e-05, -2.948567271232605e-05, -2.644956111907959e-05, -2.341344952583313e-05, -2.037733793258667e-05, -1.734122633934021e-05, -1.430511474609375e-05, -1.126900315284729e-05, -8.23289155960083e-06, -5.19677996635437e-06, -2.16066837310791e-06, 8.754432201385498e-07, 3.91155481338501e-06, 6.94766640663147e-06, 9.98377799987793e-06, 1.301988959312439e-05, 1.605600118637085e-05, 1.909211277961731e-05, 2.212822437286377e-05, 2.516433596611023e-05, 2.820044755935669e-05, 3.123655915260315e-05, 3.427267074584961e-05, 3.730878233909607e-05, 4.034489393234253e-05, 4.338100552558899e-05, 4.641711711883545e-05, 4.945322871208191e-05, 5.248934030532837e-05, 5.552545189857483e-05, 5.856156349182129e-05, 6.159767508506775e-05, 6.463378667831421e-05, 6.766989827156067e-05, 7.070600986480713e-05, 7.374212145805359e-05, 7.677823305130005e-05, 7.981434464454651e-05, 8.285045623779297e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 8.0, 7.0, 14.0, 15.0, 30.0, 38.0, 61.0, 134.0, 238.0, 570.0, 1886.0, 9262.0, 107892.0, 785562.0, 129213.0, 10449.0, 2011.0, 632.0, 257.0, 109.0, 72.0, 39.0, 24.0, 13.0, 8.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60595703125, -0.5749282836914062, -0.5438995361328125, -0.5128707885742188, -0.481842041015625, -0.45081329345703125, -0.4197845458984375, -0.38875579833984375, -0.35772705078125, -0.32669830322265625, -0.2956695556640625, -0.26464080810546875, -0.233612060546875, -0.20258331298828125, -0.1715545654296875, -0.14052581787109375, -0.1094970703125, -0.07846832275390625, -0.0474395751953125, -0.01641082763671875, 0.014617919921875, 0.04564666748046875, 0.0766754150390625, 0.10770416259765625, 0.13873291015625, 0.16976165771484375, 0.2007904052734375, 0.23181915283203125, 0.262847900390625, 0.29387664794921875, 0.3249053955078125, 0.35593414306640625, 0.386962890625, 0.41799163818359375, 0.4490203857421875, 0.48004913330078125, 0.511077880859375, 0.5421066284179688, 0.5731353759765625, 0.6041641235351562, 0.63519287109375, 0.6662216186523438, 0.6972503662109375, 0.7282791137695312, 0.759307861328125, 0.7903366088867188, 0.8213653564453125, 0.8523941040039062, 0.8834228515625, 0.9144515991210938, 0.9454803466796875, 0.9765090942382812, 1.007537841796875, 1.0385665893554688, 1.0695953369140625, 1.1006240844726562, 1.13165283203125, 1.1626815795898438, 1.1937103271484375, 1.2247390747070312, 1.255767822265625, 1.2867965698242188, 1.3178253173828125, 1.3488540649414062, 1.3798828125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 5.0, 10.0, 14.0, 19.0, 16.0, 23.0, 24.0, 53.0, 45.0, 59.0, 90.0, 70.0, 87.0, 82.0, 65.0, 64.0, 61.0, 50.0, 52.0, 28.0, 18.0, 11.0, 15.0, 9.0, 8.0, 4.0, 6.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342529296875, -0.32982635498046875, -0.3171234130859375, -0.30442047119140625, -0.291717529296875, -0.27901458740234375, -0.2663116455078125, -0.25360870361328125, -0.24090576171875, -0.22820281982421875, -0.2154998779296875, -0.20279693603515625, -0.190093994140625, -0.17739105224609375, -0.1646881103515625, -0.15198516845703125, -0.1392822265625, -0.12657928466796875, -0.1138763427734375, -0.10117340087890625, -0.088470458984375, -0.07576751708984375, -0.0630645751953125, -0.05036163330078125, -0.03765869140625, -0.02495574951171875, -0.0122528076171875, 0.00045013427734375, 0.013153076171875, 0.02585601806640625, 0.0385589599609375, 0.05126190185546875, 0.06396484375, 0.07666778564453125, 0.0893707275390625, 0.10207366943359375, 0.114776611328125, 0.12747955322265625, 0.1401824951171875, 0.15288543701171875, 0.16558837890625, 0.17829132080078125, 0.1909942626953125, 0.20369720458984375, 0.216400146484375, 0.22910308837890625, 0.2418060302734375, 0.25450897216796875, 0.2672119140625, 0.27991485595703125, 0.2926177978515625, 0.30532073974609375, 0.318023681640625, 0.33072662353515625, 0.3434295654296875, 0.35613250732421875, 0.36883544921875, 0.38153839111328125, 0.3942413330078125, 0.40694427490234375, 0.419647216796875, 0.43235015869140625, 0.4450531005859375, 0.45775604248046875, 0.470458984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 13.0, 36.0, 168.0, 315.0, 288.0, 115.0, 39.0, 10.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.353282928466797, -16.82286262512207, -16.29244041442871, -15.762019157409668, -15.231597900390625, -14.701176643371582, -14.170755386352539, -13.640335083007812, -13.109912872314453, -12.57949161529541, -12.049070358276367, -11.518649101257324, -10.988227844238281, -10.457806587219238, -9.927385330200195, -9.396965026855469, -8.866543769836426, -8.336122512817383, -7.80570125579834, -7.275279998779297, -6.744858741760254, -6.214437484741211, -5.684016704559326, -5.153595447540283, -4.62317419052124, -4.092752933502197, -3.5623316764831543, -3.0319106578826904, -2.5014894008636475, -1.9710681438446045, -1.4406471252441406, -0.9102258682250977, -0.3798046112060547, 0.1506165862083435, 0.6810377836227417, 1.2114589214324951, 1.741880178451538, 2.272301435470581, 2.802722454071045, 3.333143711090088, 3.863564968109131, 4.393986225128174, 4.924407482147217, 5.454828262329102, 5.9852495193481445, 6.5156707763671875, 7.0460920333862305, 7.576513290405273, 8.106934547424316, 8.63735580444336, 9.167777061462402, 9.698198318481445, 10.228619575500488, 10.759040832519531, 11.289461135864258, 11.819883346557617, 12.350303649902344, 12.880724906921387, 13.41114616394043, 13.941567420959473, 14.471988677978516, 15.002409934997559, 15.532831192016602, 16.063251495361328, 16.593673706054688]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 9.0, 8.0, 10.0, 19.0, 15.0, 19.0, 22.0, 27.0, 36.0, 35.0, 43.0, 42.0, 44.0, 42.0, 59.0, 49.0, 39.0, 43.0, 48.0, 54.0, 54.0, 45.0, 31.0, 35.0, 20.0, 27.0, 15.0, 21.0, 17.0, 13.0, 14.0, 10.0, 6.0, 3.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.109270095825195, -4.95625114440918, -4.803232192993164, -4.650213241577148, -4.497194290161133, -4.344175338745117, -4.191156387329102, -4.038137435913086, -3.8851184844970703, -3.7320995330810547, -3.579080581665039, -3.4260616302490234, -3.273042678833008, -3.120023727416992, -2.9670047760009766, -2.813985824584961, -2.6609668731689453, -2.5079479217529297, -2.354928970336914, -2.2019100189208984, -2.048891067504883, -1.8958721160888672, -1.7428531646728516, -1.589834213256836, -1.4368152618408203, -1.2837963104248047, -1.130777359008789, -0.9777584075927734, -0.8247394561767578, -0.6717205047607422, -0.5187015533447266, -0.36568260192871094, -0.2126631736755371, -0.059644222259521484, 0.09337472915649414, 0.24639368057250977, 0.3994126319885254, 0.552431583404541, 0.7054505348205566, 0.8584694862365723, 1.011488437652588, 1.1645073890686035, 1.3175263404846191, 1.4705452919006348, 1.6235642433166504, 1.776583194732666, 1.9296021461486816, 2.0826210975646973, 2.235640048980713, 2.3886590003967285, 2.541677951812744, 2.6946969032287598, 2.8477158546447754, 3.000734806060791, 3.1537537574768066, 3.3067727088928223, 3.459791660308838, 3.6128106117248535, 3.765829563140869, 3.9188485145568848, 4.0718674659729, 4.224886417388916, 4.377905368804932, 4.530924320220947, 4.683943271636963]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 6.0, 10.0, 5.0, 8.0, 6.0, 13.0, 15.0, 19.0, 29.0, 36.0, 26.0, 49.0, 57.0, 79.0, 121.0, 172.0, 274.0, 452.0, 857.0, 1950.0, 4645.0, 12776.0, 53479.0, 3325528.0, 737903.0, 37828.0, 10382.0, 3959.0, 1663.0, 816.0, 439.0, 244.0, 163.0, 81.0, 63.0, 42.0, 25.0, 21.0, 10.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.779296875, -2.7129669189453125, -2.646636962890625, -2.5803070068359375, -2.51397705078125, -2.4476470947265625, -2.381317138671875, -2.3149871826171875, -2.2486572265625, -2.1823272705078125, -2.115997314453125, -2.0496673583984375, -1.98333740234375, -1.9170074462890625, -1.850677490234375, -1.7843475341796875, -1.718017578125, -1.6516876220703125, -1.585357666015625, -1.5190277099609375, -1.45269775390625, -1.3863677978515625, -1.320037841796875, -1.2537078857421875, -1.1873779296875, -1.1210479736328125, -1.054718017578125, -0.9883880615234375, -0.92205810546875, -0.8557281494140625, -0.789398193359375, -0.7230682373046875, -0.65673828125, -0.5904083251953125, -0.524078369140625, -0.4577484130859375, -0.39141845703125, -0.3250885009765625, -0.258758544921875, -0.1924285888671875, -0.1260986328125, -0.0597686767578125, 0.006561279296875, 0.0728912353515625, 0.13922119140625, 0.2055511474609375, 0.271881103515625, 0.3382110595703125, 0.404541015625, 0.4708709716796875, 0.537200927734375, 0.6035308837890625, 0.66986083984375, 0.7361907958984375, 0.802520751953125, 0.8688507080078125, 0.9351806640625, 1.0015106201171875, 1.067840576171875, 1.1341705322265625, 1.20050048828125, 1.2668304443359375, 1.333160400390625, 1.3994903564453125, 1.4658203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 9.0, 14.0, 15.0, 29.0, 38.0, 36.0, 39.0, 65.0, 64.0, 69.0, 71.0, 90.0, 81.0, 73.0, 53.0, 45.0, 50.0, 43.0, 35.0, 18.0, 13.0, 18.0, 9.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.3876953125, -0.377593994140625, -0.36749267578125, -0.357391357421875, -0.3472900390625, -0.337188720703125, -0.32708740234375, -0.316986083984375, -0.306884765625, -0.296783447265625, -0.28668212890625, -0.276580810546875, -0.2664794921875, -0.256378173828125, -0.24627685546875, -0.236175537109375, -0.22607421875, -0.215972900390625, -0.20587158203125, -0.195770263671875, -0.1856689453125, -0.175567626953125, -0.16546630859375, -0.155364990234375, -0.145263671875, -0.135162353515625, -0.12506103515625, -0.114959716796875, -0.1048583984375, -0.094757080078125, -0.08465576171875, -0.074554443359375, -0.064453125, -0.054351806640625, -0.04425048828125, -0.034149169921875, -0.0240478515625, -0.013946533203125, -0.00384521484375, 0.006256103515625, 0.016357421875, 0.026458740234375, 0.03656005859375, 0.046661376953125, 0.0567626953125, 0.066864013671875, 0.07696533203125, 0.087066650390625, 0.09716796875, 0.107269287109375, 0.11737060546875, 0.127471923828125, 0.1375732421875, 0.147674560546875, 0.15777587890625, 0.167877197265625, 0.177978515625, 0.188079833984375, 0.19818115234375, 0.208282470703125, 0.2183837890625, 0.228485107421875, 0.23858642578125, 0.248687744140625, 0.2587890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 10.0, 9.0, 10.0, 29.0, 42.0, 53.0, 97.0, 146.0, 261.0, 569.0, 1415.0, 4227.0, 17258.0, 161839.0, 3851704.0, 134432.0, 15570.0, 4133.0, 1331.0, 528.0, 274.0, 126.0, 74.0, 49.0, 35.0, 17.0, 13.0, 13.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.8515625, -2.782806396484375, -2.71405029296875, -2.645294189453125, -2.5765380859375, -2.507781982421875, -2.43902587890625, -2.370269775390625, -2.301513671875, -2.232757568359375, -2.16400146484375, -2.095245361328125, -2.0264892578125, -1.957733154296875, -1.88897705078125, -1.820220947265625, -1.75146484375, -1.682708740234375, -1.61395263671875, -1.545196533203125, -1.4764404296875, -1.407684326171875, -1.33892822265625, -1.270172119140625, -1.201416015625, -1.132659912109375, -1.06390380859375, -0.995147705078125, -0.9263916015625, -0.857635498046875, -0.78887939453125, -0.720123291015625, -0.6513671875, -0.582611083984375, -0.51385498046875, -0.445098876953125, -0.3763427734375, -0.307586669921875, -0.23883056640625, -0.170074462890625, -0.101318359375, -0.032562255859375, 0.03619384765625, 0.104949951171875, 0.1737060546875, 0.242462158203125, 0.31121826171875, 0.379974365234375, 0.44873046875, 0.517486572265625, 0.58624267578125, 0.654998779296875, 0.7237548828125, 0.792510986328125, 0.86126708984375, 0.930023193359375, 0.998779296875, 1.067535400390625, 1.13629150390625, 1.205047607421875, 1.2738037109375, 1.342559814453125, 1.41131591796875, 1.480072021484375, 1.548828125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 12.0, 9.0, 11.0, 12.0, 15.0, 21.0, 39.0, 61.0, 92.0, 157.0, 335.0, 939.0, 1501.0, 441.0, 171.0, 101.0, 54.0, 30.0, 16.0, 9.0, 15.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.73681640625, -0.7169952392578125, -0.697174072265625, -0.6773529052734375, -0.65753173828125, -0.6377105712890625, -0.617889404296875, -0.5980682373046875, -0.5782470703125, -0.5584259033203125, -0.538604736328125, -0.5187835693359375, -0.49896240234375, -0.4791412353515625, -0.459320068359375, -0.4394989013671875, -0.419677734375, -0.3998565673828125, -0.380035400390625, -0.3602142333984375, -0.34039306640625, -0.3205718994140625, -0.300750732421875, -0.2809295654296875, -0.2611083984375, -0.2412872314453125, -0.221466064453125, -0.2016448974609375, -0.18182373046875, -0.1620025634765625, -0.142181396484375, -0.1223602294921875, -0.1025390625, -0.0827178955078125, -0.062896728515625, -0.0430755615234375, -0.02325439453125, -0.0034332275390625, 0.016387939453125, 0.0362091064453125, 0.0560302734375, 0.0758514404296875, 0.095672607421875, 0.1154937744140625, 0.13531494140625, 0.1551361083984375, 0.174957275390625, 0.1947784423828125, 0.214599609375, 0.2344207763671875, 0.254241943359375, 0.2740631103515625, 0.29388427734375, 0.3137054443359375, 0.333526611328125, 0.3533477783203125, 0.3731689453125, 0.3929901123046875, 0.412811279296875, 0.4326324462890625, 0.45245361328125, 0.4722747802734375, 0.492095947265625, 0.5119171142578125, 0.53173828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 6.0, 16.0, 36.0, 62.0, 96.0, 186.0, 221.0, 162.0, 122.0, 45.0, 19.0, 7.0, 8.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.845273971557617, -5.666065692901611, -5.486856937408447, -5.307648658752441, -5.1284403800964355, -4.94923210144043, -4.770023345947266, -4.59081506729126, -4.411606788635254, -4.232398509979248, -4.053189754486084, -3.873981475830078, -3.6947731971740723, -3.5155646800994873, -3.3363561630249023, -3.1571478843688965, -2.9779391288757324, -2.7987306118011475, -2.6195223331451416, -2.4403138160705566, -2.261105537414551, -2.081897020339966, -1.9026885032653809, -1.7234801054000854, -1.54427170753479, -1.3650633096694946, -1.1858549118041992, -1.0066463947296143, -0.8274379968643188, -0.6482295989990234, -0.4690210819244385, -0.28981268405914307, -0.11060380935668945, 0.06860461831092834, 0.24781304597854614, 0.42702150344848633, 0.6062299013137817, 0.7854382991790771, 0.9646468162536621, 1.1438552141189575, 1.323063611984253, 1.5022720098495483, 1.6814804077148438, 1.8606889247894287, 2.0398974418640137, 2.2191057205200195, 2.3983142375946045, 2.5775227546691895, 2.7567310333251953, 2.9359395503997803, 3.115147829055786, 3.294356346130371, 3.473564624786377, 3.652773141860962, 3.831981658935547, 4.011189937591553, 4.190398216247559, 4.3696064949035645, 4.5488152503967285, 4.728023529052734, 4.90723180770874, 5.086440086364746, 5.26564884185791, 5.444857120513916, 5.62406587600708]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 3.0, 13.0, 6.0, 12.0, 17.0, 21.0, 24.0, 40.0, 45.0, 49.0, 46.0, 66.0, 53.0, 62.0, 59.0, 57.0, 68.0, 76.0, 57.0, 42.0, 49.0, 43.0, 27.0, 19.0, 14.0, 13.0, 9.0, 2.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.837348222732544, -1.7499698400497437, -1.6625914573669434, -1.5752129554748535, -1.4878345727920532, -1.400456190109253, -1.3130778074264526, -1.2256994247436523, -1.1383209228515625, -1.0509425401687622, -0.9635640978813171, -0.8761857151985168, -0.7888072729110718, -0.7014288902282715, -0.6140505075454712, -0.5266720652580261, -0.4392937421798706, -0.3519153296947479, -0.26453691720962524, -0.17715853452682495, -0.08978012204170227, -0.00240170955657959, 0.0849766731262207, 0.17235511541366577, 0.25973349809646606, 0.34711191058158875, 0.4344903230667114, 0.5218687057495117, 0.609247088432312, 0.6966255307197571, 0.7840039134025574, 0.8713823556900024, 0.9587607383728027, 1.046139121055603, 1.1335175037384033, 1.2208960056304932, 1.3082743883132935, 1.3956527709960938, 1.483031153678894, 1.5704095363616943, 1.6577880382537842, 1.7451664209365845, 1.8325448036193848, 1.9199233055114746, 2.0073015689849854, 2.094680070877075, 2.182058334350586, 2.269436836242676, 2.3568153381347656, 2.4441938400268555, 2.531572103500366, 2.618950605392456, 2.706328868865967, 2.7937073707580566, 2.8810858726501465, 2.9684641361236572, 3.055842399597168, 3.143220901489258, 3.2305991649627686, 3.3179776668548584, 3.405355930328369, 3.492734432220459, 3.580112934112549, 3.6674911975860596, 3.7548696994781494]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 6.0, 7.0, 8.0, 16.0, 23.0, 35.0, 48.0, 66.0, 141.0, 323.0, 697.0, 1792.0, 6236.0, 33286.0, 455555.0, 503910.0, 36421.0, 6647.0, 1953.0, 682.0, 285.0, 157.0, 84.0, 60.0, 32.0, 28.0, 15.0, 10.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.90234375, -2.823944091796875, -2.74554443359375, -2.667144775390625, -2.5887451171875, -2.510345458984375, -2.43194580078125, -2.353546142578125, -2.275146484375, -2.196746826171875, -2.11834716796875, -2.039947509765625, -1.9615478515625, -1.883148193359375, -1.80474853515625, -1.726348876953125, -1.64794921875, -1.569549560546875, -1.49114990234375, -1.412750244140625, -1.3343505859375, -1.255950927734375, -1.17755126953125, -1.099151611328125, -1.020751953125, -0.942352294921875, -0.86395263671875, -0.785552978515625, -0.7071533203125, -0.628753662109375, -0.55035400390625, -0.471954345703125, -0.3935546875, -0.315155029296875, -0.23675537109375, -0.158355712890625, -0.0799560546875, -0.001556396484375, 0.07684326171875, 0.155242919921875, 0.233642578125, 0.312042236328125, 0.39044189453125, 0.468841552734375, 0.5472412109375, 0.625640869140625, 0.70404052734375, 0.782440185546875, 0.86083984375, 0.939239501953125, 1.01763916015625, 1.096038818359375, 1.1744384765625, 1.252838134765625, 1.33123779296875, 1.409637451171875, 1.488037109375, 1.566436767578125, 1.64483642578125, 1.723236083984375, 1.8016357421875, 1.880035400390625, 1.95843505859375, 2.036834716796875, 2.115234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 11.0, 11.0, 13.0, 13.0, 25.0, 43.0, 45.0, 46.0, 49.0, 71.0, 55.0, 82.0, 92.0, 74.0, 77.0, 60.0, 53.0, 44.0, 46.0, 22.0, 22.0, 14.0, 11.0, 12.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.412353515625, -0.4012794494628906, -0.39020538330078125, -0.3791313171386719, -0.3680572509765625, -0.3569831848144531, -0.34590911865234375, -0.3348350524902344, -0.323760986328125, -0.3126869201660156, -0.30161285400390625, -0.2905387878417969, -0.2794647216796875, -0.2683906555175781, -0.25731658935546875, -0.24624252319335938, -0.23516845703125, -0.22409439086914062, -0.21302032470703125, -0.20194625854492188, -0.1908721923828125, -0.17979812622070312, -0.16872406005859375, -0.15764999389648438, -0.146575927734375, -0.13550186157226562, -0.12442779541015625, -0.11335372924804688, -0.1022796630859375, -0.09120559692382812, -0.08013153076171875, -0.06905746459960938, -0.0579833984375, -0.046909332275390625, -0.03583526611328125, -0.024761199951171875, -0.0136871337890625, -0.002613067626953125, 0.00846099853515625, 0.019535064697265625, 0.030609130859375, 0.041683197021484375, 0.05275726318359375, 0.06383132934570312, 0.0749053955078125, 0.08597946166992188, 0.09705352783203125, 0.10812759399414062, 0.11920166015625, 0.13027572631835938, 0.14134979248046875, 0.15242385864257812, 0.1634979248046875, 0.17457199096679688, 0.18564605712890625, 0.19672012329101562, 0.207794189453125, 0.21886825561523438, 0.22994232177734375, 0.24101638793945312, 0.2520904541015625, 0.2631645202636719, 0.27423858642578125, 0.2853126525878906, 0.29638671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 8.0, 11.0, 21.0, 31.0, 36.0, 52.0, 110.0, 186.0, 386.0, 948.0, 2782.0, 10089.0, 54059.0, 419163.0, 480419.0, 63717.0, 11435.0, 3022.0, 1041.0, 444.0, 212.0, 98.0, 57.0, 50.0, 28.0, 21.0, 14.0, 15.0, 14.0, 10.0, 10.0, 7.0, 11.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5634765625, -1.517547607421875, -1.47161865234375, -1.425689697265625, -1.3797607421875, -1.333831787109375, -1.28790283203125, -1.241973876953125, -1.196044921875, -1.150115966796875, -1.10418701171875, -1.058258056640625, -1.0123291015625, -0.966400146484375, -0.92047119140625, -0.874542236328125, -0.82861328125, -0.782684326171875, -0.73675537109375, -0.690826416015625, -0.6448974609375, -0.598968505859375, -0.55303955078125, -0.507110595703125, -0.461181640625, -0.415252685546875, -0.36932373046875, -0.323394775390625, -0.2774658203125, -0.231536865234375, -0.18560791015625, -0.139678955078125, -0.09375, -0.047821044921875, -0.00189208984375, 0.044036865234375, 0.0899658203125, 0.135894775390625, 0.18182373046875, 0.227752685546875, 0.273681640625, 0.319610595703125, 0.36553955078125, 0.411468505859375, 0.4573974609375, 0.503326416015625, 0.54925537109375, 0.595184326171875, 0.64111328125, 0.687042236328125, 0.73297119140625, 0.778900146484375, 0.8248291015625, 0.870758056640625, 0.91668701171875, 0.962615966796875, 1.008544921875, 1.054473876953125, 1.10040283203125, 1.146331787109375, 1.1922607421875, 1.238189697265625, 1.28411865234375, 1.330047607421875, 1.3759765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 3.0, 5.0, 11.0, 13.0, 15.0, 22.0, 28.0, 24.0, 27.0, 28.0, 30.0, 40.0, 54.0, 68.0, 48.0, 39.0, 70.0, 47.0, 74.0, 54.0, 48.0, 44.0, 38.0, 29.0, 20.0, 23.0, 16.0, 16.0, 15.0, 13.0, 5.0, 6.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.978515625, -0.9448089599609375, -0.911102294921875, -0.8773956298828125, -0.84368896484375, -0.8099822998046875, -0.776275634765625, -0.7425689697265625, -0.7088623046875, -0.6751556396484375, -0.641448974609375, -0.6077423095703125, -0.57403564453125, -0.5403289794921875, -0.506622314453125, -0.4729156494140625, -0.439208984375, -0.4055023193359375, -0.371795654296875, -0.3380889892578125, -0.30438232421875, -0.2706756591796875, -0.236968994140625, -0.2032623291015625, -0.1695556640625, -0.1358489990234375, -0.102142333984375, -0.0684356689453125, -0.03472900390625, -0.0010223388671875, 0.032684326171875, 0.0663909912109375, 0.10009765625, 0.1338043212890625, 0.167510986328125, 0.2012176513671875, 0.23492431640625, 0.2686309814453125, 0.302337646484375, 0.3360443115234375, 0.3697509765625, 0.4034576416015625, 0.437164306640625, 0.4708709716796875, 0.50457763671875, 0.5382843017578125, 0.571990966796875, 0.6056976318359375, 0.639404296875, 0.6731109619140625, 0.706817626953125, 0.7405242919921875, 0.77423095703125, 0.8079376220703125, 0.841644287109375, 0.8753509521484375, 0.9090576171875, 0.9427642822265625, 0.976470947265625, 1.0101776123046875, 1.04388427734375, 1.0775909423828125, 1.111297607421875, 1.1450042724609375, 1.1787109375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 7.0, 16.0, 44.0, 88.0, 209.0, 818.0, 17675.0, 1022860.0, 6027.0, 510.0, 158.0, 88.0, 28.0, 12.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51171875, -3.3785400390625, -3.245361328125, -3.1121826171875, -2.97900390625, -2.8458251953125, -2.712646484375, -2.5794677734375, -2.4462890625, -2.3131103515625, -2.179931640625, -2.0467529296875, -1.91357421875, -1.7803955078125, -1.647216796875, -1.5140380859375, -1.380859375, -1.2476806640625, -1.114501953125, -0.9813232421875, -0.84814453125, -0.7149658203125, -0.581787109375, -0.4486083984375, -0.3154296875, -0.1822509765625, -0.049072265625, 0.0841064453125, 0.21728515625, 0.3504638671875, 0.483642578125, 0.6168212890625, 0.75, 0.8831787109375, 1.016357421875, 1.1495361328125, 1.28271484375, 1.4158935546875, 1.549072265625, 1.6822509765625, 1.8154296875, 1.9486083984375, 2.081787109375, 2.2149658203125, 2.34814453125, 2.4813232421875, 2.614501953125, 2.7476806640625, 2.880859375, 3.0140380859375, 3.147216796875, 3.2803955078125, 3.41357421875, 3.5467529296875, 3.679931640625, 3.8131103515625, 3.9462890625, 4.0794677734375, 4.212646484375, 4.3458251953125, 4.47900390625, 4.6121826171875, 4.745361328125, 4.8785400390625, 5.01171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 18.0, 22.0, 39.0, 72.0, 114.0, 167.0, 213.0, 135.0, 87.0, 42.0, 33.0, 22.0, 11.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002493858337402344, -0.00024287402629852295, -0.00023636221885681152, -0.0002298504114151001, -0.00022333860397338867, -0.00021682679653167725, -0.00021031498908996582, -0.0002038031816482544, -0.00019729137420654297, -0.00019077956676483154, -0.00018426775932312012, -0.0001777559518814087, -0.00017124414443969727, -0.00016473233699798584, -0.00015822052955627441, -0.000151708722114563, -0.00014519691467285156, -0.00013868510723114014, -0.0001321732997894287, -0.00012566149234771729, -0.00011914968490600586, -0.00011263787746429443, -0.00010612607002258301, -9.961426258087158e-05, -9.310245513916016e-05, -8.659064769744873e-05, -8.00788402557373e-05, -7.356703281402588e-05, -6.705522537231445e-05, -6.054341793060303e-05, -5.40316104888916e-05, -4.7519803047180176e-05, -4.100799560546875e-05, -3.4496188163757324e-05, -2.79843807220459e-05, -2.1472573280334473e-05, -1.4960765838623047e-05, -8.448958396911621e-06, -1.9371509552001953e-06, 4.5746564865112305e-06, 1.1086463928222656e-05, 1.7598271369934082e-05, 2.4110078811645508e-05, 3.0621886253356934e-05, 3.713369369506836e-05, 4.3645501136779785e-05, 5.015730857849121e-05, 5.666911602020264e-05, 6.318092346191406e-05, 6.969273090362549e-05, 7.620453834533691e-05, 8.271634578704834e-05, 8.922815322875977e-05, 9.573996067047119e-05, 0.00010225176811218262, 0.00010876357555389404, 0.00011527538299560547, 0.0001217871904373169, 0.00012829899787902832, 0.00013481080532073975, 0.00014132261276245117, 0.0001478344202041626, 0.00015434622764587402, 0.00016085803508758545, 0.00016736984252929688]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 20.0, 52.0, 80.0, 199.0, 621.0, 8565.0, 1030102.0, 7949.0, 623.0, 181.0, 69.0, 43.0, 24.0, 12.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.7421875, -4.6005859375, -4.458984375, -4.3173828125, -4.17578125, -4.0341796875, -3.892578125, -3.7509765625, -3.609375, -3.4677734375, -3.326171875, -3.1845703125, -3.04296875, -2.9013671875, -2.759765625, -2.6181640625, -2.4765625, -2.3349609375, -2.193359375, -2.0517578125, -1.91015625, -1.7685546875, -1.626953125, -1.4853515625, -1.34375, -1.2021484375, -1.060546875, -0.9189453125, -0.77734375, -0.6357421875, -0.494140625, -0.3525390625, -0.2109375, -0.0693359375, 0.072265625, 0.2138671875, 0.35546875, 0.4970703125, 0.638671875, 0.7802734375, 0.921875, 1.0634765625, 1.205078125, 1.3466796875, 1.48828125, 1.6298828125, 1.771484375, 1.9130859375, 2.0546875, 2.1962890625, 2.337890625, 2.4794921875, 2.62109375, 2.7626953125, 2.904296875, 3.0458984375, 3.1875, 3.3291015625, 3.470703125, 3.6123046875, 3.75390625, 3.8955078125, 4.037109375, 4.1787109375, 4.3203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 24.0, 96.0, 417.0, 339.0, 85.0, 26.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.513671875, -2.4324951171875, -2.351318359375, -2.2701416015625, -2.18896484375, -2.1077880859375, -2.026611328125, -1.9454345703125, -1.8642578125, -1.7830810546875, -1.701904296875, -1.6207275390625, -1.53955078125, -1.4583740234375, -1.377197265625, -1.2960205078125, -1.21484375, -1.1336669921875, -1.052490234375, -0.9713134765625, -0.89013671875, -0.8089599609375, -0.727783203125, -0.6466064453125, -0.5654296875, -0.4842529296875, -0.403076171875, -0.3218994140625, -0.24072265625, -0.1595458984375, -0.078369140625, 0.0028076171875, 0.083984375, 0.1651611328125, 0.246337890625, 0.3275146484375, 0.40869140625, 0.4898681640625, 0.571044921875, 0.6522216796875, 0.7333984375, 0.8145751953125, 0.895751953125, 0.9769287109375, 1.05810546875, 1.1392822265625, 1.220458984375, 1.3016357421875, 1.3828125, 1.4639892578125, 1.545166015625, 1.6263427734375, 1.70751953125, 1.7886962890625, 1.869873046875, 1.9510498046875, 2.0322265625, 2.1134033203125, 2.194580078125, 2.2757568359375, 2.35693359375, 2.4381103515625, 2.519287109375, 2.6004638671875, 2.681640625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 8.0, 26.0, 86.0, 277.0, 347.0, 171.0, 63.0, 17.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-37.4338264465332, -36.72834777832031, -36.02286911010742, -35.31739044189453, -34.61191177368164, -33.90643310546875, -33.200950622558594, -32.4954719543457, -31.789993286132812, -31.084514617919922, -30.37903594970703, -29.67355728149414, -28.968076705932617, -28.262598037719727, -27.557119369506836, -26.851640701293945, -26.146162033081055, -25.440683364868164, -24.735204696655273, -24.02972412109375, -23.32424545288086, -22.61876678466797, -21.913288116455078, -21.207809448242188, -20.502330780029297, -19.796852111816406, -19.091373443603516, -18.385894775390625, -17.6804141998291, -16.97493553161621, -16.26945686340332, -15.56397819519043, -14.858497619628906, -14.153018951416016, -13.447539329528809, -12.742060661315918, -12.036581039428711, -11.33110237121582, -10.62562370300293, -9.920145034790039, -9.214665412902832, -8.509186744689941, -7.803707122802734, -7.098228454589844, -6.392749309539795, -5.687270164489746, -4.9817914962768555, -4.276312351226807, -3.570833206176758, -2.865354061126709, -2.1598751544952393, -1.4543962478637695, -0.7489171028137207, -0.043437957763671875, 0.6620407104492188, 1.3675198554992676, 2.0729990005493164, 2.7784781455993652, 3.483957052230835, 4.189435958862305, 4.8949151039123535, 5.600394248962402, 6.305872917175293, 7.011352062225342, 7.716831207275391]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 3.0, 7.0, 6.0, 13.0, 17.0, 4.0, 13.0, 24.0, 17.0, 24.0, 27.0, 28.0, 30.0, 38.0, 43.0, 44.0, 50.0, 41.0, 38.0, 53.0, 36.0, 39.0, 44.0, 36.0, 36.0, 39.0, 34.0, 35.0, 27.0, 18.0, 18.0, 19.0, 16.0, 15.0, 7.0, 14.0, 11.0, 5.0, 6.0, 3.0, 3.0, 2.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.314615726470947, -5.158224582672119, -5.001832962036133, -4.845441818237305, -4.689050674438477, -4.532659530639648, -4.376267910003662, -4.219876766204834, -4.063485145568848, -3.9070937633514404, -3.7507026195526123, -3.594311237335205, -3.437920093536377, -3.2815287113189697, -3.1251373291015625, -2.9687461853027344, -2.8123550415039062, -2.655963659286499, -2.499572515487671, -2.3431811332702637, -2.1867899894714355, -2.0303986072540283, -1.874007225036621, -1.7176159620285034, -1.5612246990203857, -1.404833436012268, -1.2484421730041504, -1.0920507907867432, -0.9356595277786255, -0.7792682647705078, -0.6228769421577454, -0.4664856195449829, -0.31009387969970703, -0.15370258688926697, 0.0026887059211730957, 0.15907999873161316, 0.3154712915420532, 0.4718625545501709, 0.6282538771629333, 0.7846451997756958, 0.9410364627838135, 1.0974277257919312, 1.2538189888000488, 1.410210371017456, 1.5666016340255737, 1.7229928970336914, 1.8793842792510986, 2.035775661468506, 2.192166805267334, 2.348558187484741, 2.5049493312835693, 2.6613407135009766, 2.8177318572998047, 2.974123239517212, 3.130514621734619, 3.2869057655334473, 3.4432971477508545, 3.5996885299682617, 3.75607967376709, 3.912471055984497, 4.068862438201904, 4.225253582000732, 4.3816447257995605, 4.538036346435547, 4.694427490234375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 8.0, 11.0, 14.0, 18.0, 21.0, 35.0, 56.0, 74.0, 137.0, 215.0, 485.0, 1201.0, 3802.0, 16340.0, 201843.0, 3913791.0, 44584.0, 7808.0, 2276.0, 829.0, 335.0, 177.0, 88.0, 51.0, 31.0, 19.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.642578125, -3.554290771484375, -3.46600341796875, -3.377716064453125, -3.2894287109375, -3.201141357421875, -3.11285400390625, -3.024566650390625, -2.936279296875, -2.847991943359375, -2.75970458984375, -2.671417236328125, -2.5831298828125, -2.494842529296875, -2.40655517578125, -2.318267822265625, -2.22998046875, -2.141693115234375, -2.05340576171875, -1.965118408203125, -1.8768310546875, -1.788543701171875, -1.70025634765625, -1.611968994140625, -1.523681640625, -1.435394287109375, -1.34710693359375, -1.258819580078125, -1.1705322265625, -1.082244873046875, -0.99395751953125, -0.905670166015625, -0.8173828125, -0.729095458984375, -0.64080810546875, -0.552520751953125, -0.4642333984375, -0.375946044921875, -0.28765869140625, -0.199371337890625, -0.111083984375, -0.022796630859375, 0.06549072265625, 0.153778076171875, 0.2420654296875, 0.330352783203125, 0.41864013671875, 0.506927490234375, 0.59521484375, 0.683502197265625, 0.77178955078125, 0.860076904296875, 0.9483642578125, 1.036651611328125, 1.12493896484375, 1.213226318359375, 1.301513671875, 1.389801025390625, 1.47808837890625, 1.566375732421875, 1.6546630859375, 1.742950439453125, 1.83123779296875, 1.919525146484375, 2.0078125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 5.0, 13.0, 17.0, 21.0, 20.0, 21.0, 33.0, 42.0, 50.0, 67.0, 65.0, 57.0, 62.0, 68.0, 62.0, 70.0, 60.0, 61.0, 52.0, 30.0, 28.0, 29.0, 25.0, 11.0, 13.0, 8.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.440673828125, -0.42914581298828125, -0.4176177978515625, -0.40608978271484375, -0.394561767578125, -0.38303375244140625, -0.3715057373046875, -0.35997772216796875, -0.34844970703125, -0.33692169189453125, -0.3253936767578125, -0.31386566162109375, -0.302337646484375, -0.29080963134765625, -0.2792816162109375, -0.26775360107421875, -0.2562255859375, -0.24469757080078125, -0.2331695556640625, -0.22164154052734375, -0.210113525390625, -0.19858551025390625, -0.1870574951171875, -0.17552947998046875, -0.16400146484375, -0.15247344970703125, -0.1409454345703125, -0.12941741943359375, -0.117889404296875, -0.10636138916015625, -0.0948333740234375, -0.08330535888671875, -0.07177734375, -0.06024932861328125, -0.0487213134765625, -0.03719329833984375, -0.025665283203125, -0.01413726806640625, -0.0026092529296875, 0.00891876220703125, 0.02044677734375, 0.03197479248046875, 0.0435028076171875, 0.05503082275390625, 0.066558837890625, 0.07808685302734375, 0.0896148681640625, 0.10114288330078125, 0.1126708984375, 0.12419891357421875, 0.1357269287109375, 0.14725494384765625, 0.158782958984375, 0.17031097412109375, 0.1818389892578125, 0.19336700439453125, 0.20489501953125, 0.21642303466796875, 0.2279510498046875, 0.23947906494140625, 0.251007080078125, 0.26253509521484375, 0.2740631103515625, 0.28559112548828125, 0.297119140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 0.0, 11.0, 11.0, 11.0, 19.0, 44.0, 62.0, 82.0, 107.0, 152.0, 256.0, 636.0, 2453.0, 26626.0, 4112781.0, 46305.0, 3125.0, 748.0, 299.0, 165.0, 120.0, 84.0, 71.0, 44.0, 23.0, 25.0, 13.0, 10.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69921875, -5.52423095703125, -5.3492431640625, -5.17425537109375, -4.999267578125, -4.82427978515625, -4.6492919921875, -4.47430419921875, -4.29931640625, -4.12432861328125, -3.9493408203125, -3.77435302734375, -3.599365234375, -3.42437744140625, -3.2493896484375, -3.07440185546875, -2.8994140625, -2.72442626953125, -2.5494384765625, -2.37445068359375, -2.199462890625, -2.02447509765625, -1.8494873046875, -1.67449951171875, -1.49951171875, -1.32452392578125, -1.1495361328125, -0.97454833984375, -0.799560546875, -0.62457275390625, -0.4495849609375, -0.27459716796875, -0.099609375, 0.07537841796875, 0.2503662109375, 0.42535400390625, 0.600341796875, 0.77532958984375, 0.9503173828125, 1.12530517578125, 1.30029296875, 1.47528076171875, 1.6502685546875, 1.82525634765625, 2.000244140625, 2.17523193359375, 2.3502197265625, 2.52520751953125, 2.7001953125, 2.87518310546875, 3.0501708984375, 3.22515869140625, 3.400146484375, 3.57513427734375, 3.7501220703125, 3.92510986328125, 4.10009765625, 4.27508544921875, 4.4500732421875, 4.62506103515625, 4.800048828125, 4.97503662109375, 5.1500244140625, 5.32501220703125, 5.5]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 14.0, 38.0, 130.0, 2249.0, 1502.0, 91.0, 32.0, 13.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.930389404296875, -1.85882568359375, -1.787261962890625, -1.7156982421875, -1.644134521484375, -1.57257080078125, -1.501007080078125, -1.429443359375, -1.357879638671875, -1.28631591796875, -1.214752197265625, -1.1431884765625, -1.071624755859375, -1.00006103515625, -0.928497314453125, -0.85693359375, -0.785369873046875, -0.71380615234375, -0.642242431640625, -0.5706787109375, -0.499114990234375, -0.42755126953125, -0.355987548828125, -0.284423828125, -0.212860107421875, -0.14129638671875, -0.069732666015625, 0.0018310546875, 0.073394775390625, 0.14495849609375, 0.216522216796875, 0.2880859375, 0.359649658203125, 0.43121337890625, 0.502777099609375, 0.5743408203125, 0.645904541015625, 0.71746826171875, 0.789031982421875, 0.860595703125, 0.932159423828125, 1.00372314453125, 1.075286865234375, 1.1468505859375, 1.218414306640625, 1.28997802734375, 1.361541748046875, 1.43310546875, 1.504669189453125, 1.57623291015625, 1.647796630859375, 1.7193603515625, 1.790924072265625, 1.86248779296875, 1.934051513671875, 2.005615234375, 2.077178955078125, 2.14874267578125, 2.220306396484375, 2.2918701171875, 2.363433837890625, 2.43499755859375, 2.506561279296875, 2.578125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 6.0, 15.0, 22.0, 49.0, 141.0, 279.0, 247.0, 123.0, 66.0, 29.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.467264175415039, -6.251947402954102, -6.036631107330322, -5.821314334869385, -5.6059980392456055, -5.390681266784668, -5.175364971160889, -4.960048198699951, -4.744731903076172, -4.529415130615234, -4.314098834991455, -4.098782062530518, -3.8834657669067383, -3.668148994445801, -3.4528326988220215, -3.237515926361084, -3.0221993923187256, -2.806882858276367, -2.591566324234009, -2.3762497901916504, -2.160933256149292, -1.945616602897644, -1.7303000688552856, -1.5149835348129272, -1.2996670007705688, -1.0843504667282104, -0.869033932685852, -0.6537173390388489, -0.4384008049964905, -0.2230842113494873, -0.007767677307128906, 0.2075488567352295, 0.4228653907775879, 0.6381819248199463, 0.8534984588623047, 1.068814992904663, 1.2841315269470215, 1.4994481801986694, 1.7147647142410278, 1.9300812482833862, 2.145397663116455, 2.3607141971588135, 2.576030731201172, 2.7913472652435303, 3.0066637992858887, 3.221980571746826, 3.4372968673706055, 3.652613639831543, 3.8679301738739014, 4.08324670791626, 4.298563480377197, 4.513879776000977, 4.729196548461914, 4.944512844085693, 5.159829616546631, 5.37514591217041, 5.590462684631348, 5.805779457092285, 6.0210957527160645, 6.236412525177002, 6.451728820800781, 6.667045593261719, 6.882361888885498, 7.0976786613464355, 7.312994956970215]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 21.0, 33.0, 62.0, 83.0, 103.0, 117.0, 118.0, 126.0, 103.0, 77.0, 50.0, 27.0, 31.0, 21.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5036702156066895, -5.349239349365234, -5.194808006286621, -5.040376663208008, -4.885945796966553, -4.731514930725098, -4.577083587646484, -4.422652244567871, -4.268221378326416, -4.113790512084961, -3.9593591690063477, -3.8049280643463135, -3.6504969596862793, -3.496065855026245, -3.341634750366211, -3.1872036457061768, -3.0327725410461426, -2.8783414363861084, -2.723910331726074, -2.56947922706604, -2.415048122406006, -2.2606170177459717, -2.1061859130859375, -1.9517548084259033, -1.7973237037658691, -1.642892599105835, -1.4884614944458008, -1.3340303897857666, -1.1795992851257324, -1.0251681804656982, -0.8707370758056641, -0.7163059711456299, -0.5618753433227539, -0.4074442386627197, -0.25301313400268555, -0.09858202934265137, 0.05584907531738281, 0.210280179977417, 0.36471128463745117, 0.5191423892974854, 0.6735734939575195, 0.8280045986175537, 0.9824357032775879, 1.136866807937622, 1.2912979125976562, 1.4457290172576904, 1.6001601219177246, 1.7545912265777588, 1.909022331237793, 2.063453435897827, 2.2178845405578613, 2.3723156452178955, 2.5267467498779297, 2.681177854537964, 2.835608959197998, 2.9900400638580322, 3.1444711685180664, 3.2989022731781006, 3.4533333778381348, 3.607764482498169, 3.762195587158203, 3.9166266918182373, 4.0710577964782715, 4.225488662719727, 4.37992000579834]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 1.0, 10.0, 18.0, 27.0, 32.0, 68.0, 144.0, 266.0, 818.0, 3570.0, 35419.0, 774144.0, 220485.0, 10932.0, 1678.0, 497.0, 188.0, 105.0, 56.0, 29.0, 22.0, 15.0, 7.0, 9.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.5703125, -4.460906982421875, -4.35150146484375, -4.242095947265625, -4.1326904296875, -4.023284912109375, -3.91387939453125, -3.804473876953125, -3.695068359375, -3.585662841796875, -3.47625732421875, -3.366851806640625, -3.2574462890625, -3.148040771484375, -3.03863525390625, -2.929229736328125, -2.81982421875, -2.710418701171875, -2.60101318359375, -2.491607666015625, -2.3822021484375, -2.272796630859375, -2.16339111328125, -2.053985595703125, -1.944580078125, -1.835174560546875, -1.72576904296875, -1.616363525390625, -1.5069580078125, -1.397552490234375, -1.28814697265625, -1.178741455078125, -1.0693359375, -0.959930419921875, -0.85052490234375, -0.741119384765625, -0.6317138671875, -0.522308349609375, -0.41290283203125, -0.303497314453125, -0.194091796875, -0.084686279296875, 0.02471923828125, 0.134124755859375, 0.2435302734375, 0.352935791015625, 0.46234130859375, 0.571746826171875, 0.68115234375, 0.790557861328125, 0.89996337890625, 1.009368896484375, 1.1187744140625, 1.228179931640625, 1.33758544921875, 1.446990966796875, 1.556396484375, 1.665802001953125, 1.77520751953125, 1.884613037109375, 1.9940185546875, 2.103424072265625, 2.21282958984375, 2.322235107421875, 2.431640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 11.0, 20.0, 18.0, 21.0, 41.0, 58.0, 69.0, 77.0, 82.0, 85.0, 85.0, 74.0, 75.0, 63.0, 63.0, 31.0, 34.0, 25.0, 23.0, 17.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.59326171875, -0.5784912109375, -0.563720703125, -0.5489501953125, -0.5341796875, -0.5194091796875, -0.504638671875, -0.4898681640625, -0.47509765625, -0.4603271484375, -0.445556640625, -0.4307861328125, -0.416015625, -0.4012451171875, -0.386474609375, -0.3717041015625, -0.35693359375, -0.3421630859375, -0.327392578125, -0.3126220703125, -0.2978515625, -0.2830810546875, -0.268310546875, -0.2535400390625, -0.23876953125, -0.2239990234375, -0.209228515625, -0.1944580078125, -0.1796875, -0.1649169921875, -0.150146484375, -0.1353759765625, -0.12060546875, -0.1058349609375, -0.091064453125, -0.0762939453125, -0.0615234375, -0.0467529296875, -0.031982421875, -0.0172119140625, -0.00244140625, 0.0123291015625, 0.027099609375, 0.0418701171875, 0.056640625, 0.0714111328125, 0.086181640625, 0.1009521484375, 0.11572265625, 0.1304931640625, 0.145263671875, 0.1600341796875, 0.1748046875, 0.1895751953125, 0.204345703125, 0.2191162109375, 0.23388671875, 0.2486572265625, 0.263427734375, 0.2781982421875, 0.29296875, 0.3077392578125, 0.322509765625, 0.3372802734375, 0.35205078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 5.0, 10.0, 17.0, 17.0, 9.0, 30.0, 29.0, 53.0, 73.0, 144.0, 259.0, 722.0, 2454.0, 10843.0, 66950.0, 488243.0, 411068.0, 55003.0, 9162.0, 2194.0, 653.0, 254.0, 120.0, 76.0, 46.0, 29.0, 18.0, 12.0, 10.0, 12.0, 10.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.31927490234375, -1.2684326171875, -1.21759033203125, -1.166748046875, -1.11590576171875, -1.0650634765625, -1.01422119140625, -0.96337890625, -0.91253662109375, -0.8616943359375, -0.81085205078125, -0.760009765625, -0.70916748046875, -0.6583251953125, -0.60748291015625, -0.556640625, -0.50579833984375, -0.4549560546875, -0.40411376953125, -0.353271484375, -0.30242919921875, -0.2515869140625, -0.20074462890625, -0.14990234375, -0.09906005859375, -0.0482177734375, 0.00262451171875, 0.053466796875, 0.10430908203125, 0.1551513671875, 0.20599365234375, 0.2568359375, 0.30767822265625, 0.3585205078125, 0.40936279296875, 0.460205078125, 0.51104736328125, 0.5618896484375, 0.61273193359375, 0.66357421875, 0.71441650390625, 0.7652587890625, 0.81610107421875, 0.866943359375, 0.91778564453125, 0.9686279296875, 1.01947021484375, 1.0703125, 1.12115478515625, 1.1719970703125, 1.22283935546875, 1.273681640625, 1.32452392578125, 1.3753662109375, 1.42620849609375, 1.47705078125, 1.52789306640625, 1.5787353515625, 1.62957763671875, 1.680419921875, 1.73126220703125, 1.7821044921875, 1.83294677734375, 1.8837890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 8.0, 10.0, 11.0, 8.0, 20.0, 19.0, 25.0, 30.0, 30.0, 32.0, 44.0, 35.0, 34.0, 53.0, 39.0, 47.0, 44.0, 59.0, 41.0, 49.0, 35.0, 37.0, 38.0, 38.0, 29.0, 21.0, 32.0, 23.0, 17.0, 22.0, 6.0, 16.0, 10.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93408203125, -0.9002914428710938, -0.8665008544921875, -0.8327102661132812, -0.798919677734375, -0.7651290893554688, -0.7313385009765625, -0.6975479125976562, -0.66375732421875, -0.6299667358398438, -0.5961761474609375, -0.5623855590820312, -0.528594970703125, -0.49480438232421875, -0.4610137939453125, -0.42722320556640625, -0.3934326171875, -0.35964202880859375, -0.3258514404296875, -0.29206085205078125, -0.258270263671875, -0.22447967529296875, -0.1906890869140625, -0.15689849853515625, -0.12310791015625, -0.08931732177734375, -0.0555267333984375, -0.02173614501953125, 0.012054443359375, 0.04584503173828125, 0.0796356201171875, 0.11342620849609375, 0.147216796875, 0.18100738525390625, 0.2147979736328125, 0.24858856201171875, 0.282379150390625, 0.31616973876953125, 0.3499603271484375, 0.38375091552734375, 0.41754150390625, 0.45133209228515625, 0.4851226806640625, 0.5189132690429688, 0.552703857421875, 0.5864944458007812, 0.6202850341796875, 0.6540756225585938, 0.6878662109375, 0.7216567993164062, 0.7554473876953125, 0.7892379760742188, 0.823028564453125, 0.8568191528320312, 0.8906097412109375, 0.9244003295898438, 0.95819091796875, 0.9919815063476562, 1.0257720947265625, 1.0595626831054688, 1.093353271484375, 1.1271438598632812, 1.1609344482421875, 1.1947250366210938, 1.228515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 9.0, 12.0, 12.0, 23.0, 27.0, 45.0, 79.0, 168.0, 293.0, 620.0, 1551.0, 4887.0, 24093.0, 206654.0, 667490.0, 120611.0, 15813.0, 3740.0, 1288.0, 539.0, 271.0, 137.0, 80.0, 40.0, 27.0, 17.0, 8.0, 9.0, 2.0, 8.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.515625, -0.49745941162109375, -0.4792938232421875, -0.46112823486328125, -0.442962646484375, -0.42479705810546875, -0.4066314697265625, -0.38846588134765625, -0.37030029296875, -0.35213470458984375, -0.3339691162109375, -0.31580352783203125, -0.297637939453125, -0.27947235107421875, -0.2613067626953125, -0.24314117431640625, -0.2249755859375, -0.20680999755859375, -0.1886444091796875, -0.17047882080078125, -0.152313232421875, -0.13414764404296875, -0.1159820556640625, -0.09781646728515625, -0.07965087890625, -0.06148529052734375, -0.0433197021484375, -0.02515411376953125, -0.006988525390625, 0.01117706298828125, 0.0293426513671875, 0.04750823974609375, 0.065673828125, 0.08383941650390625, 0.1020050048828125, 0.12017059326171875, 0.138336181640625, 0.15650177001953125, 0.1746673583984375, 0.19283294677734375, 0.21099853515625, 0.22916412353515625, 0.2473297119140625, 0.26549530029296875, 0.283660888671875, 0.30182647705078125, 0.3199920654296875, 0.33815765380859375, 0.3563232421875, 0.37448883056640625, 0.3926544189453125, 0.41082000732421875, 0.428985595703125, 0.44715118408203125, 0.4653167724609375, 0.48348236083984375, 0.50164794921875, 0.5198135375976562, 0.5379791259765625, 0.5561447143554688, 0.574310302734375, 0.5924758911132812, 0.6106414794921875, 0.6288070678710938, 0.64697265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 9.0, 8.0, 17.0, 16.0, 32.0, 39.0, 51.0, 82.0, 125.0, 153.0, 138.0, 96.0, 81.0, 49.0, 34.0, 16.0, 17.0, 11.0, 10.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015926361083984375, -0.00015561282634735107, -0.0001519620418548584, -0.00014831125736236572, -0.00014466047286987305, -0.00014100968837738037, -0.0001373589038848877, -0.00013370811939239502, -0.00013005733489990234, -0.00012640655040740967, -0.000122755765914917, -0.00011910498142242432, -0.00011545419692993164, -0.00011180341243743896, -0.00010815262794494629, -0.00010450184345245361, -0.00010085105895996094, -9.720027446746826e-05, -9.354948997497559e-05, -8.989870548248291e-05, -8.624792098999023e-05, -8.259713649749756e-05, -7.894635200500488e-05, -7.529556751251221e-05, -7.164478302001953e-05, -6.799399852752686e-05, -6.434321403503418e-05, -6.0692429542541504e-05, -5.704164505004883e-05, -5.339086055755615e-05, -4.9740076065063477e-05, -4.60892915725708e-05, -4.2438507080078125e-05, -3.878772258758545e-05, -3.5136938095092773e-05, -3.14861536026001e-05, -2.7835369110107422e-05, -2.4184584617614746e-05, -2.053380012512207e-05, -1.6883015632629395e-05, -1.3232231140136719e-05, -9.581446647644043e-06, -5.930662155151367e-06, -2.2798776626586914e-06, 1.3709068298339844e-06, 5.02169132232666e-06, 8.672475814819336e-06, 1.2323260307312012e-05, 1.5974044799804688e-05, 1.9624829292297363e-05, 2.327561378479004e-05, 2.6926398277282715e-05, 3.057718276977539e-05, 3.4227967262268066e-05, 3.787875175476074e-05, 4.152953624725342e-05, 4.5180320739746094e-05, 4.883110523223877e-05, 5.2481889724731445e-05, 5.613267421722412e-05, 5.97834587097168e-05, 6.343424320220947e-05, 6.708502769470215e-05, 7.073581218719482e-05, 7.43865966796875e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 5.0, 10.0, 5.0, 10.0, 20.0, 33.0, 70.0, 161.0, 364.0, 1170.0, 4589.0, 30293.0, 412589.0, 551910.0, 39579.0, 5544.0, 1354.0, 488.0, 171.0, 77.0, 49.0, 23.0, 15.0, 9.0, 3.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.0126953125, -0.9891777038574219, -0.9656600952148438, -0.9421424865722656, -0.9186248779296875, -0.8951072692871094, -0.8715896606445312, -0.8480720520019531, -0.824554443359375, -0.8010368347167969, -0.7775192260742188, -0.7540016174316406, -0.7304840087890625, -0.7069664001464844, -0.6834487915039062, -0.6599311828613281, -0.63641357421875, -0.6128959655761719, -0.5893783569335938, -0.5658607482910156, -0.5423431396484375, -0.5188255310058594, -0.49530792236328125, -0.4717903137207031, -0.448272705078125, -0.4247550964355469, -0.40123748779296875, -0.3777198791503906, -0.3542022705078125, -0.3306846618652344, -0.30716705322265625, -0.2836494445800781, -0.2601318359375, -0.23661422729492188, -0.21309661865234375, -0.18957901000976562, -0.1660614013671875, -0.14254379272460938, -0.11902618408203125, -0.09550857543945312, -0.071990966796875, -0.048473358154296875, -0.02495574951171875, -0.001438140869140625, 0.0220794677734375, 0.045597076416015625, 0.06911468505859375, 0.09263229370117188, 0.11614990234375, 0.13966751098632812, 0.16318511962890625, 0.18670272827148438, 0.2102203369140625, 0.23373794555664062, 0.25725555419921875, 0.2807731628417969, 0.304290771484375, 0.3278083801269531, 0.35132598876953125, 0.3748435974121094, 0.3983612060546875, 0.4218788146972656, 0.44539642333984375, 0.4689140319824219, 0.492431640625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 5.0, 17.0, 12.0, 15.0, 25.0, 22.0, 49.0, 71.0, 86.0, 116.0, 114.0, 112.0, 99.0, 69.0, 55.0, 30.0, 30.0, 18.0, 15.0, 11.0, 11.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.533203125, -0.5189895629882812, -0.5047760009765625, -0.49056243896484375, -0.476348876953125, -0.46213531494140625, -0.4479217529296875, -0.43370819091796875, -0.41949462890625, -0.40528106689453125, -0.3910675048828125, -0.37685394287109375, -0.362640380859375, -0.34842681884765625, -0.3342132568359375, -0.31999969482421875, -0.3057861328125, -0.29157257080078125, -0.2773590087890625, -0.26314544677734375, -0.248931884765625, -0.23471832275390625, -0.2205047607421875, -0.20629119873046875, -0.19207763671875, -0.17786407470703125, -0.1636505126953125, -0.14943695068359375, -0.135223388671875, -0.12100982666015625, -0.1067962646484375, -0.09258270263671875, -0.078369140625, -0.06415557861328125, -0.0499420166015625, -0.03572845458984375, -0.021514892578125, -0.00730133056640625, 0.0069122314453125, 0.02112579345703125, 0.03533935546875, 0.04955291748046875, 0.0637664794921875, 0.07798004150390625, 0.092193603515625, 0.10640716552734375, 0.1206207275390625, 0.13483428955078125, 0.1490478515625, 0.16326141357421875, 0.1774749755859375, 0.19168853759765625, 0.205902099609375, 0.22011566162109375, 0.2343292236328125, 0.24854278564453125, 0.26275634765625, 0.27696990966796875, 0.2911834716796875, 0.30539703369140625, 0.319610595703125, 0.33382415771484375, 0.3480377197265625, 0.36225128173828125, 0.37646484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 13.0, 24.0, 43.0, 83.0, 110.0, 169.0, 162.0, 141.0, 121.0, 58.0, 39.0, 17.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.583742618560791, -5.280097007751465, -4.976451396942139, -4.6728057861328125, -4.369159698486328, -4.06551456451416, -3.761868476867676, -3.4582228660583496, -3.1545772552490234, -2.8509316444396973, -2.547286033630371, -2.243640184402466, -1.9399945735931396, -1.6363489627838135, -1.3327032327651978, -1.029057502746582, -0.7254118919372559, -0.4217662215232849, -0.11812055110931396, 0.18552511930465698, 0.48917078971862793, 0.7928164005279541, 1.0964621305465698, 1.4001078605651855, 1.7037534713745117, 2.007399082183838, 2.311044692993164, 2.6146905422210693, 2.9183361530303955, 3.2219817638397217, 3.525627613067627, 3.829273223876953, 4.1329193115234375, 4.436564922332764, 4.74021053314209, 5.043856143951416, 5.347501754760742, 5.651147842407227, 5.954793453216553, 6.258439064025879, 6.562084674835205, 6.865730285644531, 7.169375896453857, 7.473021507263184, 7.776667594909668, 8.080312728881836, 8.38395881652832, 8.687604904174805, 8.991250038146973, 9.294896125793457, 9.598541259765625, 9.90218734741211, 10.205832481384277, 10.509478569030762, 10.81312370300293, 11.116769790649414, 11.420415878295898, 11.724061965942383, 12.02770709991455, 12.331353187561035, 12.634998321533203, 12.938644409179688, 13.242289543151855, 13.54593563079834, 13.849580764770508]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 7.0, 1.0, 8.0, 11.0, 14.0, 6.0, 8.0, 11.0, 16.0, 17.0, 15.0, 26.0, 27.0, 23.0, 21.0, 34.0, 27.0, 22.0, 29.0, 44.0, 36.0, 25.0, 45.0, 42.0, 42.0, 34.0, 40.0, 44.0, 29.0, 30.0, 27.0, 28.0, 25.0, 23.0, 21.0, 20.0, 15.0, 24.0, 13.0, 14.0, 5.0, 6.0, 13.0, 8.0, 4.0, 7.0, 8.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.377024173736572, -4.24040412902832, -4.103784084320068, -3.9671640396118164, -3.8305439949035645, -3.6939239501953125, -3.5573041439056396, -3.4206840991973877, -3.2840640544891357, -3.147444009780884, -3.010823965072632, -2.87420392036438, -2.737584114074707, -2.600964069366455, -2.464344024658203, -2.327723979949951, -2.191103935241699, -2.0544838905334473, -1.9178638458251953, -1.781243920326233, -1.644623875617981, -1.508003830909729, -1.3713839054107666, -1.2347638607025146, -1.0981438159942627, -0.9615237712860107, -0.8249037861824036, -0.6882838010787964, -0.5516637563705444, -0.4150437116622925, -0.2784237265586853, -0.14180374145507812, -0.005184173583984375, 0.1314358413219452, 0.26805585622787476, 0.4046758711338043, 0.5412958860397339, 0.6779159307479858, 0.814535915851593, 0.9511559009552002, 1.0877759456634521, 1.224395990371704, 1.361016035079956, 1.4976359605789185, 1.6342560052871704, 1.7708760499954224, 1.9074959754943848, 2.0441160202026367, 2.1807360649108887, 2.3173561096191406, 2.4539761543273926, 2.5905961990356445, 2.7272162437438965, 2.8638362884521484, 3.0004560947418213, 3.1370761394500732, 3.273696184158325, 3.410316228866577, 3.546936273574829, 3.683556318283081, 3.820176124572754, 3.956796169281006, 4.093416213989258, 4.23003625869751, 4.366656303405762]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 4.0, 7.0, 5.0, 15.0, 14.0, 13.0, 13.0, 23.0, 28.0, 38.0, 44.0, 69.0, 111.0, 163.0, 279.0, 555.0, 1147.0, 2822.0, 8206.0, 30196.0, 844059.0, 3257799.0, 33665.0, 8948.0, 3219.0, 1404.0, 625.0, 320.0, 196.0, 98.0, 72.0, 39.0, 34.0, 17.0, 12.0, 4.0, 9.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.237884521484375, -4.13201904296875, -4.026153564453125, -3.9202880859375, -3.814422607421875, -3.70855712890625, -3.602691650390625, -3.496826171875, -3.390960693359375, -3.28509521484375, -3.179229736328125, -3.0733642578125, -2.967498779296875, -2.86163330078125, -2.755767822265625, -2.64990234375, -2.544036865234375, -2.43817138671875, -2.332305908203125, -2.2264404296875, -2.120574951171875, -2.01470947265625, -1.908843994140625, -1.802978515625, -1.697113037109375, -1.59124755859375, -1.485382080078125, -1.3795166015625, -1.273651123046875, -1.16778564453125, -1.061920166015625, -0.9560546875, -0.850189208984375, -0.74432373046875, -0.638458251953125, -0.5325927734375, -0.426727294921875, -0.32086181640625, -0.214996337890625, -0.109130859375, -0.003265380859375, 0.10260009765625, 0.208465576171875, 0.3143310546875, 0.420196533203125, 0.52606201171875, 0.631927490234375, 0.73779296875, 0.843658447265625, 0.94952392578125, 1.055389404296875, 1.1612548828125, 1.267120361328125, 1.37298583984375, 1.478851318359375, 1.584716796875, 1.690582275390625, 1.79644775390625, 1.902313232421875, 2.0081787109375, 2.114044189453125, 2.21990966796875, 2.325775146484375, 2.431640625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 8.0, 8.0, 11.0, 9.0, 21.0, 20.0, 20.0, 43.0, 45.0, 60.0, 60.0, 69.0, 71.0, 73.0, 81.0, 60.0, 62.0, 59.0, 54.0, 32.0, 42.0, 35.0, 15.0, 14.0, 14.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.5498046875, -0.5359840393066406, -0.5221633911132812, -0.5083427429199219, -0.4945220947265625, -0.4807014465332031, -0.46688079833984375, -0.4530601501464844, -0.439239501953125, -0.4254188537597656, -0.41159820556640625, -0.3977775573730469, -0.3839569091796875, -0.3701362609863281, -0.35631561279296875, -0.3424949645996094, -0.32867431640625, -0.3148536682128906, -0.30103302001953125, -0.2872123718261719, -0.2733917236328125, -0.2595710754394531, -0.24575042724609375, -0.23192977905273438, -0.218109130859375, -0.20428848266601562, -0.19046783447265625, -0.17664718627929688, -0.1628265380859375, -0.14900588989257812, -0.13518524169921875, -0.12136459350585938, -0.1075439453125, -0.09372329711914062, -0.07990264892578125, -0.06608200073242188, -0.0522613525390625, -0.038440704345703125, -0.02462005615234375, -0.010799407958984375, 0.003021240234375, 0.016841888427734375, 0.03066253662109375, 0.044483184814453125, 0.0583038330078125, 0.07212448120117188, 0.08594512939453125, 0.09976577758789062, 0.11358642578125, 0.12740707397460938, 0.14122772216796875, 0.15504837036132812, 0.1688690185546875, 0.18268966674804688, 0.19651031494140625, 0.21033096313476562, 0.224151611328125, 0.23797225952148438, 0.25179290771484375, 0.2656135559082031, 0.2794342041015625, 0.2932548522949219, 0.30707550048828125, 0.3208961486816406, 0.334716796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 16.0, 6.0, 17.0, 31.0, 30.0, 42.0, 48.0, 79.0, 94.0, 119.0, 172.0, 251.0, 289.0, 485.0, 806.0, 1553.0, 3364.0, 8745.0, 31024.0, 252845.0, 3766816.0, 96374.0, 18960.0, 6149.0, 2509.0, 1264.0, 707.0, 400.0, 279.0, 198.0, 147.0, 96.0, 100.0, 70.0, 49.0, 35.0, 26.0, 18.0, 15.0, 9.0, 8.0, 8.0, 6.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.04736328125, -1.9775390625, -1.90771484375, -1.837890625, -1.76806640625, -1.6982421875, -1.62841796875, -1.55859375, -1.48876953125, -1.4189453125, -1.34912109375, -1.279296875, -1.20947265625, -1.1396484375, -1.06982421875, -1.0, -0.93017578125, -0.8603515625, -0.79052734375, -0.720703125, -0.65087890625, -0.5810546875, -0.51123046875, -0.44140625, -0.37158203125, -0.3017578125, -0.23193359375, -0.162109375, -0.09228515625, -0.0224609375, 0.04736328125, 0.1171875, 0.18701171875, 0.2568359375, 0.32666015625, 0.396484375, 0.46630859375, 0.5361328125, 0.60595703125, 0.67578125, 0.74560546875, 0.8154296875, 0.88525390625, 0.955078125, 1.02490234375, 1.0947265625, 1.16455078125, 1.234375, 1.30419921875, 1.3740234375, 1.44384765625, 1.513671875, 1.58349609375, 1.6533203125, 1.72314453125, 1.79296875, 1.86279296875, 1.9326171875, 2.00244140625, 2.072265625, 2.14208984375, 2.2119140625, 2.28173828125, 2.3515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 12.0, 10.0, 21.0, 29.0, 62.0, 174.0, 839.0, 2488.0, 223.0, 92.0, 45.0, 25.0, 13.0, 10.0, 6.0, 4.0, 5.0, 5.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.201171875, -1.1660003662109375, -1.130828857421875, -1.0956573486328125, -1.06048583984375, -1.0253143310546875, -0.990142822265625, -0.9549713134765625, -0.9197998046875, -0.8846282958984375, -0.849456787109375, -0.8142852783203125, -0.77911376953125, -0.7439422607421875, -0.708770751953125, -0.6735992431640625, -0.638427734375, -0.6032562255859375, -0.568084716796875, -0.5329132080078125, -0.49774169921875, -0.4625701904296875, -0.427398681640625, -0.3922271728515625, -0.3570556640625, -0.3218841552734375, -0.286712646484375, -0.2515411376953125, -0.21636962890625, -0.1811981201171875, -0.146026611328125, -0.1108551025390625, -0.07568359375, -0.0405120849609375, -0.005340576171875, 0.0298309326171875, 0.06500244140625, 0.1001739501953125, 0.135345458984375, 0.1705169677734375, 0.2056884765625, 0.2408599853515625, 0.276031494140625, 0.3112030029296875, 0.34637451171875, 0.3815460205078125, 0.416717529296875, 0.4518890380859375, 0.487060546875, 0.5222320556640625, 0.557403564453125, 0.5925750732421875, 0.62774658203125, 0.6629180908203125, 0.698089599609375, 0.7332611083984375, 0.7684326171875, 0.8036041259765625, 0.838775634765625, 0.8739471435546875, 0.90911865234375, 0.9442901611328125, 0.979461669921875, 1.0146331787109375, 1.0498046875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 8.0, 16.0, 33.0, 97.0, 300.0, 352.0, 145.0, 35.0, 12.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.955515384674072, -6.655892372131348, -6.356269359588623, -6.056646347045898, -5.757023811340332, -5.457400798797607, -5.157777786254883, -4.858155250549316, -4.558531761169434, -4.258908748626709, -3.9592859745025635, -3.659662961959839, -3.3600401878356934, -3.0604171752929688, -2.760794162750244, -2.4611713886260986, -2.161548614501953, -1.861925721168518, -1.562302827835083, -1.2626798152923584, -0.9630569219589233, -0.6634340286254883, -0.36381101608276367, -0.06418824195861816, 0.23543477058410645, 0.5350576639175415, 0.8346806168556213, 1.1343035697937012, 1.4339264631271362, 1.7335493564605713, 2.033172369003296, 2.3327951431274414, 2.632417678833008, 2.9320406913757324, 3.231663465499878, 3.5312864780426025, 3.830909252166748, 4.130532264709473, 4.430155277252197, 4.729778289794922, 5.029400825500488, 5.329023838043213, 5.6286468505859375, 5.928269386291504, 6.2278923988342285, 6.527515411376953, 6.827138423919678, 7.126761436462402, 7.426384449005127, 7.726007461547852, 8.025629997253418, 8.3252534866333, 8.624876022338867, 8.92449951171875, 9.224122047424316, 9.523744583129883, 9.823368072509766, 10.122990608215332, 10.422614097595215, 10.722236633300781, 11.021860122680664, 11.32148265838623, 11.621105194091797, 11.92072868347168, 12.220351219177246]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 13.0, 17.0, 17.0, 24.0, 38.0, 47.0, 71.0, 65.0, 70.0, 85.0, 87.0, 86.0, 84.0, 70.0, 53.0, 56.0, 26.0, 34.0, 16.0, 12.0, 5.0, 0.0, 5.0, 3.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.753364086151123, -3.634342670440674, -3.5153210163116455, -3.3962996006011963, -3.277278184890747, -3.1582565307617188, -3.0392351150512695, -2.9202136993408203, -2.801192283630371, -2.682170867919922, -2.5631492137908936, -2.4441277980804443, -2.325106382369995, -2.206084728240967, -2.0870633125305176, -1.9680418968200684, -1.8490203619003296, -1.7299988269805908, -1.6109774112701416, -1.4919558763504028, -1.3729344606399536, -1.2539129257202148, -1.1348915100097656, -1.0158699750900269, -0.8968484997749329, -0.7778270244598389, -0.6588055491447449, -0.5397840738296509, -0.4207625687122345, -0.3017410635948181, -0.18271958827972412, -0.06369811296463013, 0.05532336235046387, 0.17434483766555786, 0.29336631298065186, 0.41238781809806824, 0.5314092636108398, 0.6504307985305786, 0.7694522738456726, 0.8884737491607666, 1.0074951648712158, 1.1265166997909546, 1.2455381155014038, 1.3645596504211426, 1.4835810661315918, 1.6026026010513306, 1.7216241359710693, 1.8406455516815186, 1.9596670866012573, 2.078688621520996, 2.1977100372314453, 2.3167314529418945, 2.435753107070923, 2.554774522781372, 2.6737959384918213, 2.7928175926208496, 2.911839008331299, 3.030860424041748, 3.1498820781707764, 3.2689034938812256, 3.387924909591675, 3.506946563720703, 3.6259679794311523, 3.7449893951416016, 3.864010810852051]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 13.0, 12.0, 12.0, 20.0, 25.0, 38.0, 68.0, 119.0, 205.0, 362.0, 713.0, 1964.0, 5882.0, 24417.0, 155221.0, 633606.0, 186653.0, 28762.0, 6679.0, 2088.0, 804.0, 415.0, 180.0, 79.0, 65.0, 53.0, 23.0, 16.0, 21.0, 10.0, 6.0, 6.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.375, -2.299713134765625, -2.22442626953125, -2.149139404296875, -2.0738525390625, -1.998565673828125, -1.92327880859375, -1.847991943359375, -1.772705078125, -1.697418212890625, -1.62213134765625, -1.546844482421875, -1.4715576171875, -1.396270751953125, -1.32098388671875, -1.245697021484375, -1.17041015625, -1.095123291015625, -1.01983642578125, -0.944549560546875, -0.8692626953125, -0.793975830078125, -0.71868896484375, -0.643402099609375, -0.568115234375, -0.492828369140625, -0.41754150390625, -0.342254638671875, -0.2669677734375, -0.191680908203125, -0.11639404296875, -0.041107177734375, 0.0341796875, 0.109466552734375, 0.18475341796875, 0.260040283203125, 0.3353271484375, 0.410614013671875, 0.48590087890625, 0.561187744140625, 0.636474609375, 0.711761474609375, 0.78704833984375, 0.862335205078125, 0.9376220703125, 1.012908935546875, 1.08819580078125, 1.163482666015625, 1.23876953125, 1.314056396484375, 1.38934326171875, 1.464630126953125, 1.5399169921875, 1.615203857421875, 1.69049072265625, 1.765777587890625, 1.841064453125, 1.916351318359375, 1.99163818359375, 2.066925048828125, 2.1422119140625, 2.217498779296875, 2.29278564453125, 2.368072509765625, 2.443359375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 11.0, 16.0, 18.0, 23.0, 40.0, 50.0, 40.0, 53.0, 72.0, 74.0, 80.0, 92.0, 65.0, 79.0, 77.0, 45.0, 41.0, 30.0, 24.0, 18.0, 16.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.62451171875, -0.60888671875, -0.59326171875, -0.57763671875, -0.56201171875, -0.54638671875, -0.53076171875, -0.51513671875, -0.49951171875, -0.48388671875, -0.46826171875, -0.45263671875, -0.43701171875, -0.42138671875, -0.40576171875, -0.39013671875, -0.37451171875, -0.35888671875, -0.34326171875, -0.32763671875, -0.31201171875, -0.29638671875, -0.28076171875, -0.26513671875, -0.24951171875, -0.23388671875, -0.21826171875, -0.20263671875, -0.18701171875, -0.17138671875, -0.15576171875, -0.14013671875, -0.12451171875, -0.10888671875, -0.09326171875, -0.07763671875, -0.06201171875, -0.04638671875, -0.03076171875, -0.01513671875, 0.00048828125, 0.01611328125, 0.03173828125, 0.04736328125, 0.06298828125, 0.07861328125, 0.09423828125, 0.10986328125, 0.12548828125, 0.14111328125, 0.15673828125, 0.17236328125, 0.18798828125, 0.20361328125, 0.21923828125, 0.23486328125, 0.25048828125, 0.26611328125, 0.28173828125, 0.29736328125, 0.31298828125, 0.32861328125, 0.34423828125, 0.35986328125, 0.37548828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 8.0, 1.0, 5.0, 6.0, 10.0, 7.0, 16.0, 27.0, 32.0, 36.0, 66.0, 89.0, 130.0, 218.0, 362.0, 640.0, 1220.0, 2454.0, 5213.0, 12005.0, 30018.0, 83844.0, 231306.0, 374153.0, 192808.0, 69160.0, 25308.0, 10255.0, 4389.0, 2100.0, 1120.0, 589.0, 324.0, 212.0, 133.0, 73.0, 54.0, 39.0, 33.0, 18.0, 20.0, 11.0, 11.0, 13.0, 2.0, 3.0, 10.0, 5.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89453125, -0.8651123046875, -0.835693359375, -0.8062744140625, -0.77685546875, -0.7474365234375, -0.718017578125, -0.6885986328125, -0.6591796875, -0.6297607421875, -0.600341796875, -0.5709228515625, -0.54150390625, -0.5120849609375, -0.482666015625, -0.4532470703125, -0.423828125, -0.3944091796875, -0.364990234375, -0.3355712890625, -0.30615234375, -0.2767333984375, -0.247314453125, -0.2178955078125, -0.1884765625, -0.1590576171875, -0.129638671875, -0.1002197265625, -0.07080078125, -0.0413818359375, -0.011962890625, 0.0174560546875, 0.046875, 0.0762939453125, 0.105712890625, 0.1351318359375, 0.16455078125, 0.1939697265625, 0.223388671875, 0.2528076171875, 0.2822265625, 0.3116455078125, 0.341064453125, 0.3704833984375, 0.39990234375, 0.4293212890625, 0.458740234375, 0.4881591796875, 0.517578125, 0.5469970703125, 0.576416015625, 0.6058349609375, 0.63525390625, 0.6646728515625, 0.694091796875, 0.7235107421875, 0.7529296875, 0.7823486328125, 0.811767578125, 0.8411865234375, 0.87060546875, 0.9000244140625, 0.929443359375, 0.9588623046875, 0.98828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 7.0, 12.0, 9.0, 11.0, 16.0, 22.0, 22.0, 13.0, 34.0, 26.0, 34.0, 36.0, 29.0, 47.0, 51.0, 48.0, 66.0, 46.0, 56.0, 30.0, 41.0, 45.0, 38.0, 31.0, 43.0, 32.0, 21.0, 16.0, 29.0, 22.0, 7.0, 12.0, 9.0, 5.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.18072509765625, -1.1378173828125, -1.09490966796875, -1.052001953125, -1.00909423828125, -0.9661865234375, -0.92327880859375, -0.88037109375, -0.83746337890625, -0.7945556640625, -0.75164794921875, -0.708740234375, -0.66583251953125, -0.6229248046875, -0.58001708984375, -0.537109375, -0.49420166015625, -0.4512939453125, -0.40838623046875, -0.365478515625, -0.32257080078125, -0.2796630859375, -0.23675537109375, -0.19384765625, -0.15093994140625, -0.1080322265625, -0.06512451171875, -0.022216796875, 0.02069091796875, 0.0635986328125, 0.10650634765625, 0.1494140625, 0.19232177734375, 0.2352294921875, 0.27813720703125, 0.321044921875, 0.36395263671875, 0.4068603515625, 0.44976806640625, 0.49267578125, 0.53558349609375, 0.5784912109375, 0.62139892578125, 0.664306640625, 0.70721435546875, 0.7501220703125, 0.79302978515625, 0.8359375, 0.87884521484375, 0.9217529296875, 0.96466064453125, 1.007568359375, 1.05047607421875, 1.0933837890625, 1.13629150390625, 1.17919921875, 1.22210693359375, 1.2650146484375, 1.30792236328125, 1.350830078125, 1.39373779296875, 1.4366455078125, 1.47955322265625, 1.5224609375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 19.0, 20.0, 42.0, 49.0, 58.0, 96.0, 165.0, 216.0, 372.0, 670.0, 1408.0, 3565.0, 11993.0, 94883.0, 776643.0, 136286.0, 14642.0, 4112.0, 1531.0, 728.0, 374.0, 224.0, 151.0, 79.0, 50.0, 50.0, 40.0, 25.0, 14.0, 7.0, 7.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.02734375, -0.9937286376953125, -0.960113525390625, -0.9264984130859375, -0.89288330078125, -0.8592681884765625, -0.825653076171875, -0.7920379638671875, -0.7584228515625, -0.7248077392578125, -0.691192626953125, -0.6575775146484375, -0.62396240234375, -0.5903472900390625, -0.556732177734375, -0.5231170654296875, -0.489501953125, -0.4558868408203125, -0.422271728515625, -0.3886566162109375, -0.35504150390625, -0.3214263916015625, -0.287811279296875, -0.2541961669921875, -0.2205810546875, -0.1869659423828125, -0.153350830078125, -0.1197357177734375, -0.08612060546875, -0.0525054931640625, -0.018890380859375, 0.0147247314453125, 0.04833984375, 0.0819549560546875, 0.115570068359375, 0.1491851806640625, 0.18280029296875, 0.2164154052734375, 0.250030517578125, 0.2836456298828125, 0.3172607421875, 0.3508758544921875, 0.384490966796875, 0.4181060791015625, 0.45172119140625, 0.4853363037109375, 0.518951416015625, 0.5525665283203125, 0.586181640625, 0.6197967529296875, 0.653411865234375, 0.6870269775390625, 0.72064208984375, 0.7542572021484375, 0.787872314453125, 0.8214874267578125, 0.8551025390625, 0.8887176513671875, 0.922332763671875, 0.9559478759765625, 0.98956298828125, 1.0231781005859375, 1.056793212890625, 1.0904083251953125, 1.1240234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 10.0, 19.0, 32.0, 34.0, 65.0, 102.0, 172.0, 187.0, 141.0, 80.0, 71.0, 35.0, 18.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021910667419433594, -0.00021290406584739685, -0.00020670145750045776, -0.00020049884915351868, -0.0001942962408065796, -0.0001880936324596405, -0.00018189102411270142, -0.00017568841576576233, -0.00016948580741882324, -0.00016328319907188416, -0.00015708059072494507, -0.00015087798237800598, -0.0001446753740310669, -0.0001384727656841278, -0.00013227015733718872, -0.00012606754899024963, -0.00011986494064331055, -0.00011366233229637146, -0.00010745972394943237, -0.00010125711560249329, -9.50545072555542e-05, -8.885189890861511e-05, -8.264929056167603e-05, -7.644668221473694e-05, -7.024407386779785e-05, -6.404146552085876e-05, -5.783885717391968e-05, -5.163624882698059e-05, -4.5433640480041504e-05, -3.923103213310242e-05, -3.302842378616333e-05, -2.6825815439224243e-05, -2.0623207092285156e-05, -1.442059874534607e-05, -8.217990398406982e-06, -2.0153820514678955e-06, 4.187226295471191e-06, 1.0389834642410278e-05, 1.6592442989349365e-05, 2.2795051336288452e-05, 2.899765968322754e-05, 3.5200268030166626e-05, 4.140287637710571e-05, 4.76054847240448e-05, 5.380809307098389e-05, 6.0010701417922974e-05, 6.621330976486206e-05, 7.241591811180115e-05, 7.861852645874023e-05, 8.482113480567932e-05, 9.102374315261841e-05, 9.72263514995575e-05, 0.00010342895984649658, 0.00010963156819343567, 0.00011583417654037476, 0.00012203678488731384, 0.00012823939323425293, 0.00013444200158119202, 0.0001406446099281311, 0.0001468472182750702, 0.00015304982662200928, 0.00015925243496894836, 0.00016545504331588745, 0.00017165765166282654, 0.00017786026000976562]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 15.0, 18.0, 27.0, 44.0, 61.0, 98.0, 143.0, 315.0, 831.0, 2190.0, 8277.0, 76833.0, 794976.0, 147772.0, 12163.0, 2932.0, 965.0, 403.0, 177.0, 100.0, 73.0, 46.0, 31.0, 22.0, 14.0, 9.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9881591796875, -0.947998046875, -0.9078369140625, -0.86767578125, -0.8275146484375, -0.787353515625, -0.7471923828125, -0.70703125, -0.6668701171875, -0.626708984375, -0.5865478515625, -0.54638671875, -0.5062255859375, -0.466064453125, -0.4259033203125, -0.3857421875, -0.3455810546875, -0.305419921875, -0.2652587890625, -0.22509765625, -0.1849365234375, -0.144775390625, -0.1046142578125, -0.064453125, -0.0242919921875, 0.015869140625, 0.0560302734375, 0.09619140625, 0.1363525390625, 0.176513671875, 0.2166748046875, 0.2568359375, 0.2969970703125, 0.337158203125, 0.3773193359375, 0.41748046875, 0.4576416015625, 0.497802734375, 0.5379638671875, 0.578125, 0.6182861328125, 0.658447265625, 0.6986083984375, 0.73876953125, 0.7789306640625, 0.819091796875, 0.8592529296875, 0.8994140625, 0.9395751953125, 0.979736328125, 1.0198974609375, 1.06005859375, 1.1002197265625, 1.140380859375, 1.1805419921875, 1.220703125, 1.2608642578125, 1.301025390625, 1.3411865234375, 1.38134765625, 1.4215087890625, 1.461669921875, 1.5018310546875, 1.5419921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 3.0, 8.0, 13.0, 10.0, 31.0, 51.0, 53.0, 94.0, 119.0, 144.0, 137.0, 97.0, 84.0, 52.0, 34.0, 26.0, 14.0, 3.0, 4.0, 7.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.12890625, -1.0980300903320312, -1.0671539306640625, -1.0362777709960938, -1.005401611328125, -0.9745254516601562, -0.9436492919921875, -0.9127731323242188, -0.88189697265625, -0.8510208129882812, -0.8201446533203125, -0.7892684936523438, -0.758392333984375, -0.7275161743164062, -0.6966400146484375, -0.6657638549804688, -0.6348876953125, -0.6040115356445312, -0.5731353759765625, -0.5422592163085938, -0.511383056640625, -0.48050689697265625, -0.4496307373046875, -0.41875457763671875, -0.38787841796875, -0.35700225830078125, -0.3261260986328125, -0.29524993896484375, -0.264373779296875, -0.23349761962890625, -0.2026214599609375, -0.17174530029296875, -0.140869140625, -0.10999298095703125, -0.0791168212890625, -0.04824066162109375, -0.017364501953125, 0.01351165771484375, 0.0443878173828125, 0.07526397705078125, 0.10614013671875, 0.13701629638671875, 0.1678924560546875, 0.19876861572265625, 0.229644775390625, 0.26052093505859375, 0.2913970947265625, 0.32227325439453125, 0.3531494140625, 0.38402557373046875, 0.4149017333984375, 0.44577789306640625, 0.476654052734375, 0.5075302124023438, 0.5384063720703125, 0.5692825317382812, 0.60015869140625, 0.6310348510742188, 0.6619110107421875, 0.6927871704101562, 0.723663330078125, 0.7545394897460938, 0.7854156494140625, 0.8162918090820312, 0.84716796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 9.0, 11.0, 16.0, 29.0, 64.0, 112.0, 142.0, 196.0, 177.0, 130.0, 59.0, 35.0, 13.0, 9.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.208967208862305, -8.721240043640137, -8.233511924743652, -7.745784282684326, -7.258056640625, -6.770329475402832, -6.282601356506348, -5.79487419128418, -5.307146072387695, -4.819418430328369, -4.331690788269043, -3.843963146209717, -3.3562355041503906, -2.8685081005096436, -2.3807804584503174, -1.8930528163909912, -1.4053254127502441, -0.917597770690918, -0.4298701882362366, 0.057857394218444824, 0.545585036277771, 1.0333125591278076, 1.5210402011871338, 2.00876784324646, 2.496495485305786, 2.9842231273651123, 3.4719507694244385, 3.9596781730651855, 4.447405815124512, 4.935133457183838, 5.422861099243164, 5.91058874130249, 6.398316383361816, 6.886044025421143, 7.373771667480469, 7.861499309539795, 8.349226951599121, 8.836954116821289, 9.324682235717773, 9.812409400939941, 10.300137519836426, 10.787864685058594, 11.275592803955078, 11.763319969177246, 12.25104808807373, 12.738775253295898, 13.226503372192383, 13.71423053741455, 14.201957702636719, 14.689684867858887, 15.177412986755371, 15.665140151977539, 16.152868270874023, 16.640596389770508, 17.12832260131836, 17.616050720214844, 18.103778839111328, 18.591506958007812, 19.079233169555664, 19.56696128845215, 20.054689407348633, 20.542417526245117, 21.03014373779297, 21.517871856689453, 22.005599975585938]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 6.0, 6.0, 5.0, 9.0, 9.0, 6.0, 8.0, 16.0, 12.0, 13.0, 14.0, 22.0, 15.0, 25.0, 24.0, 27.0, 31.0, 35.0, 15.0, 41.0, 36.0, 54.0, 43.0, 41.0, 41.0, 39.0, 25.0, 41.0, 44.0, 42.0, 37.0, 33.0, 26.0, 31.0, 19.0, 21.0, 13.0, 16.0, 14.0, 11.0, 8.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.625533580780029, -6.410942554473877, -6.196352005004883, -5.9817609786987305, -5.767169952392578, -5.552578926086426, -5.337987899780273, -5.123397350311279, -4.908806324005127, -4.694215297698975, -4.4796247482299805, -4.265033721923828, -4.050442695617676, -3.8358516693115234, -3.62126088142395, -3.406670093536377, -3.1920790672302246, -2.9774880409240723, -2.762897253036499, -2.548306465148926, -2.3337154388427734, -2.119124412536621, -1.9045336246490479, -1.689942717552185, -1.4753518104553223, -1.2607609033584595, -1.0461699962615967, -0.8315790891647339, -0.6169881820678711, -0.4023972749710083, -0.1878063678741455, 0.026784539222717285, 0.24137544631958008, 0.45596635341644287, 0.6705572605133057, 0.8851481676101685, 1.0997390747070312, 1.314329981803894, 1.5289208889007568, 1.7435117959976196, 1.9581027030944824, 2.1726937294006348, 2.387284517288208, 2.6018753051757812, 2.8164663314819336, 3.031057357788086, 3.245648145675659, 3.4602389335632324, 3.6748299598693848, 3.889420986175537, 4.104011535644531, 4.318602561950684, 4.533193588256836, 4.747784614562988, 4.962375640869141, 5.176966190338135, 5.391557216644287, 5.6061482429504395, 5.820738792419434, 6.035329818725586, 6.249920845031738, 6.464511871337891, 6.679102897644043, 6.893693447113037, 7.1082844734191895]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 6.0, 3.0, 2.0, 6.0, 8.0, 16.0, 15.0, 24.0, 30.0, 36.0, 44.0, 81.0, 125.0, 185.0, 388.0, 867.0, 2393.0, 7723.0, 40197.0, 3689287.0, 418364.0, 25093.0, 5818.0, 1962.0, 815.0, 387.0, 159.0, 104.0, 52.0, 26.0, 29.0, 9.0, 10.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0], "bins": [-5.484375, -5.362152099609375, -5.23992919921875, -5.117706298828125, -4.9954833984375, -4.873260498046875, -4.75103759765625, -4.628814697265625, -4.506591796875, -4.384368896484375, -4.26214599609375, -4.139923095703125, -4.0177001953125, -3.895477294921875, -3.77325439453125, -3.651031494140625, -3.52880859375, -3.406585693359375, -3.28436279296875, -3.162139892578125, -3.0399169921875, -2.917694091796875, -2.79547119140625, -2.673248291015625, -2.551025390625, -2.428802490234375, -2.30657958984375, -2.184356689453125, -2.0621337890625, -1.939910888671875, -1.81768798828125, -1.695465087890625, -1.5732421875, -1.451019287109375, -1.32879638671875, -1.206573486328125, -1.0843505859375, -0.962127685546875, -0.83990478515625, -0.717681884765625, -0.595458984375, -0.473236083984375, -0.35101318359375, -0.228790283203125, -0.1065673828125, 0.015655517578125, 0.13787841796875, 0.260101318359375, 0.38232421875, 0.504547119140625, 0.62677001953125, 0.748992919921875, 0.8712158203125, 0.993438720703125, 1.11566162109375, 1.237884521484375, 1.360107421875, 1.482330322265625, 1.60455322265625, 1.726776123046875, 1.8489990234375, 1.971221923828125, 2.09344482421875, 2.215667724609375, 2.337890625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 11.0, 8.0, 19.0, 14.0, 16.0, 24.0, 35.0, 34.0, 33.0, 64.0, 54.0, 59.0, 52.0, 67.0, 60.0, 79.0, 74.0, 60.0, 37.0, 34.0, 35.0, 31.0, 19.0, 20.0, 15.0, 12.0, 10.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.58984375, -0.5746307373046875, -0.559417724609375, -0.5442047119140625, -0.52899169921875, -0.5137786865234375, -0.498565673828125, -0.4833526611328125, -0.4681396484375, -0.4529266357421875, -0.437713623046875, -0.4225006103515625, -0.40728759765625, -0.3920745849609375, -0.376861572265625, -0.3616485595703125, -0.346435546875, -0.3312225341796875, -0.316009521484375, -0.3007965087890625, -0.28558349609375, -0.2703704833984375, -0.255157470703125, -0.2399444580078125, -0.2247314453125, -0.2095184326171875, -0.194305419921875, -0.1790924072265625, -0.16387939453125, -0.1486663818359375, -0.133453369140625, -0.1182403564453125, -0.10302734375, -0.0878143310546875, -0.072601318359375, -0.0573883056640625, -0.04217529296875, -0.0269622802734375, -0.011749267578125, 0.0034637451171875, 0.0186767578125, 0.0338897705078125, 0.049102783203125, 0.0643157958984375, 0.07952880859375, 0.0947418212890625, 0.109954833984375, 0.1251678466796875, 0.140380859375, 0.1555938720703125, 0.170806884765625, 0.1860198974609375, 0.20123291015625, 0.2164459228515625, 0.231658935546875, 0.2468719482421875, 0.2620849609375, 0.2772979736328125, 0.292510986328125, 0.3077239990234375, 0.32293701171875, 0.3381500244140625, 0.353363037109375, 0.3685760498046875, 0.3837890625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 7.0, 3.0, 9.0, 6.0, 7.0, 5.0, 8.0, 18.0, 26.0, 23.0, 46.0, 67.0, 68.0, 96.0, 154.0, 269.0, 430.0, 613.0, 1069.0, 2045.0, 4390.0, 10817.0, 42055.0, 444024.0, 3554445.0, 101146.0, 19329.0, 6485.0, 2889.0, 1435.0, 809.0, 527.0, 286.0, 191.0, 140.0, 95.0, 64.0, 44.0, 26.0, 30.0, 30.0, 13.0, 8.0, 4.0, 8.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.1953125, -2.125030517578125, -2.05474853515625, -1.984466552734375, -1.9141845703125, -1.843902587890625, -1.77362060546875, -1.703338623046875, -1.633056640625, -1.562774658203125, -1.49249267578125, -1.422210693359375, -1.3519287109375, -1.281646728515625, -1.21136474609375, -1.141082763671875, -1.07080078125, -1.000518798828125, -0.93023681640625, -0.859954833984375, -0.7896728515625, -0.719390869140625, -0.64910888671875, -0.578826904296875, -0.508544921875, -0.438262939453125, -0.36798095703125, -0.297698974609375, -0.2274169921875, -0.157135009765625, -0.08685302734375, -0.016571044921875, 0.0537109375, 0.123992919921875, 0.19427490234375, 0.264556884765625, 0.3348388671875, 0.405120849609375, 0.47540283203125, 0.545684814453125, 0.615966796875, 0.686248779296875, 0.75653076171875, 0.826812744140625, 0.8970947265625, 0.967376708984375, 1.03765869140625, 1.107940673828125, 1.17822265625, 1.248504638671875, 1.31878662109375, 1.389068603515625, 1.4593505859375, 1.529632568359375, 1.59991455078125, 1.670196533203125, 1.740478515625, 1.810760498046875, 1.88104248046875, 1.951324462890625, 2.0216064453125, 2.091888427734375, 2.16217041015625, 2.232452392578125, 2.302734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 4.0, 3.0, 5.0, 13.0, 14.0, 22.0, 26.0, 54.0, 158.0, 456.0, 2427.0, 512.0, 161.0, 88.0, 37.0, 27.0, 17.0, 10.0, 12.0, 9.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.314453125, -1.2740631103515625, -1.233673095703125, -1.1932830810546875, -1.15289306640625, -1.1125030517578125, -1.072113037109375, -1.0317230224609375, -0.9913330078125, -0.9509429931640625, -0.910552978515625, -0.8701629638671875, -0.82977294921875, -0.7893829345703125, -0.748992919921875, -0.7086029052734375, -0.668212890625, -0.6278228759765625, -0.587432861328125, -0.5470428466796875, -0.50665283203125, -0.4662628173828125, -0.425872802734375, -0.3854827880859375, -0.3450927734375, -0.3047027587890625, -0.264312744140625, -0.2239227294921875, -0.18353271484375, -0.1431427001953125, -0.102752685546875, -0.0623626708984375, -0.02197265625, 0.0184173583984375, 0.058807373046875, 0.0991973876953125, 0.13958740234375, 0.1799774169921875, 0.220367431640625, 0.2607574462890625, 0.3011474609375, 0.3415374755859375, 0.381927490234375, 0.4223175048828125, 0.46270751953125, 0.5030975341796875, 0.543487548828125, 0.5838775634765625, 0.624267578125, 0.6646575927734375, 0.705047607421875, 0.7454376220703125, 0.78582763671875, 0.8262176513671875, 0.866607666015625, 0.9069976806640625, 0.9473876953125, 0.9877777099609375, 1.028167724609375, 1.0685577392578125, 1.10894775390625, 1.1493377685546875, 1.189727783203125, 1.2301177978515625, 1.2705078125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 23.0, 72.0, 194.0, 270.0, 247.0, 94.0, 54.0, 21.0, 5.0, 3.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.648687362670898, -4.309000015258789, -3.9693121910095215, -3.629624843597412, -3.2899370193481445, -2.950249671936035, -2.6105620861053467, -2.270874500274658, -1.9311869144439697, -1.5914993286132812, -1.2518117427825928, -0.9121242761611938, -0.5724366903305054, -0.2327491044998169, 0.10693836212158203, 0.4466259479522705, 0.786313533782959, 1.1260011196136475, 1.465688705444336, 1.8053761720657349, 2.145063877105713, 2.4847512245178223, 2.8244388103485107, 3.164126396179199, 3.5038139820098877, 3.843501567840576, 4.1831889152526855, 4.522876739501953, 4.8625640869140625, 5.20225191116333, 5.5419392585754395, 5.881627082824707, 6.221314430236816, 6.561001777648926, 6.900689601898193, 7.240376949310303, 7.58006477355957, 7.91975212097168, 8.259439468383789, 8.599126815795898, 8.938815116882324, 9.278502464294434, 9.618189811706543, 9.957878112792969, 10.297565460205078, 10.637252807617188, 10.976940155029297, 11.316627502441406, 11.656314849853516, 11.996002197265625, 12.335689544677734, 12.67537784576416, 13.01506519317627, 13.354752540588379, 13.694439888000488, 14.034128189086914, 14.373815536499023, 14.713502883911133, 15.053190231323242, 15.392878532409668, 15.732565879821777, 16.072254180908203, 16.411941528320312, 16.751628875732422, 17.09131622314453]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 9.0, 8.0, 13.0, 33.0, 31.0, 39.0, 64.0, 71.0, 90.0, 75.0, 89.0, 105.0, 84.0, 68.0, 54.0, 47.0, 42.0, 26.0, 22.0, 17.0, 5.0, 7.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.562389373779297, -5.396784782409668, -5.231180191040039, -5.06557559967041, -4.899971008300781, -4.734366416931152, -4.568761825561523, -4.4031572341918945, -4.237552642822266, -4.071948051452637, -3.906343460083008, -3.740738868713379, -3.57513427734375, -3.409529685974121, -3.243924856185913, -3.078320264816284, -2.912715435028076, -2.7471108436584473, -2.5815062522888184, -2.4159016609191895, -2.2502970695495605, -2.0846924781799316, -1.9190876483917236, -1.7534830570220947, -1.5878784656524658, -1.422273874282837, -1.256669282913208, -1.0910645723342896, -0.9254599809646606, -0.7598553895950317, -0.5942507386207581, -0.4286460876464844, -0.26304149627685547, -0.09743687510490417, 0.06816774606704712, 0.2337723672389984, 0.3993769884109497, 0.5649815797805786, 0.7305862307548523, 0.896190881729126, 1.0617954730987549, 1.2274000644683838, 1.3930046558380127, 1.5586093664169312, 1.72421395778656, 1.889818549156189, 2.0554232597351074, 2.2210278511047363, 2.3866324424743652, 2.552237033843994, 2.717841625213623, 2.883446216583252, 3.049050807952881, 3.2146553993225098, 3.3802602291107178, 3.5458648204803467, 3.7114694118499756, 3.8770740032196045, 4.0426788330078125, 4.208283424377441, 4.37388801574707, 4.539492607116699, 4.705097198486328, 4.870701789855957, 5.036306381225586]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 9.0, 5.0, 5.0, 8.0, 16.0, 19.0, 34.0, 55.0, 76.0, 153.0, 306.0, 666.0, 1633.0, 4864.0, 17796.0, 84524.0, 434452.0, 403895.0, 76191.0, 16503.0, 4620.0, 1510.0, 568.0, 275.0, 145.0, 81.0, 38.0, 35.0, 18.0, 15.0, 11.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.70361328125, -2.6240234375, -2.54443359375, -2.46484375, -2.38525390625, -2.3056640625, -2.22607421875, -2.146484375, -2.06689453125, -1.9873046875, -1.90771484375, -1.828125, -1.74853515625, -1.6689453125, -1.58935546875, -1.509765625, -1.43017578125, -1.3505859375, -1.27099609375, -1.19140625, -1.11181640625, -1.0322265625, -0.95263671875, -0.873046875, -0.79345703125, -0.7138671875, -0.63427734375, -0.5546875, -0.47509765625, -0.3955078125, -0.31591796875, -0.236328125, -0.15673828125, -0.0771484375, 0.00244140625, 0.08203125, 0.16162109375, 0.2412109375, 0.32080078125, 0.400390625, 0.47998046875, 0.5595703125, 0.63916015625, 0.71875, 0.79833984375, 0.8779296875, 0.95751953125, 1.037109375, 1.11669921875, 1.1962890625, 1.27587890625, 1.35546875, 1.43505859375, 1.5146484375, 1.59423828125, 1.673828125, 1.75341796875, 1.8330078125, 1.91259765625, 1.9921875, 2.07177734375, 2.1513671875, 2.23095703125, 2.310546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 7.0, 8.0, 9.0, 15.0, 15.0, 19.0, 21.0, 44.0, 44.0, 35.0, 36.0, 40.0, 68.0, 54.0, 81.0, 67.0, 77.0, 70.0, 50.0, 44.0, 37.0, 36.0, 29.0, 22.0, 20.0, 17.0, 9.0, 6.0, 5.0, 10.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6293830871582031, -0.6127700805664062, -0.5961570739746094, -0.5795440673828125, -0.5629310607910156, -0.5463180541992188, -0.5297050476074219, -0.513092041015625, -0.4964790344238281, -0.47986602783203125, -0.4632530212402344, -0.4466400146484375, -0.4300270080566406, -0.41341400146484375, -0.3968009948730469, -0.38018798828125, -0.3635749816894531, -0.34696197509765625, -0.3303489685058594, -0.3137359619140625, -0.2971229553222656, -0.28050994873046875, -0.2638969421386719, -0.247283935546875, -0.23067092895507812, -0.21405792236328125, -0.19744491577148438, -0.1808319091796875, -0.16421890258789062, -0.14760589599609375, -0.13099288940429688, -0.1143798828125, -0.09776687622070312, -0.08115386962890625, -0.06454086303710938, -0.0479278564453125, -0.031314849853515625, -0.01470184326171875, 0.001911163330078125, 0.018524169921875, 0.035137176513671875, 0.05175018310546875, 0.06836318969726562, 0.0849761962890625, 0.10158920288085938, 0.11820220947265625, 0.13481521606445312, 0.15142822265625, 0.16804122924804688, 0.18465423583984375, 0.20126724243164062, 0.2178802490234375, 0.23449325561523438, 0.25110626220703125, 0.2677192687988281, 0.284332275390625, 0.3009452819824219, 0.31755828857421875, 0.3341712951660156, 0.3507843017578125, 0.3673973083496094, 0.38401031494140625, 0.4006233215332031, 0.417236328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 22.0, 11.0, 15.0, 27.0, 56.0, 94.0, 109.0, 206.0, 467.0, 924.0, 1896.0, 4329.0, 10595.0, 29847.0, 109112.0, 397174.0, 356843.0, 93565.0, 26708.0, 9271.0, 3789.0, 1718.0, 825.0, 388.0, 238.0, 133.0, 59.0, 39.0, 28.0, 26.0, 19.0, 7.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.384765625, -1.331390380859375, -1.27801513671875, -1.224639892578125, -1.1712646484375, -1.117889404296875, -1.06451416015625, -1.011138916015625, -0.957763671875, -0.904388427734375, -0.85101318359375, -0.797637939453125, -0.7442626953125, -0.690887451171875, -0.63751220703125, -0.584136962890625, -0.53076171875, -0.477386474609375, -0.42401123046875, -0.370635986328125, -0.3172607421875, -0.263885498046875, -0.21051025390625, -0.157135009765625, -0.103759765625, -0.050384521484375, 0.00299072265625, 0.056365966796875, 0.1097412109375, 0.163116455078125, 0.21649169921875, 0.269866943359375, 0.3232421875, 0.376617431640625, 0.42999267578125, 0.483367919921875, 0.5367431640625, 0.590118408203125, 0.64349365234375, 0.696868896484375, 0.750244140625, 0.803619384765625, 0.85699462890625, 0.910369873046875, 0.9637451171875, 1.017120361328125, 1.07049560546875, 1.123870849609375, 1.17724609375, 1.230621337890625, 1.28399658203125, 1.337371826171875, 1.3907470703125, 1.444122314453125, 1.49749755859375, 1.550872802734375, 1.604248046875, 1.657623291015625, 1.71099853515625, 1.764373779296875, 1.8177490234375, 1.871124267578125, 1.92449951171875, 1.977874755859375, 2.03125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 9.0, 5.0, 7.0, 2.0, 11.0, 9.0, 21.0, 15.0, 17.0, 18.0, 18.0, 32.0, 25.0, 51.0, 51.0, 45.0, 55.0, 54.0, 57.0, 55.0, 47.0, 59.0, 55.0, 48.0, 40.0, 41.0, 28.0, 29.0, 19.0, 16.0, 13.0, 9.0, 8.0, 10.0, 5.0, 8.0, 2.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.034698486328125, -1.96392822265625, -1.893157958984375, -1.8223876953125, -1.751617431640625, -1.68084716796875, -1.610076904296875, -1.539306640625, -1.468536376953125, -1.39776611328125, -1.326995849609375, -1.2562255859375, -1.185455322265625, -1.11468505859375, -1.043914794921875, -0.97314453125, -0.902374267578125, -0.83160400390625, -0.760833740234375, -0.6900634765625, -0.619293212890625, -0.54852294921875, -0.477752685546875, -0.406982421875, -0.336212158203125, -0.26544189453125, -0.194671630859375, -0.1239013671875, -0.053131103515625, 0.01763916015625, 0.088409423828125, 0.1591796875, 0.229949951171875, 0.30072021484375, 0.371490478515625, 0.4422607421875, 0.513031005859375, 0.58380126953125, 0.654571533203125, 0.725341796875, 0.796112060546875, 0.86688232421875, 0.937652587890625, 1.0084228515625, 1.079193115234375, 1.14996337890625, 1.220733642578125, 1.29150390625, 1.362274169921875, 1.43304443359375, 1.503814697265625, 1.5745849609375, 1.645355224609375, 1.71612548828125, 1.786895751953125, 1.857666015625, 1.928436279296875, 1.99920654296875, 2.069976806640625, 2.1407470703125, 2.211517333984375, 2.28228759765625, 2.353057861328125, 2.423828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 12.0, 12.0, 16.0, 36.0, 38.0, 74.0, 115.0, 220.0, 382.0, 739.0, 1682.0, 5380.0, 24594.0, 165052.0, 642676.0, 172988.0, 25366.0, 5763.0, 1801.0, 706.0, 373.0, 228.0, 106.0, 81.0, 36.0, 20.0, 19.0, 11.0, 4.0, 3.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.248046875, -1.211883544921875, -1.17572021484375, -1.139556884765625, -1.1033935546875, -1.067230224609375, -1.03106689453125, -0.994903564453125, -0.958740234375, -0.922576904296875, -0.88641357421875, -0.850250244140625, -0.8140869140625, -0.777923583984375, -0.74176025390625, -0.705596923828125, -0.66943359375, -0.633270263671875, -0.59710693359375, -0.560943603515625, -0.5247802734375, -0.488616943359375, -0.45245361328125, -0.416290283203125, -0.380126953125, -0.343963623046875, -0.30780029296875, -0.271636962890625, -0.2354736328125, -0.199310302734375, -0.16314697265625, -0.126983642578125, -0.0908203125, -0.054656982421875, -0.01849365234375, 0.017669677734375, 0.0538330078125, 0.089996337890625, 0.12615966796875, 0.162322998046875, 0.198486328125, 0.234649658203125, 0.27081298828125, 0.306976318359375, 0.3431396484375, 0.379302978515625, 0.41546630859375, 0.451629638671875, 0.48779296875, 0.523956298828125, 0.56011962890625, 0.596282958984375, 0.6324462890625, 0.668609619140625, 0.70477294921875, 0.740936279296875, 0.777099609375, 0.813262939453125, 0.84942626953125, 0.885589599609375, 0.9217529296875, 0.957916259765625, 0.99407958984375, 1.030242919921875, 1.06640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 11.0, 14.0, 16.0, 24.0, 53.0, 66.0, 75.0, 112.0, 135.0, 132.0, 104.0, 71.0, 68.0, 35.0, 27.0, 18.0, 9.0, 19.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001571178436279297, -0.0001510903239250183, -0.00014506280422210693, -0.00013903528451919556, -0.00013300776481628418, -0.0001269802451133728, -0.00012095272541046143, -0.00011492520570755005, -0.00010889768600463867, -0.0001028701663017273, -9.684264659881592e-05, -9.081512689590454e-05, -8.478760719299316e-05, -7.876008749008179e-05, -7.273256778717041e-05, -6.670504808425903e-05, -6.0677528381347656e-05, -5.465000867843628e-05, -4.86224889755249e-05, -4.2594969272613525e-05, -3.656744956970215e-05, -3.053992986679077e-05, -2.4512410163879395e-05, -1.8484890460968018e-05, -1.245737075805664e-05, -6.429851055145264e-06, -4.023313522338867e-07, 5.62518835067749e-06, 1.1652708053588867e-05, 1.7680227756500244e-05, 2.370774745941162e-05, 2.9735267162322998e-05, 3.5762786865234375e-05, 4.179030656814575e-05, 4.781782627105713e-05, 5.3845345973968506e-05, 5.987286567687988e-05, 6.590038537979126e-05, 7.192790508270264e-05, 7.795542478561401e-05, 8.398294448852539e-05, 9.001046419143677e-05, 9.603798389434814e-05, 0.00010206550359725952, 0.0001080930233001709, 0.00011412054300308228, 0.00012014806270599365, 0.00012617558240890503, 0.0001322031021118164, 0.00013823062181472778, 0.00014425814151763916, 0.00015028566122055054, 0.00015631318092346191, 0.0001623407006263733, 0.00016836822032928467, 0.00017439574003219604, 0.00018042325973510742, 0.0001864507794380188, 0.00019247829914093018, 0.00019850581884384155, 0.00020453333854675293, 0.0002105608582496643, 0.00021658837795257568, 0.00022261589765548706, 0.00022864341735839844]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 11.0, 4.0, 10.0, 4.0, 9.0, 23.0, 32.0, 35.0, 67.0, 98.0, 241.0, 464.0, 1161.0, 3943.0, 17746.0, 122127.0, 606771.0, 253001.0, 33406.0, 6367.0, 1755.0, 640.0, 271.0, 157.0, 83.0, 47.0, 36.0, 20.0, 13.0, 12.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.5205078125, -1.4840240478515625, -1.447540283203125, -1.4110565185546875, -1.37457275390625, -1.3380889892578125, -1.301605224609375, -1.2651214599609375, -1.2286376953125, -1.1921539306640625, -1.155670166015625, -1.1191864013671875, -1.08270263671875, -1.0462188720703125, -1.009735107421875, -0.9732513427734375, -0.936767578125, -0.9002838134765625, -0.863800048828125, -0.8273162841796875, -0.79083251953125, -0.7543487548828125, -0.717864990234375, -0.6813812255859375, -0.6448974609375, -0.6084136962890625, -0.571929931640625, -0.5354461669921875, -0.49896240234375, -0.4624786376953125, -0.425994873046875, -0.3895111083984375, -0.35302734375, -0.3165435791015625, -0.280059814453125, -0.2435760498046875, -0.20709228515625, -0.1706085205078125, -0.134124755859375, -0.0976409912109375, -0.0611572265625, -0.0246734619140625, 0.011810302734375, 0.0482940673828125, 0.08477783203125, 0.1212615966796875, 0.157745361328125, 0.1942291259765625, 0.230712890625, 0.2671966552734375, 0.303680419921875, 0.3401641845703125, 0.37664794921875, 0.4131317138671875, 0.449615478515625, 0.4860992431640625, 0.5225830078125, 0.5590667724609375, 0.595550537109375, 0.6320343017578125, 0.66851806640625, 0.7050018310546875, 0.741485595703125, 0.7779693603515625, 0.814453125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 11.0, 16.0, 29.0, 32.0, 32.0, 62.0, 101.0, 140.0, 163.0, 113.0, 88.0, 58.0, 39.0, 26.0, 26.0, 17.0, 6.0, 15.0, 7.0, 3.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.826171875, -1.7821502685546875, -1.738128662109375, -1.6941070556640625, -1.65008544921875, -1.6060638427734375, -1.562042236328125, -1.5180206298828125, -1.4739990234375, -1.4299774169921875, -1.385955810546875, -1.3419342041015625, -1.29791259765625, -1.2538909912109375, -1.209869384765625, -1.1658477783203125, -1.121826171875, -1.0778045654296875, -1.033782958984375, -0.9897613525390625, -0.94573974609375, -0.9017181396484375, -0.857696533203125, -0.8136749267578125, -0.7696533203125, -0.7256317138671875, -0.681610107421875, -0.6375885009765625, -0.59356689453125, -0.5495452880859375, -0.505523681640625, -0.4615020751953125, -0.41748046875, -0.3734588623046875, -0.329437255859375, -0.2854156494140625, -0.24139404296875, -0.1973724365234375, -0.153350830078125, -0.1093292236328125, -0.0653076171875, -0.0212860107421875, 0.022735595703125, 0.0667572021484375, 0.11077880859375, 0.1548004150390625, 0.198822021484375, 0.2428436279296875, 0.286865234375, 0.3308868408203125, 0.374908447265625, 0.4189300537109375, 0.46295166015625, 0.5069732666015625, 0.550994873046875, 0.5950164794921875, 0.6390380859375, 0.6830596923828125, 0.727081298828125, 0.7711029052734375, 0.81512451171875, 0.8591461181640625, 0.903167724609375, 0.9471893310546875, 0.9912109375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 24.0, 38.0, 180.0, 330.0, 287.0, 115.0, 28.0, 10.0], "bins": [-77.53179931640625, -76.23814392089844, -74.9444808959961, -73.65082550048828, -72.35717010498047, -71.06350708007812, -69.76985168457031, -68.4761962890625, -67.18254089355469, -65.88888549804688, -64.59522247314453, -63.30156707763672, -62.007911682128906, -60.71425247192383, -59.42059326171875, -58.12693786621094, -56.833274841308594, -55.539615631103516, -54.2459602355957, -52.952301025390625, -51.65864562988281, -50.364986419677734, -49.071327209472656, -47.777671813964844, -46.484012603759766, -45.19035339355469, -43.896697998046875, -42.6030387878418, -41.30937957763672, -40.015724182128906, -38.72206497192383, -37.42840576171875, -36.13474655151367, -34.841087341308594, -33.54743194580078, -32.2537727355957, -30.960115432739258, -29.666458129882812, -28.372798919677734, -27.07914161682129, -25.785486221313477, -24.49182891845703, -23.198169708251953, -21.904512405395508, -20.610855102539062, -19.317197799682617, -18.023540496826172, -16.729881286621094, -15.436223983764648, -14.142566680908203, -12.848908424377441, -11.55525016784668, -10.261592864990234, -8.967935562133789, -7.674277305603027, -6.380619049072266, -5.086961269378662, -3.7933034896850586, -2.499645709991455, -1.2059879302978516, 0.08766984939575195, 1.3813276290893555, 2.674985408782959, 3.9686436653137207, 5.262300968170166]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 12.0, 10.0, 10.0, 27.0, 17.0, 17.0, 24.0, 34.0, 37.0, 36.0, 38.0, 57.0, 54.0, 63.0, 62.0, 51.0, 77.0, 56.0, 53.0, 35.0, 43.0, 28.0, 34.0, 28.0, 27.0, 27.0, 16.0, 18.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.77413558959961, -13.325748443603516, -12.877361297607422, -12.428975105285645, -11.98058795928955, -11.532200813293457, -11.08381462097168, -10.635427474975586, -10.187040328979492, -9.738653182983398, -9.290266036987305, -8.841879844665527, -8.393492698669434, -7.94510555267334, -7.496718883514404, -7.048332214355469, -6.599945068359375, -6.151557922363281, -5.703171253204346, -5.25478458404541, -4.806397438049316, -4.358010292053223, -3.909623622894287, -3.4612367153167725, -3.012849807739258, -2.564462900161743, -2.1160759925842285, -1.6676890850067139, -1.2193021774291992, -0.7709152698516846, -0.3225283622741699, 0.12585854530334473, 0.5742454528808594, 1.022632360458374, 1.4710192680358887, 1.9194061756134033, 2.367793083190918, 2.8161799907684326, 3.2645668983459473, 3.712953805923462, 4.161340713500977, 4.60972785949707, 5.058114528656006, 5.506501197814941, 5.954888343811035, 6.403275489807129, 6.8516621589660645, 7.300048828125, 7.748435974121094, 8.196823120117188, 8.645210266113281, 9.093596458435059, 9.541983604431152, 9.990370750427246, 10.438756942749023, 10.887144088745117, 11.335531234741211, 11.783918380737305, 12.232305526733398, 12.680691719055176, 13.12907886505127, 13.577466011047363, 14.02585220336914, 14.474239349365234, 14.922626495361328]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 8.0, 5.0, 4.0, 10.0, 9.0, 8.0, 18.0, 49.0, 71.0, 132.0, 323.0, 866.0, 2506.0, 13404.0, 4098100.0, 70732.0, 5577.0, 1454.0, 538.0, 203.0, 102.0, 71.0, 24.0, 22.0, 17.0, 9.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 4.0], "bins": [-7.82421875, -7.653289794921875, -7.48236083984375, -7.311431884765625, -7.1405029296875, -6.969573974609375, -6.79864501953125, -6.627716064453125, -6.456787109375, -6.285858154296875, -6.11492919921875, -5.944000244140625, -5.7730712890625, -5.602142333984375, -5.43121337890625, -5.260284423828125, -5.08935546875, -4.918426513671875, -4.74749755859375, -4.576568603515625, -4.4056396484375, -4.234710693359375, -4.06378173828125, -3.892852783203125, -3.721923828125, -3.550994873046875, -3.38006591796875, -3.209136962890625, -3.0382080078125, -2.867279052734375, -2.69635009765625, -2.525421142578125, -2.3544921875, -2.183563232421875, -2.01263427734375, -1.841705322265625, -1.6707763671875, -1.499847412109375, -1.32891845703125, -1.157989501953125, -0.987060546875, -0.816131591796875, -0.64520263671875, -0.474273681640625, -0.3033447265625, -0.132415771484375, 0.03851318359375, 0.209442138671875, 0.38037109375, 0.551300048828125, 0.72222900390625, 0.893157958984375, 1.0640869140625, 1.235015869140625, 1.40594482421875, 1.576873779296875, 1.747802734375, 1.918731689453125, 2.08966064453125, 2.260589599609375, 2.4315185546875, 2.602447509765625, 2.77337646484375, 2.944305419921875, 3.115234375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 7.0, 8.0, 8.0, 8.0, 14.0, 14.0, 15.0, 13.0, 21.0, 24.0, 30.0, 45.0, 51.0, 30.0, 45.0, 49.0, 50.0, 51.0, 49.0, 46.0, 46.0, 51.0, 35.0, 41.0, 45.0, 33.0, 37.0, 26.0, 22.0, 9.0, 11.0, 15.0, 11.0, 11.0, 9.0, 1.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.60986328125, -0.5930099487304688, -0.5761566162109375, -0.5593032836914062, -0.542449951171875, -0.5255966186523438, -0.5087432861328125, -0.49188995361328125, -0.47503662109375, -0.45818328857421875, -0.4413299560546875, -0.42447662353515625, -0.407623291015625, -0.39076995849609375, -0.3739166259765625, -0.35706329345703125, -0.3402099609375, -0.32335662841796875, -0.3065032958984375, -0.28964996337890625, -0.272796630859375, -0.25594329833984375, -0.2390899658203125, -0.22223663330078125, -0.20538330078125, -0.18852996826171875, -0.1716766357421875, -0.15482330322265625, -0.137969970703125, -0.12111663818359375, -0.1042633056640625, -0.08740997314453125, -0.070556640625, -0.05370330810546875, -0.0368499755859375, -0.01999664306640625, -0.003143310546875, 0.01371002197265625, 0.0305633544921875, 0.04741668701171875, 0.06427001953125, 0.08112335205078125, 0.0979766845703125, 0.11483001708984375, 0.131683349609375, 0.14853668212890625, 0.1653900146484375, 0.18224334716796875, 0.1990966796875, 0.21595001220703125, 0.2328033447265625, 0.24965667724609375, 0.266510009765625, 0.28336334228515625, 0.3002166748046875, 0.31707000732421875, 0.33392333984375, 0.35077667236328125, 0.3676300048828125, 0.38448333740234375, 0.401336669921875, 0.41819000244140625, 0.4350433349609375, 0.45189666748046875, 0.46875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 7.0, 10.0, 14.0, 12.0, 21.0, 32.0, 46.0, 62.0, 95.0, 143.0, 228.0, 416.0, 706.0, 1391.0, 3121.0, 8290.0, 31716.0, 3795295.0, 316725.0, 23716.0, 6766.0, 2604.0, 1200.0, 657.0, 341.0, 213.0, 152.0, 94.0, 47.0, 39.0, 29.0, 19.0, 6.0, 10.0, 13.0, 6.0, 6.0, 5.0, 2.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.31640625, -3.221405029296875, -3.12640380859375, -3.031402587890625, -2.9364013671875, -2.841400146484375, -2.74639892578125, -2.651397705078125, -2.556396484375, -2.461395263671875, -2.36639404296875, -2.271392822265625, -2.1763916015625, -2.081390380859375, -1.98638916015625, -1.891387939453125, -1.79638671875, -1.701385498046875, -1.60638427734375, -1.511383056640625, -1.4163818359375, -1.321380615234375, -1.22637939453125, -1.131378173828125, -1.036376953125, -0.941375732421875, -0.84637451171875, -0.751373291015625, -0.6563720703125, -0.561370849609375, -0.46636962890625, -0.371368408203125, -0.2763671875, -0.181365966796875, -0.08636474609375, 0.008636474609375, 0.1036376953125, 0.198638916015625, 0.29364013671875, 0.388641357421875, 0.483642578125, 0.578643798828125, 0.67364501953125, 0.768646240234375, 0.8636474609375, 0.958648681640625, 1.05364990234375, 1.148651123046875, 1.24365234375, 1.338653564453125, 1.43365478515625, 1.528656005859375, 1.6236572265625, 1.718658447265625, 1.81365966796875, 1.908660888671875, 2.003662109375, 2.098663330078125, 2.19366455078125, 2.288665771484375, 2.3836669921875, 2.478668212890625, 2.57366943359375, 2.668670654296875, 2.763671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 10.0, 8.0, 6.0, 5.0, 21.0, 32.0, 54.0, 215.0, 3421.0, 179.0, 51.0, 22.0, 23.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.83251953125, -0.8113784790039062, -0.7902374267578125, -0.7690963745117188, -0.747955322265625, -0.7268142700195312, -0.7056732177734375, -0.6845321655273438, -0.66339111328125, -0.6422500610351562, -0.6211090087890625, -0.5999679565429688, -0.578826904296875, -0.5576858520507812, -0.5365447998046875, -0.5154037475585938, -0.4942626953125, -0.47312164306640625, -0.4519805908203125, -0.43083953857421875, -0.409698486328125, -0.38855743408203125, -0.3674163818359375, -0.34627532958984375, -0.32513427734375, -0.30399322509765625, -0.2828521728515625, -0.26171112060546875, -0.240570068359375, -0.21942901611328125, -0.1982879638671875, -0.17714691162109375, -0.156005859375, -0.13486480712890625, -0.1137237548828125, -0.09258270263671875, -0.071441650390625, -0.05030059814453125, -0.0291595458984375, -0.00801849365234375, 0.01312255859375, 0.03426361083984375, 0.0554046630859375, 0.07654571533203125, 0.097686767578125, 0.11882781982421875, 0.1399688720703125, 0.16110992431640625, 0.1822509765625, 0.20339202880859375, 0.2245330810546875, 0.24567413330078125, 0.266815185546875, 0.28795623779296875, 0.3090972900390625, 0.33023834228515625, 0.35137939453125, 0.37252044677734375, 0.3936614990234375, 0.41480255126953125, 0.435943603515625, 0.45708465576171875, 0.4782257080078125, 0.49936676025390625, 0.5205078125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 3.0, 4.0, 6.0, 14.0, 28.0, 40.0, 60.0, 120.0, 147.0, 166.0, 134.0, 124.0, 76.0, 40.0, 22.0, 11.0, 3.0, 6.0, 6.0, 2.0, 2.0], "bins": [-4.905620574951172, -4.812600135803223, -4.719579696655273, -4.626559257507324, -4.533538341522217, -4.440517902374268, -4.347497463226318, -4.254477024078369, -4.16145658493042, -4.068436145782471, -3.9754154682159424, -3.882395029067993, -3.789374589920044, -3.6963541507720947, -3.6033334732055664, -3.510313034057617, -3.417292594909668, -3.3242721557617188, -3.2312514781951904, -3.138231039047241, -3.045210599899292, -2.9521901607513428, -2.8591694831848145, -2.7661490440368652, -2.673128366470337, -2.5801079273223877, -2.4870872497558594, -2.39406681060791, -2.301046371459961, -2.2080259323120117, -2.1150052547454834, -2.021984815597534, -1.928964376449585, -1.8359438180923462, -1.742923378944397, -1.6499028205871582, -1.556882381439209, -1.4638618230819702, -1.3708412647247314, -1.2778208255767822, -1.184800386428833, -1.0917798280715942, -0.998759388923645, -0.9057388305664062, -0.812718391418457, -0.7196978330612183, -0.6266773343086243, -0.5336568355560303, -0.4406362771987915, -0.3476157784461975, -0.2545952796936035, -0.16157475113868713, -0.06855425238609314, 0.024466246366500854, 0.11748677492141724, 0.21050727367401123, 0.3035277724266052, 0.3965482711791992, 0.4895687699317932, 0.5825892686843872, 0.675609827041626, 0.7686302661895752, 0.861650824546814, 0.954671323299408, 1.047691822052002]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 6.0, 8.0, 20.0, 10.0, 10.0, 9.0, 16.0, 23.0, 26.0, 32.0, 34.0, 29.0, 46.0, 40.0, 35.0, 34.0, 61.0, 46.0, 56.0, 40.0, 38.0, 49.0, 43.0, 30.0, 36.0, 31.0, 31.0, 23.0, 18.0, 18.0, 23.0, 18.0, 7.0, 9.0, 7.0, 5.0, 12.0, 5.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.1453073024749756, -1.1123360395431519, -1.0793648958206177, -1.046393632888794, -1.0134224891662598, -0.980451226234436, -0.9474800229072571, -0.9145088195800781, -0.8815376162528992, -0.8485664129257202, -0.8155952095985413, -0.7826240062713623, -0.7496527433395386, -0.7166815996170044, -0.6837103366851807, -0.6507391333580017, -0.6177679300308228, -0.5847967267036438, -0.5518255233764648, -0.5188543200492859, -0.48588308691978455, -0.4529118835926056, -0.41994065046310425, -0.3869694471359253, -0.35399824380874634, -0.3210270404815674, -0.2880558371543884, -0.2550846040248871, -0.22211340069770813, -0.18914219737052917, -0.15617097914218903, -0.12319976091384888, -0.09022867679595947, -0.05725746601819992, -0.02428625524044037, 0.008684955537319183, 0.041656166315078735, 0.07462736964225769, 0.10759858787059784, 0.140569806098938, 0.17354100942611694, 0.2065122127532959, 0.23948343098163605, 0.2724546492099762, 0.30542585253715515, 0.3383970558643341, 0.37136828899383545, 0.4043394923210144, 0.43731069564819336, 0.4702818989753723, 0.5032531023025513, 0.5362243056297302, 0.5691955089569092, 0.6021667718887329, 0.6351379752159119, 0.6681091785430908, 0.7010803818702698, 0.7340515851974487, 0.7670227885246277, 0.7999939918518066, 0.8329652547836304, 0.8659363985061646, 0.8989076614379883, 0.9318788647651672, 0.9648500680923462]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 6.0, 7.0, 10.0, 24.0, 23.0, 36.0, 52.0, 84.0, 195.0, 436.0, 970.0, 2413.0, 6829.0, 22070.0, 78555.0, 269174.0, 419266.0, 177908.0, 48562.0, 14148.0, 4646.0, 1737.0, 703.0, 333.0, 141.0, 89.0, 47.0, 29.0, 12.0, 13.0, 7.0, 7.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.509765625, -2.42962646484375, -2.3494873046875, -2.26934814453125, -2.189208984375, -2.10906982421875, -2.0289306640625, -1.94879150390625, -1.86865234375, -1.78851318359375, -1.7083740234375, -1.62823486328125, -1.548095703125, -1.46795654296875, -1.3878173828125, -1.30767822265625, -1.2275390625, -1.14739990234375, -1.0672607421875, -0.98712158203125, -0.906982421875, -0.82684326171875, -0.7467041015625, -0.66656494140625, -0.58642578125, -0.50628662109375, -0.4261474609375, -0.34600830078125, -0.265869140625, -0.18572998046875, -0.1055908203125, -0.02545166015625, 0.0546875, 0.13482666015625, 0.2149658203125, 0.29510498046875, 0.375244140625, 0.45538330078125, 0.5355224609375, 0.61566162109375, 0.69580078125, 0.77593994140625, 0.8560791015625, 0.93621826171875, 1.016357421875, 1.09649658203125, 1.1766357421875, 1.25677490234375, 1.3369140625, 1.41705322265625, 1.4971923828125, 1.57733154296875, 1.657470703125, 1.73760986328125, 1.8177490234375, 1.89788818359375, 1.97802734375, 2.05816650390625, 2.1383056640625, 2.21844482421875, 2.298583984375, 2.37872314453125, 2.4588623046875, 2.53900146484375, 2.619140625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 6.0, 5.0, 5.0, 9.0, 5.0, 19.0, 9.0, 17.0, 20.0, 19.0, 34.0, 29.0, 26.0, 44.0, 35.0, 44.0, 49.0, 48.0, 43.0, 46.0, 37.0, 45.0, 49.0, 40.0, 40.0, 38.0, 41.0, 29.0, 33.0, 30.0, 22.0, 14.0, 16.0, 13.0, 13.0, 10.0, 6.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6240234375, -0.6060409545898438, -0.5880584716796875, -0.5700759887695312, -0.552093505859375, -0.5341110229492188, -0.5161285400390625, -0.49814605712890625, -0.48016357421875, -0.46218109130859375, -0.4441986083984375, -0.42621612548828125, -0.408233642578125, -0.39025115966796875, -0.3722686767578125, -0.35428619384765625, -0.3363037109375, -0.31832122802734375, -0.3003387451171875, -0.28235626220703125, -0.264373779296875, -0.24639129638671875, -0.2284088134765625, -0.21042633056640625, -0.19244384765625, -0.17446136474609375, -0.1564788818359375, -0.13849639892578125, -0.120513916015625, -0.10253143310546875, -0.0845489501953125, -0.06656646728515625, -0.048583984375, -0.03060150146484375, -0.0126190185546875, 0.00536346435546875, 0.023345947265625, 0.04132843017578125, 0.0593109130859375, 0.07729339599609375, 0.09527587890625, 0.11325836181640625, 0.1312408447265625, 0.14922332763671875, 0.167205810546875, 0.18518829345703125, 0.2031707763671875, 0.22115325927734375, 0.2391357421875, 0.25711822509765625, 0.2751007080078125, 0.29308319091796875, 0.311065673828125, 0.32904815673828125, 0.3470306396484375, 0.36501312255859375, 0.38299560546875, 0.40097808837890625, 0.4189605712890625, 0.43694305419921875, 0.454925537109375, 0.47290802001953125, 0.4908905029296875, 0.5088729858398438, 0.52685546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 13.0, 13.0, 34.0, 27.0, 67.0, 76.0, 158.0, 203.0, 385.0, 765.0, 1376.0, 2657.0, 5655.0, 12495.0, 29933.0, 76586.0, 199486.0, 374617.0, 208500.0, 79083.0, 31016.0, 13309.0, 5953.0, 2829.0, 1446.0, 758.0, 435.0, 246.0, 167.0, 94.0, 42.0, 35.0, 22.0, 13.0, 13.0, 15.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.64453125, -1.5923614501953125, -1.540191650390625, -1.4880218505859375, -1.43585205078125, -1.3836822509765625, -1.331512451171875, -1.2793426513671875, -1.2271728515625, -1.1750030517578125, -1.122833251953125, -1.0706634521484375, -1.01849365234375, -0.9663238525390625, -0.914154052734375, -0.8619842529296875, -0.809814453125, -0.7576446533203125, -0.705474853515625, -0.6533050537109375, -0.60113525390625, -0.5489654541015625, -0.496795654296875, -0.4446258544921875, -0.3924560546875, -0.3402862548828125, -0.288116455078125, -0.2359466552734375, -0.18377685546875, -0.1316070556640625, -0.079437255859375, -0.0272674560546875, 0.02490234375, 0.0770721435546875, 0.129241943359375, 0.1814117431640625, 0.23358154296875, 0.2857513427734375, 0.337921142578125, 0.3900909423828125, 0.4422607421875, 0.4944305419921875, 0.546600341796875, 0.5987701416015625, 0.65093994140625, 0.7031097412109375, 0.755279541015625, 0.8074493408203125, 0.859619140625, 0.9117889404296875, 0.963958740234375, 1.0161285400390625, 1.06829833984375, 1.1204681396484375, 1.172637939453125, 1.2248077392578125, 1.2769775390625, 1.3291473388671875, 1.381317138671875, 1.4334869384765625, 1.48565673828125, 1.5378265380859375, 1.589996337890625, 1.6421661376953125, 1.6943359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 10.0, 10.0, 15.0, 28.0, 21.0, 22.0, 21.0, 49.0, 34.0, 37.0, 58.0, 49.0, 56.0, 63.0, 51.0, 65.0, 54.0, 46.0, 42.0, 43.0, 38.0, 32.0, 24.0, 22.0, 23.0, 15.0, 8.0, 11.0, 13.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.173828125, -3.056732177734375, -2.93963623046875, -2.822540283203125, -2.7054443359375, -2.588348388671875, -2.47125244140625, -2.354156494140625, -2.237060546875, -2.119964599609375, -2.00286865234375, -1.885772705078125, -1.7686767578125, -1.651580810546875, -1.53448486328125, -1.417388916015625, -1.30029296875, -1.183197021484375, -1.06610107421875, -0.949005126953125, -0.8319091796875, -0.714813232421875, -0.59771728515625, -0.480621337890625, -0.363525390625, -0.246429443359375, -0.12933349609375, -0.012237548828125, 0.1048583984375, 0.221954345703125, 0.33905029296875, 0.456146240234375, 0.5732421875, 0.690338134765625, 0.80743408203125, 0.924530029296875, 1.0416259765625, 1.158721923828125, 1.27581787109375, 1.392913818359375, 1.510009765625, 1.627105712890625, 1.74420166015625, 1.861297607421875, 1.9783935546875, 2.095489501953125, 2.21258544921875, 2.329681396484375, 2.44677734375, 2.563873291015625, 2.68096923828125, 2.798065185546875, 2.9151611328125, 3.032257080078125, 3.14935302734375, 3.266448974609375, 3.383544921875, 3.500640869140625, 3.61773681640625, 3.734832763671875, 3.8519287109375, 3.969024658203125, 4.08612060546875, 4.203216552734375, 4.3203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 17.0, 31.0, 53.0, 87.0, 172.0, 412.0, 1173.0, 6321.0, 199505.0, 825101.0, 12858.0, 1851.0, 494.0, 213.0, 95.0, 57.0, 48.0, 16.0, 6.0, 13.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.5078125, -4.36761474609375, -4.2274169921875, -4.08721923828125, -3.947021484375, -3.80682373046875, -3.6666259765625, -3.52642822265625, -3.38623046875, -3.24603271484375, -3.1058349609375, -2.96563720703125, -2.825439453125, -2.68524169921875, -2.5450439453125, -2.40484619140625, -2.2646484375, -2.12445068359375, -1.9842529296875, -1.84405517578125, -1.703857421875, -1.56365966796875, -1.4234619140625, -1.28326416015625, -1.14306640625, -1.00286865234375, -0.8626708984375, -0.72247314453125, -0.582275390625, -0.44207763671875, -0.3018798828125, -0.16168212890625, -0.021484375, 0.11871337890625, 0.2589111328125, 0.39910888671875, 0.539306640625, 0.67950439453125, 0.8197021484375, 0.95989990234375, 1.10009765625, 1.24029541015625, 1.3804931640625, 1.52069091796875, 1.660888671875, 1.80108642578125, 1.9412841796875, 2.08148193359375, 2.2216796875, 2.36187744140625, 2.5020751953125, 2.64227294921875, 2.782470703125, 2.92266845703125, 3.0628662109375, 3.20306396484375, 3.34326171875, 3.48345947265625, 3.6236572265625, 3.76385498046875, 3.904052734375, 4.04425048828125, 4.1844482421875, 4.32464599609375, 4.46484375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 16.0, 27.0, 25.0, 43.0, 58.0, 83.0, 91.0, 136.0, 119.0, 100.0, 104.0, 66.0, 29.0, 30.0, 24.0, 16.0, 8.0, 8.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014734268188476562, -0.00013963505625724792, -0.00013192743062973022, -0.00012421980500221252, -0.00011651217937469482, -0.00010880455374717712, -0.00010109692811965942, -9.338930249214172e-05, -8.568167686462402e-05, -7.797405123710632e-05, -7.026642560958862e-05, -6.255879998207092e-05, -5.485117435455322e-05, -4.714354872703552e-05, -3.943592309951782e-05, -3.172829747200012e-05, -2.4020671844482422e-05, -1.631304621696472e-05, -8.605420589447021e-06, -8.977949619293213e-07, 6.809830665588379e-06, 1.4517456293106079e-05, 2.222508192062378e-05, 2.993270754814148e-05, 3.764033317565918e-05, 4.534795880317688e-05, 5.305558443069458e-05, 6.076321005821228e-05, 6.847083568572998e-05, 7.617846131324768e-05, 8.388608694076538e-05, 9.159371256828308e-05, 9.930133819580078e-05, 0.00010700896382331848, 0.00011471658945083618, 0.00012242421507835388, 0.00013013184070587158, 0.00013783946633338928, 0.00014554709196090698, 0.00015325471758842468, 0.00016096234321594238, 0.00016866996884346008, 0.00017637759447097778, 0.00018408522009849548, 0.00019179284572601318, 0.00019950047135353088, 0.00020720809698104858, 0.00021491572260856628, 0.00022262334823608398, 0.00023033097386360168, 0.00023803859949111938, 0.0002457462251186371, 0.0002534538507461548, 0.0002611614763736725, 0.0002688691020011902, 0.0002765767276287079, 0.0002842843532562256, 0.0002919919788837433, 0.000299699604511261, 0.0003074072301387787, 0.0003151148557662964, 0.0003228224813938141, 0.0003305301070213318, 0.0003382377326488495, 0.0003459453582763672]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 9.0, 10.0, 27.0, 41.0, 91.0, 221.0, 678.0, 2332.0, 12879.0, 325334.0, 681136.0, 21214.0, 3222.0, 845.0, 294.0, 102.0, 62.0, 24.0, 9.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.416015625, -3.31585693359375, -3.2156982421875, -3.11553955078125, -3.015380859375, -2.91522216796875, -2.8150634765625, -2.71490478515625, -2.61474609375, -2.51458740234375, -2.4144287109375, -2.31427001953125, -2.214111328125, -2.11395263671875, -2.0137939453125, -1.91363525390625, -1.8134765625, -1.71331787109375, -1.6131591796875, -1.51300048828125, -1.412841796875, -1.31268310546875, -1.2125244140625, -1.11236572265625, -1.01220703125, -0.91204833984375, -0.8118896484375, -0.71173095703125, -0.611572265625, -0.51141357421875, -0.4112548828125, -0.31109619140625, -0.2109375, -0.11077880859375, -0.0106201171875, 0.08953857421875, 0.189697265625, 0.28985595703125, 0.3900146484375, 0.49017333984375, 0.59033203125, 0.69049072265625, 0.7906494140625, 0.89080810546875, 0.990966796875, 1.09112548828125, 1.1912841796875, 1.29144287109375, 1.3916015625, 1.49176025390625, 1.5919189453125, 1.69207763671875, 1.792236328125, 1.89239501953125, 1.9925537109375, 2.09271240234375, 2.19287109375, 2.29302978515625, 2.3931884765625, 2.49334716796875, 2.593505859375, 2.69366455078125, 2.7938232421875, 2.89398193359375, 2.994140625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 4.0, 10.0, 6.0, 9.0, 20.0, 32.0, 85.0, 142.0, 204.0, 230.0, 118.0, 61.0, 31.0, 18.0, 7.0, 7.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.546875, -4.42962646484375, -4.3123779296875, -4.19512939453125, -4.077880859375, -3.96063232421875, -3.8433837890625, -3.72613525390625, -3.60888671875, -3.49163818359375, -3.3743896484375, -3.25714111328125, -3.139892578125, -3.02264404296875, -2.9053955078125, -2.78814697265625, -2.6708984375, -2.55364990234375, -2.4364013671875, -2.31915283203125, -2.201904296875, -2.08465576171875, -1.9674072265625, -1.85015869140625, -1.73291015625, -1.61566162109375, -1.4984130859375, -1.38116455078125, -1.263916015625, -1.14666748046875, -1.0294189453125, -0.91217041015625, -0.794921875, -0.67767333984375, -0.5604248046875, -0.44317626953125, -0.325927734375, -0.20867919921875, -0.0914306640625, 0.02581787109375, 0.14306640625, 0.26031494140625, 0.3775634765625, 0.49481201171875, 0.612060546875, 0.72930908203125, 0.8465576171875, 0.96380615234375, 1.0810546875, 1.19830322265625, 1.3155517578125, 1.43280029296875, 1.550048828125, 1.66729736328125, 1.7845458984375, 1.90179443359375, 2.01904296875, 2.13629150390625, 2.2535400390625, 2.37078857421875, 2.488037109375, 2.60528564453125, 2.7225341796875, 2.83978271484375, 2.95703125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 14.0, 28.0, 74.0, 170.0, 270.0, 231.0, 144.0, 60.0, 12.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.5616569519043, -31.949108123779297, -30.336559295654297, -28.724008560180664, -27.111459732055664, -25.498910903930664, -23.88636016845703, -22.27381134033203, -20.66126251220703, -19.04871368408203, -17.43616485595703, -15.823614120483398, -14.211065292358398, -12.598516464233398, -10.985966682434082, -9.373416900634766, -7.760868072509766, -6.148318767547607, -4.535769462585449, -2.923220157623291, -1.3106708526611328, 0.3018779754638672, 1.9144277572631836, 3.5269775390625, 5.1395263671875, 6.752075672149658, 8.364624977111816, 9.977174758911133, 11.589723587036133, 13.202272415161133, 14.81482219696045, 16.427371978759766, 18.03992462158203, 19.65247344970703, 21.26502227783203, 22.877573013305664, 24.490121841430664, 26.102670669555664, 27.715221405029297, 29.327770233154297, 30.940319061279297, 32.5528678894043, 34.1654167175293, 35.7779655456543, 37.39051818847656, 39.00306701660156, 40.61561584472656, 42.22816467285156, 43.84071350097656, 45.45326232910156, 47.06581115722656, 48.67835998535156, 50.29090881347656, 51.90345764160156, 53.51601028442383, 55.12855911254883, 56.74110794067383, 58.35365676879883, 59.96620559692383, 61.57875442504883, 63.191307067871094, 64.8038558959961, 66.4164047241211, 68.0289535522461, 69.6415023803711]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 0.0, 10.0, 9.0, 7.0, 10.0, 11.0, 17.0, 15.0, 19.0, 27.0, 25.0, 17.0, 27.0, 33.0, 44.0, 52.0, 44.0, 47.0, 39.0, 48.0, 60.0, 47.0, 57.0, 43.0, 29.0, 39.0, 28.0, 22.0, 24.0, 18.0, 21.0, 28.0, 18.0, 6.0, 12.0, 10.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-17.513343811035156, -16.96009635925293, -16.40684700012207, -15.853599548339844, -15.300352096557617, -14.747103691101074, -14.193855285644531, -13.640607833862305, -13.087359428405762, -12.534111022949219, -11.980863571166992, -11.42761516571045, -10.874366760253906, -10.32111930847168, -9.767870903015137, -9.214622497558594, -8.661375045776367, -8.108126640319824, -7.554879188537598, -7.001630783081055, -6.44838285446167, -5.895134925842285, -5.341886520385742, -4.788638591766357, -4.235390663146973, -3.682142734527588, -3.128894567489624, -2.57564640045166, -2.0223984718322754, -1.4691505432128906, -0.9159023761749268, -0.3626542091369629, 0.19059371948242188, 0.7438417673110962, 1.2970898151397705, 1.8503378629684448, 2.403585910797119, 2.956833839416504, 3.5100820064544678, 4.063330173492432, 4.616578102111816, 5.169826030731201, 5.723073959350586, 6.276322364807129, 6.829570293426514, 7.382818222045898, 7.936066627502441, 8.489315032958984, 9.042562484741211, 9.595810890197754, 10.14905834197998, 10.702306747436523, 11.25555419921875, 11.808802604675293, 12.362051010131836, 12.915298461914062, 13.468546867370605, 14.021795272827148, 14.575042724609375, 15.128291130065918, 15.681539535522461, 16.234786987304688, 16.788034439086914, 17.341283798217773, 17.89453125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 15.0, 17.0, 36.0, 69.0, 151.0, 405.0, 1382.0, 7261.0, 4007031.0, 170849.0, 5407.0, 1052.0, 340.0, 128.0, 53.0, 34.0, 14.0, 8.0, 10.0, 1.0, 8.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.453125, -13.1536865234375, -12.854248046875, -12.5548095703125, -12.25537109375, -11.9559326171875, -11.656494140625, -11.3570556640625, -11.0576171875, -10.7581787109375, -10.458740234375, -10.1593017578125, -9.85986328125, -9.5604248046875, -9.260986328125, -8.9615478515625, -8.662109375, -8.3626708984375, -8.063232421875, -7.7637939453125, -7.46435546875, -7.1649169921875, -6.865478515625, -6.5660400390625, -6.2666015625, -5.9671630859375, -5.667724609375, -5.3682861328125, -5.06884765625, -4.7694091796875, -4.469970703125, -4.1705322265625, -3.87109375, -3.5716552734375, -3.272216796875, -2.9727783203125, -2.67333984375, -2.3739013671875, -2.074462890625, -1.7750244140625, -1.4755859375, -1.1761474609375, -0.876708984375, -0.5772705078125, -0.27783203125, 0.0216064453125, 0.321044921875, 0.6204833984375, 0.919921875, 1.2193603515625, 1.518798828125, 1.8182373046875, 2.11767578125, 2.4171142578125, 2.716552734375, 3.0159912109375, 3.3154296875, 3.6148681640625, 3.914306640625, 4.2137451171875, 4.51318359375, 4.8126220703125, 5.112060546875, 5.4114990234375, 5.7109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 1.0, 4.0, 6.0, 9.0, 4.0, 7.0, 14.0, 23.0, 22.0, 27.0, 36.0, 31.0, 32.0, 57.0, 54.0, 42.0, 45.0, 56.0, 46.0, 53.0, 60.0, 54.0, 43.0, 43.0, 48.0, 33.0, 25.0, 22.0, 20.0, 11.0, 13.0, 8.0, 12.0, 7.0, 9.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.87548828125, -0.849853515625, -0.82421875, -0.798583984375, -0.77294921875, -0.747314453125, -0.7216796875, -0.696044921875, -0.67041015625, -0.644775390625, -0.619140625, -0.593505859375, -0.56787109375, -0.542236328125, -0.5166015625, -0.490966796875, -0.46533203125, -0.439697265625, -0.4140625, -0.388427734375, -0.36279296875, -0.337158203125, -0.3115234375, -0.285888671875, -0.26025390625, -0.234619140625, -0.208984375, -0.183349609375, -0.15771484375, -0.132080078125, -0.1064453125, -0.080810546875, -0.05517578125, -0.029541015625, -0.00390625, 0.021728515625, 0.04736328125, 0.072998046875, 0.0986328125, 0.124267578125, 0.14990234375, 0.175537109375, 0.201171875, 0.226806640625, 0.25244140625, 0.278076171875, 0.3037109375, 0.329345703125, 0.35498046875, 0.380615234375, 0.40625, 0.431884765625, 0.45751953125, 0.483154296875, 0.5087890625, 0.534423828125, 0.56005859375, 0.585693359375, 0.611328125, 0.636962890625, 0.66259765625, 0.688232421875, 0.7138671875, 0.739501953125, 0.76513671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 8.0, 10.0, 23.0, 19.0, 35.0, 53.0, 71.0, 99.0, 155.0, 220.0, 320.0, 536.0, 815.0, 1297.0, 2004.0, 3446.0, 6132.0, 12130.0, 32057.0, 140761.0, 3827171.0, 112899.0, 28401.0, 11456.0, 5677.0, 3157.0, 1838.0, 1246.0, 725.0, 506.0, 306.0, 203.0, 143.0, 114.0, 74.0, 56.0, 34.0, 32.0, 18.0, 9.0, 4.0, 10.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.387664794921875, -2.30657958984375, -2.225494384765625, -2.1444091796875, -2.063323974609375, -1.98223876953125, -1.901153564453125, -1.820068359375, -1.738983154296875, -1.65789794921875, -1.576812744140625, -1.4957275390625, -1.414642333984375, -1.33355712890625, -1.252471923828125, -1.17138671875, -1.090301513671875, -1.00921630859375, -0.928131103515625, -0.8470458984375, -0.765960693359375, -0.68487548828125, -0.603790283203125, -0.522705078125, -0.441619873046875, -0.36053466796875, -0.279449462890625, -0.1983642578125, -0.117279052734375, -0.03619384765625, 0.044891357421875, 0.1259765625, 0.207061767578125, 0.28814697265625, 0.369232177734375, 0.4503173828125, 0.531402587890625, 0.61248779296875, 0.693572998046875, 0.774658203125, 0.855743408203125, 0.93682861328125, 1.017913818359375, 1.0989990234375, 1.180084228515625, 1.26116943359375, 1.342254638671875, 1.42333984375, 1.504425048828125, 1.58551025390625, 1.666595458984375, 1.7476806640625, 1.828765869140625, 1.90985107421875, 1.990936279296875, 2.072021484375, 2.153106689453125, 2.23419189453125, 2.315277099609375, 2.3963623046875, 2.477447509765625, 2.55853271484375, 2.639617919921875, 2.720703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 5.0, 7.0, 10.0, 11.0, 11.0, 16.0, 18.0, 37.0, 56.0, 156.0, 2979.0, 487.0, 105.0, 56.0, 34.0, 31.0, 15.0, 4.0, 8.0, 2.0, 7.0, 7.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.984375, -0.9576873779296875, -0.930999755859375, -0.9043121337890625, -0.87762451171875, -0.8509368896484375, -0.824249267578125, -0.7975616455078125, -0.7708740234375, -0.7441864013671875, -0.717498779296875, -0.6908111572265625, -0.66412353515625, -0.6374359130859375, -0.610748291015625, -0.5840606689453125, -0.557373046875, -0.5306854248046875, -0.503997802734375, -0.4773101806640625, -0.45062255859375, -0.4239349365234375, -0.397247314453125, -0.3705596923828125, -0.3438720703125, -0.3171844482421875, -0.290496826171875, -0.2638092041015625, -0.23712158203125, -0.2104339599609375, -0.183746337890625, -0.1570587158203125, -0.13037109375, -0.1036834716796875, -0.076995849609375, -0.0503082275390625, -0.02362060546875, 0.0030670166015625, 0.029754638671875, 0.0564422607421875, 0.0831298828125, 0.1098175048828125, 0.136505126953125, 0.1631927490234375, 0.18988037109375, 0.2165679931640625, 0.243255615234375, 0.2699432373046875, 0.296630859375, 0.3233184814453125, 0.350006103515625, 0.3766937255859375, 0.40338134765625, 0.4300689697265625, 0.456756591796875, 0.4834442138671875, 0.5101318359375, 0.5368194580078125, 0.563507080078125, 0.5901947021484375, 0.61688232421875, 0.6435699462890625, 0.670257568359375, 0.6969451904296875, 0.7236328125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 11.0, 17.0, 29.0, 39.0, 64.0, 102.0, 127.0, 147.0, 131.0, 107.0, 69.0, 60.0, 36.0, 36.0, 12.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.696760654449463, -6.558041572570801, -6.419322490692139, -6.280602931976318, -6.141883850097656, -6.003164768218994, -5.864445686340332, -5.72572660446167, -5.587007522583008, -5.448288440704346, -5.309569358825684, -5.170849800109863, -5.032130718231201, -4.893411636352539, -4.754692554473877, -4.615973472595215, -4.4772539138793945, -4.338534832000732, -4.19981575012207, -4.06109619140625, -3.922377109527588, -3.783658027648926, -3.6449389457702637, -3.5062198638916016, -3.3675005435943604, -3.2287814617156982, -3.090062141418457, -2.951343059539795, -2.812623977661133, -2.6739046573638916, -2.5351855754852295, -2.3964662551879883, -2.2577476501464844, -2.1190285682678223, -1.980309247970581, -1.841590166091919, -1.7028709650039673, -1.5641517639160156, -1.4254326820373535, -1.2867134809494019, -1.1479942798614502, -1.0092750787734985, -0.8705559372901917, -0.7318367958068848, -0.5931175947189331, -0.45439839363098145, -0.31567925214767456, -0.17696011066436768, -0.038240909576416016, 0.10047826170921326, 0.23919743299484253, 0.3779166042804718, 0.5166357755661011, 0.6553549766540527, 0.7940741181373596, 0.9327932596206665, 1.0715124607086182, 1.2102316617965698, 1.3489508628845215, 1.4876699447631836, 1.6263891458511353, 1.765108346939087, 1.903827428817749, 2.0425467491149902, 2.1812658309936523]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 11.0, 13.0, 12.0, 15.0, 21.0, 17.0, 25.0, 24.0, 34.0, 23.0, 38.0, 34.0, 48.0, 47.0, 49.0, 47.0, 55.0, 40.0, 47.0, 55.0, 41.0, 39.0, 39.0, 44.0, 22.0, 23.0, 23.0, 13.0, 15.0, 15.0, 14.0, 20.0, 11.0, 3.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8557887077331543, -1.7828123569488525, -1.7098360061645508, -1.636859655380249, -1.5638831853866577, -1.490906834602356, -1.4179304838180542, -1.344954013824463, -1.2719776630401611, -1.1990013122558594, -1.1260249614715576, -1.0530486106872559, -0.9800721406936646, -0.9070957899093628, -0.834119439125061, -0.7611430287361145, -0.6881667375564575, -0.6151903867721558, -0.5422139763832092, -0.46923762559890747, -0.3962612450122833, -0.3232848644256592, -0.2503085136413574, -0.1773321032524109, -0.10435575246810913, -0.03137937933206558, 0.041596993803977966, 0.11457335948944092, 0.18754974007606506, 0.2605261206626892, 0.33350247144699097, 0.4064788818359375, 0.47945523262023926, 0.552431583404541, 0.6254079937934875, 0.6983843445777893, 0.7713607549667358, 0.8443371057510376, 0.9173134565353394, 0.9902898669242859, 1.0632662773132324, 1.1362426280975342, 1.209218978881836, 1.2821953296661377, 1.355171799659729, 1.4281481504440308, 1.5011245012283325, 1.5741009712219238, 1.647077202796936, 1.7200535535812378, 1.7930299043655396, 1.8660063743591309, 1.9389827251434326, 2.0119590759277344, 2.084935426712036, 2.157911777496338, 2.2308881282806396, 2.3038644790649414, 2.376840829849243, 2.449817180633545, 2.5227935314178467, 2.5957698822021484, 2.6687464714050293, 2.741722822189331, 2.814699172973633]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 4.0, 17.0, 12.0, 17.0, 22.0, 25.0, 58.0, 146.0, 256.0, 681.0, 1589.0, 4692.0, 15615.0, 61018.0, 257586.0, 470802.0, 177988.0, 41372.0, 10917.0, 3424.0, 1258.0, 582.0, 236.0, 96.0, 62.0, 34.0, 10.0, 14.0, 9.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.751953125, -2.658233642578125, -2.56451416015625, -2.470794677734375, -2.3770751953125, -2.283355712890625, -2.18963623046875, -2.095916748046875, -2.002197265625, -1.908477783203125, -1.81475830078125, -1.721038818359375, -1.6273193359375, -1.533599853515625, -1.43988037109375, -1.346160888671875, -1.25244140625, -1.158721923828125, -1.06500244140625, -0.971282958984375, -0.8775634765625, -0.783843994140625, -0.69012451171875, -0.596405029296875, -0.502685546875, -0.408966064453125, -0.31524658203125, -0.221527099609375, -0.1278076171875, -0.034088134765625, 0.05963134765625, 0.153350830078125, 0.2470703125, 0.340789794921875, 0.43450927734375, 0.528228759765625, 0.6219482421875, 0.715667724609375, 0.80938720703125, 0.903106689453125, 0.996826171875, 1.090545654296875, 1.18426513671875, 1.277984619140625, 1.3717041015625, 1.465423583984375, 1.55914306640625, 1.652862548828125, 1.74658203125, 1.840301513671875, 1.93402099609375, 2.027740478515625, 2.1214599609375, 2.215179443359375, 2.30889892578125, 2.402618408203125, 2.496337890625, 2.590057373046875, 2.68377685546875, 2.777496337890625, 2.8712158203125, 2.964935302734375, 3.05865478515625, 3.152374267578125, 3.24609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 10.0, 11.0, 9.0, 11.0, 11.0, 22.0, 20.0, 26.0, 34.0, 42.0, 26.0, 49.0, 47.0, 56.0, 53.0, 51.0, 48.0, 38.0, 61.0, 61.0, 44.0, 50.0, 36.0, 36.0, 36.0, 27.0, 13.0, 7.0, 10.0, 13.0, 7.0, 10.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.95166015625, -0.924560546875, -0.8974609375, -0.870361328125, -0.84326171875, -0.816162109375, -0.7890625, -0.761962890625, -0.73486328125, -0.707763671875, -0.6806640625, -0.653564453125, -0.62646484375, -0.599365234375, -0.572265625, -0.545166015625, -0.51806640625, -0.490966796875, -0.4638671875, -0.436767578125, -0.40966796875, -0.382568359375, -0.35546875, -0.328369140625, -0.30126953125, -0.274169921875, -0.2470703125, -0.219970703125, -0.19287109375, -0.165771484375, -0.138671875, -0.111572265625, -0.08447265625, -0.057373046875, -0.0302734375, -0.003173828125, 0.02392578125, 0.051025390625, 0.078125, 0.105224609375, 0.13232421875, 0.159423828125, 0.1865234375, 0.213623046875, 0.24072265625, 0.267822265625, 0.294921875, 0.322021484375, 0.34912109375, 0.376220703125, 0.4033203125, 0.430419921875, 0.45751953125, 0.484619140625, 0.51171875, 0.538818359375, 0.56591796875, 0.593017578125, 0.6201171875, 0.647216796875, 0.67431640625, 0.701416015625, 0.728515625, 0.755615234375, 0.78271484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 15.0, 23.0, 20.0, 59.0, 86.0, 168.0, 326.0, 798.0, 2198.0, 7265.0, 33364.0, 225980.0, 622885.0, 126617.0, 20822.0, 5080.0, 1557.0, 636.0, 266.0, 158.0, 78.0, 40.0, 31.0, 13.0, 8.0, 10.0, 14.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.103546142578125, -3.98052978515625, -3.857513427734375, -3.7344970703125, -3.611480712890625, -3.48846435546875, -3.365447998046875, -3.242431640625, -3.119415283203125, -2.99639892578125, -2.873382568359375, -2.7503662109375, -2.627349853515625, -2.50433349609375, -2.381317138671875, -2.25830078125, -2.135284423828125, -2.01226806640625, -1.889251708984375, -1.7662353515625, -1.643218994140625, -1.52020263671875, -1.397186279296875, -1.274169921875, -1.151153564453125, -1.02813720703125, -0.905120849609375, -0.7821044921875, -0.659088134765625, -0.53607177734375, -0.413055419921875, -0.2900390625, -0.167022705078125, -0.04400634765625, 0.079010009765625, 0.2020263671875, 0.325042724609375, 0.44805908203125, 0.571075439453125, 0.694091796875, 0.817108154296875, 0.94012451171875, 1.063140869140625, 1.1861572265625, 1.309173583984375, 1.43218994140625, 1.555206298828125, 1.67822265625, 1.801239013671875, 1.92425537109375, 2.047271728515625, 2.1702880859375, 2.293304443359375, 2.41632080078125, 2.539337158203125, 2.662353515625, 2.785369873046875, 2.90838623046875, 3.031402587890625, 3.1544189453125, 3.277435302734375, 3.40045166015625, 3.523468017578125, 3.646484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 5.0, 9.0, 12.0, 14.0, 30.0, 25.0, 35.0, 30.0, 44.0, 55.0, 64.0, 65.0, 63.0, 67.0, 60.0, 56.0, 68.0, 59.0, 48.0, 38.0, 37.0, 28.0, 21.0, 21.0, 16.0, 4.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.6973876953125, -5.515869140625, -5.3343505859375, -5.15283203125, -4.9713134765625, -4.789794921875, -4.6082763671875, -4.4267578125, -4.2452392578125, -4.063720703125, -3.8822021484375, -3.70068359375, -3.5191650390625, -3.337646484375, -3.1561279296875, -2.974609375, -2.7930908203125, -2.611572265625, -2.4300537109375, -2.24853515625, -2.0670166015625, -1.885498046875, -1.7039794921875, -1.5224609375, -1.3409423828125, -1.159423828125, -0.9779052734375, -0.79638671875, -0.6148681640625, -0.433349609375, -0.2518310546875, -0.0703125, 0.1112060546875, 0.292724609375, 0.4742431640625, 0.65576171875, 0.8372802734375, 1.018798828125, 1.2003173828125, 1.3818359375, 1.5633544921875, 1.744873046875, 1.9263916015625, 2.10791015625, 2.2894287109375, 2.470947265625, 2.6524658203125, 2.833984375, 3.0155029296875, 3.197021484375, 3.3785400390625, 3.56005859375, 3.7415771484375, 3.923095703125, 4.1046142578125, 4.2861328125, 4.4676513671875, 4.649169921875, 4.8306884765625, 5.01220703125, 5.1937255859375, 5.375244140625, 5.5567626953125, 5.73828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 16.0, 29.0, 44.0, 98.0, 237.0, 777.0, 6991.0, 667853.0, 366382.0, 5068.0, 673.0, 197.0, 84.0, 50.0, 33.0, 5.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.52734375, -7.35205078125, -7.1767578125, -7.00146484375, -6.826171875, -6.65087890625, -6.4755859375, -6.30029296875, -6.125, -5.94970703125, -5.7744140625, -5.59912109375, -5.423828125, -5.24853515625, -5.0732421875, -4.89794921875, -4.72265625, -4.54736328125, -4.3720703125, -4.19677734375, -4.021484375, -3.84619140625, -3.6708984375, -3.49560546875, -3.3203125, -3.14501953125, -2.9697265625, -2.79443359375, -2.619140625, -2.44384765625, -2.2685546875, -2.09326171875, -1.91796875, -1.74267578125, -1.5673828125, -1.39208984375, -1.216796875, -1.04150390625, -0.8662109375, -0.69091796875, -0.515625, -0.34033203125, -0.1650390625, 0.01025390625, 0.185546875, 0.36083984375, 0.5361328125, 0.71142578125, 0.88671875, 1.06201171875, 1.2373046875, 1.41259765625, 1.587890625, 1.76318359375, 1.9384765625, 2.11376953125, 2.2890625, 2.46435546875, 2.6396484375, 2.81494140625, 2.990234375, 3.16552734375, 3.3408203125, 3.51611328125, 3.69140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 13.0, 15.0, 13.0, 22.0, 28.0, 55.0, 79.0, 98.0, 129.0, 136.0, 102.0, 86.0, 79.0, 45.0, 36.0, 20.0, 12.0, 8.0, 12.0, 5.0, 1.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002484321594238281, -0.00023790448904037476, -0.0002273768186569214, -0.00021684914827346802, -0.00020632147789001465, -0.00019579380750656128, -0.0001852661371231079, -0.00017473846673965454, -0.00016421079635620117, -0.0001536831259727478, -0.00014315545558929443, -0.00013262778520584106, -0.0001221001148223877, -0.00011157244443893433, -0.00010104477405548096, -9.051710367202759e-05, -7.998943328857422e-05, -6.946176290512085e-05, -5.893409252166748e-05, -4.840642213821411e-05, -3.787875175476074e-05, -2.7351081371307373e-05, -1.6823410987854004e-05, -6.295740604400635e-06, 4.231929779052734e-06, 1.4759600162506104e-05, 2.5287270545959473e-05, 3.581494092941284e-05, 4.634261131286621e-05, 5.687028169631958e-05, 6.739795207977295e-05, 7.792562246322632e-05, 8.845329284667969e-05, 9.898096323013306e-05, 0.00010950863361358643, 0.0001200363039970398, 0.00013056397438049316, 0.00014109164476394653, 0.0001516193151473999, 0.00016214698553085327, 0.00017267465591430664, 0.00018320232629776, 0.00019372999668121338, 0.00020425766706466675, 0.00021478533744812012, 0.00022531300783157349, 0.00023584067821502686, 0.0002463683485984802, 0.0002568960189819336, 0.00026742368936538696, 0.00027795135974884033, 0.0002884790301322937, 0.00029900670051574707, 0.00030953437089920044, 0.0003200620412826538, 0.0003305897116661072, 0.00034111738204956055, 0.0003516450524330139, 0.0003621727228164673, 0.00037270039319992065, 0.000383228063583374, 0.0003937557339668274, 0.00040428340435028076, 0.00041481107473373413, 0.0004253387451171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 12.0, 18.0, 36.0, 77.0, 122.0, 241.0, 808.0, 7681.0, 764613.0, 269840.0, 4062.0, 619.0, 221.0, 88.0, 52.0, 22.0, 22.0, 9.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2734375, -5.10272216796875, -4.9320068359375, -4.76129150390625, -4.590576171875, -4.41986083984375, -4.2491455078125, -4.07843017578125, -3.90771484375, -3.73699951171875, -3.5662841796875, -3.39556884765625, -3.224853515625, -3.05413818359375, -2.8834228515625, -2.71270751953125, -2.5419921875, -2.37127685546875, -2.2005615234375, -2.02984619140625, -1.859130859375, -1.68841552734375, -1.5177001953125, -1.34698486328125, -1.17626953125, -1.00555419921875, -0.8348388671875, -0.66412353515625, -0.493408203125, -0.32269287109375, -0.1519775390625, 0.01873779296875, 0.189453125, 0.36016845703125, 0.5308837890625, 0.70159912109375, 0.872314453125, 1.04302978515625, 1.2137451171875, 1.38446044921875, 1.55517578125, 1.72589111328125, 1.8966064453125, 2.06732177734375, 2.238037109375, 2.40875244140625, 2.5794677734375, 2.75018310546875, 2.9208984375, 3.09161376953125, 3.2623291015625, 3.43304443359375, 3.603759765625, 3.77447509765625, 3.9451904296875, 4.11590576171875, 4.28662109375, 4.45733642578125, 4.6280517578125, 4.79876708984375, 4.969482421875, 5.14019775390625, 5.3109130859375, 5.48162841796875, 5.65234375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 22.0, 45.0, 121.0, 219.0, 258.0, 191.0, 77.0, 33.0, 16.0, 8.0, 8.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.814453125, -1.637542724609375, -1.46063232421875, -1.283721923828125, -1.1068115234375, -0.929901123046875, -0.75299072265625, -0.576080322265625, -0.399169921875, -0.222259521484375, -0.04534912109375, 0.131561279296875, 0.3084716796875, 0.485382080078125, 0.66229248046875, 0.839202880859375, 1.01611328125, 1.193023681640625, 1.36993408203125, 1.546844482421875, 1.7237548828125, 1.900665283203125, 2.07757568359375, 2.254486083984375, 2.431396484375, 2.608306884765625, 2.78521728515625, 2.962127685546875, 3.1390380859375, 3.315948486328125, 3.49285888671875, 3.669769287109375, 3.8466796875, 4.023590087890625, 4.20050048828125, 4.377410888671875, 4.5543212890625, 4.731231689453125, 4.90814208984375, 5.085052490234375, 5.261962890625, 5.438873291015625, 5.61578369140625, 5.792694091796875, 5.9696044921875, 6.146514892578125, 6.32342529296875, 6.500335693359375, 6.67724609375, 6.854156494140625, 7.03106689453125, 7.207977294921875, 7.3848876953125, 7.561798095703125, 7.73870849609375, 7.915618896484375, 8.092529296875, 8.269439697265625, 8.44635009765625, 8.623260498046875, 8.8001708984375, 8.977081298828125, 9.15399169921875, 9.330902099609375, 9.5078125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 10.0, 20.0, 50.0, 103.0, 186.0, 228.0, 183.0, 120.0, 50.0, 25.0, 10.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.940765380859375, -56.25018310546875, -54.55960464477539, -52.869022369384766, -51.178443908691406, -49.48786163330078, -47.797279357910156, -46.10669708251953, -44.41611862182617, -42.72553634643555, -41.03495788574219, -39.34437561035156, -37.65379333496094, -35.96321487426758, -34.27263259887695, -32.582054138183594, -30.89147186279297, -29.200891494750977, -27.510311126708984, -25.81972885131836, -24.129148483276367, -22.438568115234375, -20.74798583984375, -19.057405471801758, -17.366825103759766, -15.676244735717773, -13.985663414001465, -12.295082092285156, -10.604501724243164, -8.913921356201172, -7.223340034484863, -5.532758712768555, -3.8421783447265625, -2.151597499847412, -0.4610166549682617, 1.2295641899108887, 2.920145034790039, 4.610725402832031, 6.30130672454834, 7.991888046264648, 9.68246841430664, 11.373048782348633, 13.063630104064941, 14.75421142578125, 16.444791793823242, 18.135372161865234, 19.82595443725586, 21.51653480529785, 23.207115173339844, 24.897695541381836, 26.588275909423828, 28.278858184814453, 29.969438552856445, 31.660018920898438, 33.35060119628906, 35.04118347167969, 36.73176193237305, 38.42234420776367, 40.11292266845703, 41.803504943847656, 43.49408721923828, 45.18466567993164, 46.875247955322266, 48.565826416015625, 50.25640869140625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 4.0, 4.0, 10.0, 11.0, 14.0, 15.0, 16.0, 23.0, 14.0, 39.0, 36.0, 46.0, 54.0, 45.0, 42.0, 58.0, 47.0, 66.0, 64.0, 63.0, 46.0, 50.0, 37.0, 38.0, 32.0, 20.0, 24.0, 20.0, 13.0, 17.0, 9.0, 14.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.285371780395508, -25.575790405273438, -24.866209030151367, -24.156627655029297, -23.447046279907227, -22.737464904785156, -22.027883529663086, -21.318302154541016, -20.608720779418945, -19.899139404296875, -19.189558029174805, -18.479976654052734, -17.770395278930664, -17.060813903808594, -16.351232528686523, -15.641651153564453, -14.932069778442383, -14.222488403320312, -13.512907028198242, -12.803325653076172, -12.093744277954102, -11.384162902832031, -10.674581527709961, -9.96500015258789, -9.25541877746582, -8.54583740234375, -7.83625602722168, -7.126674652099609, -6.417093276977539, -5.707511901855469, -4.997930526733398, -4.288349151611328, -3.5787696838378906, -2.8691883087158203, -2.15960693359375, -1.4500255584716797, -0.7404441833496094, -0.030862808227539062, 0.6787185668945312, 1.3882999420166016, 2.097881317138672, 2.807462692260742, 3.5170440673828125, 4.226625442504883, 4.936206817626953, 5.645788192749023, 6.355369567871094, 7.064950942993164, 7.774532318115234, 8.484113693237305, 9.193695068359375, 9.903276443481445, 10.612857818603516, 11.322439193725586, 12.032020568847656, 12.741601943969727, 13.451183319091797, 14.160764694213867, 14.870346069335938, 15.579927444458008, 16.289508819580078, 16.99909019470215, 17.70867156982422, 18.41825294494629, 19.12783432006836]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 0.0, 4.0, 12.0, 7.0, 19.0, 14.0, 30.0, 72.0, 140.0, 309.0, 752.0, 2063.0, 9281.0, 4119988.0, 54457.0, 4836.0, 1347.0, 505.0, 210.0, 86.0, 56.0, 27.0, 23.0, 16.0, 9.0, 9.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -12.0096435546875, -11.683349609375, -11.3570556640625, -11.03076171875, -10.7044677734375, -10.378173828125, -10.0518798828125, -9.7255859375, -9.3992919921875, -9.072998046875, -8.7467041015625, -8.42041015625, -8.0941162109375, -7.767822265625, -7.4415283203125, -7.115234375, -6.7889404296875, -6.462646484375, -6.1363525390625, -5.81005859375, -5.4837646484375, -5.157470703125, -4.8311767578125, -4.5048828125, -4.1785888671875, -3.852294921875, -3.5260009765625, -3.19970703125, -2.8734130859375, -2.547119140625, -2.2208251953125, -1.89453125, -1.5682373046875, -1.241943359375, -0.9156494140625, -0.58935546875, -0.2630615234375, 0.063232421875, 0.3895263671875, 0.7158203125, 1.0421142578125, 1.368408203125, 1.6947021484375, 2.02099609375, 2.3472900390625, 2.673583984375, 2.9998779296875, 3.326171875, 3.6524658203125, 3.978759765625, 4.3050537109375, 4.63134765625, 4.9576416015625, 5.283935546875, 5.6102294921875, 5.9365234375, 6.2628173828125, 6.589111328125, 6.9154052734375, 7.24169921875, 7.5679931640625, 7.894287109375, 8.2205810546875, 8.546875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 4.0, 14.0, 13.0, 20.0, 24.0, 21.0, 33.0, 25.0, 53.0, 52.0, 48.0, 67.0, 58.0, 70.0, 71.0, 68.0, 66.0, 46.0, 48.0, 28.0, 32.0, 22.0, 22.0, 18.0, 12.0, 15.0, 7.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.154296875, -1.1186676025390625, -1.083038330078125, -1.0474090576171875, -1.01177978515625, -0.9761505126953125, -0.940521240234375, -0.9048919677734375, -0.8692626953125, -0.8336334228515625, -0.798004150390625, -0.7623748779296875, -0.72674560546875, -0.6911163330078125, -0.655487060546875, -0.6198577880859375, -0.584228515625, -0.5485992431640625, -0.512969970703125, -0.4773406982421875, -0.44171142578125, -0.4060821533203125, -0.370452880859375, -0.3348236083984375, -0.2991943359375, -0.2635650634765625, -0.227935791015625, -0.1923065185546875, -0.15667724609375, -0.1210479736328125, -0.085418701171875, -0.0497894287109375, -0.01416015625, 0.0214691162109375, 0.057098388671875, 0.0927276611328125, 0.12835693359375, 0.1639862060546875, 0.199615478515625, 0.2352447509765625, 0.2708740234375, 0.3065032958984375, 0.342132568359375, 0.3777618408203125, 0.41339111328125, 0.4490203857421875, 0.484649658203125, 0.5202789306640625, 0.555908203125, 0.5915374755859375, 0.627166748046875, 0.6627960205078125, 0.69842529296875, 0.7340545654296875, 0.769683837890625, 0.8053131103515625, 0.8409423828125, 0.8765716552734375, 0.912200927734375, 0.9478302001953125, 0.98345947265625, 1.0190887451171875, 1.054718017578125, 1.0903472900390625, 1.1259765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 10.0, 10.0, 7.0, 11.0, 16.0, 31.0, 27.0, 45.0, 55.0, 68.0, 114.0, 169.0, 249.0, 512.0, 1347.0, 4498.0, 22864.0, 4058779.0, 90962.0, 10051.0, 2483.0, 889.0, 422.0, 198.0, 105.0, 96.0, 69.0, 43.0, 42.0, 32.0, 23.0, 12.0, 17.0, 9.0, 3.0, 4.0, 0.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.17578125, -6.93475341796875, -6.6937255859375, -6.45269775390625, -6.211669921875, -5.97064208984375, -5.7296142578125, -5.48858642578125, -5.24755859375, -5.00653076171875, -4.7655029296875, -4.52447509765625, -4.283447265625, -4.04241943359375, -3.8013916015625, -3.56036376953125, -3.3193359375, -3.07830810546875, -2.8372802734375, -2.59625244140625, -2.355224609375, -2.11419677734375, -1.8731689453125, -1.63214111328125, -1.39111328125, -1.15008544921875, -0.9090576171875, -0.66802978515625, -0.427001953125, -0.18597412109375, 0.0550537109375, 0.29608154296875, 0.537109375, 0.77813720703125, 1.0191650390625, 1.26019287109375, 1.501220703125, 1.74224853515625, 1.9832763671875, 2.22430419921875, 2.46533203125, 2.70635986328125, 2.9473876953125, 3.18841552734375, 3.429443359375, 3.67047119140625, 3.9114990234375, 4.15252685546875, 4.3935546875, 4.63458251953125, 4.8756103515625, 5.11663818359375, 5.357666015625, 5.59869384765625, 5.8397216796875, 6.08074951171875, 6.32177734375, 6.56280517578125, 6.8038330078125, 7.04486083984375, 7.285888671875, 7.52691650390625, 7.7679443359375, 8.00897216796875, 8.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 7.0, 6.0, 20.0, 34.0, 74.0, 3641.0, 197.0, 48.0, 19.0, 14.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6650390625, -1.6029510498046875, -1.540863037109375, -1.4787750244140625, -1.41668701171875, -1.3545989990234375, -1.292510986328125, -1.2304229736328125, -1.1683349609375, -1.1062469482421875, -1.044158935546875, -0.9820709228515625, -0.91998291015625, -0.8578948974609375, -0.795806884765625, -0.7337188720703125, -0.671630859375, -0.6095428466796875, -0.547454833984375, -0.4853668212890625, -0.42327880859375, -0.3611907958984375, -0.299102783203125, -0.2370147705078125, -0.1749267578125, -0.1128387451171875, -0.050750732421875, 0.0113372802734375, 0.07342529296875, 0.1355133056640625, 0.197601318359375, 0.2596893310546875, 0.32177734375, 0.3838653564453125, 0.445953369140625, 0.5080413818359375, 0.57012939453125, 0.6322174072265625, 0.694305419921875, 0.7563934326171875, 0.8184814453125, 0.8805694580078125, 0.942657470703125, 1.0047454833984375, 1.06683349609375, 1.1289215087890625, 1.191009521484375, 1.2530975341796875, 1.315185546875, 1.3772735595703125, 1.439361572265625, 1.5014495849609375, 1.56353759765625, 1.6256256103515625, 1.687713623046875, 1.7498016357421875, 1.8118896484375, 1.8739776611328125, 1.936065673828125, 1.9981536865234375, 2.06024169921875, 2.1223297119140625, 2.184417724609375, 2.2465057373046875, 2.30859375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 7.0, 4.0, 12.0, 13.0, 17.0, 24.0, 32.0, 38.0, 41.0, 57.0, 79.0, 68.0, 65.0, 73.0, 94.0, 68.0, 68.0, 59.0, 51.0, 35.0, 23.0, 14.0, 18.0, 9.0, 11.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.427734375, -3.3411476612091064, -3.254560947418213, -3.1679739952087402, -3.0813872814178467, -2.994800567626953, -2.9082138538360596, -2.821627140045166, -2.7350401878356934, -2.6484534740448, -2.5618667602539062, -2.4752798080444336, -2.38869309425354, -2.3021063804626465, -2.215519666671753, -2.1289329528808594, -2.0423460006713867, -1.9557592868804932, -1.86917245388031, -1.7825857400894165, -1.6959989070892334, -1.6094121932983398, -1.5228254795074463, -1.4362386465072632, -1.3496520519256592, -1.2630653381347656, -1.1764785051345825, -1.089891791343689, -1.0033049583435059, -0.9167182445526123, -0.830131471157074, -0.7435446977615356, -0.6569578647613525, -0.5703710913658142, -0.4837843179702759, -0.39719757437705994, -0.3106108009815216, -0.22402402758598328, -0.13743728399276733, -0.050850510597229004, 0.035736262798309326, 0.12232302874326706, 0.2089097946882248, 0.29549655318260193, 0.38208332657814026, 0.4686700999736786, 0.5552568435668945, 0.6418436169624329, 0.7284303903579712, 0.8150171637535095, 0.9016039371490479, 0.9881906509399414, 1.0747774839401245, 1.161364197731018, 1.2479510307312012, 1.3345377445220947, 1.4211244583129883, 1.5077111721038818, 1.594298005104065, 1.6808847188949585, 1.7674715518951416, 1.8540582656860352, 1.9406449794769287, 2.0272316932678223, 2.113818645477295]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 13.0, 13.0, 6.0, 12.0, 13.0, 15.0, 18.0, 22.0, 21.0, 33.0, 33.0, 40.0, 34.0, 38.0, 39.0, 42.0, 57.0, 49.0, 39.0, 38.0, 32.0, 42.0, 32.0, 44.0, 30.0, 28.0, 34.0, 21.0, 24.0, 20.0, 15.0, 18.0, 12.0, 18.0, 5.0, 12.0, 11.0, 3.0, 2.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.3478598594665527, -2.2728610038757324, -2.197861909866333, -2.1228628158569336, -2.0478639602661133, -1.9728649854660034, -1.8978660106658936, -1.8228670358657837, -1.7478680610656738, -1.672869086265564, -1.597870111465454, -1.5228711366653442, -1.4478721618652344, -1.3728731870651245, -1.2978742122650146, -1.2228752374649048, -1.147876262664795, -1.072877287864685, -0.9978783130645752, -0.9228793382644653, -0.8478803634643555, -0.7728813886642456, -0.6978824138641357, -0.6228834390640259, -0.547884464263916, -0.47288548946380615, -0.3978865146636963, -0.3228875398635864, -0.24788856506347656, -0.1728895902633667, -0.09789061546325684, -0.022891640663146973, 0.05210709571838379, 0.12710607051849365, 0.20210504531860352, 0.2771040201187134, 0.35210299491882324, 0.4271019697189331, 0.502100944519043, 0.5770999193191528, 0.6520988941192627, 0.7270978689193726, 0.8020968437194824, 0.8770958185195923, 0.9520947933197021, 1.027093768119812, 1.1020927429199219, 1.1770917177200317, 1.2520906925201416, 1.3270896673202515, 1.4020886421203613, 1.4770876169204712, 1.552086591720581, 1.627085566520691, 1.7020845413208008, 1.7770835161209106, 1.8520824909210205, 1.9270814657211304, 2.0020804405212402, 2.0770792961120605, 2.15207839012146, 2.2270774841308594, 2.3020763397216797, 2.3770751953125, 2.4520742893218994]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 1.0, 8.0, 6.0, 7.0, 7.0, 19.0, 24.0, 33.0, 64.0, 88.0, 157.0, 289.0, 590.0, 1078.0, 2492.0, 5797.0, 15155.0, 45330.0, 148427.0, 386642.0, 297648.0, 96095.0, 30043.0, 10500.0, 4199.0, 1877.0, 892.0, 481.0, 236.0, 138.0, 75.0, 60.0, 28.0, 25.0, 11.0, 13.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-3.119140625, -3.034423828125, -2.94970703125, -2.864990234375, -2.7802734375, -2.695556640625, -2.61083984375, -2.526123046875, -2.44140625, -2.356689453125, -2.27197265625, -2.187255859375, -2.1025390625, -2.017822265625, -1.93310546875, -1.848388671875, -1.763671875, -1.678955078125, -1.59423828125, -1.509521484375, -1.4248046875, -1.340087890625, -1.25537109375, -1.170654296875, -1.0859375, -1.001220703125, -0.91650390625, -0.831787109375, -0.7470703125, -0.662353515625, -0.57763671875, -0.492919921875, -0.408203125, -0.323486328125, -0.23876953125, -0.154052734375, -0.0693359375, 0.015380859375, 0.10009765625, 0.184814453125, 0.26953125, 0.354248046875, 0.43896484375, 0.523681640625, 0.6083984375, 0.693115234375, 0.77783203125, 0.862548828125, 0.947265625, 1.031982421875, 1.11669921875, 1.201416015625, 1.2861328125, 1.370849609375, 1.45556640625, 1.540283203125, 1.625, 1.709716796875, 1.79443359375, 1.879150390625, 1.9638671875, 2.048583984375, 2.13330078125, 2.218017578125, 2.302734375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 4.0, 8.0, 3.0, 3.0, 11.0, 16.0, 20.0, 11.0, 18.0, 18.0, 31.0, 32.0, 36.0, 36.0, 51.0, 48.0, 55.0, 54.0, 56.0, 54.0, 54.0, 50.0, 48.0, 40.0, 35.0, 41.0, 28.0, 30.0, 23.0, 13.0, 13.0, 10.0, 9.0, 11.0, 4.0, 2.0, 7.0, 1.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.203125, -1.168212890625, -1.13330078125, -1.098388671875, -1.0634765625, -1.028564453125, -0.99365234375, -0.958740234375, -0.923828125, -0.888916015625, -0.85400390625, -0.819091796875, -0.7841796875, -0.749267578125, -0.71435546875, -0.679443359375, -0.64453125, -0.609619140625, -0.57470703125, -0.539794921875, -0.5048828125, -0.469970703125, -0.43505859375, -0.400146484375, -0.365234375, -0.330322265625, -0.29541015625, -0.260498046875, -0.2255859375, -0.190673828125, -0.15576171875, -0.120849609375, -0.0859375, -0.051025390625, -0.01611328125, 0.018798828125, 0.0537109375, 0.088623046875, 0.12353515625, 0.158447265625, 0.193359375, 0.228271484375, 0.26318359375, 0.298095703125, 0.3330078125, 0.367919921875, 0.40283203125, 0.437744140625, 0.47265625, 0.507568359375, 0.54248046875, 0.577392578125, 0.6123046875, 0.647216796875, 0.68212890625, 0.717041015625, 0.751953125, 0.786865234375, 0.82177734375, 0.856689453125, 0.8916015625, 0.926513671875, 0.96142578125, 0.996337890625, 1.03125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 5.0, 11.0, 23.0, 28.0, 37.0, 55.0, 116.0, 212.0, 400.0, 859.0, 2287.0, 8027.0, 40721.0, 334975.0, 570693.0, 72603.0, 12197.0, 3192.0, 1084.0, 486.0, 231.0, 121.0, 64.0, 30.0, 29.0, 20.0, 13.0, 7.0, 3.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.10418701171875, -3.9583740234375, -3.81256103515625, -3.666748046875, -3.52093505859375, -3.3751220703125, -3.22930908203125, -3.08349609375, -2.93768310546875, -2.7918701171875, -2.64605712890625, -2.500244140625, -2.35443115234375, -2.2086181640625, -2.06280517578125, -1.9169921875, -1.77117919921875, -1.6253662109375, -1.47955322265625, -1.333740234375, -1.18792724609375, -1.0421142578125, -0.89630126953125, -0.75048828125, -0.60467529296875, -0.4588623046875, -0.31304931640625, -0.167236328125, -0.02142333984375, 0.1243896484375, 0.27020263671875, 0.416015625, 0.56182861328125, 0.7076416015625, 0.85345458984375, 0.999267578125, 1.14508056640625, 1.2908935546875, 1.43670654296875, 1.58251953125, 1.72833251953125, 1.8741455078125, 2.01995849609375, 2.165771484375, 2.31158447265625, 2.4573974609375, 2.60321044921875, 2.7490234375, 2.89483642578125, 3.0406494140625, 3.18646240234375, 3.332275390625, 3.47808837890625, 3.6239013671875, 3.76971435546875, 3.91552734375, 4.06134033203125, 4.2071533203125, 4.35296630859375, 4.498779296875, 4.64459228515625, 4.7904052734375, 4.93621826171875, 5.08203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 8.0, 18.0, 19.0, 23.0, 26.0, 36.0, 44.0, 46.0, 46.0, 51.0, 62.0, 58.0, 57.0, 58.0, 54.0, 50.0, 64.0, 46.0, 43.0, 32.0, 37.0, 28.0, 25.0, 19.0, 13.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6796875, -6.4505615234375, -6.221435546875, -5.9923095703125, -5.76318359375, -5.5340576171875, -5.304931640625, -5.0758056640625, -4.8466796875, -4.6175537109375, -4.388427734375, -4.1593017578125, -3.93017578125, -3.7010498046875, -3.471923828125, -3.2427978515625, -3.013671875, -2.7845458984375, -2.555419921875, -2.3262939453125, -2.09716796875, -1.8680419921875, -1.638916015625, -1.4097900390625, -1.1806640625, -0.9515380859375, -0.722412109375, -0.4932861328125, -0.26416015625, -0.0350341796875, 0.194091796875, 0.4232177734375, 0.65234375, 0.8814697265625, 1.110595703125, 1.3397216796875, 1.56884765625, 1.7979736328125, 2.027099609375, 2.2562255859375, 2.4853515625, 2.7144775390625, 2.943603515625, 3.1727294921875, 3.40185546875, 3.6309814453125, 3.860107421875, 4.0892333984375, 4.318359375, 4.5474853515625, 4.776611328125, 5.0057373046875, 5.23486328125, 5.4639892578125, 5.693115234375, 5.9222412109375, 6.1513671875, 6.3804931640625, 6.609619140625, 6.8387451171875, 7.06787109375, 7.2969970703125, 7.526123046875, 7.7552490234375, 7.984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 12.0, 3.0, 8.0, 14.0, 16.0, 40.0, 72.0, 120.0, 212.0, 548.0, 1716.0, 11132.0, 472981.0, 546893.0, 11970.0, 1756.0, 535.0, 237.0, 124.0, 64.0, 42.0, 17.0, 13.0, 8.0, 5.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.92327880859375, -4.7645263671875, -4.60577392578125, -4.447021484375, -4.28826904296875, -4.1295166015625, -3.97076416015625, -3.81201171875, -3.65325927734375, -3.4945068359375, -3.33575439453125, -3.177001953125, -3.01824951171875, -2.8594970703125, -2.70074462890625, -2.5419921875, -2.38323974609375, -2.2244873046875, -2.06573486328125, -1.906982421875, -1.74822998046875, -1.5894775390625, -1.43072509765625, -1.27197265625, -1.11322021484375, -0.9544677734375, -0.79571533203125, -0.636962890625, -0.47821044921875, -0.3194580078125, -0.16070556640625, -0.001953125, 0.15679931640625, 0.3155517578125, 0.47430419921875, 0.633056640625, 0.79180908203125, 0.9505615234375, 1.10931396484375, 1.26806640625, 1.42681884765625, 1.5855712890625, 1.74432373046875, 1.903076171875, 2.06182861328125, 2.2205810546875, 2.37933349609375, 2.5380859375, 2.69683837890625, 2.8555908203125, 3.01434326171875, 3.173095703125, 3.33184814453125, 3.4906005859375, 3.64935302734375, 3.80810546875, 3.96685791015625, 4.1256103515625, 4.28436279296875, 4.443115234375, 4.60186767578125, 4.7606201171875, 4.91937255859375, 5.078125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 3.0, 6.0, 9.0, 27.0, 30.0, 50.0, 49.0, 103.0, 118.0, 128.0, 145.0, 107.0, 77.0, 49.0, 31.0, 21.0, 15.0, 9.0, 11.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005693435668945312, -0.0005553476512432098, -0.0005413517355918884, -0.000527355819940567, -0.0005133599042892456, -0.0004993639886379242, -0.0004853680729866028, -0.00047137215733528137, -0.00045737624168395996, -0.00044338032603263855, -0.00042938441038131714, -0.00041538849472999573, -0.0004013925790786743, -0.0003873966634273529, -0.0003734007477760315, -0.0003594048321247101, -0.00034540891647338867, -0.00033141300082206726, -0.00031741708517074585, -0.00030342116951942444, -0.00028942525386810303, -0.0002754293382167816, -0.0002614334225654602, -0.0002474375069141388, -0.00023344159126281738, -0.00021944567561149597, -0.00020544975996017456, -0.00019145384430885315, -0.00017745792865753174, -0.00016346201300621033, -0.00014946609735488892, -0.0001354701817035675, -0.0001214742660522461, -0.00010747835040092468, -9.348243474960327e-05, -7.948651909828186e-05, -6.549060344696045e-05, -5.149468779563904e-05, -3.749877214431763e-05, -2.3502856492996216e-05, -9.506940841674805e-06, 4.4889748096466064e-06, 1.8484890460968018e-05, 3.248080611228943e-05, 4.647672176361084e-05, 6.047263741493225e-05, 7.446855306625366e-05, 8.846446871757507e-05, 0.00010246038436889648, 0.0001164563000202179, 0.0001304522156715393, 0.00014444813132286072, 0.00015844404697418213, 0.00017243996262550354, 0.00018643587827682495, 0.00020043179392814636, 0.00021442770957946777, 0.00022842362523078918, 0.0002424195408821106, 0.000256415456533432, 0.0002704113721847534, 0.00028440728783607483, 0.00029840320348739624, 0.00031239911913871765, 0.00032639503479003906]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 6.0, 9.0, 15.0, 16.0, 48.0, 68.0, 115.0, 237.0, 450.0, 1078.0, 2924.0, 11790.0, 89217.0, 795351.0, 126864.0, 14523.0, 3607.0, 1206.0, 494.0, 239.0, 111.0, 74.0, 40.0, 28.0, 10.0, 8.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.8765869140625, -2.782470703125, -2.6883544921875, -2.59423828125, -2.5001220703125, -2.406005859375, -2.3118896484375, -2.2177734375, -2.1236572265625, -2.029541015625, -1.9354248046875, -1.84130859375, -1.7471923828125, -1.653076171875, -1.5589599609375, -1.46484375, -1.3707275390625, -1.276611328125, -1.1824951171875, -1.08837890625, -0.9942626953125, -0.900146484375, -0.8060302734375, -0.7119140625, -0.6177978515625, -0.523681640625, -0.4295654296875, -0.33544921875, -0.2413330078125, -0.147216796875, -0.0531005859375, 0.041015625, 0.1351318359375, 0.229248046875, 0.3233642578125, 0.41748046875, 0.5115966796875, 0.605712890625, 0.6998291015625, 0.7939453125, 0.8880615234375, 0.982177734375, 1.0762939453125, 1.17041015625, 1.2645263671875, 1.358642578125, 1.4527587890625, 1.546875, 1.6409912109375, 1.735107421875, 1.8292236328125, 1.92333984375, 2.0174560546875, 2.111572265625, 2.2056884765625, 2.2998046875, 2.3939208984375, 2.488037109375, 2.5821533203125, 2.67626953125, 2.7703857421875, 2.864501953125, 2.9586181640625, 3.052734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 7.0, 1.0, 6.0, 8.0, 15.0, 13.0, 20.0, 29.0, 43.0, 50.0, 75.0, 101.0, 120.0, 134.0, 109.0, 70.0, 63.0, 32.0, 25.0, 21.0, 15.0, 11.0, 9.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.40234375, -3.30487060546875, -3.2073974609375, -3.10992431640625, -3.012451171875, -2.91497802734375, -2.8175048828125, -2.72003173828125, -2.62255859375, -2.52508544921875, -2.4276123046875, -2.33013916015625, -2.232666015625, -2.13519287109375, -2.0377197265625, -1.94024658203125, -1.8427734375, -1.74530029296875, -1.6478271484375, -1.55035400390625, -1.452880859375, -1.35540771484375, -1.2579345703125, -1.16046142578125, -1.06298828125, -0.96551513671875, -0.8680419921875, -0.77056884765625, -0.673095703125, -0.57562255859375, -0.4781494140625, -0.38067626953125, -0.283203125, -0.18572998046875, -0.0882568359375, 0.00921630859375, 0.106689453125, 0.20416259765625, 0.3016357421875, 0.39910888671875, 0.49658203125, 0.59405517578125, 0.6915283203125, 0.78900146484375, 0.886474609375, 0.98394775390625, 1.0814208984375, 1.17889404296875, 1.2763671875, 1.37384033203125, 1.4713134765625, 1.56878662109375, 1.666259765625, 1.76373291015625, 1.8612060546875, 1.95867919921875, 2.05615234375, 2.15362548828125, 2.2510986328125, 2.34857177734375, 2.446044921875, 2.54351806640625, 2.6409912109375, 2.73846435546875, 2.8359375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 12.0, 14.0, 17.0, 29.0, 57.0, 94.0, 118.0, 161.0, 156.0, 96.0, 95.0, 64.0, 33.0, 20.0, 8.0, 14.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.67017364501953, -44.55193328857422, -43.433692932128906, -42.31545639038086, -41.19721603393555, -40.078975677490234, -38.96073913574219, -37.842498779296875, -36.72425842285156, -35.60601806640625, -34.48777770996094, -33.36954116821289, -32.25130081176758, -31.133060455322266, -30.014822006225586, -28.896583557128906, -27.778343200683594, -26.66010284423828, -25.5418643951416, -24.423625946044922, -23.30538558959961, -22.187145233154297, -21.068906784057617, -19.950668334960938, -18.832427978515625, -17.714187622070312, -16.595949172973633, -15.477709770202637, -14.35947036743164, -13.241230964660645, -12.122991561889648, -11.004752159118652, -9.886512756347656, -8.76827335357666, -7.650033950805664, -6.531794548034668, -5.413555145263672, -4.295315742492676, -3.1770763397216797, -2.0588369369506836, -0.9405975341796875, 0.1776418685913086, 1.2958812713623047, 2.414120674133301, 3.532360076904297, 4.650599479675293, 5.768838882446289, 6.887078285217285, 8.005317687988281, 9.123557090759277, 10.241796493530273, 11.36003589630127, 12.478275299072266, 13.596514701843262, 14.714754104614258, 15.832993507385254, 16.95123291015625, 18.069473266601562, 19.187711715698242, 20.305950164794922, 21.424190521240234, 22.542430877685547, 23.660669326782227, 24.778907775878906, 25.89714813232422]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 1.0, 7.0, 10.0, 12.0, 9.0, 18.0, 13.0, 18.0, 20.0, 24.0, 22.0, 24.0, 22.0, 36.0, 39.0, 36.0, 47.0, 52.0, 41.0, 42.0, 48.0, 43.0, 47.0, 41.0, 36.0, 40.0, 37.0, 22.0, 28.0, 25.0, 18.0, 18.0, 19.0, 9.0, 13.0, 13.0, 7.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.017623901367188, -22.295289993286133, -21.572956085205078, -20.850622177124023, -20.12828826904297, -19.405956268310547, -18.683622360229492, -17.961288452148438, -17.238954544067383, -16.516620635986328, -15.794286727905273, -15.071953773498535, -14.34961986541748, -13.627285957336426, -12.904953002929688, -12.182619094848633, -11.460285186767578, -10.737951278686523, -10.015617370605469, -9.29328441619873, -8.570950508117676, -7.848616600036621, -7.126283168792725, -6.403949737548828, -5.681615829467773, -4.959281921386719, -4.236948490142822, -3.5146148204803467, -2.792281150817871, -2.0699474811553955, -1.34761381149292, -0.6252803802490234, 0.09705352783203125, 0.8193871974945068, 1.5417208671569824, 2.264054536819458, 2.9863882064819336, 3.708721876144409, 4.431055545806885, 5.153388977050781, 5.875722885131836, 6.598056793212891, 7.320390224456787, 8.042723655700684, 8.765057563781738, 9.487391471862793, 10.209724426269531, 10.932058334350586, 11.65439224243164, 12.376726150512695, 13.09906005859375, 13.821393013000488, 14.543726921081543, 15.266060829162598, 15.988393783569336, 16.71072769165039, 17.433061599731445, 18.1553955078125, 18.877729415893555, 19.60006332397461, 20.32239532470703, 21.044729232788086, 21.76706314086914, 22.489397048950195, 23.21173095703125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 11.0, 14.0, 22.0, 37.0, 63.0, 112.0, 216.0, 455.0, 1021.0, 3057.0, 12103.0, 148594.0, 3998169.0, 23362.0, 4563.0, 1403.0, 548.0, 269.0, 109.0, 62.0, 38.0, 25.0, 9.0, 8.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66796875, -7.46710205078125, -7.2662353515625, -7.06536865234375, -6.864501953125, -6.66363525390625, -6.4627685546875, -6.26190185546875, -6.06103515625, -5.86016845703125, -5.6593017578125, -5.45843505859375, -5.257568359375, -5.05670166015625, -4.8558349609375, -4.65496826171875, -4.4541015625, -4.25323486328125, -4.0523681640625, -3.85150146484375, -3.650634765625, -3.44976806640625, -3.2489013671875, -3.04803466796875, -2.84716796875, -2.64630126953125, -2.4454345703125, -2.24456787109375, -2.043701171875, -1.84283447265625, -1.6419677734375, -1.44110107421875, -1.240234375, -1.03936767578125, -0.8385009765625, -0.63763427734375, -0.436767578125, -0.23590087890625, -0.0350341796875, 0.16583251953125, 0.36669921875, 0.56756591796875, 0.7684326171875, 0.96929931640625, 1.170166015625, 1.37103271484375, 1.5718994140625, 1.77276611328125, 1.9736328125, 2.17449951171875, 2.3753662109375, 2.57623291015625, 2.777099609375, 2.97796630859375, 3.1788330078125, 3.37969970703125, 3.58056640625, 3.78143310546875, 3.9822998046875, 4.18316650390625, 4.384033203125, 4.58489990234375, 4.7857666015625, 4.98663330078125, 5.1875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 9.0, 10.0, 8.0, 5.0, 16.0, 27.0, 31.0, 46.0, 64.0, 79.0, 76.0, 83.0, 92.0, 84.0, 64.0, 89.0, 71.0, 37.0, 36.0, 14.0, 15.0, 9.0, 8.0, 7.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2109375, -2.153106689453125, -2.09527587890625, -2.037445068359375, -1.9796142578125, -1.921783447265625, -1.86395263671875, -1.806121826171875, -1.748291015625, -1.690460205078125, -1.63262939453125, -1.574798583984375, -1.5169677734375, -1.459136962890625, -1.40130615234375, -1.343475341796875, -1.28564453125, -1.227813720703125, -1.16998291015625, -1.112152099609375, -1.0543212890625, -0.996490478515625, -0.93865966796875, -0.880828857421875, -0.822998046875, -0.765167236328125, -0.70733642578125, -0.649505615234375, -0.5916748046875, -0.533843994140625, -0.47601318359375, -0.418182373046875, -0.3603515625, -0.302520751953125, -0.24468994140625, -0.186859130859375, -0.1290283203125, -0.071197509765625, -0.01336669921875, 0.044464111328125, 0.102294921875, 0.160125732421875, 0.21795654296875, 0.275787353515625, 0.3336181640625, 0.391448974609375, 0.44927978515625, 0.507110595703125, 0.56494140625, 0.622772216796875, 0.68060302734375, 0.738433837890625, 0.7962646484375, 0.854095458984375, 0.91192626953125, 0.969757080078125, 1.027587890625, 1.085418701171875, 1.14324951171875, 1.201080322265625, 1.2589111328125, 1.316741943359375, 1.37457275390625, 1.432403564453125, 1.490234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 7.0, 9.0, 6.0, 3.0, 19.0, 18.0, 26.0, 29.0, 49.0, 53.0, 81.0, 189.0, 358.0, 922.0, 2764.0, 17681.0, 4051306.0, 111600.0, 6395.0, 1532.0, 561.0, 245.0, 149.0, 81.0, 61.0, 41.0, 26.0, 23.0, 12.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5234375, -7.1611328125, -6.798828125, -6.4365234375, -6.07421875, -5.7119140625, -5.349609375, -4.9873046875, -4.625, -4.2626953125, -3.900390625, -3.5380859375, -3.17578125, -2.8134765625, -2.451171875, -2.0888671875, -1.7265625, -1.3642578125, -1.001953125, -0.6396484375, -0.27734375, 0.0849609375, 0.447265625, 0.8095703125, 1.171875, 1.5341796875, 1.896484375, 2.2587890625, 2.62109375, 2.9833984375, 3.345703125, 3.7080078125, 4.0703125, 4.4326171875, 4.794921875, 5.1572265625, 5.51953125, 5.8818359375, 6.244140625, 6.6064453125, 6.96875, 7.3310546875, 7.693359375, 8.0556640625, 8.41796875, 8.7802734375, 9.142578125, 9.5048828125, 9.8671875, 10.2294921875, 10.591796875, 10.9541015625, 11.31640625, 11.6787109375, 12.041015625, 12.4033203125, 12.765625, 13.1279296875, 13.490234375, 13.8525390625, 14.21484375, 14.5771484375, 14.939453125, 15.3017578125, 15.6640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 10.0, 24.0, 50.0, 210.0, 3458.0, 206.0, 60.0, 27.0, 13.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53515625, -2.381103515625, -2.22705078125, -2.072998046875, -1.9189453125, -1.764892578125, -1.61083984375, -1.456787109375, -1.302734375, -1.148681640625, -0.99462890625, -0.840576171875, -0.6865234375, -0.532470703125, -0.37841796875, -0.224365234375, -0.0703125, 0.083740234375, 0.23779296875, 0.391845703125, 0.5458984375, 0.699951171875, 0.85400390625, 1.008056640625, 1.162109375, 1.316162109375, 1.47021484375, 1.624267578125, 1.7783203125, 1.932373046875, 2.08642578125, 2.240478515625, 2.39453125, 2.548583984375, 2.70263671875, 2.856689453125, 3.0107421875, 3.164794921875, 3.31884765625, 3.472900390625, 3.626953125, 3.781005859375, 3.93505859375, 4.089111328125, 4.2431640625, 4.397216796875, 4.55126953125, 4.705322265625, 4.859375, 5.013427734375, 5.16748046875, 5.321533203125, 5.4755859375, 5.629638671875, 5.78369140625, 5.937744140625, 6.091796875, 6.245849609375, 6.39990234375, 6.553955078125, 6.7080078125, 6.862060546875, 7.01611328125, 7.170166015625, 7.32421875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 36.0, 88.0, 245.0, 348.0, 201.0, 57.0, 18.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.21238899230957, -16.321622848510742, -15.430856704711914, -14.540090560913086, -13.649324417114258, -12.75855827331543, -11.867791175842285, -10.977025032043457, -10.086258888244629, -9.1954927444458, -8.304726600646973, -7.413959980010986, -6.523193836212158, -5.63242769241333, -4.741661071777344, -3.8508949279785156, -2.9601287841796875, -2.0693626403808594, -1.1785962581634521, -0.2878298759460449, 0.6029362678527832, 1.4937024116516113, 2.3844690322875977, 3.275235176086426, 4.166001319885254, 5.056767463684082, 5.94753360748291, 6.8383002281188965, 7.729066371917725, 8.619832992553711, 9.510599136352539, 10.401365280151367, 11.292133331298828, 12.182899475097656, 13.073665618896484, 13.964431762695312, 14.85519790649414, 15.745964050292969, 16.636730194091797, 17.527496337890625, 18.418262481689453, 19.30902862548828, 20.19979476928711, 21.090560913085938, 21.981327056884766, 22.872093200683594, 23.762859344482422, 24.65362548828125, 25.54439353942871, 26.43515968322754, 27.325925827026367, 28.216691970825195, 29.107458114624023, 29.99822425842285, 30.888992309570312, 31.77975845336914, 32.67052459716797, 33.5612907409668, 34.452056884765625, 35.34282302856445, 36.23358917236328, 37.12435531616211, 38.01512145996094, 38.905887603759766, 39.796653747558594]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 7.0, 10.0, 11.0, 21.0, 29.0, 39.0, 72.0, 66.0, 82.0, 106.0, 92.0, 89.0, 96.0, 70.0, 67.0, 49.0, 33.0, 25.0, 19.0, 9.0, 4.0, 8.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.999860763549805, -12.589277267456055, -12.178694725036621, -11.768112182617188, -11.357528686523438, -10.946945190429688, -10.536362648010254, -10.12578010559082, -9.71519660949707, -9.30461311340332, -8.894030570983887, -8.483448028564453, -8.072864532470703, -7.662281513214111, -7.2516984939575195, -6.841115474700928, -6.430532455444336, -6.019949436187744, -5.609366416931152, -5.1987833976745605, -4.788200378417969, -4.377617359161377, -3.967034339904785, -3.5564513206481934, -3.1458683013916016, -2.7352852821350098, -2.324702262878418, -1.9141192436218262, -1.5035362243652344, -1.0929532051086426, -0.6823701858520508, -0.271787166595459, 0.1387948989868164, 0.5493779182434082, 0.9599609375, 1.3705439567565918, 1.7811269760131836, 2.1917099952697754, 2.602293014526367, 3.012876033782959, 3.423459053039551, 3.8340420722961426, 4.244625091552734, 4.655208110809326, 5.065791130065918, 5.47637414932251, 5.886957168579102, 6.297540187835693, 6.708123207092285, 7.118706226348877, 7.529289245605469, 7.9398722648620605, 8.350455284118652, 8.761037826538086, 9.171621322631836, 9.582204818725586, 9.99278736114502, 10.403369903564453, 10.813953399658203, 11.224536895751953, 11.635119438171387, 12.04570198059082, 12.45628547668457, 12.86686897277832, 13.277451515197754]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 4.0, 7.0, 12.0, 15.0, 24.0, 37.0, 57.0, 75.0, 113.0, 164.0, 270.0, 455.0, 808.0, 1514.0, 3023.0, 6976.0, 19208.0, 65711.0, 255612.0, 461734.0, 165517.0, 43141.0, 13476.0, 5229.0, 2456.0, 1204.0, 675.0, 389.0, 209.0, 153.0, 102.0, 62.0, 36.0, 23.0, 13.0, 15.0, 8.0, 11.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.646484375, -3.533721923828125, -3.42095947265625, -3.308197021484375, -3.1954345703125, -3.082672119140625, -2.96990966796875, -2.857147216796875, -2.744384765625, -2.631622314453125, -2.51885986328125, -2.406097412109375, -2.2933349609375, -2.180572509765625, -2.06781005859375, -1.955047607421875, -1.84228515625, -1.729522705078125, -1.61676025390625, -1.503997802734375, -1.3912353515625, -1.278472900390625, -1.16571044921875, -1.052947998046875, -0.940185546875, -0.827423095703125, -0.71466064453125, -0.601898193359375, -0.4891357421875, -0.376373291015625, -0.26361083984375, -0.150848388671875, -0.0380859375, 0.074676513671875, 0.18743896484375, 0.300201416015625, 0.4129638671875, 0.525726318359375, 0.63848876953125, 0.751251220703125, 0.864013671875, 0.976776123046875, 1.08953857421875, 1.202301025390625, 1.3150634765625, 1.427825927734375, 1.54058837890625, 1.653350830078125, 1.76611328125, 1.878875732421875, 1.99163818359375, 2.104400634765625, 2.2171630859375, 2.329925537109375, 2.44268798828125, 2.555450439453125, 2.668212890625, 2.780975341796875, 2.89373779296875, 3.006500244140625, 3.1192626953125, 3.232025146484375, 3.34478759765625, 3.457550048828125, 3.5703125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 0.0, 3.0, 6.0, 7.0, 7.0, 15.0, 15.0, 15.0, 26.0, 34.0, 30.0, 66.0, 69.0, 58.0, 77.0, 79.0, 82.0, 60.0, 61.0, 65.0, 60.0, 44.0, 30.0, 33.0, 18.0, 7.0, 10.0, 5.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.111328125, -2.052337646484375, -1.99334716796875, -1.934356689453125, -1.8753662109375, -1.816375732421875, -1.75738525390625, -1.698394775390625, -1.639404296875, -1.580413818359375, -1.52142333984375, -1.462432861328125, -1.4034423828125, -1.344451904296875, -1.28546142578125, -1.226470947265625, -1.16748046875, -1.108489990234375, -1.04949951171875, -0.990509033203125, -0.9315185546875, -0.872528076171875, -0.81353759765625, -0.754547119140625, -0.695556640625, -0.636566162109375, -0.57757568359375, -0.518585205078125, -0.4595947265625, -0.400604248046875, -0.34161376953125, -0.282623291015625, -0.2236328125, -0.164642333984375, -0.10565185546875, -0.046661376953125, 0.0123291015625, 0.071319580078125, 0.13031005859375, 0.189300537109375, 0.248291015625, 0.307281494140625, 0.36627197265625, 0.425262451171875, 0.4842529296875, 0.543243408203125, 0.60223388671875, 0.661224365234375, 0.72021484375, 0.779205322265625, 0.83819580078125, 0.897186279296875, 0.9561767578125, 1.015167236328125, 1.07415771484375, 1.133148193359375, 1.192138671875, 1.251129150390625, 1.31011962890625, 1.369110107421875, 1.4281005859375, 1.487091064453125, 1.54608154296875, 1.605072021484375, 1.6640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 10.0, 10.0, 19.0, 48.0, 93.0, 221.0, 778.0, 3417.0, 48226.0, 920596.0, 69864.0, 4043.0, 783.0, 241.0, 97.0, 40.0, 35.0, 10.0, 8.0, 5.0, 3.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.92578125, -7.57427978515625, -7.2227783203125, -6.87127685546875, -6.519775390625, -6.16827392578125, -5.8167724609375, -5.46527099609375, -5.11376953125, -4.76226806640625, -4.4107666015625, -4.05926513671875, -3.707763671875, -3.35626220703125, -3.0047607421875, -2.65325927734375, -2.3017578125, -1.95025634765625, -1.5987548828125, -1.24725341796875, -0.895751953125, -0.54425048828125, -0.1927490234375, 0.15875244140625, 0.51025390625, 0.86175537109375, 1.2132568359375, 1.56475830078125, 1.916259765625, 2.26776123046875, 2.6192626953125, 2.97076416015625, 3.322265625, 3.67376708984375, 4.0252685546875, 4.37677001953125, 4.728271484375, 5.07977294921875, 5.4312744140625, 5.78277587890625, 6.13427734375, 6.48577880859375, 6.8372802734375, 7.18878173828125, 7.540283203125, 7.89178466796875, 8.2432861328125, 8.59478759765625, 8.9462890625, 9.29779052734375, 9.6492919921875, 10.00079345703125, 10.352294921875, 10.70379638671875, 11.0552978515625, 11.40679931640625, 11.75830078125, 12.10980224609375, 12.4613037109375, 12.81280517578125, 13.164306640625, 13.51580810546875, 13.8673095703125, 14.21881103515625, 14.5703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 11.0, 11.0, 11.0, 22.0, 30.0, 28.0, 36.0, 38.0, 55.0, 66.0, 72.0, 70.0, 83.0, 81.0, 64.0, 57.0, 52.0, 52.0, 48.0, 26.0, 20.0, 15.0, 11.0, 17.0, 7.0, 6.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.734375, -5.4593505859375, -5.184326171875, -4.9093017578125, -4.63427734375, -4.3592529296875, -4.084228515625, -3.8092041015625, -3.5341796875, -3.2591552734375, -2.984130859375, -2.7091064453125, -2.43408203125, -2.1590576171875, -1.884033203125, -1.6090087890625, -1.333984375, -1.0589599609375, -0.783935546875, -0.5089111328125, -0.23388671875, 0.0411376953125, 0.316162109375, 0.5911865234375, 0.8662109375, 1.1412353515625, 1.416259765625, 1.6912841796875, 1.96630859375, 2.2413330078125, 2.516357421875, 2.7913818359375, 3.06640625, 3.3414306640625, 3.616455078125, 3.8914794921875, 4.16650390625, 4.4415283203125, 4.716552734375, 4.9915771484375, 5.2666015625, 5.5416259765625, 5.816650390625, 6.0916748046875, 6.36669921875, 6.6417236328125, 6.916748046875, 7.1917724609375, 7.466796875, 7.7418212890625, 8.016845703125, 8.2918701171875, 8.56689453125, 8.8419189453125, 9.116943359375, 9.3919677734375, 9.6669921875, 9.9420166015625, 10.217041015625, 10.4920654296875, 10.76708984375, 11.0421142578125, 11.317138671875, 11.5921630859375, 11.8671875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 4.0, 14.0, 7.0, 8.0, 18.0, 18.0, 16.0, 30.0, 45.0, 94.0, 132.0, 181.0, 335.0, 583.0, 1237.0, 3189.0, 11082.0, 65106.0, 568168.0, 347003.0, 38894.0, 7671.0, 2411.0, 1010.0, 505.0, 268.0, 178.0, 104.0, 80.0, 41.0, 31.0, 32.0, 11.0, 6.0, 10.0, 2.0, 5.0, 5.0, 2.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.658203125, -1.607757568359375, -1.55731201171875, -1.506866455078125, -1.4564208984375, -1.405975341796875, -1.35552978515625, -1.305084228515625, -1.254638671875, -1.204193115234375, -1.15374755859375, -1.103302001953125, -1.0528564453125, -1.002410888671875, -0.95196533203125, -0.901519775390625, -0.85107421875, -0.800628662109375, -0.75018310546875, -0.699737548828125, -0.6492919921875, -0.598846435546875, -0.54840087890625, -0.497955322265625, -0.447509765625, -0.397064208984375, -0.34661865234375, -0.296173095703125, -0.2457275390625, -0.195281982421875, -0.14483642578125, -0.094390869140625, -0.0439453125, 0.006500244140625, 0.05694580078125, 0.107391357421875, 0.1578369140625, 0.208282470703125, 0.25872802734375, 0.309173583984375, 0.359619140625, 0.410064697265625, 0.46051025390625, 0.510955810546875, 0.5614013671875, 0.611846923828125, 0.66229248046875, 0.712738037109375, 0.76318359375, 0.813629150390625, 0.86407470703125, 0.914520263671875, 0.9649658203125, 1.015411376953125, 1.06585693359375, 1.116302490234375, 1.166748046875, 1.217193603515625, 1.26763916015625, 1.318084716796875, 1.3685302734375, 1.418975830078125, 1.46942138671875, 1.519866943359375, 1.5703125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 11.0, 14.0, 19.0, 22.0, 29.0, 35.0, 46.0, 45.0, 63.0, 53.0, 77.0, 79.0, 70.0, 75.0, 44.0, 59.0, 49.0, 35.0, 29.0, 20.0, 19.0, 13.0, 20.0, 11.0, 13.0, 10.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022077560424804688, -0.0002142973244190216, -0.00020781904458999634, -0.00020134076476097107, -0.0001948624849319458, -0.00018838420510292053, -0.00018190592527389526, -0.00017542764544487, -0.00016894936561584473, -0.00016247108578681946, -0.0001559928059577942, -0.00014951452612876892, -0.00014303624629974365, -0.00013655796647071838, -0.00013007968664169312, -0.00012360140681266785, -0.00011712312698364258, -0.00011064484715461731, -0.00010416656732559204, -9.768828749656677e-05, -9.12100076675415e-05, -8.473172783851624e-05, -7.825344800949097e-05, -7.17751681804657e-05, -6.529688835144043e-05, -5.881860852241516e-05, -5.234032869338989e-05, -4.5862048864364624e-05, -3.9383769035339355e-05, -3.290548920631409e-05, -2.642720937728882e-05, -1.994892954826355e-05, -1.3470649719238281e-05, -6.992369890213013e-06, -5.140900611877441e-07, 5.964189767837524e-06, 1.2442469596862793e-05, 1.892074942588806e-05, 2.539902925491333e-05, 3.18773090839386e-05, 3.835558891296387e-05, 4.4833868741989136e-05, 5.1312148571014404e-05, 5.779042840003967e-05, 6.426870822906494e-05, 7.074698805809021e-05, 7.722526788711548e-05, 8.370354771614075e-05, 9.018182754516602e-05, 9.666010737419128e-05, 0.00010313838720321655, 0.00010961666703224182, 0.00011609494686126709, 0.00012257322669029236, 0.00012905150651931763, 0.0001355297863483429, 0.00014200806617736816, 0.00014848634600639343, 0.0001549646258354187, 0.00016144290566444397, 0.00016792118549346924, 0.0001743994653224945, 0.00018087774515151978, 0.00018735602498054504, 0.0001938343048095703]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 12.0, 12.0, 21.0, 45.0, 99.0, 192.0, 522.0, 1704.0, 11326.0, 523906.0, 497016.0, 11021.0, 1735.0, 555.0, 227.0, 77.0, 36.0, 26.0, 9.0, 7.0, 3.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.20562744140625, -3.0987548828125, -2.99188232421875, -2.885009765625, -2.77813720703125, -2.6712646484375, -2.56439208984375, -2.45751953125, -2.35064697265625, -2.2437744140625, -2.13690185546875, -2.030029296875, -1.92315673828125, -1.8162841796875, -1.70941162109375, -1.6025390625, -1.49566650390625, -1.3887939453125, -1.28192138671875, -1.175048828125, -1.06817626953125, -0.9613037109375, -0.85443115234375, -0.74755859375, -0.64068603515625, -0.5338134765625, -0.42694091796875, -0.320068359375, -0.21319580078125, -0.1063232421875, 0.00054931640625, 0.107421875, 0.21429443359375, 0.3211669921875, 0.42803955078125, 0.534912109375, 0.64178466796875, 0.7486572265625, 0.85552978515625, 0.96240234375, 1.06927490234375, 1.1761474609375, 1.28302001953125, 1.389892578125, 1.49676513671875, 1.6036376953125, 1.71051025390625, 1.8173828125, 1.92425537109375, 2.0311279296875, 2.13800048828125, 2.244873046875, 2.35174560546875, 2.4586181640625, 2.56549072265625, 2.67236328125, 2.77923583984375, 2.8861083984375, 2.99298095703125, 3.099853515625, 3.20672607421875, 3.3135986328125, 3.42047119140625, 3.52734375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 3.0, 10.0, 9.0, 20.0, 32.0, 45.0, 61.0, 91.0, 98.0, 145.0, 105.0, 107.0, 86.0, 74.0, 34.0, 32.0, 19.0, 12.0, 11.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2646484375, -1.1865386962890625, -1.108428955078125, -1.0303192138671875, -0.95220947265625, -0.8740997314453125, -0.795989990234375, -0.7178802490234375, -0.6397705078125, -0.5616607666015625, -0.483551025390625, -0.4054412841796875, -0.32733154296875, -0.2492218017578125, -0.171112060546875, -0.0930023193359375, -0.014892578125, 0.0632171630859375, 0.141326904296875, 0.2194366455078125, 0.29754638671875, 0.3756561279296875, 0.453765869140625, 0.5318756103515625, 0.6099853515625, 0.6880950927734375, 0.766204833984375, 0.8443145751953125, 0.92242431640625, 1.0005340576171875, 1.078643798828125, 1.1567535400390625, 1.23486328125, 1.3129730224609375, 1.391082763671875, 1.4691925048828125, 1.54730224609375, 1.6254119873046875, 1.703521728515625, 1.7816314697265625, 1.8597412109375, 1.9378509521484375, 2.015960693359375, 2.0940704345703125, 2.17218017578125, 2.2502899169921875, 2.328399658203125, 2.4065093994140625, 2.484619140625, 2.5627288818359375, 2.640838623046875, 2.7189483642578125, 2.79705810546875, 2.8751678466796875, 2.953277587890625, 3.0313873291015625, 3.1094970703125, 3.1876068115234375, 3.265716552734375, 3.3438262939453125, 3.42193603515625, 3.5000457763671875, 3.578155517578125, 3.6562652587890625, 3.734375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 5.0, 36.0, 75.0, 122.0, 226.0, 228.0, 134.0, 91.0, 46.0, 18.0, 7.0, 6.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.32183074951172, -56.514591217041016, -54.70735168457031, -52.900108337402344, -51.09286880493164, -49.28562927246094, -47.478389739990234, -45.67115020751953, -43.86390686035156, -42.05666732788086, -40.249427795410156, -38.44218444824219, -36.634944915771484, -34.82770538330078, -33.02046585083008, -31.213226318359375, -29.405986785888672, -27.59874725341797, -25.791505813598633, -23.98426628112793, -22.177024841308594, -20.36978530883789, -18.562545776367188, -16.755306243896484, -14.948064804077148, -13.140824317932129, -11.33358383178711, -9.526344299316406, -7.719103813171387, -5.911863327026367, -4.104623794555664, -2.2973833084106445, -0.490142822265625, 1.3170974254608154, 3.124337673187256, 4.931577682495117, 6.738818168640137, 8.546058654785156, 10.35329818725586, 12.160538673400879, 13.967779159545898, 15.775019645690918, 17.582260131835938, 19.38949966430664, 21.196739196777344, 23.00398063659668, 24.811220169067383, 26.61846160888672, 28.425701141357422, 30.232940673828125, 32.04018020629883, 33.84741973876953, 35.6546630859375, 37.4619026184082, 39.269142150878906, 41.07638168334961, 42.88362121582031, 44.690860748291016, 46.49810028076172, 48.30534362792969, 50.11258316040039, 51.919822692871094, 53.7270622253418, 55.5343017578125, 57.34154510498047]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 6.0, 9.0, 12.0, 13.0, 20.0, 16.0, 25.0, 16.0, 27.0, 37.0, 40.0, 40.0, 34.0, 62.0, 65.0, 62.0, 58.0, 69.0, 50.0, 52.0, 43.0, 46.0, 32.0, 37.0, 19.0, 25.0, 17.0, 22.0, 11.0, 7.0, 6.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-34.696685791015625, -33.67158889770508, -32.64649200439453, -31.62139129638672, -30.596294403076172, -29.571197509765625, -28.546098709106445, -27.520999908447266, -26.49590301513672, -25.470806121826172, -24.445707321166992, -23.420608520507812, -22.395511627197266, -21.37041473388672, -20.34531593322754, -19.32021713256836, -18.295120239257812, -17.270023345947266, -16.244924545288086, -15.219826698303223, -14.19472885131836, -13.169631004333496, -12.144533157348633, -11.11943531036377, -10.094337463378906, -9.069239616394043, -8.04414176940918, -7.019043922424316, -5.993946075439453, -4.96884822845459, -3.9437503814697266, -2.9186525344848633, -1.8935585021972656, -0.8684606552124023, 0.15663719177246094, 1.1817350387573242, 2.2068328857421875, 3.231930732727051, 4.257028579711914, 5.282126426696777, 6.307224273681641, 7.332322120666504, 8.357419967651367, 9.38251781463623, 10.407615661621094, 11.432713508605957, 12.45781135559082, 13.482909202575684, 14.508007049560547, 15.53310489654541, 16.558202743530273, 17.583301544189453, 18.6083984375, 19.633495330810547, 20.658594131469727, 21.683692932128906, 22.708789825439453, 23.73388671875, 24.75898551940918, 25.78408432006836, 26.809181213378906, 27.834278106689453, 28.859376907348633, 29.884475708007812, 30.90957260131836]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 11.0, 15.0, 20.0, 10.0, 23.0, 49.0, 59.0, 86.0, 166.0, 271.0, 590.0, 1344.0, 3577.0, 12022.0, 62283.0, 2812317.0, 1236787.0, 49023.0, 10328.0, 3156.0, 1163.0, 495.0, 214.0, 134.0, 57.0, 35.0, 13.0, 12.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-6.15234375, -6.021240234375, -5.89013671875, -5.759033203125, -5.6279296875, -5.496826171875, -5.36572265625, -5.234619140625, -5.103515625, -4.972412109375, -4.84130859375, -4.710205078125, -4.5791015625, -4.447998046875, -4.31689453125, -4.185791015625, -4.0546875, -3.923583984375, -3.79248046875, -3.661376953125, -3.5302734375, -3.399169921875, -3.26806640625, -3.136962890625, -3.005859375, -2.874755859375, -2.74365234375, -2.612548828125, -2.4814453125, -2.350341796875, -2.21923828125, -2.088134765625, -1.95703125, -1.825927734375, -1.69482421875, -1.563720703125, -1.4326171875, -1.301513671875, -1.17041015625, -1.039306640625, -0.908203125, -0.777099609375, -0.64599609375, -0.514892578125, -0.3837890625, -0.252685546875, -0.12158203125, 0.009521484375, 0.140625, 0.271728515625, 0.40283203125, 0.533935546875, 0.6650390625, 0.796142578125, 0.92724609375, 1.058349609375, 1.189453125, 1.320556640625, 1.45166015625, 1.582763671875, 1.7138671875, 1.844970703125, 1.97607421875, 2.107177734375, 2.23828125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 10.0, 3.0, 8.0, 6.0, 14.0, 19.0, 17.0, 33.0, 30.0, 30.0, 44.0, 49.0, 57.0, 75.0, 58.0, 64.0, 56.0, 65.0, 60.0, 47.0, 48.0, 37.0, 45.0, 27.0, 25.0, 27.0, 10.0, 16.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4951171875, -1.45074462890625, -1.4063720703125, -1.36199951171875, -1.317626953125, -1.27325439453125, -1.2288818359375, -1.18450927734375, -1.14013671875, -1.09576416015625, -1.0513916015625, -1.00701904296875, -0.962646484375, -0.91827392578125, -0.8739013671875, -0.82952880859375, -0.78515625, -0.74078369140625, -0.6964111328125, -0.65203857421875, -0.607666015625, -0.56329345703125, -0.5189208984375, -0.47454833984375, -0.43017578125, -0.38580322265625, -0.3414306640625, -0.29705810546875, -0.252685546875, -0.20831298828125, -0.1639404296875, -0.11956787109375, -0.0751953125, -0.03082275390625, 0.0135498046875, 0.05792236328125, 0.102294921875, 0.14666748046875, 0.1910400390625, 0.23541259765625, 0.27978515625, 0.32415771484375, 0.3685302734375, 0.41290283203125, 0.457275390625, 0.50164794921875, 0.5460205078125, 0.59039306640625, 0.634765625, 0.67913818359375, 0.7235107421875, 0.76788330078125, 0.812255859375, 0.85662841796875, 0.9010009765625, 0.94537353515625, 0.98974609375, 1.03411865234375, 1.0784912109375, 1.12286376953125, 1.167236328125, 1.21160888671875, 1.2559814453125, 1.30035400390625, 1.3447265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 6.0, 4.0, 5.0, 4.0, 5.0, 8.0, 14.0, 22.0, 25.0, 37.0, 58.0, 107.0, 154.0, 291.0, 490.0, 1049.0, 2151.0, 5176.0, 15101.0, 58055.0, 503586.0, 3390864.0, 167979.0, 32564.0, 9694.0, 3566.0, 1567.0, 742.0, 368.0, 226.0, 151.0, 81.0, 41.0, 23.0, 24.0, 11.0, 12.0, 10.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-4.203125, -4.090423583984375, -3.97772216796875, -3.865020751953125, -3.7523193359375, -3.639617919921875, -3.52691650390625, -3.414215087890625, -3.301513671875, -3.188812255859375, -3.07611083984375, -2.963409423828125, -2.8507080078125, -2.738006591796875, -2.62530517578125, -2.512603759765625, -2.39990234375, -2.287200927734375, -2.17449951171875, -2.061798095703125, -1.9490966796875, -1.836395263671875, -1.72369384765625, -1.610992431640625, -1.498291015625, -1.385589599609375, -1.27288818359375, -1.160186767578125, -1.0474853515625, -0.934783935546875, -0.82208251953125, -0.709381103515625, -0.5966796875, -0.483978271484375, -0.37127685546875, -0.258575439453125, -0.1458740234375, -0.033172607421875, 0.07952880859375, 0.192230224609375, 0.304931640625, 0.417633056640625, 0.53033447265625, 0.643035888671875, 0.7557373046875, 0.868438720703125, 0.98114013671875, 1.093841552734375, 1.20654296875, 1.319244384765625, 1.43194580078125, 1.544647216796875, 1.6573486328125, 1.770050048828125, 1.88275146484375, 1.995452880859375, 2.108154296875, 2.220855712890625, 2.33355712890625, 2.446258544921875, 2.5589599609375, 2.671661376953125, 2.78436279296875, 2.897064208984375, 3.009765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 14.0, 7.0, 16.0, 31.0, 34.0, 43.0, 71.0, 117.0, 188.0, 408.0, 846.0, 1104.0, 501.0, 215.0, 129.0, 85.0, 55.0, 37.0, 42.0, 23.0, 19.0, 11.0, 13.0, 11.0, 4.0, 5.0, 3.0, 6.0, 0.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.171875, -4.056671142578125, -3.94146728515625, -3.826263427734375, -3.7110595703125, -3.595855712890625, -3.48065185546875, -3.365447998046875, -3.250244140625, -3.135040283203125, -3.01983642578125, -2.904632568359375, -2.7894287109375, -2.674224853515625, -2.55902099609375, -2.443817138671875, -2.32861328125, -2.213409423828125, -2.09820556640625, -1.983001708984375, -1.8677978515625, -1.752593994140625, -1.63739013671875, -1.522186279296875, -1.406982421875, -1.291778564453125, -1.17657470703125, -1.061370849609375, -0.9461669921875, -0.830963134765625, -0.71575927734375, -0.600555419921875, -0.4853515625, -0.370147705078125, -0.25494384765625, -0.139739990234375, -0.0245361328125, 0.090667724609375, 0.20587158203125, 0.321075439453125, 0.436279296875, 0.551483154296875, 0.66668701171875, 0.781890869140625, 0.8970947265625, 1.012298583984375, 1.12750244140625, 1.242706298828125, 1.35791015625, 1.473114013671875, 1.58831787109375, 1.703521728515625, 1.8187255859375, 1.933929443359375, 2.04913330078125, 2.164337158203125, 2.279541015625, 2.394744873046875, 2.50994873046875, 2.625152587890625, 2.7403564453125, 2.855560302734375, 2.97076416015625, 3.085968017578125, 3.201171875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 18.0, 34.0, 58.0, 107.0, 173.0, 203.0, 149.0, 115.0, 55.0, 29.0, 18.0, 5.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.90979766845703, -41.7921257019043, -40.67445373535156, -39.55678176879883, -38.439109802246094, -37.321441650390625, -36.203765869140625, -35.086097717285156, -33.96842575073242, -32.85075378417969, -31.733081817626953, -30.61540985107422, -29.497739791870117, -28.380067825317383, -27.26239585876465, -26.144723892211914, -25.02705192565918, -23.909379959106445, -22.79170799255371, -21.67403793334961, -20.556365966796875, -19.43869400024414, -18.321022033691406, -17.203350067138672, -16.085678100585938, -14.968006134033203, -13.850335121154785, -12.73266315460205, -11.614992141723633, -10.497320175170898, -9.379648208618164, -8.26197624206543, -7.144306182861328, -6.026634693145752, -4.908963203430176, -3.7912912368774414, -2.6736197471618652, -1.555948257446289, -0.4382762908935547, 0.6793951988220215, 1.7970666885375977, 2.914738178253174, 4.03240966796875, 5.150081634521484, 6.2677531242370605, 7.385424613952637, 8.503096580505371, 9.620767593383789, 10.738439559936523, 11.856111526489258, 12.973782539367676, 14.09145450592041, 15.209125518798828, 16.326797485351562, 17.444469451904297, 18.56214141845703, 19.679813385009766, 20.7974853515625, 21.915157318115234, 23.03282928466797, 24.15049934387207, 25.268171310424805, 26.38584327697754, 27.503515243530273, 28.621185302734375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 7.0, 10.0, 8.0, 14.0, 7.0, 25.0, 13.0, 31.0, 27.0, 41.0, 39.0, 36.0, 46.0, 56.0, 40.0, 77.0, 52.0, 53.0, 46.0, 43.0, 47.0, 39.0, 30.0, 34.0, 26.0, 33.0, 26.0, 9.0, 12.0, 15.0, 9.0, 13.0, 11.0, 4.0, 2.0, 6.0, 4.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.761592864990234, -18.23255157470703, -17.70351219177246, -17.174470901489258, -16.645431518554688, -16.116390228271484, -15.587348937988281, -15.058308601379395, -14.529268264770508, -14.000227928161621, -13.471187591552734, -12.942146301269531, -12.413105964660645, -11.884065628051758, -11.355024337768555, -10.825984001159668, -10.296943664550781, -9.767903327941895, -9.238862991333008, -8.709821701049805, -8.180781364440918, -7.651741027832031, -7.122700214385986, -6.593659400939941, -6.064619064331055, -5.535578727722168, -5.006537914276123, -4.477497100830078, -3.9484567642211914, -3.4194161891937256, -2.8903756141662598, -2.361335039138794, -1.832296371459961, -1.3032557964324951, -0.7742152214050293, -0.24517464637756348, 0.28386592864990234, 0.8129065036773682, 1.341947078704834, 1.8709876537322998, 2.4000282287597656, 2.9290688037872314, 3.4581093788146973, 3.987149953842163, 4.516190528869629, 5.045230865478516, 5.5742716789245605, 6.1033124923706055, 6.632352828979492, 7.161393165588379, 7.690433979034424, 8.219474792480469, 8.748515129089355, 9.277555465698242, 9.806596755981445, 10.335637092590332, 10.864677429199219, 11.393717765808105, 11.922758102416992, 12.451799392700195, 12.980839729309082, 13.509880065917969, 14.038921356201172, 14.567961692810059, 15.097002029418945]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 4.0, 9.0, 13.0, 14.0, 39.0, 44.0, 57.0, 87.0, 136.0, 225.0, 372.0, 611.0, 1027.0, 1745.0, 2925.0, 5218.0, 10125.0, 20121.0, 41219.0, 86659.0, 171492.0, 259526.0, 215197.0, 117379.0, 57169.0, 27396.0, 13557.0, 7027.0, 3845.0, 2116.0, 1196.0, 734.0, 435.0, 279.0, 188.0, 119.0, 89.0, 60.0, 33.0, 22.0, 17.0, 4.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0], "bins": [-1.9013671875, -1.8509521484375, -1.800537109375, -1.7501220703125, -1.69970703125, -1.6492919921875, -1.598876953125, -1.5484619140625, -1.498046875, -1.4476318359375, -1.397216796875, -1.3468017578125, -1.29638671875, -1.2459716796875, -1.195556640625, -1.1451416015625, -1.0947265625, -1.0443115234375, -0.993896484375, -0.9434814453125, -0.89306640625, -0.8426513671875, -0.792236328125, -0.7418212890625, -0.69140625, -0.6409912109375, -0.590576171875, -0.5401611328125, -0.48974609375, -0.4393310546875, -0.388916015625, -0.3385009765625, -0.2880859375, -0.2376708984375, -0.187255859375, -0.1368408203125, -0.08642578125, -0.0360107421875, 0.014404296875, 0.0648193359375, 0.115234375, 0.1656494140625, 0.216064453125, 0.2664794921875, 0.31689453125, 0.3673095703125, 0.417724609375, 0.4681396484375, 0.5185546875, 0.5689697265625, 0.619384765625, 0.6697998046875, 0.72021484375, 0.7706298828125, 0.821044921875, 0.8714599609375, 0.921875, 0.9722900390625, 1.022705078125, 1.0731201171875, 1.12353515625, 1.1739501953125, 1.224365234375, 1.2747802734375, 1.3251953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 2.0, 7.0, 11.0, 13.0, 23.0, 20.0, 24.0, 24.0, 22.0, 25.0, 50.0, 56.0, 42.0, 44.0, 46.0, 51.0, 46.0, 52.0, 46.0, 44.0, 50.0, 42.0, 33.0, 36.0, 36.0, 23.0, 23.0, 29.0, 13.0, 10.0, 16.0, 10.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0185546875, -0.983154296875, -0.94775390625, -0.912353515625, -0.876953125, -0.841552734375, -0.80615234375, -0.770751953125, -0.7353515625, -0.699951171875, -0.66455078125, -0.629150390625, -0.59375, -0.558349609375, -0.52294921875, -0.487548828125, -0.4521484375, -0.416748046875, -0.38134765625, -0.345947265625, -0.310546875, -0.275146484375, -0.23974609375, -0.204345703125, -0.1689453125, -0.133544921875, -0.09814453125, -0.062744140625, -0.02734375, 0.008056640625, 0.04345703125, 0.078857421875, 0.1142578125, 0.149658203125, 0.18505859375, 0.220458984375, 0.255859375, 0.291259765625, 0.32666015625, 0.362060546875, 0.3974609375, 0.432861328125, 0.46826171875, 0.503662109375, 0.5390625, 0.574462890625, 0.60986328125, 0.645263671875, 0.6806640625, 0.716064453125, 0.75146484375, 0.786865234375, 0.822265625, 0.857666015625, 0.89306640625, 0.928466796875, 0.9638671875, 0.999267578125, 1.03466796875, 1.070068359375, 1.10546875, 1.140869140625, 1.17626953125, 1.211669921875, 1.2470703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 9.0, 8.0, 14.0, 16.0, 43.0, 57.0, 97.0, 159.0, 232.0, 373.0, 622.0, 1161.0, 2628.0, 7727.0, 35589.0, 243117.0, 623211.0, 106751.0, 17871.0, 4677.0, 1900.0, 929.0, 529.0, 293.0, 192.0, 103.0, 75.0, 59.0, 38.0, 23.0, 13.0, 11.0, 6.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.82421875, -4.701446533203125, -4.57867431640625, -4.455902099609375, -4.3331298828125, -4.210357666015625, -4.08758544921875, -3.964813232421875, -3.842041015625, -3.719268798828125, -3.59649658203125, -3.473724365234375, -3.3509521484375, -3.228179931640625, -3.10540771484375, -2.982635498046875, -2.85986328125, -2.737091064453125, -2.61431884765625, -2.491546630859375, -2.3687744140625, -2.246002197265625, -2.12322998046875, -2.000457763671875, -1.877685546875, -1.754913330078125, -1.63214111328125, -1.509368896484375, -1.3865966796875, -1.263824462890625, -1.14105224609375, -1.018280029296875, -0.8955078125, -0.772735595703125, -0.64996337890625, -0.527191162109375, -0.4044189453125, -0.281646728515625, -0.15887451171875, -0.036102294921875, 0.086669921875, 0.209442138671875, 0.33221435546875, 0.454986572265625, 0.5777587890625, 0.700531005859375, 0.82330322265625, 0.946075439453125, 1.06884765625, 1.191619873046875, 1.31439208984375, 1.437164306640625, 1.5599365234375, 1.682708740234375, 1.80548095703125, 1.928253173828125, 2.051025390625, 2.173797607421875, 2.29656982421875, 2.419342041015625, 2.5421142578125, 2.664886474609375, 2.78765869140625, 2.910430908203125, 3.033203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 12.0, 9.0, 15.0, 16.0, 20.0, 21.0, 33.0, 34.0, 34.0, 36.0, 48.0, 46.0, 65.0, 50.0, 53.0, 50.0, 60.0, 47.0, 59.0, 41.0, 40.0, 36.0, 30.0, 30.0, 22.0, 24.0, 13.0, 13.0, 5.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.671875, -5.50421142578125, -5.3365478515625, -5.16888427734375, -5.001220703125, -4.83355712890625, -4.6658935546875, -4.49822998046875, -4.33056640625, -4.16290283203125, -3.9952392578125, -3.82757568359375, -3.659912109375, -3.49224853515625, -3.3245849609375, -3.15692138671875, -2.9892578125, -2.82159423828125, -2.6539306640625, -2.48626708984375, -2.318603515625, -2.15093994140625, -1.9832763671875, -1.81561279296875, -1.64794921875, -1.48028564453125, -1.3126220703125, -1.14495849609375, -0.977294921875, -0.80963134765625, -0.6419677734375, -0.47430419921875, -0.306640625, -0.13897705078125, 0.0286865234375, 0.19635009765625, 0.364013671875, 0.53167724609375, 0.6993408203125, 0.86700439453125, 1.03466796875, 1.20233154296875, 1.3699951171875, 1.53765869140625, 1.705322265625, 1.87298583984375, 2.0406494140625, 2.20831298828125, 2.3759765625, 2.54364013671875, 2.7113037109375, 2.87896728515625, 3.046630859375, 3.21429443359375, 3.3819580078125, 3.54962158203125, 3.71728515625, 3.88494873046875, 4.0526123046875, 4.22027587890625, 4.387939453125, 4.55560302734375, 4.7232666015625, 4.89093017578125, 5.05859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 10.0, 7.0, 16.0, 11.0, 22.0, 33.0, 57.0, 81.0, 154.0, 307.0, 710.0, 1911.0, 7896.0, 63118.0, 802604.0, 153452.0, 13506.0, 2884.0, 962.0, 365.0, 180.0, 99.0, 62.0, 31.0, 29.0, 19.0, 14.0, 6.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9207763671875, -1.851318359375, -1.7818603515625, -1.71240234375, -1.6429443359375, -1.573486328125, -1.5040283203125, -1.4345703125, -1.3651123046875, -1.295654296875, -1.2261962890625, -1.15673828125, -1.0872802734375, -1.017822265625, -0.9483642578125, -0.87890625, -0.8094482421875, -0.739990234375, -0.6705322265625, -0.60107421875, -0.5316162109375, -0.462158203125, -0.3927001953125, -0.3232421875, -0.2537841796875, -0.184326171875, -0.1148681640625, -0.04541015625, 0.0240478515625, 0.093505859375, 0.1629638671875, 0.232421875, 0.3018798828125, 0.371337890625, 0.4407958984375, 0.51025390625, 0.5797119140625, 0.649169921875, 0.7186279296875, 0.7880859375, 0.8575439453125, 0.927001953125, 0.9964599609375, 1.06591796875, 1.1353759765625, 1.204833984375, 1.2742919921875, 1.34375, 1.4132080078125, 1.482666015625, 1.5521240234375, 1.62158203125, 1.6910400390625, 1.760498046875, 1.8299560546875, 1.8994140625, 1.9688720703125, 2.038330078125, 2.1077880859375, 2.17724609375, 2.2467041015625, 2.316162109375, 2.3856201171875, 2.455078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 8.0, 16.0, 12.0, 27.0, 51.0, 64.0, 108.0, 128.0, 141.0, 130.0, 105.0, 63.0, 38.0, 33.0, 24.0, 10.0, 15.0, 6.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005822181701660156, -0.0005674064159393311, -0.0005525946617126465, -0.0005377829074859619, -0.0005229711532592773, -0.0005081593990325928, -0.0004933476448059082, -0.00047853589057922363, -0.00046372413635253906, -0.0004489123821258545, -0.0004341006278991699, -0.00041928887367248535, -0.0004044771194458008, -0.0003896653652191162, -0.00037485361099243164, -0.00036004185676574707, -0.0003452301025390625, -0.00033041834831237793, -0.00031560659408569336, -0.0003007948398590088, -0.0002859830856323242, -0.00027117133140563965, -0.0002563595771789551, -0.0002415478229522705, -0.00022673606872558594, -0.00021192431449890137, -0.0001971125602722168, -0.00018230080604553223, -0.00016748905181884766, -0.00015267729759216309, -0.00013786554336547852, -0.00012305378913879395, -0.00010824203491210938, -9.34302806854248e-05, -7.861852645874023e-05, -6.380677223205566e-05, -4.8995018005371094e-05, -3.4183263778686523e-05, -1.9371509552001953e-05, -4.559755325317383e-06, 1.0251998901367188e-05, 2.5063753128051758e-05, 3.987550735473633e-05, 5.46872615814209e-05, 6.949901580810547e-05, 8.431077003479004e-05, 9.912252426147461e-05, 0.00011393427848815918, 0.00012874603271484375, 0.00014355778694152832, 0.0001583695411682129, 0.00017318129539489746, 0.00018799304962158203, 0.0002028048038482666, 0.00021761655807495117, 0.00023242831230163574, 0.0002472400665283203, 0.0002620518207550049, 0.00027686357498168945, 0.000291675329208374, 0.0003064870834350586, 0.00032129883766174316, 0.00033611059188842773, 0.0003509223461151123, 0.0003657341003417969]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 9.0, 16.0, 12.0, 30.0, 44.0, 50.0, 115.0, 166.0, 295.0, 508.0, 1032.0, 2471.0, 7251.0, 33325.0, 305636.0, 616634.0, 63603.0, 11193.0, 3291.0, 1327.0, 677.0, 337.0, 202.0, 108.0, 73.0, 49.0, 26.0, 23.0, 11.0, 8.0, 5.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1523895263671875, -1.102630615234375, -1.0528717041015625, -1.00311279296875, -0.9533538818359375, -0.903594970703125, -0.8538360595703125, -0.8040771484375, -0.7543182373046875, -0.704559326171875, -0.6548004150390625, -0.60504150390625, -0.5552825927734375, -0.505523681640625, -0.4557647705078125, -0.406005859375, -0.3562469482421875, -0.306488037109375, -0.2567291259765625, -0.20697021484375, -0.1572113037109375, -0.107452392578125, -0.0576934814453125, -0.0079345703125, 0.0418243408203125, 0.091583251953125, 0.1413421630859375, 0.19110107421875, 0.2408599853515625, 0.290618896484375, 0.3403778076171875, 0.39013671875, 0.4398956298828125, 0.489654541015625, 0.5394134521484375, 0.58917236328125, 0.6389312744140625, 0.688690185546875, 0.7384490966796875, 0.7882080078125, 0.8379669189453125, 0.887725830078125, 0.9374847412109375, 0.98724365234375, 1.0370025634765625, 1.086761474609375, 1.1365203857421875, 1.186279296875, 1.2360382080078125, 1.285797119140625, 1.3355560302734375, 1.38531494140625, 1.4350738525390625, 1.484832763671875, 1.5345916748046875, 1.5843505859375, 1.6341094970703125, 1.683868408203125, 1.7336273193359375, 1.78338623046875, 1.8331451416015625, 1.882904052734375, 1.9326629638671875, 1.982421875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 4.0, 3.0, 3.0, 11.0, 27.0, 24.0, 45.0, 46.0, 71.0, 93.0, 126.0, 118.0, 110.0, 85.0, 73.0, 43.0, 36.0, 26.0, 16.0, 15.0, 7.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.03863525390625, -1.9718017578125, -1.90496826171875, -1.838134765625, -1.77130126953125, -1.7044677734375, -1.63763427734375, -1.57080078125, -1.50396728515625, -1.4371337890625, -1.37030029296875, -1.303466796875, -1.23663330078125, -1.1697998046875, -1.10296630859375, -1.0361328125, -0.96929931640625, -0.9024658203125, -0.83563232421875, -0.768798828125, -0.70196533203125, -0.6351318359375, -0.56829833984375, -0.50146484375, -0.43463134765625, -0.3677978515625, -0.30096435546875, -0.234130859375, -0.16729736328125, -0.1004638671875, -0.03363037109375, 0.033203125, 0.10003662109375, 0.1668701171875, 0.23370361328125, 0.300537109375, 0.36737060546875, 0.4342041015625, 0.50103759765625, 0.56787109375, 0.63470458984375, 0.7015380859375, 0.76837158203125, 0.835205078125, 0.90203857421875, 0.9688720703125, 1.03570556640625, 1.1025390625, 1.16937255859375, 1.2362060546875, 1.30303955078125, 1.369873046875, 1.43670654296875, 1.5035400390625, 1.57037353515625, 1.63720703125, 1.70404052734375, 1.7708740234375, 1.83770751953125, 1.904541015625, 1.97137451171875, 2.0382080078125, 2.10504150390625, 2.171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 20.0, 27.0, 108.0, 183.0, 302.0, 211.0, 91.0, 34.0, 15.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.68215942382812, -68.04549407958984, -66.40882110595703, -64.77215576171875, -63.13548278808594, -61.49881362915039, -59.862144470214844, -58.22547912597656, -56.58880615234375, -54.9521369934082, -53.315467834472656, -51.67879867553711, -50.04212951660156, -48.405460357666016, -46.76879119873047, -45.13212585449219, -43.49545669555664, -41.858787536621094, -40.22211837768555, -38.58544921875, -36.94878005981445, -35.312110900878906, -33.675445556640625, -32.03877258300781, -30.4021053314209, -28.76543617248535, -27.128767013549805, -25.49209976196289, -23.855430603027344, -22.218761444091797, -20.58209228515625, -18.945423126220703, -17.308757781982422, -15.672088623046875, -14.035419464111328, -12.398751258850098, -10.76208209991455, -9.125412940979004, -7.488744735717773, -5.852075576782227, -4.21540641784668, -2.578737497329712, -0.9420685768127441, 0.6946001052856445, 2.3312692642211914, 3.9679384231567383, 5.604606628417969, 7.241275787353516, 8.877944946289062, 10.51461410522461, 12.151283264160156, 13.787951469421387, 15.424620628356934, 17.061290740966797, 18.69795799255371, 20.334627151489258, 21.971296310424805, 23.60796546936035, 25.2446346282959, 26.881301879882812, 28.51797103881836, 30.154640197753906, 31.791309356689453, 33.427978515625, 35.06464767456055]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 6.0, 13.0, 13.0, 16.0, 20.0, 22.0, 33.0, 29.0, 52.0, 41.0, 51.0, 51.0, 64.0, 81.0, 81.0, 66.0, 68.0, 61.0, 43.0, 30.0, 35.0, 22.0, 22.0, 21.0, 17.0, 10.0, 8.0, 7.0, 1.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.02332305908203, -28.27657127380371, -27.52981948852539, -26.78306770324707, -26.03631591796875, -25.289566040039062, -24.542814254760742, -23.796062469482422, -23.0493106842041, -22.30255889892578, -21.55580711364746, -20.80905532836914, -20.062305450439453, -19.315553665161133, -18.568801879882812, -17.822050094604492, -17.075298309326172, -16.32854652404785, -15.581794738769531, -14.835043907165527, -14.088292121887207, -13.341540336608887, -12.594789505004883, -11.848037719726562, -11.101285934448242, -10.354534149169922, -9.607782363891602, -8.861031532287598, -8.114279747009277, -7.367527961730957, -6.620776653289795, -5.874025344848633, -5.1272735595703125, -4.380521774291992, -3.63377046585083, -2.887018918991089, -2.1402673721313477, -1.3935158252716064, -0.6467642784118652, 0.09998703002929688, 0.8467388153076172, 1.5934903621673584, 2.3402419090270996, 3.086993455886841, 3.833745002746582, 4.580496788024902, 5.3272480964660645, 6.073999404907227, 6.820751190185547, 7.567502975463867, 8.314254760742188, 9.061005592346191, 9.807757377624512, 10.554509162902832, 11.301259994506836, 12.048011779785156, 12.794763565063477, 13.541515350341797, 14.288267135620117, 15.035017967224121, 15.781769752502441, 16.528520584106445, 17.275272369384766, 18.022024154663086, 18.768775939941406]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 5.0, 9.0, 12.0, 25.0, 31.0, 40.0, 74.0, 105.0, 204.0, 504.0, 1642.0, 7166.0, 51631.0, 3670771.0, 436626.0, 19822.0, 3949.0, 969.0, 332.0, 120.0, 69.0, 58.0, 21.0, 31.0, 7.0, 8.0, 7.0, 4.0, 12.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.890625, -4.753936767578125, -4.61724853515625, -4.480560302734375, -4.3438720703125, -4.207183837890625, -4.07049560546875, -3.933807373046875, -3.797119140625, -3.660430908203125, -3.52374267578125, -3.387054443359375, -3.2503662109375, -3.113677978515625, -2.97698974609375, -2.840301513671875, -2.70361328125, -2.566925048828125, -2.43023681640625, -2.293548583984375, -2.1568603515625, -2.020172119140625, -1.88348388671875, -1.746795654296875, -1.610107421875, -1.473419189453125, -1.33673095703125, -1.200042724609375, -1.0633544921875, -0.926666259765625, -0.78997802734375, -0.653289794921875, -0.5166015625, -0.379913330078125, -0.24322509765625, -0.106536865234375, 0.0301513671875, 0.166839599609375, 0.30352783203125, 0.440216064453125, 0.576904296875, 0.713592529296875, 0.85028076171875, 0.986968994140625, 1.1236572265625, 1.260345458984375, 1.39703369140625, 1.533721923828125, 1.67041015625, 1.807098388671875, 1.94378662109375, 2.080474853515625, 2.2171630859375, 2.353851318359375, 2.49053955078125, 2.627227783203125, 2.763916015625, 2.900604248046875, 3.03729248046875, 3.173980712890625, 3.3106689453125, 3.447357177734375, 3.58404541015625, 3.720733642578125, 3.857421875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 9.0, 15.0, 17.0, 36.0, 57.0, 54.0, 76.0, 102.0, 103.0, 109.0, 98.0, 82.0, 80.0, 51.0, 45.0, 31.0, 21.0, 11.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.08984375, -3.0200958251953125, -2.950347900390625, -2.8805999755859375, -2.81085205078125, -2.7411041259765625, -2.671356201171875, -2.6016082763671875, -2.5318603515625, -2.4621124267578125, -2.392364501953125, -2.3226165771484375, -2.25286865234375, -2.1831207275390625, -2.113372802734375, -2.0436248779296875, -1.973876953125, -1.9041290283203125, -1.834381103515625, -1.7646331787109375, -1.69488525390625, -1.6251373291015625, -1.555389404296875, -1.4856414794921875, -1.4158935546875, -1.3461456298828125, -1.276397705078125, -1.2066497802734375, -1.13690185546875, -1.0671539306640625, -0.997406005859375, -0.9276580810546875, -0.85791015625, -0.7881622314453125, -0.718414306640625, -0.6486663818359375, -0.57891845703125, -0.5091705322265625, -0.439422607421875, -0.3696746826171875, -0.2999267578125, -0.2301788330078125, -0.160430908203125, -0.0906829833984375, -0.02093505859375, 0.0488128662109375, 0.118560791015625, 0.1883087158203125, 0.258056640625, 0.3278045654296875, 0.397552490234375, 0.4673004150390625, 0.53704833984375, 0.6067962646484375, 0.676544189453125, 0.7462921142578125, 0.8160400390625, 0.8857879638671875, 0.955535888671875, 1.0252838134765625, 1.09503173828125, 1.1647796630859375, 1.234527587890625, 1.3042755126953125, 1.3740234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 13.0, 19.0, 16.0, 36.0, 54.0, 102.0, 203.0, 372.0, 863.0, 1899.0, 4603.0, 12051.0, 35270.0, 153371.0, 2743889.0, 1107364.0, 93040.0, 25451.0, 8954.0, 3487.0, 1555.0, 765.0, 398.0, 222.0, 115.0, 65.0, 35.0, 31.0, 12.0, 8.0, 4.0, 4.0, 7.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.740234375, -2.656829833984375, -2.57342529296875, -2.490020751953125, -2.4066162109375, -2.323211669921875, -2.23980712890625, -2.156402587890625, -2.072998046875, -1.989593505859375, -1.90618896484375, -1.822784423828125, -1.7393798828125, -1.655975341796875, -1.57257080078125, -1.489166259765625, -1.40576171875, -1.322357177734375, -1.23895263671875, -1.155548095703125, -1.0721435546875, -0.988739013671875, -0.90533447265625, -0.821929931640625, -0.738525390625, -0.655120849609375, -0.57171630859375, -0.488311767578125, -0.4049072265625, -0.321502685546875, -0.23809814453125, -0.154693603515625, -0.0712890625, 0.012115478515625, 0.09552001953125, 0.178924560546875, 0.2623291015625, 0.345733642578125, 0.42913818359375, 0.512542724609375, 0.595947265625, 0.679351806640625, 0.76275634765625, 0.846160888671875, 0.9295654296875, 1.012969970703125, 1.09637451171875, 1.179779052734375, 1.26318359375, 1.346588134765625, 1.42999267578125, 1.513397216796875, 1.5968017578125, 1.680206298828125, 1.76361083984375, 1.847015380859375, 1.930419921875, 2.013824462890625, 2.09722900390625, 2.180633544921875, 2.2640380859375, 2.347442626953125, 2.43084716796875, 2.514251708984375, 2.59765625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 10.0, 5.0, 7.0, 4.0, 10.0, 15.0, 14.0, 19.0, 12.0, 35.0, 32.0, 67.0, 86.0, 137.0, 288.0, 529.0, 858.0, 783.0, 458.0, 237.0, 158.0, 88.0, 60.0, 28.0, 23.0, 27.0, 14.0, 24.0, 9.0, 3.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.01348876953125, -1.9293212890625, -1.84515380859375, -1.760986328125, -1.67681884765625, -1.5926513671875, -1.50848388671875, -1.42431640625, -1.34014892578125, -1.2559814453125, -1.17181396484375, -1.087646484375, -1.00347900390625, -0.9193115234375, -0.83514404296875, -0.7509765625, -0.66680908203125, -0.5826416015625, -0.49847412109375, -0.414306640625, -0.33013916015625, -0.2459716796875, -0.16180419921875, -0.07763671875, 0.00653076171875, 0.0906982421875, 0.17486572265625, 0.259033203125, 0.34320068359375, 0.4273681640625, 0.51153564453125, 0.595703125, 0.67987060546875, 0.7640380859375, 0.84820556640625, 0.932373046875, 1.01654052734375, 1.1007080078125, 1.18487548828125, 1.26904296875, 1.35321044921875, 1.4373779296875, 1.52154541015625, 1.605712890625, 1.68988037109375, 1.7740478515625, 1.85821533203125, 1.9423828125, 2.02655029296875, 2.1107177734375, 2.19488525390625, 2.279052734375, 2.36322021484375, 2.4473876953125, 2.53155517578125, 2.61572265625, 2.69989013671875, 2.7840576171875, 2.86822509765625, 2.952392578125, 3.03656005859375, 3.1207275390625, 3.20489501953125, 3.2890625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 93.0, 186.0, 314.0, 224.0, 100.0, 34.0, 10.0, 8.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.85332489013672, -39.42203903198242, -37.990753173828125, -36.55946350097656, -35.128177642822266, -33.69689178466797, -32.26560592651367, -30.834320068359375, -29.403032302856445, -27.97174644470215, -26.54045867919922, -25.109172821044922, -23.677886962890625, -22.246599197387695, -20.8153133392334, -19.38402557373047, -17.952739715576172, -16.521453857421875, -15.090166091918945, -13.658880233764648, -12.227593421936035, -10.796306610107422, -9.365020751953125, -7.933733940124512, -6.502447128295898, -5.071160316467285, -3.63987398147583, -2.208587646484375, -0.7773008346557617, 0.6539859771728516, 2.0852718353271484, 3.5165586471557617, 4.947845458984375, 6.379132270812988, 7.810418605804443, 9.241704940795898, 10.672991752624512, 12.104278564453125, 13.535564422607422, 14.966851234436035, 16.39813804626465, 17.829423904418945, 19.260711669921875, 20.691997528076172, 22.12328338623047, 23.5545711517334, 24.985857009887695, 26.417144775390625, 27.848430633544922, 29.27971649169922, 30.71100425720215, 32.14228820800781, 33.573577880859375, 35.00486373901367, 36.43614959716797, 37.867435455322266, 39.29872131347656, 40.73000717163086, 42.161293029785156, 43.59258270263672, 45.023868560791016, 46.45515441894531, 47.88644027709961, 49.317726135253906, 50.74901580810547]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 7.0, 4.0, 2.0, 5.0, 10.0, 15.0, 12.0, 15.0, 24.0, 24.0, 24.0, 46.0, 30.0, 47.0, 55.0, 56.0, 48.0, 60.0, 62.0, 55.0, 58.0, 49.0, 47.0, 51.0, 33.0, 29.0, 32.0, 18.0, 25.0, 15.0, 13.0, 10.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.802183151245117, -14.299299240112305, -13.796415328979492, -13.29353141784668, -12.790647506713867, -12.287763595581055, -11.784880638122559, -11.281996726989746, -10.779112815856934, -10.276228904724121, -9.773344993591309, -9.270461082458496, -8.767578125, -8.264694213867188, -7.761810302734375, -7.2589263916015625, -6.75604248046875, -6.2531585693359375, -5.750274658203125, -5.247391223907471, -4.744507312774658, -4.241623401641846, -3.7387397289276123, -3.235856056213379, -2.7329721450805664, -2.230088233947754, -1.7272045612335205, -1.2243207693099976, -0.7214369773864746, -0.2185530662536621, 0.2843306064605713, 0.7872142791748047, 1.29010009765625, 1.792983889579773, 2.295867681503296, 2.7987513542175293, 3.301635265350342, 3.8045191764831543, 4.307402610778809, 4.810286521911621, 5.313170433044434, 5.816054344177246, 6.318938255310059, 6.821821689605713, 7.324705600738525, 7.827589511871338, 8.330472946166992, 8.833356857299805, 9.336240768432617, 9.83912467956543, 10.342008590698242, 10.844892501831055, 11.347776412963867, 11.85066032409668, 12.353543281555176, 12.856427192687988, 13.3593111038208, 13.862195014953613, 14.365078926086426, 14.867962837219238, 15.370845794677734, 15.873729705810547, 16.37661361694336, 16.879497528076172, 17.382381439208984]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 0.0, 6.0, 5.0, 9.0, 9.0, 15.0, 24.0, 47.0, 70.0, 130.0, 190.0, 298.0, 532.0, 945.0, 1740.0, 3162.0, 6097.0, 12525.0, 26576.0, 59283.0, 135082.0, 275526.0, 277093.0, 136126.0, 59832.0, 27211.0, 12598.0, 6323.0, 3127.0, 1728.0, 945.0, 535.0, 294.0, 180.0, 104.0, 59.0, 40.0, 36.0, 13.0, 8.0, 12.0, 9.0, 2.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.828125, -1.7691650390625, -1.710205078125, -1.6512451171875, -1.59228515625, -1.5333251953125, -1.474365234375, -1.4154052734375, -1.3564453125, -1.2974853515625, -1.238525390625, -1.1795654296875, -1.12060546875, -1.0616455078125, -1.002685546875, -0.9437255859375, -0.884765625, -0.8258056640625, -0.766845703125, -0.7078857421875, -0.64892578125, -0.5899658203125, -0.531005859375, -0.4720458984375, -0.4130859375, -0.3541259765625, -0.295166015625, -0.2362060546875, -0.17724609375, -0.1182861328125, -0.059326171875, -0.0003662109375, 0.05859375, 0.1175537109375, 0.176513671875, 0.2354736328125, 0.29443359375, 0.3533935546875, 0.412353515625, 0.4713134765625, 0.5302734375, 0.5892333984375, 0.648193359375, 0.7071533203125, 0.76611328125, 0.8250732421875, 0.884033203125, 0.9429931640625, 1.001953125, 1.0609130859375, 1.119873046875, 1.1788330078125, 1.23779296875, 1.2967529296875, 1.355712890625, 1.4146728515625, 1.4736328125, 1.5325927734375, 1.591552734375, 1.6505126953125, 1.70947265625, 1.7684326171875, 1.827392578125, 1.8863525390625, 1.9453125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 15.0, 19.0, 25.0, 28.0, 31.0, 40.0, 52.0, 55.0, 65.0, 83.0, 62.0, 71.0, 75.0, 70.0, 49.0, 61.0, 38.0, 31.0, 30.0, 25.0, 24.0, 22.0, 10.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.515625, -1.465087890625, -1.41455078125, -1.364013671875, -1.3134765625, -1.262939453125, -1.21240234375, -1.161865234375, -1.111328125, -1.060791015625, -1.01025390625, -0.959716796875, -0.9091796875, -0.858642578125, -0.80810546875, -0.757568359375, -0.70703125, -0.656494140625, -0.60595703125, -0.555419921875, -0.5048828125, -0.454345703125, -0.40380859375, -0.353271484375, -0.302734375, -0.252197265625, -0.20166015625, -0.151123046875, -0.1005859375, -0.050048828125, 0.00048828125, 0.051025390625, 0.1015625, 0.152099609375, 0.20263671875, 0.253173828125, 0.3037109375, 0.354248046875, 0.40478515625, 0.455322265625, 0.505859375, 0.556396484375, 0.60693359375, 0.657470703125, 0.7080078125, 0.758544921875, 0.80908203125, 0.859619140625, 0.91015625, 0.960693359375, 1.01123046875, 1.061767578125, 1.1123046875, 1.162841796875, 1.21337890625, 1.263916015625, 1.314453125, 1.364990234375, 1.41552734375, 1.466064453125, 1.5166015625, 1.567138671875, 1.61767578125, 1.668212890625, 1.71875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 7.0, 14.0, 13.0, 25.0, 13.0, 32.0, 54.0, 62.0, 117.0, 136.0, 238.0, 430.0, 743.0, 1473.0, 3575.0, 11269.0, 45617.0, 236241.0, 583365.0, 126492.0, 26365.0, 7127.0, 2532.0, 1137.0, 589.0, 302.0, 187.0, 120.0, 71.0, 55.0, 31.0, 26.0, 14.0, 15.0, 13.0, 13.0, 3.0, 7.0, 8.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.62109375, -3.505462646484375, -3.38983154296875, -3.274200439453125, -3.1585693359375, -3.042938232421875, -2.92730712890625, -2.811676025390625, -2.696044921875, -2.580413818359375, -2.46478271484375, -2.349151611328125, -2.2335205078125, -2.117889404296875, -2.00225830078125, -1.886627197265625, -1.77099609375, -1.655364990234375, -1.53973388671875, -1.424102783203125, -1.3084716796875, -1.192840576171875, -1.07720947265625, -0.961578369140625, -0.845947265625, -0.730316162109375, -0.61468505859375, -0.499053955078125, -0.3834228515625, -0.267791748046875, -0.15216064453125, -0.036529541015625, 0.0791015625, 0.194732666015625, 0.31036376953125, 0.425994873046875, 0.5416259765625, 0.657257080078125, 0.77288818359375, 0.888519287109375, 1.004150390625, 1.119781494140625, 1.23541259765625, 1.351043701171875, 1.4666748046875, 1.582305908203125, 1.69793701171875, 1.813568115234375, 1.92919921875, 2.044830322265625, 2.16046142578125, 2.276092529296875, 2.3917236328125, 2.507354736328125, 2.62298583984375, 2.738616943359375, 2.854248046875, 2.969879150390625, 3.08551025390625, 3.201141357421875, 3.3167724609375, 3.432403564453125, 3.54803466796875, 3.663665771484375, 3.779296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 4.0, 8.0, 13.0, 13.0, 16.0, 19.0, 23.0, 42.0, 25.0, 36.0, 44.0, 46.0, 52.0, 46.0, 52.0, 60.0, 52.0, 57.0, 53.0, 56.0, 40.0, 46.0, 39.0, 30.0, 27.0, 20.0, 12.0, 15.0, 13.0, 12.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8125, -4.646484375, -4.48046875, -4.314453125, -4.1484375, -3.982421875, -3.81640625, -3.650390625, -3.484375, -3.318359375, -3.15234375, -2.986328125, -2.8203125, -2.654296875, -2.48828125, -2.322265625, -2.15625, -1.990234375, -1.82421875, -1.658203125, -1.4921875, -1.326171875, -1.16015625, -0.994140625, -0.828125, -0.662109375, -0.49609375, -0.330078125, -0.1640625, 0.001953125, 0.16796875, 0.333984375, 0.5, 0.666015625, 0.83203125, 0.998046875, 1.1640625, 1.330078125, 1.49609375, 1.662109375, 1.828125, 1.994140625, 2.16015625, 2.326171875, 2.4921875, 2.658203125, 2.82421875, 2.990234375, 3.15625, 3.322265625, 3.48828125, 3.654296875, 3.8203125, 3.986328125, 4.15234375, 4.318359375, 4.484375, 4.650390625, 4.81640625, 4.982421875, 5.1484375, 5.314453125, 5.48046875, 5.646484375, 5.8125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 6.0, 9.0, 7.0, 6.0, 7.0, 28.0, 32.0, 42.0, 66.0, 128.0, 269.0, 565.0, 1528.0, 5034.0, 31448.0, 666628.0, 317664.0, 19111.0, 3725.0, 1185.0, 523.0, 210.0, 126.0, 72.0, 34.0, 32.0, 14.0, 11.0, 9.0, 8.0, 7.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.86468505859375, -2.7801513671875, -2.69561767578125, -2.611083984375, -2.52655029296875, -2.4420166015625, -2.35748291015625, -2.27294921875, -2.18841552734375, -2.1038818359375, -2.01934814453125, -1.934814453125, -1.85028076171875, -1.7657470703125, -1.68121337890625, -1.5966796875, -1.51214599609375, -1.4276123046875, -1.34307861328125, -1.258544921875, -1.17401123046875, -1.0894775390625, -1.00494384765625, -0.92041015625, -0.83587646484375, -0.7513427734375, -0.66680908203125, -0.582275390625, -0.49774169921875, -0.4132080078125, -0.32867431640625, -0.244140625, -0.15960693359375, -0.0750732421875, 0.00946044921875, 0.093994140625, 0.17852783203125, 0.2630615234375, 0.34759521484375, 0.43212890625, 0.51666259765625, 0.6011962890625, 0.68572998046875, 0.770263671875, 0.85479736328125, 0.9393310546875, 1.02386474609375, 1.1083984375, 1.19293212890625, 1.2774658203125, 1.36199951171875, 1.446533203125, 1.53106689453125, 1.6156005859375, 1.70013427734375, 1.78466796875, 1.86920166015625, 1.9537353515625, 2.03826904296875, 2.122802734375, 2.20733642578125, 2.2918701171875, 2.37640380859375, 2.4609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 5.0, 3.0, 6.0, 13.0, 20.0, 19.0, 17.0, 61.0, 59.0, 75.0, 92.0, 106.0, 117.0, 94.0, 78.0, 59.0, 40.0, 44.0, 18.0, 14.0, 13.0, 7.0, 5.0, 11.0, 3.0, 3.0, 8.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00039124488830566406, -0.0003782697021961212, -0.00036529451608657837, -0.0003523193299770355, -0.0003393441438674927, -0.00032636895775794983, -0.000313393771648407, -0.00030041858553886414, -0.0002874433994293213, -0.00027446821331977844, -0.0002614930272102356, -0.00024851784110069275, -0.0002355426549911499, -0.00022256746888160706, -0.0002095922827720642, -0.00019661709666252136, -0.00018364191055297852, -0.00017066672444343567, -0.00015769153833389282, -0.00014471635222434998, -0.00013174116611480713, -0.00011876598000526428, -0.00010579079389572144, -9.281560778617859e-05, -7.984042167663574e-05, -6.68652355670929e-05, -5.389004945755005e-05, -4.09148633480072e-05, -2.7939677238464355e-05, -1.4964491128921509e-05, -1.989305019378662e-06, 1.0985881090164185e-05, 2.396106719970703e-05, 3.693625330924988e-05, 4.9911439418792725e-05, 6.288662552833557e-05, 7.586181163787842e-05, 8.883699774742126e-05, 0.00010181218385696411, 0.00011478736996650696, 0.0001277625560760498, 0.00014073774218559265, 0.0001537129282951355, 0.00016668811440467834, 0.0001796633005142212, 0.00019263848662376404, 0.00020561367273330688, 0.00021858885884284973, 0.00023156404495239258, 0.0002445392310619354, 0.00025751441717147827, 0.0002704896032810211, 0.00028346478939056396, 0.0002964399755001068, 0.00030941516160964966, 0.0003223903477191925, 0.00033536553382873535, 0.0003483407199382782, 0.00036131590604782104, 0.0003742910921573639, 0.00038726627826690674, 0.0004002414643764496, 0.00041321665048599243, 0.0004261918365955353, 0.0004391670227050781]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 11.0, 16.0, 21.0, 30.0, 55.0, 75.0, 153.0, 271.0, 595.0, 1427.0, 4605.0, 24619.0, 282303.0, 668993.0, 54128.0, 7587.0, 2047.0, 814.0, 353.0, 162.0, 102.0, 67.0, 38.0, 22.0, 15.0, 11.0, 7.0, 6.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.115234375, -2.051483154296875, -1.98773193359375, -1.923980712890625, -1.8602294921875, -1.796478271484375, -1.73272705078125, -1.668975830078125, -1.605224609375, -1.541473388671875, -1.47772216796875, -1.413970947265625, -1.3502197265625, -1.286468505859375, -1.22271728515625, -1.158966064453125, -1.09521484375, -1.031463623046875, -0.96771240234375, -0.903961181640625, -0.8402099609375, -0.776458740234375, -0.71270751953125, -0.648956298828125, -0.585205078125, -0.521453857421875, -0.45770263671875, -0.393951416015625, -0.3302001953125, -0.266448974609375, -0.20269775390625, -0.138946533203125, -0.0751953125, -0.011444091796875, 0.05230712890625, 0.116058349609375, 0.1798095703125, 0.243560791015625, 0.30731201171875, 0.371063232421875, 0.434814453125, 0.498565673828125, 0.56231689453125, 0.626068115234375, 0.6898193359375, 0.753570556640625, 0.81732177734375, 0.881072998046875, 0.94482421875, 1.008575439453125, 1.07232666015625, 1.136077880859375, 1.1998291015625, 1.263580322265625, 1.32733154296875, 1.391082763671875, 1.454833984375, 1.518585205078125, 1.58233642578125, 1.646087646484375, 1.7098388671875, 1.773590087890625, 1.83734130859375, 1.901092529296875, 1.96484375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 6.0, 6.0, 8.0, 21.0, 25.0, 26.0, 30.0, 37.0, 56.0, 61.0, 69.0, 79.0, 80.0, 88.0, 73.0, 80.0, 63.0, 45.0, 35.0, 26.0, 22.0, 18.0, 10.0, 13.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7666015625, -1.7126007080078125, -1.658599853515625, -1.6045989990234375, -1.55059814453125, -1.4965972900390625, -1.442596435546875, -1.3885955810546875, -1.3345947265625, -1.2805938720703125, -1.226593017578125, -1.1725921630859375, -1.11859130859375, -1.0645904541015625, -1.010589599609375, -0.9565887451171875, -0.902587890625, -0.8485870361328125, -0.794586181640625, -0.7405853271484375, -0.68658447265625, -0.6325836181640625, -0.578582763671875, -0.5245819091796875, -0.4705810546875, -0.4165802001953125, -0.362579345703125, -0.3085784912109375, -0.25457763671875, -0.2005767822265625, -0.146575927734375, -0.0925750732421875, -0.03857421875, 0.0154266357421875, 0.069427490234375, 0.1234283447265625, 0.17742919921875, 0.2314300537109375, 0.285430908203125, 0.3394317626953125, 0.3934326171875, 0.4474334716796875, 0.501434326171875, 0.5554351806640625, 0.60943603515625, 0.6634368896484375, 0.717437744140625, 0.7714385986328125, 0.825439453125, 0.8794403076171875, 0.933441162109375, 0.9874420166015625, 1.04144287109375, 1.0954437255859375, 1.149444580078125, 1.2034454345703125, 1.2574462890625, 1.3114471435546875, 1.365447998046875, 1.4194488525390625, 1.47344970703125, 1.5274505615234375, 1.581451416015625, 1.6354522705078125, 1.689453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 19.0, 45.0, 112.0, 216.0, 265.0, 172.0, 85.0, 35.0, 21.0, 6.0, 6.0, 5.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.83061981201172, -35.3729133605957, -33.91520690917969, -32.45750427246094, -30.999797821044922, -29.542091369628906, -28.084386825561523, -26.62668228149414, -25.168975830078125, -23.71126937866211, -22.253564834594727, -20.795860290527344, -19.338153839111328, -17.880447387695312, -16.42274284362793, -14.96503734588623, -13.507331848144531, -12.049626350402832, -10.591920852661133, -9.134215354919434, -7.676509857177734, -6.218804359436035, -4.761098861694336, -3.3033933639526367, -1.8456878662109375, -0.3879823684692383, 1.069723129272461, 2.52742862701416, 3.9851341247558594, 5.442839622497559, 6.900545120239258, 8.358250617980957, 9.815959930419922, 11.273665428161621, 12.73137092590332, 14.18907642364502, 15.646781921386719, 17.104488372802734, 18.562192916870117, 20.0198974609375, 21.477603912353516, 22.93531036376953, 24.393014907836914, 25.850719451904297, 27.308425903320312, 28.766132354736328, 30.22383689880371, 31.681541442871094, 33.13924789428711, 34.596954345703125, 36.054656982421875, 37.51236343383789, 38.970069885253906, 40.42777633666992, 41.88548278808594, 43.34318542480469, 44.8008918762207, 46.25859832763672, 47.71630096435547, 49.174007415771484, 50.6317138671875, 52.089420318603516, 53.54712677001953, 55.00482940673828, 56.4625358581543]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 6.0, 14.0, 14.0, 23.0, 30.0, 27.0, 32.0, 46.0, 43.0, 56.0, 50.0, 64.0, 79.0, 88.0, 75.0, 61.0, 52.0, 54.0, 33.0, 37.0, 30.0, 16.0, 14.0, 14.0, 10.0, 8.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.305660247802734, -35.44225311279297, -34.5788459777832, -33.71543502807617, -32.852027893066406, -31.98862075805664, -31.125213623046875, -30.261804580688477, -29.398395538330078, -28.534988403320312, -27.671579360961914, -26.80817222595215, -25.94476318359375, -25.081356048583984, -24.21794891357422, -23.35453987121582, -22.491132736206055, -21.62772560119629, -20.76431655883789, -19.900909423828125, -19.037500381469727, -18.17409324645996, -17.310684204101562, -16.447277069091797, -15.583868980407715, -14.720460891723633, -13.85705280303955, -12.993644714355469, -12.130237579345703, -11.266828536987305, -10.403421401977539, -9.540013313293457, -8.676603317260742, -7.81319522857666, -6.949787139892578, -6.086379528045654, -5.222971439361572, -4.35956335067749, -3.4961557388305664, -2.6327476501464844, -1.7693395614624023, -0.9059315919876099, -0.04252362251281738, 0.8208842277526855, 1.6842923164367676, 2.5477004051208496, 3.4111080169677734, 4.2745161056518555, 5.1379241943359375, 6.0013322830200195, 6.864740371704102, 7.728147983551025, 8.591556549072266, 9.454963684082031, 10.318371772766113, 11.181779861450195, 12.045187950134277, 12.90859603881836, 13.772004127502441, 14.635412216186523, 15.498819351196289, 16.362228393554688, 17.225635528564453, 18.08904266357422, 18.952451705932617]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 12.0, 16.0, 16.0, 25.0, 47.0, 47.0, 106.0, 224.0, 413.0, 902.0, 2046.0, 5131.0, 14957.0, 56694.0, 404992.0, 2827975.0, 760279.0, 86581.0, 21477.0, 7269.0, 2852.0, 1193.0, 525.0, 240.0, 112.0, 58.0, 38.0, 8.0, 15.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2734375, -2.216064453125, -2.15869140625, -2.101318359375, -2.0439453125, -1.986572265625, -1.92919921875, -1.871826171875, -1.814453125, -1.757080078125, -1.69970703125, -1.642333984375, -1.5849609375, -1.527587890625, -1.47021484375, -1.412841796875, -1.35546875, -1.298095703125, -1.24072265625, -1.183349609375, -1.1259765625, -1.068603515625, -1.01123046875, -0.953857421875, -0.896484375, -0.839111328125, -0.78173828125, -0.724365234375, -0.6669921875, -0.609619140625, -0.55224609375, -0.494873046875, -0.4375, -0.380126953125, -0.32275390625, -0.265380859375, -0.2080078125, -0.150634765625, -0.09326171875, -0.035888671875, 0.021484375, 0.078857421875, 0.13623046875, 0.193603515625, 0.2509765625, 0.308349609375, 0.36572265625, 0.423095703125, 0.48046875, 0.537841796875, 0.59521484375, 0.652587890625, 0.7099609375, 0.767333984375, 0.82470703125, 0.882080078125, 0.939453125, 0.996826171875, 1.05419921875, 1.111572265625, 1.1689453125, 1.226318359375, 1.28369140625, 1.341064453125, 1.3984375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 9.0, 19.0, 23.0, 34.0, 34.0, 66.0, 59.0, 97.0, 85.0, 89.0, 93.0, 99.0, 77.0, 74.0, 49.0, 41.0, 22.0, 20.0, 11.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.11328125, -3.0492782592773438, -2.9852752685546875, -2.9212722778320312, -2.857269287109375, -2.7932662963867188, -2.7292633056640625, -2.6652603149414062, -2.60125732421875, -2.5372543334960938, -2.4732513427734375, -2.4092483520507812, -2.345245361328125, -2.2812423706054688, -2.2172393798828125, -2.1532363891601562, -2.0892333984375, -2.0252304077148438, -1.9612274169921875, -1.8972244262695312, -1.833221435546875, -1.7692184448242188, -1.7052154541015625, -1.6412124633789062, -1.57720947265625, -1.5132064819335938, -1.4492034912109375, -1.3852005004882812, -1.321197509765625, -1.2571945190429688, -1.1931915283203125, -1.1291885375976562, -1.065185546875, -1.0011825561523438, -0.9371795654296875, -0.8731765747070312, -0.809173583984375, -0.7451705932617188, -0.6811676025390625, -0.6171646118164062, -0.55316162109375, -0.48915863037109375, -0.4251556396484375, -0.36115264892578125, -0.297149658203125, -0.23314666748046875, -0.1691436767578125, -0.10514068603515625, -0.0411376953125, 0.02286529541015625, 0.0868682861328125, 0.15087127685546875, 0.214874267578125, 0.27887725830078125, 0.3428802490234375, 0.40688323974609375, 0.47088623046875, 0.5348892211914062, 0.5988922119140625, 0.6628952026367188, 0.726898193359375, 0.7909011840820312, 0.8549041748046875, 0.9189071655273438, 0.98291015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 17.0, 12.0, 20.0, 24.0, 28.0, 54.0, 92.0, 156.0, 272.0, 488.0, 1014.0, 2345.0, 6415.0, 20541.0, 94655.0, 1299692.0, 2568616.0, 153942.0, 30748.0, 9033.0, 3234.0, 1338.0, 645.0, 337.0, 205.0, 110.0, 60.0, 46.0, 39.0, 31.0, 14.0, 15.0, 6.0, 6.0, 10.0, 6.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.578125, -2.48956298828125, -2.4010009765625, -2.31243896484375, -2.223876953125, -2.13531494140625, -2.0467529296875, -1.95819091796875, -1.86962890625, -1.78106689453125, -1.6925048828125, -1.60394287109375, -1.515380859375, -1.42681884765625, -1.3382568359375, -1.24969482421875, -1.1611328125, -1.07257080078125, -0.9840087890625, -0.89544677734375, -0.806884765625, -0.71832275390625, -0.6297607421875, -0.54119873046875, -0.45263671875, -0.36407470703125, -0.2755126953125, -0.18695068359375, -0.098388671875, -0.00982666015625, 0.0787353515625, 0.16729736328125, 0.255859375, 0.34442138671875, 0.4329833984375, 0.52154541015625, 0.610107421875, 0.69866943359375, 0.7872314453125, 0.87579345703125, 0.96435546875, 1.05291748046875, 1.1414794921875, 1.23004150390625, 1.318603515625, 1.40716552734375, 1.4957275390625, 1.58428955078125, 1.6728515625, 1.76141357421875, 1.8499755859375, 1.93853759765625, 2.027099609375, 2.11566162109375, 2.2042236328125, 2.29278564453125, 2.38134765625, 2.46990966796875, 2.5584716796875, 2.64703369140625, 2.735595703125, 2.82415771484375, 2.9127197265625, 3.00128173828125, 3.08984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 2.0, 6.0, 5.0, 5.0, 8.0, 18.0, 20.0, 21.0, 34.0, 47.0, 64.0, 105.0, 206.0, 321.0, 553.0, 825.0, 678.0, 404.0, 246.0, 130.0, 97.0, 63.0, 61.0, 42.0, 25.0, 19.0, 17.0, 10.0, 11.0, 7.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.2421875, -3.14324951171875, -3.0443115234375, -2.94537353515625, -2.846435546875, -2.74749755859375, -2.6485595703125, -2.54962158203125, -2.45068359375, -2.35174560546875, -2.2528076171875, -2.15386962890625, -2.054931640625, -1.95599365234375, -1.8570556640625, -1.75811767578125, -1.6591796875, -1.56024169921875, -1.4613037109375, -1.36236572265625, -1.263427734375, -1.16448974609375, -1.0655517578125, -0.96661376953125, -0.86767578125, -0.76873779296875, -0.6697998046875, -0.57086181640625, -0.471923828125, -0.37298583984375, -0.2740478515625, -0.17510986328125, -0.076171875, 0.02276611328125, 0.1217041015625, 0.22064208984375, 0.319580078125, 0.41851806640625, 0.5174560546875, 0.61639404296875, 0.71533203125, 0.81427001953125, 0.9132080078125, 1.01214599609375, 1.111083984375, 1.21002197265625, 1.3089599609375, 1.40789794921875, 1.5068359375, 1.60577392578125, 1.7047119140625, 1.80364990234375, 1.902587890625, 2.00152587890625, 2.1004638671875, 2.19940185546875, 2.29833984375, 2.39727783203125, 2.4962158203125, 2.59515380859375, 2.694091796875, 2.79302978515625, 2.8919677734375, 2.99090576171875, 3.08984375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 17.0, 38.0, 90.0, 217.0, 273.0, 204.0, 87.0, 39.0, 16.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.38591766357422, -22.97064208984375, -21.55536651611328, -20.140090942382812, -18.724817276000977, -17.309541702270508, -15.894266128540039, -14.478991508483887, -13.063715934753418, -11.64844036102295, -10.233165740966797, -8.817890167236328, -7.402615070343018, -5.987339973449707, -4.572064399719238, -3.156789779663086, -1.7415142059326172, -0.3262389898300171, 1.089036226272583, 2.5043115615844727, 3.919586658477783, 5.334861755371094, 6.7501373291015625, 8.165411949157715, 9.580687522888184, 10.995963096618652, 12.411237716674805, 13.826513290405273, 15.241788864135742, 16.657062530517578, 18.072338104248047, 19.487613677978516, 20.902889251708984, 22.318164825439453, 23.733440399169922, 25.14871597290039, 26.563989639282227, 27.979265213012695, 29.394540786743164, 30.809814453125, 32.22509002685547, 33.64036560058594, 35.055641174316406, 36.470916748046875, 37.886192321777344, 39.30146789550781, 40.71674346923828, 42.132015228271484, 43.54729461669922, 44.96257019042969, 46.377845764160156, 47.793121337890625, 49.208396911621094, 50.62367248535156, 52.03894805908203, 53.454219818115234, 54.8694953918457, 56.28477096557617, 57.70004653930664, 59.11532211303711, 60.53059768676758, 61.94586944580078, 63.36114501953125, 64.77642059326172, 66.19169616699219]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 10.0, 8.0, 11.0, 12.0, 8.0, 21.0, 22.0, 25.0, 25.0, 32.0, 30.0, 26.0, 39.0, 46.0, 47.0, 43.0, 49.0, 47.0, 45.0, 63.0, 52.0, 41.0, 41.0, 30.0, 28.0, 24.0, 20.0, 30.0, 20.0, 21.0, 13.0, 21.0, 11.0, 6.0, 6.0, 10.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.254129409790039, -13.804848670959473, -13.355567932128906, -12.90628719329834, -12.457006454467773, -12.00772476196289, -11.558444023132324, -11.109163284301758, -10.659882545471191, -10.210601806640625, -9.761321067810059, -9.312040328979492, -8.86275863647461, -8.41347885131836, -7.964197158813477, -7.51491641998291, -7.065635681152344, -6.616354942321777, -6.167074203491211, -5.717792987823486, -5.26851224899292, -4.8192315101623535, -4.369950294494629, -3.9206695556640625, -3.471388816833496, -3.0221080780029297, -2.572827100753784, -2.1235461235046387, -1.6742653846740723, -1.2249846458435059, -0.7757036685943604, -0.32642269134521484, 0.12285804748535156, 0.5721389055252075, 1.0214197635650635, 1.4707006216049194, 1.9199814796447754, 2.369262218475342, 2.8185431957244873, 3.267824172973633, 3.717104911804199, 4.166385650634766, 4.615666389465332, 5.064947605133057, 5.514228343963623, 5.9635090827941895, 6.412790298461914, 6.8620710372924805, 7.311351776123047, 7.760632514953613, 8.20991325378418, 8.659193992614746, 9.108474731445312, 9.557756423950195, 10.007037162780762, 10.456317901611328, 10.905598640441895, 11.354879379272461, 11.804160118103027, 12.253440856933594, 12.702722549438477, 13.152002334594727, 13.60128402709961, 14.050564765930176, 14.499845504760742]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 10.0, 7.0, 12.0, 31.0, 28.0, 45.0, 71.0, 152.0, 261.0, 457.0, 965.0, 1932.0, 4115.0, 9190.0, 21442.0, 49233.0, 110050.0, 214552.0, 276413.0, 191381.0, 93646.0, 41402.0, 18134.0, 7990.0, 3547.0, 1696.0, 754.0, 443.0, 225.0, 142.0, 82.0, 44.0, 28.0, 30.0, 26.0, 10.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8544921875, -1.8035430908203125, -1.752593994140625, -1.7016448974609375, -1.65069580078125, -1.5997467041015625, -1.548797607421875, -1.4978485107421875, -1.4468994140625, -1.3959503173828125, -1.345001220703125, -1.2940521240234375, -1.24310302734375, -1.1921539306640625, -1.141204833984375, -1.0902557373046875, -1.039306640625, -0.9883575439453125, -0.937408447265625, -0.8864593505859375, -0.83551025390625, -0.7845611572265625, -0.733612060546875, -0.6826629638671875, -0.6317138671875, -0.5807647705078125, -0.529815673828125, -0.4788665771484375, -0.42791748046875, -0.3769683837890625, -0.326019287109375, -0.2750701904296875, -0.22412109375, -0.1731719970703125, -0.122222900390625, -0.0712738037109375, -0.02032470703125, 0.0306243896484375, 0.081573486328125, 0.1325225830078125, 0.1834716796875, 0.2344207763671875, 0.285369873046875, 0.3363189697265625, 0.38726806640625, 0.4382171630859375, 0.489166259765625, 0.5401153564453125, 0.591064453125, 0.6420135498046875, 0.692962646484375, 0.7439117431640625, 0.79486083984375, 0.8458099365234375, 0.896759033203125, 0.9477081298828125, 0.9986572265625, 1.0496063232421875, 1.100555419921875, 1.1515045166015625, 1.20245361328125, 1.2534027099609375, 1.304351806640625, 1.3553009033203125, 1.40625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 4.0, 9.0, 18.0, 10.0, 14.0, 27.0, 30.0, 32.0, 37.0, 55.0, 55.0, 54.0, 65.0, 61.0, 51.0, 42.0, 58.0, 52.0, 47.0, 51.0, 46.0, 30.0, 32.0, 34.0, 27.0, 18.0, 10.0, 9.0, 9.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.7373046875, -1.6965789794921875, -1.655853271484375, -1.6151275634765625, -1.57440185546875, -1.5336761474609375, -1.492950439453125, -1.4522247314453125, -1.4114990234375, -1.3707733154296875, -1.330047607421875, -1.2893218994140625, -1.24859619140625, -1.2078704833984375, -1.167144775390625, -1.1264190673828125, -1.085693359375, -1.0449676513671875, -1.004241943359375, -0.9635162353515625, -0.92279052734375, -0.8820648193359375, -0.841339111328125, -0.8006134033203125, -0.7598876953125, -0.7191619873046875, -0.678436279296875, -0.6377105712890625, -0.59698486328125, -0.5562591552734375, -0.515533447265625, -0.4748077392578125, -0.43408203125, -0.3933563232421875, -0.352630615234375, -0.3119049072265625, -0.27117919921875, -0.2304534912109375, -0.189727783203125, -0.1490020751953125, -0.1082763671875, -0.0675506591796875, -0.026824951171875, 0.0139007568359375, 0.05462646484375, 0.0953521728515625, 0.136077880859375, 0.1768035888671875, 0.217529296875, 0.2582550048828125, 0.298980712890625, 0.3397064208984375, 0.38043212890625, 0.4211578369140625, 0.461883544921875, 0.5026092529296875, 0.5433349609375, 0.5840606689453125, 0.624786376953125, 0.6655120849609375, 0.70623779296875, 0.7469635009765625, 0.787689208984375, 0.8284149169921875, 0.869140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 13.0, 20.0, 21.0, 30.0, 42.0, 53.0, 85.0, 124.0, 199.0, 270.0, 449.0, 775.0, 1290.0, 2792.0, 8073.0, 41757.0, 310263.0, 591143.0, 71719.0, 11867.0, 3512.0, 1586.0, 879.0, 534.0, 357.0, 224.0, 141.0, 111.0, 60.0, 43.0, 37.0, 24.0, 16.0, 11.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.47265625, -4.355377197265625, -4.23809814453125, -4.120819091796875, -4.0035400390625, -3.886260986328125, -3.76898193359375, -3.651702880859375, -3.534423828125, -3.417144775390625, -3.29986572265625, -3.182586669921875, -3.0653076171875, -2.948028564453125, -2.83074951171875, -2.713470458984375, -2.59619140625, -2.478912353515625, -2.36163330078125, -2.244354248046875, -2.1270751953125, -2.009796142578125, -1.89251708984375, -1.775238037109375, -1.657958984375, -1.540679931640625, -1.42340087890625, -1.306121826171875, -1.1888427734375, -1.071563720703125, -0.95428466796875, -0.837005615234375, -0.7197265625, -0.602447509765625, -0.48516845703125, -0.367889404296875, -0.2506103515625, -0.133331298828125, -0.01605224609375, 0.101226806640625, 0.218505859375, 0.335784912109375, 0.45306396484375, 0.570343017578125, 0.6876220703125, 0.804901123046875, 0.92218017578125, 1.039459228515625, 1.15673828125, 1.274017333984375, 1.39129638671875, 1.508575439453125, 1.6258544921875, 1.743133544921875, 1.86041259765625, 1.977691650390625, 2.094970703125, 2.212249755859375, 2.32952880859375, 2.446807861328125, 2.5640869140625, 2.681365966796875, 2.79864501953125, 2.915924072265625, 3.033203125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 7.0, 4.0, 7.0, 11.0, 13.0, 26.0, 30.0, 35.0, 35.0, 37.0, 43.0, 52.0, 61.0, 67.0, 52.0, 87.0, 65.0, 61.0, 62.0, 45.0, 43.0, 31.0, 29.0, 25.0, 21.0, 24.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.54296875, -7.35833740234375, -7.1737060546875, -6.98907470703125, -6.804443359375, -6.61981201171875, -6.4351806640625, -6.25054931640625, -6.06591796875, -5.88128662109375, -5.6966552734375, -5.51202392578125, -5.327392578125, -5.14276123046875, -4.9581298828125, -4.77349853515625, -4.5888671875, -4.40423583984375, -4.2196044921875, -4.03497314453125, -3.850341796875, -3.66571044921875, -3.4810791015625, -3.29644775390625, -3.11181640625, -2.92718505859375, -2.7425537109375, -2.55792236328125, -2.373291015625, -2.18865966796875, -2.0040283203125, -1.81939697265625, -1.634765625, -1.45013427734375, -1.2655029296875, -1.08087158203125, -0.896240234375, -0.71160888671875, -0.5269775390625, -0.34234619140625, -0.15771484375, 0.02691650390625, 0.2115478515625, 0.39617919921875, 0.580810546875, 0.76544189453125, 0.9500732421875, 1.13470458984375, 1.3193359375, 1.50396728515625, 1.6885986328125, 1.87322998046875, 2.057861328125, 2.24249267578125, 2.4271240234375, 2.61175537109375, 2.79638671875, 2.98101806640625, 3.1656494140625, 3.35028076171875, 3.534912109375, 3.71954345703125, 3.9041748046875, 4.08880615234375, 4.2734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 16.0, 13.0, 31.0, 90.0, 168.0, 557.0, 2035.0, 19816.0, 876368.0, 142508.0, 5368.0, 1024.0, 313.0, 121.0, 52.0, 29.0, 15.0, 8.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.957305908203125, -2.86968994140625, -2.782073974609375, -2.6944580078125, -2.606842041015625, -2.51922607421875, -2.431610107421875, -2.343994140625, -2.256378173828125, -2.16876220703125, -2.081146240234375, -1.9935302734375, -1.905914306640625, -1.81829833984375, -1.730682373046875, -1.64306640625, -1.555450439453125, -1.46783447265625, -1.380218505859375, -1.2926025390625, -1.204986572265625, -1.11737060546875, -1.029754638671875, -0.942138671875, -0.854522705078125, -0.76690673828125, -0.679290771484375, -0.5916748046875, -0.504058837890625, -0.41644287109375, -0.328826904296875, -0.2412109375, -0.153594970703125, -0.06597900390625, 0.021636962890625, 0.1092529296875, 0.196868896484375, 0.28448486328125, 0.372100830078125, 0.459716796875, 0.547332763671875, 0.63494873046875, 0.722564697265625, 0.8101806640625, 0.897796630859375, 0.98541259765625, 1.073028564453125, 1.16064453125, 1.248260498046875, 1.33587646484375, 1.423492431640625, 1.5111083984375, 1.598724365234375, 1.68634033203125, 1.773956298828125, 1.861572265625, 1.949188232421875, 2.03680419921875, 2.124420166015625, 2.2120361328125, 2.299652099609375, 2.38726806640625, 2.474884033203125, 2.5625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 3.0, 2.0, 3.0, 13.0, 13.0, 10.0, 21.0, 19.0, 22.0, 28.0, 31.0, 47.0, 54.0, 52.0, 85.0, 67.0, 83.0, 90.0, 60.0, 50.0, 43.0, 46.0, 39.0, 30.0, 19.0, 13.0, 15.0, 9.0, 7.0, 9.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021457672119140625, -0.00020572543144226074, -0.00019687414169311523, -0.00018802285194396973, -0.00017917156219482422, -0.0001703202724456787, -0.0001614689826965332, -0.0001526176929473877, -0.0001437664031982422, -0.00013491511344909668, -0.00012606382369995117, -0.00011721253395080566, -0.00010836124420166016, -9.950995445251465e-05, -9.065866470336914e-05, -8.180737495422363e-05, -7.295608520507812e-05, -6.410479545593262e-05, -5.525350570678711e-05, -4.64022159576416e-05, -3.7550926208496094e-05, -2.8699636459350586e-05, -1.9848346710205078e-05, -1.099705696105957e-05, -2.1457672119140625e-06, 6.705522537231445e-06, 1.5556812286376953e-05, 2.440810203552246e-05, 3.325939178466797e-05, 4.2110681533813477e-05, 5.0961971282958984e-05, 5.981326103210449e-05, 6.866455078125e-05, 7.751584053039551e-05, 8.636713027954102e-05, 9.521842002868652e-05, 0.00010406970977783203, 0.00011292099952697754, 0.00012177228927612305, 0.00013062357902526855, 0.00013947486877441406, 0.00014832615852355957, 0.00015717744827270508, 0.00016602873802185059, 0.0001748800277709961, 0.0001837313175201416, 0.0001925826072692871, 0.00020143389701843262, 0.00021028518676757812, 0.00021913647651672363, 0.00022798776626586914, 0.00023683905601501465, 0.00024569034576416016, 0.00025454163551330566, 0.00026339292526245117, 0.0002722442150115967, 0.0002810955047607422, 0.0002899467945098877, 0.0002987980842590332, 0.0003076493740081787, 0.0003165006637573242, 0.0003253519535064697, 0.00033420324325561523, 0.00034305453300476074, 0.00035190582275390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 5.0, 9.0, 9.0, 11.0, 21.0, 24.0, 49.0, 70.0, 85.0, 182.0, 265.0, 424.0, 777.0, 1589.0, 3690.0, 11771.0, 57742.0, 528702.0, 374913.0, 50672.0, 10681.0, 3495.0, 1510.0, 725.0, 404.0, 241.0, 148.0, 93.0, 61.0, 51.0, 30.0, 33.0, 14.0, 16.0, 12.0, 6.0, 5.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9940032958984375, -0.959686279296875, -0.9253692626953125, -0.89105224609375, -0.8567352294921875, -0.822418212890625, -0.7881011962890625, -0.7537841796875, -0.7194671630859375, -0.685150146484375, -0.6508331298828125, -0.61651611328125, -0.5821990966796875, -0.547882080078125, -0.5135650634765625, -0.479248046875, -0.4449310302734375, -0.410614013671875, -0.3762969970703125, -0.34197998046875, -0.3076629638671875, -0.273345947265625, -0.2390289306640625, -0.2047119140625, -0.1703948974609375, -0.136077880859375, -0.1017608642578125, -0.06744384765625, -0.0331268310546875, 0.001190185546875, 0.0355072021484375, 0.06982421875, 0.1041412353515625, 0.138458251953125, 0.1727752685546875, 0.20709228515625, 0.2414093017578125, 0.275726318359375, 0.3100433349609375, 0.3443603515625, 0.3786773681640625, 0.412994384765625, 0.4473114013671875, 0.48162841796875, 0.5159454345703125, 0.550262451171875, 0.5845794677734375, 0.618896484375, 0.6532135009765625, 0.687530517578125, 0.7218475341796875, 0.75616455078125, 0.7904815673828125, 0.824798583984375, 0.8591156005859375, 0.8934326171875, 0.9277496337890625, 0.962066650390625, 0.9963836669921875, 1.03070068359375, 1.0650177001953125, 1.099334716796875, 1.1336517333984375, 1.16796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 8.0, 6.0, 12.0, 8.0, 12.0, 20.0, 20.0, 26.0, 31.0, 43.0, 37.0, 52.0, 61.0, 58.0, 75.0, 66.0, 56.0, 59.0, 49.0, 49.0, 45.0, 43.0, 39.0, 21.0, 28.0, 15.0, 16.0, 10.0, 2.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91015625, -0.8780517578125, -0.845947265625, -0.8138427734375, -0.78173828125, -0.7496337890625, -0.717529296875, -0.6854248046875, -0.6533203125, -0.6212158203125, -0.589111328125, -0.5570068359375, -0.52490234375, -0.4927978515625, -0.460693359375, -0.4285888671875, -0.396484375, -0.3643798828125, -0.332275390625, -0.3001708984375, -0.26806640625, -0.2359619140625, -0.203857421875, -0.1717529296875, -0.1396484375, -0.1075439453125, -0.075439453125, -0.0433349609375, -0.01123046875, 0.0208740234375, 0.052978515625, 0.0850830078125, 0.1171875, 0.1492919921875, 0.181396484375, 0.2135009765625, 0.24560546875, 0.2777099609375, 0.309814453125, 0.3419189453125, 0.3740234375, 0.4061279296875, 0.438232421875, 0.4703369140625, 0.50244140625, 0.5345458984375, 0.566650390625, 0.5987548828125, 0.630859375, 0.6629638671875, 0.695068359375, 0.7271728515625, 0.75927734375, 0.7913818359375, 0.823486328125, 0.8555908203125, 0.8876953125, 0.9197998046875, 0.951904296875, 0.9840087890625, 1.01611328125, 1.0482177734375, 1.080322265625, 1.1124267578125, 1.14453125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 2.0, 7.0, 16.0, 36.0, 57.0, 87.0, 119.0, 222.0, 169.0, 121.0, 74.0, 40.0, 21.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.81401824951172, -31.917997360229492, -31.021976470947266, -30.12595558166504, -29.229934692382812, -28.333913803100586, -27.43789291381836, -26.541872024536133, -25.645851135253906, -24.74983024597168, -23.853809356689453, -22.957788467407227, -22.061767578125, -21.165746688842773, -20.269725799560547, -19.37370491027832, -18.477684020996094, -17.581663131713867, -16.68564224243164, -15.789621353149414, -14.893600463867188, -13.997579574584961, -13.101558685302734, -12.205537796020508, -11.309516906738281, -10.413496017456055, -9.517475128173828, -8.621454238891602, -7.725433349609375, -6.829412460327148, -5.933391571044922, -5.037370681762695, -4.141349792480469, -3.245328903198242, -2.3493080139160156, -1.453287124633789, -0.5572662353515625, 0.33875465393066406, 1.2347755432128906, 2.130796432495117, 3.0268173217773438, 3.9228382110595703, 4.818859100341797, 5.714879989624023, 6.61090087890625, 7.506921768188477, 8.402942657470703, 9.29896354675293, 10.194984436035156, 11.091005325317383, 11.98702621459961, 12.883047103881836, 13.779067993164062, 14.675088882446289, 15.571109771728516, 16.467130661010742, 17.36315155029297, 18.259172439575195, 19.155193328857422, 20.05121421813965, 20.947235107421875, 21.8432559967041, 22.739276885986328, 23.635297775268555, 24.53131866455078]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 7.0, 5.0, 8.0, 3.0, 12.0, 19.0, 25.0, 28.0, 22.0, 22.0, 28.0, 33.0, 37.0, 37.0, 43.0, 55.0, 63.0, 67.0, 64.0, 64.0, 46.0, 34.0, 36.0, 27.0, 26.0, 35.0, 19.0, 25.0, 14.0, 15.0, 16.0, 8.0, 10.0, 10.0, 6.0, 8.0, 3.0, 2.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.392358779907227, -16.842315673828125, -16.292272567749023, -15.742228507995605, -15.192185401916504, -14.642142295837402, -14.092098236083984, -13.542055130004883, -12.992012023925781, -12.44196891784668, -11.891925811767578, -11.34188175201416, -10.791838645935059, -10.241795539855957, -9.691751480102539, -9.141708374023438, -8.591665267944336, -8.041622161865234, -7.491578578948975, -6.941534996032715, -6.391491889953613, -5.841448783874512, -5.291405200958252, -4.741361618041992, -4.191318511962891, -3.64127516746521, -3.0912318229675293, -2.5411884784698486, -1.991145133972168, -1.4411017894744873, -0.8910584449768066, -0.341015100479126, 0.20902633666992188, 0.7590696811676025, 1.3091130256652832, 1.8591563701629639, 2.4091997146606445, 2.959243059158325, 3.509286403656006, 4.059329986572266, 4.609373092651367, 5.159416198730469, 5.7094597816467285, 6.259503364562988, 6.80954647064209, 7.359589576721191, 7.909633159637451, 8.459676742553711, 9.009719848632812, 9.559762954711914, 10.109806060791016, 10.659850120544434, 11.209893226623535, 11.759936332702637, 12.309980392456055, 12.860023498535156, 13.410066604614258, 13.96010971069336, 14.510152816772461, 15.060196876525879, 15.61023998260498, 16.1602840423584, 16.7103271484375, 17.2603702545166, 17.810413360595703]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 5.0, 14.0, 19.0, 23.0, 24.0, 46.0, 60.0, 96.0, 179.0, 303.0, 519.0, 947.0, 1550.0, 2999.0, 5851.0, 11603.0, 26092.0, 67307.0, 224594.0, 862959.0, 1826528.0, 832502.0, 214093.0, 65896.0, 25592.0, 11738.0, 5784.0, 3055.0, 1640.0, 930.0, 580.0, 280.0, 178.0, 112.0, 67.0, 58.0, 19.0, 18.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0693359375, -1.0408096313476562, -1.0122833251953125, -0.9837570190429688, -0.955230712890625, -0.9267044067382812, -0.8981781005859375, -0.8696517944335938, -0.84112548828125, -0.8125991821289062, -0.7840728759765625, -0.7555465698242188, -0.727020263671875, -0.6984939575195312, -0.6699676513671875, -0.6414413452148438, -0.6129150390625, -0.5843887329101562, -0.5558624267578125, -0.5273361206054688, -0.498809814453125, -0.47028350830078125, -0.4417572021484375, -0.41323089599609375, -0.38470458984375, -0.35617828369140625, -0.3276519775390625, -0.29912567138671875, -0.270599365234375, -0.24207305908203125, -0.2135467529296875, -0.18502044677734375, -0.156494140625, -0.12796783447265625, -0.0994415283203125, -0.07091522216796875, -0.042388916015625, -0.01386260986328125, 0.0146636962890625, 0.04319000244140625, 0.07171630859375, 0.10024261474609375, 0.1287689208984375, 0.15729522705078125, 0.185821533203125, 0.21434783935546875, 0.2428741455078125, 0.27140045166015625, 0.2999267578125, 0.32845306396484375, 0.3569793701171875, 0.38550567626953125, 0.414031982421875, 0.44255828857421875, 0.4710845947265625, 0.49961090087890625, 0.52813720703125, 0.5566635131835938, 0.5851898193359375, 0.6137161254882812, 0.642242431640625, 0.6707687377929688, 0.6992950439453125, 0.7278213500976562, 0.75634765625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 10.0, 7.0, 6.0, 8.0, 10.0, 11.0, 12.0, 12.0, 16.0, 15.0, 21.0, 29.0, 34.0, 38.0, 35.0, 38.0, 35.0, 40.0, 33.0, 49.0, 44.0, 41.0, 46.0, 30.0, 33.0, 45.0, 36.0, 38.0, 25.0, 30.0, 24.0, 16.0, 18.0, 9.0, 15.0, 15.0, 16.0, 10.0, 13.0, 10.0, 6.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.8359375, -0.81036376953125, -0.7847900390625, -0.75921630859375, -0.733642578125, -0.70806884765625, -0.6824951171875, -0.65692138671875, -0.63134765625, -0.60577392578125, -0.5802001953125, -0.55462646484375, -0.529052734375, -0.50347900390625, -0.4779052734375, -0.45233154296875, -0.4267578125, -0.40118408203125, -0.3756103515625, -0.35003662109375, -0.324462890625, -0.29888916015625, -0.2733154296875, -0.24774169921875, -0.22216796875, -0.19659423828125, -0.1710205078125, -0.14544677734375, -0.119873046875, -0.09429931640625, -0.0687255859375, -0.04315185546875, -0.017578125, 0.00799560546875, 0.0335693359375, 0.05914306640625, 0.084716796875, 0.11029052734375, 0.1358642578125, 0.16143798828125, 0.18701171875, 0.21258544921875, 0.2381591796875, 0.26373291015625, 0.289306640625, 0.31488037109375, 0.3404541015625, 0.36602783203125, 0.3916015625, 0.41717529296875, 0.4427490234375, 0.46832275390625, 0.493896484375, 0.51947021484375, 0.5450439453125, 0.57061767578125, 0.59619140625, 0.62176513671875, 0.6473388671875, 0.67291259765625, 0.698486328125, 0.72406005859375, 0.7496337890625, 0.77520751953125, 0.80078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 9.0, 6.0, 9.0, 15.0, 26.0, 22.0, 42.0, 38.0, 74.0, 116.0, 164.0, 327.0, 630.0, 1498.0, 4174.0, 13982.0, 58478.0, 435522.0, 3220498.0, 381593.0, 55331.0, 13750.0, 4434.0, 1747.0, 777.0, 414.0, 221.0, 133.0, 71.0, 60.0, 39.0, 26.0, 16.0, 10.0, 5.0, 9.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.39453125, -2.322998046875, -2.25146484375, -2.179931640625, -2.1083984375, -2.036865234375, -1.96533203125, -1.893798828125, -1.822265625, -1.750732421875, -1.67919921875, -1.607666015625, -1.5361328125, -1.464599609375, -1.39306640625, -1.321533203125, -1.25, -1.178466796875, -1.10693359375, -1.035400390625, -0.9638671875, -0.892333984375, -0.82080078125, -0.749267578125, -0.677734375, -0.606201171875, -0.53466796875, -0.463134765625, -0.3916015625, -0.320068359375, -0.24853515625, -0.177001953125, -0.10546875, -0.033935546875, 0.03759765625, 0.109130859375, 0.1806640625, 0.252197265625, 0.32373046875, 0.395263671875, 0.466796875, 0.538330078125, 0.60986328125, 0.681396484375, 0.7529296875, 0.824462890625, 0.89599609375, 0.967529296875, 1.0390625, 1.110595703125, 1.18212890625, 1.253662109375, 1.3251953125, 1.396728515625, 1.46826171875, 1.539794921875, 1.611328125, 1.682861328125, 1.75439453125, 1.825927734375, 1.8974609375, 1.968994140625, 2.04052734375, 2.112060546875, 2.18359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 9.0, 18.0, 15.0, 25.0, 29.0, 36.0, 51.0, 103.0, 138.0, 269.0, 486.0, 668.0, 768.0, 536.0, 357.0, 166.0, 116.0, 80.0, 55.0, 36.0, 23.0, 15.0, 17.0, 14.0, 8.0, 6.0, 3.0, 2.0, 6.0, 1.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.615234375, -2.5286865234375, -2.442138671875, -2.3555908203125, -2.26904296875, -2.1824951171875, -2.095947265625, -2.0093994140625, -1.9228515625, -1.8363037109375, -1.749755859375, -1.6632080078125, -1.57666015625, -1.4901123046875, -1.403564453125, -1.3170166015625, -1.23046875, -1.1439208984375, -1.057373046875, -0.9708251953125, -0.88427734375, -0.7977294921875, -0.711181640625, -0.6246337890625, -0.5380859375, -0.4515380859375, -0.364990234375, -0.2784423828125, -0.19189453125, -0.1053466796875, -0.018798828125, 0.0677490234375, 0.154296875, 0.2408447265625, 0.327392578125, 0.4139404296875, 0.50048828125, 0.5870361328125, 0.673583984375, 0.7601318359375, 0.8466796875, 0.9332275390625, 1.019775390625, 1.1063232421875, 1.19287109375, 1.2794189453125, 1.365966796875, 1.4525146484375, 1.5390625, 1.6256103515625, 1.712158203125, 1.7987060546875, 1.88525390625, 1.9718017578125, 2.058349609375, 2.1448974609375, 2.2314453125, 2.3179931640625, 2.404541015625, 2.4910888671875, 2.57763671875, 2.6641845703125, 2.750732421875, 2.8372802734375, 2.923828125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 11.0, 35.0, 74.0, 259.0, 284.0, 220.0, 57.0, 26.0, 20.0, 2.0, 7.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.636878967285156, -43.29689025878906, -41.9568977355957, -40.616905212402344, -39.27691650390625, -37.936927795410156, -36.5969352722168, -35.25694274902344, -33.916954040527344, -32.57696533203125, -31.23697280883789, -29.896982192993164, -28.556991577148438, -27.21700096130371, -25.877010345458984, -24.537019729614258, -23.19702911376953, -21.857038497924805, -20.517047882080078, -19.17705726623535, -17.837066650390625, -16.4970760345459, -15.157085418701172, -13.817094802856445, -12.477104187011719, -11.137113571166992, -9.797122955322266, -8.457132339477539, -7.1171417236328125, -5.777151107788086, -4.437160491943359, -3.097169876098633, -1.7571754455566406, -0.41718482971191406, 0.9228057861328125, 2.262796401977539, 3.6027870178222656, 4.942777633666992, 6.282768249511719, 7.622758865356445, 8.962749481201172, 10.302740097045898, 11.642730712890625, 12.982721328735352, 14.322711944580078, 15.662702560424805, 17.00269317626953, 18.342683792114258, 19.682674407958984, 21.02266502380371, 22.362655639648438, 23.702646255493164, 25.04263687133789, 26.382627487182617, 27.722618103027344, 29.06260871887207, 30.402599334716797, 31.742589950561523, 33.08258056640625, 34.422569274902344, 35.7625617980957, 37.10255432128906, 38.442543029785156, 39.78253173828125, 41.12252426147461]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 12.0, 10.0, 8.0, 8.0, 10.0, 13.0, 15.0, 18.0, 23.0, 27.0, 33.0, 38.0, 39.0, 55.0, 46.0, 54.0, 54.0, 64.0, 58.0, 58.0, 59.0, 46.0, 45.0, 40.0, 29.0, 29.0, 20.0, 21.0, 13.0, 10.0, 16.0, 7.0, 8.0, 2.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.405157089233398, -10.970491409301758, -10.535825729370117, -10.101160049438477, -9.666494369506836, -9.231828689575195, -8.797163009643555, -8.362497329711914, -7.927831649780273, -7.493165969848633, -7.058500289916992, -6.623834609985352, -6.189168930053711, -5.75450325012207, -5.31983757019043, -4.885171890258789, -4.45050573348999, -4.01584005355835, -3.581174373626709, -3.1465086936950684, -2.7118430137634277, -2.277177095413208, -1.8425114154815674, -1.4078457355499268, -0.9731800556182861, -0.5385143756866455, -0.10384863615036011, 0.3308171033859253, 0.7654827833175659, 1.200148582458496, 1.6348142623901367, 2.0694799423217773, 2.504145622253418, 2.9388113021850586, 3.373476982116699, 3.80814266204834, 4.2428083419799805, 4.677474021911621, 5.112139701843262, 5.546805381774902, 5.981471061706543, 6.416136741638184, 6.850802421569824, 7.285468101501465, 7.7201337814331055, 8.154799461364746, 8.589465141296387, 9.024130821228027, 9.458797454833984, 9.893463134765625, 10.328128814697266, 10.762794494628906, 11.197460174560547, 11.632125854492188, 12.066791534423828, 12.501457214355469, 12.93612289428711, 13.37078857421875, 13.80545425415039, 14.240119934082031, 14.674785614013672, 15.109451293945312, 15.544116973876953, 15.978782653808594, 16.413448333740234]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 2.0, 6.0, 11.0, 17.0, 22.0, 41.0, 47.0, 86.0, 120.0, 200.0, 296.0, 450.0, 721.0, 1266.0, 2099.0, 3736.0, 6752.0, 12405.0, 23564.0, 44899.0, 85543.0, 155699.0, 230588.0, 208434.0, 126814.0, 67570.0, 35239.0, 18756.0, 9957.0, 5443.0, 3106.0, 1803.0, 1105.0, 606.0, 402.0, 261.0, 161.0, 105.0, 76.0, 44.0, 36.0, 20.0, 13.0, 8.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.3134765625, -1.2708587646484375, -1.228240966796875, -1.1856231689453125, -1.14300537109375, -1.1003875732421875, -1.057769775390625, -1.0151519775390625, -0.9725341796875, -0.9299163818359375, -0.887298583984375, -0.8446807861328125, -0.80206298828125, -0.7594451904296875, -0.716827392578125, -0.6742095947265625, -0.631591796875, -0.5889739990234375, -0.546356201171875, -0.5037384033203125, -0.46112060546875, -0.4185028076171875, -0.375885009765625, -0.3332672119140625, -0.2906494140625, -0.2480316162109375, -0.205413818359375, -0.1627960205078125, -0.12017822265625, -0.0775604248046875, -0.034942626953125, 0.0076751708984375, 0.05029296875, 0.0929107666015625, 0.135528564453125, 0.1781463623046875, 0.22076416015625, 0.2633819580078125, 0.305999755859375, 0.3486175537109375, 0.3912353515625, 0.4338531494140625, 0.476470947265625, 0.5190887451171875, 0.56170654296875, 0.6043243408203125, 0.646942138671875, 0.6895599365234375, 0.732177734375, 0.7747955322265625, 0.817413330078125, 0.8600311279296875, 0.90264892578125, 0.9452667236328125, 0.987884521484375, 1.0305023193359375, 1.0731201171875, 1.1157379150390625, 1.158355712890625, 1.2009735107421875, 1.24359130859375, 1.2862091064453125, 1.328826904296875, 1.3714447021484375, 1.4140625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 7.0, 8.0, 9.0, 21.0, 19.0, 15.0, 26.0, 42.0, 39.0, 61.0, 69.0, 48.0, 61.0, 70.0, 59.0, 66.0, 54.0, 49.0, 55.0, 47.0, 36.0, 30.0, 31.0, 30.0, 15.0, 17.0, 5.0, 9.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.875, -1.8325729370117188, -1.7901458740234375, -1.7477188110351562, -1.705291748046875, -1.6628646850585938, -1.6204376220703125, -1.5780105590820312, -1.53558349609375, -1.4931564331054688, -1.4507293701171875, -1.4083023071289062, -1.365875244140625, -1.3234481811523438, -1.2810211181640625, -1.2385940551757812, -1.1961669921875, -1.1537399291992188, -1.1113128662109375, -1.0688858032226562, -1.026458740234375, -0.9840316772460938, -0.9416046142578125, -0.8991775512695312, -0.85675048828125, -0.8143234252929688, -0.7718963623046875, -0.7294692993164062, -0.687042236328125, -0.6446151733398438, -0.6021881103515625, -0.5597610473632812, -0.517333984375, -0.47490692138671875, -0.4324798583984375, -0.39005279541015625, -0.347625732421875, -0.30519866943359375, -0.2627716064453125, -0.22034454345703125, -0.17791748046875, -0.13549041748046875, -0.0930633544921875, -0.05063629150390625, -0.008209228515625, 0.03421783447265625, 0.0766448974609375, 0.11907196044921875, 0.1614990234375, 0.20392608642578125, 0.2463531494140625, 0.28878021240234375, 0.331207275390625, 0.37363433837890625, 0.4160614013671875, 0.45848846435546875, 0.50091552734375, 0.5433425903320312, 0.5857696533203125, 0.6281967163085938, 0.670623779296875, 0.7130508422851562, 0.7554779052734375, 0.7979049682617188, 0.84033203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 6.0, 6.0, 13.0, 23.0, 38.0, 43.0, 69.0, 100.0, 152.0, 238.0, 347.0, 548.0, 983.0, 2066.0, 5989.0, 26861.0, 182314.0, 683409.0, 117714.0, 18917.0, 4567.0, 1736.0, 864.0, 547.0, 318.0, 202.0, 147.0, 111.0, 67.0, 37.0, 41.0, 27.0, 24.0, 14.0, 6.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.527923583984375, -4.40350341796875, -4.279083251953125, -4.1546630859375, -4.030242919921875, -3.90582275390625, -3.781402587890625, -3.656982421875, -3.532562255859375, -3.40814208984375, -3.283721923828125, -3.1593017578125, -3.034881591796875, -2.91046142578125, -2.786041259765625, -2.66162109375, -2.537200927734375, -2.41278076171875, -2.288360595703125, -2.1639404296875, -2.039520263671875, -1.91510009765625, -1.790679931640625, -1.666259765625, -1.541839599609375, -1.41741943359375, -1.292999267578125, -1.1685791015625, -1.044158935546875, -0.91973876953125, -0.795318603515625, -0.6708984375, -0.546478271484375, -0.42205810546875, -0.297637939453125, -0.1732177734375, -0.048797607421875, 0.07562255859375, 0.200042724609375, 0.324462890625, 0.448883056640625, 0.57330322265625, 0.697723388671875, 0.8221435546875, 0.946563720703125, 1.07098388671875, 1.195404052734375, 1.31982421875, 1.444244384765625, 1.56866455078125, 1.693084716796875, 1.8175048828125, 1.941925048828125, 2.06634521484375, 2.190765380859375, 2.315185546875, 2.439605712890625, 2.56402587890625, 2.688446044921875, 2.8128662109375, 2.937286376953125, 3.06170654296875, 3.186126708984375, 3.310546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 8.0, 9.0, 11.0, 8.0, 16.0, 24.0, 16.0, 31.0, 33.0, 35.0, 41.0, 37.0, 42.0, 43.0, 43.0, 62.0, 51.0, 58.0, 46.0, 43.0, 39.0, 34.0, 36.0, 36.0, 32.0, 23.0, 15.0, 22.0, 21.0, 11.0, 16.0, 15.0, 10.0, 7.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.75, -4.618988037109375, -4.48797607421875, -4.356964111328125, -4.2259521484375, -4.094940185546875, -3.96392822265625, -3.832916259765625, -3.701904296875, -3.570892333984375, -3.43988037109375, -3.308868408203125, -3.1778564453125, -3.046844482421875, -2.91583251953125, -2.784820556640625, -2.65380859375, -2.522796630859375, -2.39178466796875, -2.260772705078125, -2.1297607421875, -1.998748779296875, -1.86773681640625, -1.736724853515625, -1.605712890625, -1.474700927734375, -1.34368896484375, -1.212677001953125, -1.0816650390625, -0.950653076171875, -0.81964111328125, -0.688629150390625, -0.5576171875, -0.426605224609375, -0.29559326171875, -0.164581298828125, -0.0335693359375, 0.097442626953125, 0.22845458984375, 0.359466552734375, 0.490478515625, 0.621490478515625, 0.75250244140625, 0.883514404296875, 1.0145263671875, 1.145538330078125, 1.27655029296875, 1.407562255859375, 1.53857421875, 1.669586181640625, 1.80059814453125, 1.931610107421875, 2.0626220703125, 2.193634033203125, 2.32464599609375, 2.455657958984375, 2.586669921875, 2.717681884765625, 2.84869384765625, 2.979705810546875, 3.1107177734375, 3.241729736328125, 3.37274169921875, 3.503753662109375, 3.634765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 7.0, 12.0, 13.0, 14.0, 14.0, 36.0, 50.0, 91.0, 140.0, 234.0, 458.0, 993.0, 2229.0, 6090.0, 19832.0, 88664.0, 562350.0, 288725.0, 56948.0, 13766.0, 4508.0, 1714.0, 754.0, 366.0, 198.0, 125.0, 75.0, 38.0, 25.0, 24.0, 15.0, 17.0, 10.0, 10.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86962890625, -0.8346481323242188, -0.7996673583984375, -0.7646865844726562, -0.729705810546875, -0.6947250366210938, -0.6597442626953125, -0.6247634887695312, -0.58978271484375, -0.5548019409179688, -0.5198211669921875, -0.48484039306640625, -0.449859619140625, -0.41487884521484375, -0.3798980712890625, -0.34491729736328125, -0.3099365234375, -0.27495574951171875, -0.2399749755859375, -0.20499420166015625, -0.170013427734375, -0.13503265380859375, -0.1000518798828125, -0.06507110595703125, -0.03009033203125, 0.00489044189453125, 0.0398712158203125, 0.07485198974609375, 0.109832763671875, 0.14481353759765625, 0.1797943115234375, 0.21477508544921875, 0.249755859375, 0.28473663330078125, 0.3197174072265625, 0.35469818115234375, 0.389678955078125, 0.42465972900390625, 0.4596405029296875, 0.49462127685546875, 0.52960205078125, 0.5645828247070312, 0.5995635986328125, 0.6345443725585938, 0.669525146484375, 0.7045059204101562, 0.7394866943359375, 0.7744674682617188, 0.8094482421875, 0.8444290161132812, 0.8794097900390625, 0.9143905639648438, 0.949371337890625, 0.9843521118164062, 1.0193328857421875, 1.0543136596679688, 1.08929443359375, 1.1242752075195312, 1.1592559814453125, 1.1942367553710938, 1.229217529296875, 1.2641983032226562, 1.2991790771484375, 1.3341598510742188, 1.369140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 13.0, 9.0, 14.0, 12.0, 23.0, 23.0, 28.0, 47.0, 53.0, 77.0, 82.0, 89.0, 95.0, 77.0, 67.0, 44.0, 51.0, 46.0, 26.0, 29.0, 16.0, 23.0, 8.0, 7.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031495094299316406, -0.00030369311571121216, -0.00029243528842926025, -0.00028117746114730835, -0.00026991963386535645, -0.00025866180658340454, -0.00024740397930145264, -0.00023614615201950073, -0.00022488832473754883, -0.00021363049745559692, -0.00020237267017364502, -0.00019111484289169312, -0.0001798570156097412, -0.0001685991883277893, -0.0001573413610458374, -0.0001460835337638855, -0.0001348257064819336, -0.0001235678791999817, -0.00011231005191802979, -0.00010105222463607788, -8.979439735412598e-05, -7.853657007217407e-05, -6.727874279022217e-05, -5.6020915508270264e-05, -4.476308822631836e-05, -3.3505260944366455e-05, -2.224743366241455e-05, -1.0989606380462646e-05, 2.682209014892578e-07, 1.1526048183441162e-05, 2.2783875465393066e-05, 3.404170274734497e-05, 4.5299530029296875e-05, 5.655735731124878e-05, 6.781518459320068e-05, 7.907301187515259e-05, 9.033083915710449e-05, 0.0001015886664390564, 0.0001128464937210083, 0.0001241043210029602, 0.0001353621482849121, 0.00014661997556686401, 0.00015787780284881592, 0.00016913563013076782, 0.00018039345741271973, 0.00019165128469467163, 0.00020290911197662354, 0.00021416693925857544, 0.00022542476654052734, 0.00023668259382247925, 0.00024794042110443115, 0.00025919824838638306, 0.00027045607566833496, 0.00028171390295028687, 0.00029297173023223877, 0.0003042295575141907, 0.0003154873847961426, 0.0003267452120780945, 0.0003380030393600464, 0.0003492608666419983, 0.0003605186939239502, 0.0003717765212059021, 0.000383034348487854, 0.0003942921757698059, 0.0004055500030517578]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 6.0, 7.0, 17.0, 21.0, 26.0, 34.0, 45.0, 73.0, 146.0, 217.0, 444.0, 725.0, 1355.0, 3186.0, 8419.0, 30212.0, 150035.0, 621420.0, 180160.0, 35455.0, 9616.0, 3558.0, 1555.0, 745.0, 416.0, 249.0, 135.0, 88.0, 63.0, 31.0, 19.0, 18.0, 10.0, 16.0, 10.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0302734375, -0.998626708984375, -0.96697998046875, -0.935333251953125, -0.9036865234375, -0.872039794921875, -0.84039306640625, -0.808746337890625, -0.777099609375, -0.745452880859375, -0.71380615234375, -0.682159423828125, -0.6505126953125, -0.618865966796875, -0.58721923828125, -0.555572509765625, -0.52392578125, -0.492279052734375, -0.46063232421875, -0.428985595703125, -0.3973388671875, -0.365692138671875, -0.33404541015625, -0.302398681640625, -0.270751953125, -0.239105224609375, -0.20745849609375, -0.175811767578125, -0.1441650390625, -0.112518310546875, -0.08087158203125, -0.049224853515625, -0.017578125, 0.014068603515625, 0.04571533203125, 0.077362060546875, 0.1090087890625, 0.140655517578125, 0.17230224609375, 0.203948974609375, 0.235595703125, 0.267242431640625, 0.29888916015625, 0.330535888671875, 0.3621826171875, 0.393829345703125, 0.42547607421875, 0.457122802734375, 0.48876953125, 0.520416259765625, 0.55206298828125, 0.583709716796875, 0.6153564453125, 0.647003173828125, 0.67864990234375, 0.710296630859375, 0.741943359375, 0.773590087890625, 0.80523681640625, 0.836883544921875, 0.8685302734375, 0.900177001953125, 0.93182373046875, 0.963470458984375, 0.9951171875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 10.0, 12.0, 15.0, 34.0, 46.0, 64.0, 63.0, 92.0, 108.0, 109.0, 101.0, 78.0, 79.0, 57.0, 39.0, 31.0, 21.0, 16.0, 12.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.58203125, -1.533416748046875, -1.48480224609375, -1.436187744140625, -1.3875732421875, -1.338958740234375, -1.29034423828125, -1.241729736328125, -1.193115234375, -1.144500732421875, -1.09588623046875, -1.047271728515625, -0.9986572265625, -0.950042724609375, -0.90142822265625, -0.852813720703125, -0.80419921875, -0.755584716796875, -0.70697021484375, -0.658355712890625, -0.6097412109375, -0.561126708984375, -0.51251220703125, -0.463897705078125, -0.415283203125, -0.366668701171875, -0.31805419921875, -0.269439697265625, -0.2208251953125, -0.172210693359375, -0.12359619140625, -0.074981689453125, -0.0263671875, 0.022247314453125, 0.07086181640625, 0.119476318359375, 0.1680908203125, 0.216705322265625, 0.26531982421875, 0.313934326171875, 0.362548828125, 0.411163330078125, 0.45977783203125, 0.508392333984375, 0.5570068359375, 0.605621337890625, 0.65423583984375, 0.702850341796875, 0.75146484375, 0.800079345703125, 0.84869384765625, 0.897308349609375, 0.9459228515625, 0.994537353515625, 1.04315185546875, 1.091766357421875, 1.140380859375, 1.188995361328125, 1.23760986328125, 1.286224365234375, 1.3348388671875, 1.383453369140625, 1.43206787109375, 1.480682373046875, 1.529296875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 10.0, 42.0, 178.0, 431.0, 220.0, 77.0, 23.0, 10.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.16886138916016, -67.41625213623047, -65.66364288330078, -63.91102981567383, -62.15842056274414, -60.40580749511719, -58.6531982421875, -56.90058898925781, -55.147979736328125, -53.39537048339844, -51.642757415771484, -49.8901481628418, -48.13753890991211, -46.384925842285156, -44.63231658935547, -42.87970733642578, -41.12709426879883, -39.37448501586914, -37.62187194824219, -35.8692626953125, -34.11665344238281, -32.364044189453125, -30.611431121826172, -28.858821868896484, -27.106210708618164, -25.353599548339844, -23.600990295410156, -21.848379135131836, -20.095767974853516, -18.343158721923828, -16.590547561645508, -14.837937355041504, -13.0853271484375, -11.332716941833496, -9.580106735229492, -7.827495574951172, -6.074885368347168, -4.322275161743164, -2.5696640014648438, -0.8170537948608398, 0.9355564117431641, 2.688166856765747, 4.44077730178833, 6.193387985229492, 7.945998191833496, 9.6986083984375, 11.45121955871582, 13.203829765319824, 14.956439971923828, 16.70905113220215, 18.461660385131836, 20.214271545410156, 21.966880798339844, 23.719491958618164, 25.472103118896484, 27.224712371826172, 28.977323532104492, 30.729934692382812, 32.4825439453125, 34.23515319824219, 35.98776626586914, 37.74037551879883, 39.49298858642578, 41.24559783935547, 42.998207092285156]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 5.0, 10.0, 8.0, 8.0, 10.0, 10.0, 7.0, 17.0, 19.0, 18.0, 33.0, 28.0, 25.0, 27.0, 35.0, 37.0, 38.0, 58.0, 66.0, 75.0, 67.0, 52.0, 41.0, 38.0, 37.0, 31.0, 35.0, 24.0, 22.0, 16.0, 17.0, 13.0, 9.0, 9.0, 8.0, 7.0, 7.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-16.460195541381836, -15.962446212768555, -15.46469783782959, -14.966948509216309, -14.469200134277344, -13.971450805664062, -13.473701477050781, -12.975953102111816, -12.478204727172852, -11.98045539855957, -11.482707023620605, -10.984957695007324, -10.48720932006836, -9.989459991455078, -9.491710662841797, -8.993962287902832, -8.49621295928955, -7.998464107513428, -7.500715255737305, -7.002965927124023, -6.505217552185059, -6.007468223571777, -5.509719371795654, -5.011970520019531, -4.514221668243408, -4.016472816467285, -3.518723964691162, -3.02097487449646, -2.523226022720337, -2.025477170944214, -1.5277280807495117, -1.0299792289733887, -0.5322303771972656, -0.0344814658164978, 0.46326744556427, 0.9610164165496826, 1.4587652683258057, 1.9565141201019287, 2.454263210296631, 2.952012062072754, 3.449760913848877, 3.947509765625, 4.445258617401123, 4.943007469177246, 5.440756797790527, 5.938505172729492, 6.436254501342773, 6.9340033531188965, 7.4317522048950195, 7.929501056671143, 8.427249908447266, 8.924999237060547, 9.422747611999512, 9.920496940612793, 10.418245315551758, 10.915994644165039, 11.41374397277832, 11.911493301391602, 12.409241676330566, 12.906991004943848, 13.404739379882812, 13.902488708496094, 14.400238037109375, 14.89798641204834, 15.395734786987305]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 8.0, 6.0, 10.0, 17.0, 22.0, 27.0, 39.0, 64.0, 67.0, 119.0, 181.0, 291.0, 538.0, 1126.0, 2732.0, 7454.0, 27860.0, 167471.0, 1375864.0, 2209801.0, 334879.0, 47436.0, 11390.0, 3616.0, 1487.0, 721.0, 386.0, 210.0, 112.0, 103.0, 53.0, 37.0, 37.0, 26.0, 25.0, 21.0, 12.0, 11.0, 3.0, 8.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.396484375, -1.350189208984375, -1.30389404296875, -1.257598876953125, -1.2113037109375, -1.165008544921875, -1.11871337890625, -1.072418212890625, -1.026123046875, -0.979827880859375, -0.93353271484375, -0.887237548828125, -0.8409423828125, -0.794647216796875, -0.74835205078125, -0.702056884765625, -0.65576171875, -0.609466552734375, -0.56317138671875, -0.516876220703125, -0.4705810546875, -0.424285888671875, -0.37799072265625, -0.331695556640625, -0.285400390625, -0.239105224609375, -0.19281005859375, -0.146514892578125, -0.1002197265625, -0.053924560546875, -0.00762939453125, 0.038665771484375, 0.0849609375, 0.131256103515625, 0.17755126953125, 0.223846435546875, 0.2701416015625, 0.316436767578125, 0.36273193359375, 0.409027099609375, 0.455322265625, 0.501617431640625, 0.54791259765625, 0.594207763671875, 0.6405029296875, 0.686798095703125, 0.73309326171875, 0.779388427734375, 0.82568359375, 0.871978759765625, 0.91827392578125, 0.964569091796875, 1.0108642578125, 1.057159423828125, 1.10345458984375, 1.149749755859375, 1.196044921875, 1.242340087890625, 1.28863525390625, 1.334930419921875, 1.3812255859375, 1.427520751953125, 1.47381591796875, 1.520111083984375, 1.56640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 6.0, 5.0, 8.0, 9.0, 10.0, 11.0, 11.0, 19.0, 26.0, 31.0, 26.0, 35.0, 33.0, 39.0, 40.0, 40.0, 37.0, 45.0, 52.0, 43.0, 46.0, 42.0, 39.0, 33.0, 43.0, 44.0, 39.0, 28.0, 24.0, 19.0, 16.0, 22.0, 19.0, 12.0, 11.0, 9.0, 5.0, 7.0, 2.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.978515625, -0.95013427734375, -0.9217529296875, -0.89337158203125, -0.864990234375, -0.83660888671875, -0.8082275390625, -0.77984619140625, -0.75146484375, -0.72308349609375, -0.6947021484375, -0.66632080078125, -0.637939453125, -0.60955810546875, -0.5811767578125, -0.55279541015625, -0.5244140625, -0.49603271484375, -0.4676513671875, -0.43927001953125, -0.410888671875, -0.38250732421875, -0.3541259765625, -0.32574462890625, -0.29736328125, -0.26898193359375, -0.2406005859375, -0.21221923828125, -0.183837890625, -0.15545654296875, -0.1270751953125, -0.09869384765625, -0.0703125, -0.04193115234375, -0.0135498046875, 0.01483154296875, 0.043212890625, 0.07159423828125, 0.0999755859375, 0.12835693359375, 0.15673828125, 0.18511962890625, 0.2135009765625, 0.24188232421875, 0.270263671875, 0.29864501953125, 0.3270263671875, 0.35540771484375, 0.3837890625, 0.41217041015625, 0.4405517578125, 0.46893310546875, 0.497314453125, 0.52569580078125, 0.5540771484375, 0.58245849609375, 0.61083984375, 0.63922119140625, 0.6676025390625, 0.69598388671875, 0.724365234375, 0.75274658203125, 0.7811279296875, 0.80950927734375, 0.837890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 17.0, 34.0, 81.0, 115.0, 283.0, 670.0, 2470.0, 22823.0, 3594306.0, 561182.0, 9383.0, 1703.0, 633.0, 279.0, 126.0, 77.0, 44.0, 18.0, 11.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4609375, -6.27001953125, -6.0791015625, -5.88818359375, -5.697265625, -5.50634765625, -5.3154296875, -5.12451171875, -4.93359375, -4.74267578125, -4.5517578125, -4.36083984375, -4.169921875, -3.97900390625, -3.7880859375, -3.59716796875, -3.40625, -3.21533203125, -3.0244140625, -2.83349609375, -2.642578125, -2.45166015625, -2.2607421875, -2.06982421875, -1.87890625, -1.68798828125, -1.4970703125, -1.30615234375, -1.115234375, -0.92431640625, -0.7333984375, -0.54248046875, -0.3515625, -0.16064453125, 0.0302734375, 0.22119140625, 0.412109375, 0.60302734375, 0.7939453125, 0.98486328125, 1.17578125, 1.36669921875, 1.5576171875, 1.74853515625, 1.939453125, 2.13037109375, 2.3212890625, 2.51220703125, 2.703125, 2.89404296875, 3.0849609375, 3.27587890625, 3.466796875, 3.65771484375, 3.8486328125, 4.03955078125, 4.23046875, 4.42138671875, 4.6123046875, 4.80322265625, 4.994140625, 5.18505859375, 5.3759765625, 5.56689453125, 5.7578125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 16.0, 34.0, 50.0, 98.0, 218.0, 524.0, 1061.0, 1029.0, 544.0, 225.0, 111.0, 59.0, 31.0, 13.0, 11.0, 9.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.06640625, -2.93280029296875, -2.7991943359375, -2.66558837890625, -2.531982421875, -2.39837646484375, -2.2647705078125, -2.13116455078125, -1.99755859375, -1.86395263671875, -1.7303466796875, -1.59674072265625, -1.463134765625, -1.32952880859375, -1.1959228515625, -1.06231689453125, -0.9287109375, -0.79510498046875, -0.6614990234375, -0.52789306640625, -0.394287109375, -0.26068115234375, -0.1270751953125, 0.00653076171875, 0.14013671875, 0.27374267578125, 0.4073486328125, 0.54095458984375, 0.674560546875, 0.80816650390625, 0.9417724609375, 1.07537841796875, 1.208984375, 1.34259033203125, 1.4761962890625, 1.60980224609375, 1.743408203125, 1.87701416015625, 2.0106201171875, 2.14422607421875, 2.27783203125, 2.41143798828125, 2.5450439453125, 2.67864990234375, 2.812255859375, 2.94586181640625, 3.0794677734375, 3.21307373046875, 3.3466796875, 3.48028564453125, 3.6138916015625, 3.74749755859375, 3.881103515625, 4.01470947265625, 4.1483154296875, 4.28192138671875, 4.41552734375, 4.54913330078125, 4.6827392578125, 4.81634521484375, 4.949951171875, 5.08355712890625, 5.2171630859375, 5.35076904296875, 5.484375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 12.0, 45.0, 103.0, 221.0, 259.0, 200.0, 87.0, 34.0, 13.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.412261962890625, -32.137489318847656, -30.862712860107422, -29.58793830871582, -28.31316375732422, -27.03839111328125, -25.76361656188965, -24.488842010498047, -23.214067459106445, -21.939292907714844, -20.664518356323242, -19.38974380493164, -18.114971160888672, -16.840194702148438, -15.565422058105469, -14.290647506713867, -13.015872955322266, -11.741098403930664, -10.466323852539062, -9.191550254821777, -7.916775703430176, -6.642001152038574, -5.367227077484131, -4.0924530029296875, -2.817678451538086, -1.5429041385650635, -0.268129825592041, 1.0066444873809814, 2.281418800354004, 3.5561933517456055, 4.830967426300049, 6.105741500854492, 7.380516052246094, 8.655290603637695, 9.930065155029297, 11.204838752746582, 12.479613304138184, 13.754387855529785, 15.02916145324707, 16.303936004638672, 17.578710556030273, 18.853485107421875, 20.128259658813477, 21.403034210205078, 22.677806854248047, 23.95258331298828, 25.22735595703125, 26.50213050842285, 27.776905059814453, 29.051679611206055, 30.326454162597656, 31.601228713989258, 32.87600326538086, 34.15077590942383, 35.42555236816406, 36.70032501220703, 37.97509765625, 39.24987030029297, 40.5246467590332, 41.79941940307617, 43.074195861816406, 44.348968505859375, 45.62374496459961, 46.89851760864258, 48.17329406738281]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 4.0, 10.0, 6.0, 8.0, 17.0, 16.0, 15.0, 28.0, 44.0, 38.0, 39.0, 34.0, 49.0, 44.0, 59.0, 49.0, 51.0, 62.0, 53.0, 36.0, 37.0, 38.0, 37.0, 28.0, 31.0, 33.0, 30.0, 28.0, 12.0, 14.0, 8.0, 7.0, 11.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0], "bins": [-19.158945083618164, -18.691299438476562, -18.223655700683594, -17.756010055541992, -17.28836441040039, -16.820720672607422, -16.35307502746582, -15.885429382324219, -15.417784690856934, -14.950139999389648, -14.482494354248047, -14.014849662780762, -13.54720401763916, -13.079559326171875, -12.611913681030273, -12.144268989562988, -11.676624298095703, -11.208979606628418, -10.741333961486816, -10.273689270019531, -9.80604362487793, -9.338398933410645, -8.87075424194336, -8.403108596801758, -7.935462951660156, -7.467817783355713, -7.0001726150512695, -6.532527923583984, -6.064882755279541, -5.597237586975098, -5.129592418670654, -4.661947250366211, -4.194302558898926, -3.7266573905944824, -3.259012460708618, -2.791367292404175, -2.3237223625183105, -1.8560771942138672, -1.3884320259094238, -0.9207870960235596, -0.4531419277191162, 0.014503151178359985, 0.4821482300758362, 0.9497933387756348, 1.4174383878707886, 1.8850834369659424, 2.3527286052703857, 2.82037353515625, 3.2880187034606934, 3.7556638717651367, 4.22330904006958, 4.690954208374023, 5.158598899841309, 5.626244068145752, 6.093889236450195, 6.5615339279174805, 7.029179573059082, 7.496824741363525, 7.964469909667969, 8.432114601135254, 8.899760246276855, 9.36740493774414, 9.835050582885742, 10.302695274353027, 10.770339965820312]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 4.0, 11.0, 17.0, 30.0, 49.0, 66.0, 106.0, 178.0, 272.0, 429.0, 700.0, 1180.0, 2054.0, 3451.0, 6181.0, 11094.0, 20851.0, 40623.0, 77849.0, 139837.0, 209286.0, 212577.0, 146584.0, 82073.0, 43111.0, 22495.0, 12027.0, 6441.0, 3629.0, 2088.0, 1279.0, 765.0, 440.0, 289.0, 190.0, 104.0, 69.0, 44.0, 34.0, 15.0, 9.0, 12.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.3310546875, -1.2930755615234375, -1.255096435546875, -1.2171173095703125, -1.17913818359375, -1.1411590576171875, -1.103179931640625, -1.0652008056640625, -1.0272216796875, -0.9892425537109375, -0.951263427734375, -0.9132843017578125, -0.87530517578125, -0.8373260498046875, -0.799346923828125, -0.7613677978515625, -0.723388671875, -0.6854095458984375, -0.647430419921875, -0.6094512939453125, -0.57147216796875, -0.5334930419921875, -0.495513916015625, -0.4575347900390625, -0.4195556640625, -0.3815765380859375, -0.343597412109375, -0.3056182861328125, -0.26763916015625, -0.2296600341796875, -0.191680908203125, -0.1537017822265625, -0.11572265625, -0.0777435302734375, -0.039764404296875, -0.0017852783203125, 0.03619384765625, 0.0741729736328125, 0.112152099609375, 0.1501312255859375, 0.1881103515625, 0.2260894775390625, 0.264068603515625, 0.3020477294921875, 0.34002685546875, 0.3780059814453125, 0.415985107421875, 0.4539642333984375, 0.491943359375, 0.5299224853515625, 0.567901611328125, 0.6058807373046875, 0.64385986328125, 0.6818389892578125, 0.719818115234375, 0.7577972412109375, 0.7957763671875, 0.8337554931640625, 0.871734619140625, 0.9097137451171875, 0.94769287109375, 0.9856719970703125, 1.023651123046875, 1.0616302490234375, 1.099609375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 9.0, 9.0, 12.0, 18.0, 13.0, 18.0, 21.0, 20.0, 32.0, 20.0, 23.0, 39.0, 25.0, 39.0, 33.0, 39.0, 37.0, 46.0, 42.0, 51.0, 44.0, 41.0, 42.0, 34.0, 36.0, 32.0, 25.0, 30.0, 21.0, 23.0, 15.0, 18.0, 12.0, 7.0, 15.0, 11.0, 9.0, 5.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.875, -0.8453826904296875, -0.815765380859375, -0.7861480712890625, -0.75653076171875, -0.7269134521484375, -0.697296142578125, -0.6676788330078125, -0.6380615234375, -0.6084442138671875, -0.578826904296875, -0.5492095947265625, -0.51959228515625, -0.4899749755859375, -0.460357666015625, -0.4307403564453125, -0.401123046875, -0.3715057373046875, -0.341888427734375, -0.3122711181640625, -0.28265380859375, -0.2530364990234375, -0.223419189453125, -0.1938018798828125, -0.1641845703125, -0.1345672607421875, -0.104949951171875, -0.0753326416015625, -0.04571533203125, -0.0160980224609375, 0.013519287109375, 0.0431365966796875, 0.07275390625, 0.1023712158203125, 0.131988525390625, 0.1616058349609375, 0.19122314453125, 0.2208404541015625, 0.250457763671875, 0.2800750732421875, 0.3096923828125, 0.3393096923828125, 0.368927001953125, 0.3985443115234375, 0.42816162109375, 0.4577789306640625, 0.487396240234375, 0.5170135498046875, 0.546630859375, 0.5762481689453125, 0.605865478515625, 0.6354827880859375, 0.66510009765625, 0.6947174072265625, 0.724334716796875, 0.7539520263671875, 0.7835693359375, 0.8131866455078125, 0.842803955078125, 0.8724212646484375, 0.90203857421875, 0.9316558837890625, 0.961273193359375, 0.9908905029296875, 1.0205078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 8.0, 6.0, 13.0, 17.0, 20.0, 26.0, 50.0, 66.0, 98.0, 162.0, 250.0, 542.0, 1159.0, 2776.0, 8227.0, 30427.0, 142338.0, 600271.0, 201791.0, 43146.0, 10742.0, 3499.0, 1400.0, 653.0, 359.0, 157.0, 103.0, 68.0, 47.0, 27.0, 28.0, 20.0, 16.0, 10.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.31640625, -3.225830078125, -3.13525390625, -3.044677734375, -2.9541015625, -2.863525390625, -2.77294921875, -2.682373046875, -2.591796875, -2.501220703125, -2.41064453125, -2.320068359375, -2.2294921875, -2.138916015625, -2.04833984375, -1.957763671875, -1.8671875, -1.776611328125, -1.68603515625, -1.595458984375, -1.5048828125, -1.414306640625, -1.32373046875, -1.233154296875, -1.142578125, -1.052001953125, -0.96142578125, -0.870849609375, -0.7802734375, -0.689697265625, -0.59912109375, -0.508544921875, -0.41796875, -0.327392578125, -0.23681640625, -0.146240234375, -0.0556640625, 0.034912109375, 0.12548828125, 0.216064453125, 0.306640625, 0.397216796875, 0.48779296875, 0.578369140625, 0.6689453125, 0.759521484375, 0.85009765625, 0.940673828125, 1.03125, 1.121826171875, 1.21240234375, 1.302978515625, 1.3935546875, 1.484130859375, 1.57470703125, 1.665283203125, 1.755859375, 1.846435546875, 1.93701171875, 2.027587890625, 2.1181640625, 2.208740234375, 2.29931640625, 2.389892578125, 2.48046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 13.0, 6.0, 7.0, 14.0, 12.0, 18.0, 21.0, 23.0, 29.0, 25.0, 34.0, 37.0, 38.0, 44.0, 49.0, 45.0, 54.0, 59.0, 59.0, 54.0, 51.0, 43.0, 38.0, 40.0, 36.0, 22.0, 18.0, 15.0, 18.0, 10.0, 12.0, 10.0, 8.0, 8.0, 8.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.01953125, -3.89141845703125, -3.7633056640625, -3.63519287109375, -3.507080078125, -3.37896728515625, -3.2508544921875, -3.12274169921875, -2.99462890625, -2.86651611328125, -2.7384033203125, -2.61029052734375, -2.482177734375, -2.35406494140625, -2.2259521484375, -2.09783935546875, -1.9697265625, -1.84161376953125, -1.7135009765625, -1.58538818359375, -1.457275390625, -1.32916259765625, -1.2010498046875, -1.07293701171875, -0.94482421875, -0.81671142578125, -0.6885986328125, -0.56048583984375, -0.432373046875, -0.30426025390625, -0.1761474609375, -0.04803466796875, 0.080078125, 0.20819091796875, 0.3363037109375, 0.46441650390625, 0.592529296875, 0.72064208984375, 0.8487548828125, 0.97686767578125, 1.10498046875, 1.23309326171875, 1.3612060546875, 1.48931884765625, 1.617431640625, 1.74554443359375, 1.8736572265625, 2.00177001953125, 2.1298828125, 2.25799560546875, 2.3861083984375, 2.51422119140625, 2.642333984375, 2.77044677734375, 2.8985595703125, 3.02667236328125, 3.15478515625, 3.28289794921875, 3.4110107421875, 3.53912353515625, 3.667236328125, 3.79534912109375, 3.9234619140625, 4.05157470703125, 4.1796875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 10.0, 13.0, 19.0, 22.0, 22.0, 36.0, 44.0, 75.0, 111.0, 174.0, 306.0, 434.0, 778.0, 1471.0, 3102.0, 7457.0, 23093.0, 100536.0, 620508.0, 223931.0, 44608.0, 12501.0, 4582.0, 2033.0, 1070.0, 616.0, 320.0, 218.0, 141.0, 85.0, 70.0, 40.0, 37.0, 17.0, 20.0, 15.0, 12.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0], "bins": [-1.2744140625, -1.2387542724609375, -1.203094482421875, -1.1674346923828125, -1.13177490234375, -1.0961151123046875, -1.060455322265625, -1.0247955322265625, -0.9891357421875, -0.9534759521484375, -0.917816162109375, -0.8821563720703125, -0.84649658203125, -0.8108367919921875, -0.775177001953125, -0.7395172119140625, -0.703857421875, -0.6681976318359375, -0.632537841796875, -0.5968780517578125, -0.56121826171875, -0.5255584716796875, -0.489898681640625, -0.4542388916015625, -0.4185791015625, -0.3829193115234375, -0.347259521484375, -0.3115997314453125, -0.27593994140625, -0.2402801513671875, -0.204620361328125, -0.1689605712890625, -0.13330078125, -0.0976409912109375, -0.061981201171875, -0.0263214111328125, 0.00933837890625, 0.0449981689453125, 0.080657958984375, 0.1163177490234375, 0.1519775390625, 0.1876373291015625, 0.223297119140625, 0.2589569091796875, 0.29461669921875, 0.3302764892578125, 0.365936279296875, 0.4015960693359375, 0.437255859375, 0.4729156494140625, 0.508575439453125, 0.5442352294921875, 0.57989501953125, 0.6155548095703125, 0.651214599609375, 0.6868743896484375, 0.7225341796875, 0.7581939697265625, 0.793853759765625, 0.8295135498046875, 0.86517333984375, 0.9008331298828125, 0.936492919921875, 0.9721527099609375, 1.0078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 16.0, 35.0, 99.0, 186.0, 288.0, 174.0, 101.0, 39.0, 23.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009074211120605469, -0.0008755847811698914, -0.0008437484502792358, -0.0008119121193885803, -0.0007800757884979248, -0.0007482394576072693, -0.0007164031267166138, -0.0006845667958259583, -0.0006527304649353027, -0.0006208941340446472, -0.0005890578031539917, -0.0005572214722633362, -0.0005253851413726807, -0.0004935488104820251, -0.00046171247959136963, -0.0004298761487007141, -0.0003980398178100586, -0.0003662034869194031, -0.00033436715602874756, -0.00030253082513809204, -0.0002706944942474365, -0.000238858163356781, -0.0002070218324661255, -0.00017518550157546997, -0.00014334917068481445, -0.00011151283979415894, -7.967650890350342e-05, -4.78401780128479e-05, -1.6003847122192383e-05, 1.5832483768463135e-05, 4.766881465911865e-05, 7.950514554977417e-05, 0.00011134147644042969, 0.0001431778073310852, 0.00017501413822174072, 0.00020685046911239624, 0.00023868680000305176, 0.0002705231308937073, 0.0003023594617843628, 0.0003341957926750183, 0.00036603212356567383, 0.00039786845445632935, 0.00042970478534698486, 0.0004615411162376404, 0.0004933774471282959, 0.0005252137780189514, 0.0005570501089096069, 0.0005888864398002625, 0.000620722770690918, 0.0006525591015815735, 0.000684395432472229, 0.0007162317633628845, 0.00074806809425354, 0.0007799044251441956, 0.0008117407560348511, 0.0008435770869255066, 0.0008754134178161621, 0.0009072497487068176, 0.0009390860795974731, 0.0009709224104881287, 0.0010027587413787842, 0.0010345950722694397, 0.0010664314031600952, 0.0010982677340507507, 0.0011301040649414062]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 12.0, 13.0, 7.0, 21.0, 38.0, 61.0, 113.0, 259.0, 637.0, 1681.0, 5895.0, 25898.0, 172151.0, 710633.0, 106804.0, 17611.0, 4286.0, 1466.0, 489.0, 202.0, 120.0, 57.0, 49.0, 20.0, 11.0, 5.0, 7.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884765625, -1.1434326171875, -1.098388671875, -1.0533447265625, -1.00830078125, -0.9632568359375, -0.918212890625, -0.8731689453125, -0.828125, -0.7830810546875, -0.738037109375, -0.6929931640625, -0.64794921875, -0.6029052734375, -0.557861328125, -0.5128173828125, -0.4677734375, -0.4227294921875, -0.377685546875, -0.3326416015625, -0.28759765625, -0.2425537109375, -0.197509765625, -0.1524658203125, -0.107421875, -0.0623779296875, -0.017333984375, 0.0277099609375, 0.07275390625, 0.1177978515625, 0.162841796875, 0.2078857421875, 0.2529296875, 0.2979736328125, 0.343017578125, 0.3880615234375, 0.43310546875, 0.4781494140625, 0.523193359375, 0.5682373046875, 0.61328125, 0.6583251953125, 0.703369140625, 0.7484130859375, 0.79345703125, 0.8385009765625, 0.883544921875, 0.9285888671875, 0.9736328125, 1.0186767578125, 1.063720703125, 1.1087646484375, 1.15380859375, 1.1988525390625, 1.243896484375, 1.2889404296875, 1.333984375, 1.3790283203125, 1.424072265625, 1.4691162109375, 1.51416015625, 1.5592041015625, 1.604248046875, 1.6492919921875, 1.6943359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 2.0, 6.0, 8.0, 10.0, 13.0, 18.0, 17.0, 24.0, 25.0, 31.0, 33.0, 38.0, 58.0, 56.0, 66.0, 67.0, 78.0, 58.0, 60.0, 52.0, 51.0, 41.0, 27.0, 34.0, 12.0, 17.0, 18.0, 15.0, 8.0, 5.0, 10.0, 12.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.931640625, -0.90252685546875, -0.8734130859375, -0.84429931640625, -0.815185546875, -0.78607177734375, -0.7569580078125, -0.72784423828125, -0.69873046875, -0.66961669921875, -0.6405029296875, -0.61138916015625, -0.582275390625, -0.55316162109375, -0.5240478515625, -0.49493408203125, -0.4658203125, -0.43670654296875, -0.4075927734375, -0.37847900390625, -0.349365234375, -0.32025146484375, -0.2911376953125, -0.26202392578125, -0.23291015625, -0.20379638671875, -0.1746826171875, -0.14556884765625, -0.116455078125, -0.08734130859375, -0.0582275390625, -0.02911376953125, 0.0, 0.02911376953125, 0.0582275390625, 0.08734130859375, 0.116455078125, 0.14556884765625, 0.1746826171875, 0.20379638671875, 0.23291015625, 0.26202392578125, 0.2911376953125, 0.32025146484375, 0.349365234375, 0.37847900390625, 0.4075927734375, 0.43670654296875, 0.4658203125, 0.49493408203125, 0.5240478515625, 0.55316162109375, 0.582275390625, 0.61138916015625, 0.6405029296875, 0.66961669921875, 0.69873046875, 0.72784423828125, 0.7569580078125, 0.78607177734375, 0.815185546875, 0.84429931640625, 0.8734130859375, 0.90252685546875, 0.931640625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 17.0, 16.0, 26.0, 43.0, 74.0, 97.0, 129.0, 197.0, 112.0, 97.0, 58.0, 37.0, 27.0, 15.0, 12.0, 5.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.30418586730957, -17.682147979736328, -17.06011199951172, -16.438074111938477, -15.816036224365234, -15.193998336791992, -14.571961402893066, -13.94992446899414, -13.327886581420898, -12.705848693847656, -12.08381175994873, -11.461774826049805, -10.839736938476562, -10.21769905090332, -9.595662117004395, -8.973625183105469, -8.351587295532227, -7.729549884796143, -7.107512474060059, -6.485475063323975, -5.863437652587891, -5.241400241851807, -4.619362831115723, -3.9973254203796387, -3.3752880096435547, -2.7532505989074707, -2.1312131881713867, -1.5091757774353027, -0.8871383666992188, -0.26510095596313477, 0.3569364547729492, 0.9789738655090332, 1.6010093688964844, 2.2230467796325684, 2.8450841903686523, 3.4671216011047363, 4.08915901184082, 4.711196422576904, 5.333233833312988, 5.955271244049072, 6.577308654785156, 7.19934606552124, 7.821383476257324, 8.44342041015625, 9.065458297729492, 9.687496185302734, 10.30953311920166, 10.931570053100586, 11.553607940673828, 12.17564582824707, 12.797682762145996, 13.419719696044922, 14.041757583618164, 14.663795471191406, 15.285832405090332, 15.907869338989258, 16.5299072265625, 17.151945114135742, 17.773983001708984, 18.396018981933594, 19.018056869506836, 19.640094757080078, 20.262130737304688, 20.88416862487793, 21.506206512451172]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 5.0, 8.0, 8.0, 10.0, 10.0, 21.0, 15.0, 25.0, 22.0, 29.0, 28.0, 37.0, 33.0, 40.0, 55.0, 79.0, 97.0, 81.0, 40.0, 42.0, 40.0, 30.0, 23.0, 38.0, 29.0, 25.0, 19.0, 18.0, 20.0, 14.0, 13.0, 9.0, 7.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.516998291015625, -17.951467514038086, -17.38593864440918, -16.82040786743164, -16.254878997802734, -15.689349174499512, -15.123819351196289, -14.55828857421875, -13.992759704589844, -13.427229881286621, -12.861700057983398, -12.296170234680176, -11.730640411376953, -11.16511058807373, -10.599580764770508, -10.034049987792969, -9.468520164489746, -8.902990341186523, -8.3374605178833, -7.771930694580078, -7.2064008712768555, -6.640871047973633, -6.075340747833252, -5.509810924530029, -4.944281101226807, -4.378751277923584, -3.8132214546203613, -3.2476913928985596, -2.682161569595337, -2.1166317462921143, -1.5511016845703125, -0.9855718612670898, -0.4200420379638672, 0.14548784494400024, 0.7110177278518677, 1.2765476703643799, 1.8420774936676025, 2.407607316970825, 2.973137378692627, 3.5386672019958496, 4.104197025299072, 4.669726848602295, 5.235256671905518, 5.800786972045898, 6.366316795349121, 6.931846618652344, 7.497376441955566, 8.062906265258789, 8.628436088562012, 9.193965911865234, 9.759495735168457, 10.32502555847168, 10.890555381774902, 11.456085205078125, 12.021615982055664, 12.58714485168457, 13.15267562866211, 13.718205451965332, 14.283735275268555, 14.849265098571777, 15.414794921875, 15.980324745178223, 16.545854568481445, 17.111385345458984, 17.67691421508789]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 4.0, 8.0, 15.0, 20.0, 36.0, 25.0, 51.0, 58.0, 79.0, 109.0, 158.0, 269.0, 363.0, 610.0, 1241.0, 2592.0, 5983.0, 16297.0, 59048.0, 281817.0, 1331996.0, 1869728.0, 490907.0, 93293.0, 24114.0, 8203.0, 3449.0, 1567.0, 832.0, 455.0, 289.0, 167.0, 143.0, 95.0, 60.0, 50.0, 30.0, 36.0, 12.0, 15.0, 13.0, 7.0, 7.0, 2.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.2255859375, -1.1874847412109375, -1.149383544921875, -1.1112823486328125, -1.07318115234375, -1.0350799560546875, -0.996978759765625, -0.9588775634765625, -0.9207763671875, -0.8826751708984375, -0.844573974609375, -0.8064727783203125, -0.76837158203125, -0.7302703857421875, -0.692169189453125, -0.6540679931640625, -0.615966796875, -0.5778656005859375, -0.539764404296875, -0.5016632080078125, -0.46356201171875, -0.4254608154296875, -0.387359619140625, -0.3492584228515625, -0.3111572265625, -0.2730560302734375, -0.234954833984375, -0.1968536376953125, -0.15875244140625, -0.1206512451171875, -0.082550048828125, -0.0444488525390625, -0.00634765625, 0.0317535400390625, 0.069854736328125, 0.1079559326171875, 0.14605712890625, 0.1841583251953125, 0.222259521484375, 0.2603607177734375, 0.2984619140625, 0.3365631103515625, 0.374664306640625, 0.4127655029296875, 0.45086669921875, 0.4889678955078125, 0.527069091796875, 0.5651702880859375, 0.603271484375, 0.6413726806640625, 0.679473876953125, 0.7175750732421875, 0.75567626953125, 0.7937774658203125, 0.831878662109375, 0.8699798583984375, 0.9080810546875, 0.9461822509765625, 0.984283447265625, 1.0223846435546875, 1.06048583984375, 1.0985870361328125, 1.136688232421875, 1.1747894287109375, 1.212890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 6.0, 5.0, 9.0, 19.0, 16.0, 22.0, 29.0, 33.0, 37.0, 30.0, 41.0, 42.0, 46.0, 56.0, 48.0, 59.0, 56.0, 47.0, 54.0, 40.0, 39.0, 38.0, 33.0, 30.0, 31.0, 29.0, 21.0, 17.0, 16.0, 11.0, 10.0, 11.0, 3.0, 7.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.068084716796875, -1.03265380859375, -0.997222900390625, -0.9617919921875, -0.926361083984375, -0.89093017578125, -0.855499267578125, -0.820068359375, -0.784637451171875, -0.74920654296875, -0.713775634765625, -0.6783447265625, -0.642913818359375, -0.60748291015625, -0.572052001953125, -0.53662109375, -0.501190185546875, -0.46575927734375, -0.430328369140625, -0.3948974609375, -0.359466552734375, -0.32403564453125, -0.288604736328125, -0.253173828125, -0.217742919921875, -0.18231201171875, -0.146881103515625, -0.1114501953125, -0.076019287109375, -0.04058837890625, -0.005157470703125, 0.0302734375, 0.065704345703125, 0.10113525390625, 0.136566162109375, 0.1719970703125, 0.207427978515625, 0.24285888671875, 0.278289794921875, 0.313720703125, 0.349151611328125, 0.38458251953125, 0.420013427734375, 0.4554443359375, 0.490875244140625, 0.52630615234375, 0.561737060546875, 0.59716796875, 0.632598876953125, 0.66802978515625, 0.703460693359375, 0.7388916015625, 0.774322509765625, 0.80975341796875, 0.845184326171875, 0.880615234375, 0.916046142578125, 0.95147705078125, 0.986907958984375, 1.0223388671875, 1.057769775390625, 1.09320068359375, 1.128631591796875, 1.1640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 13.0, 20.0, 30.0, 38.0, 63.0, 98.0, 179.0, 365.0, 915.0, 2550.0, 11657.0, 127069.0, 3563651.0, 458596.0, 22868.0, 3929.0, 1195.0, 450.0, 244.0, 109.0, 76.0, 41.0, 34.0, 25.0, 11.0, 14.0, 6.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6328125, -3.521636962890625, -3.41046142578125, -3.299285888671875, -3.1881103515625, -3.076934814453125, -2.96575927734375, -2.854583740234375, -2.743408203125, -2.632232666015625, -2.52105712890625, -2.409881591796875, -2.2987060546875, -2.187530517578125, -2.07635498046875, -1.965179443359375, -1.85400390625, -1.742828369140625, -1.63165283203125, -1.520477294921875, -1.4093017578125, -1.298126220703125, -1.18695068359375, -1.075775146484375, -0.964599609375, -0.853424072265625, -0.74224853515625, -0.631072998046875, -0.5198974609375, -0.408721923828125, -0.29754638671875, -0.186370849609375, -0.0751953125, 0.035980224609375, 0.14715576171875, 0.258331298828125, 0.3695068359375, 0.480682373046875, 0.59185791015625, 0.703033447265625, 0.814208984375, 0.925384521484375, 1.03656005859375, 1.147735595703125, 1.2589111328125, 1.370086669921875, 1.48126220703125, 1.592437744140625, 1.70361328125, 1.814788818359375, 1.92596435546875, 2.037139892578125, 2.1483154296875, 2.259490966796875, 2.37066650390625, 2.481842041015625, 2.593017578125, 2.704193115234375, 2.81536865234375, 2.926544189453125, 3.0377197265625, 3.148895263671875, 3.26007080078125, 3.371246337890625, 3.482421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 7.0, 15.0, 16.0, 26.0, 38.0, 38.0, 38.0, 67.0, 99.0, 129.0, 208.0, 270.0, 448.0, 493.0, 593.0, 482.0, 367.0, 228.0, 149.0, 103.0, 76.0, 35.0, 38.0, 24.0, 15.0, 18.0, 13.0, 5.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.041015625, -1.973297119140625, -1.90557861328125, -1.837860107421875, -1.7701416015625, -1.702423095703125, -1.63470458984375, -1.566986083984375, -1.499267578125, -1.431549072265625, -1.36383056640625, -1.296112060546875, -1.2283935546875, -1.160675048828125, -1.09295654296875, -1.025238037109375, -0.95751953125, -0.889801025390625, -0.82208251953125, -0.754364013671875, -0.6866455078125, -0.618927001953125, -0.55120849609375, -0.483489990234375, -0.415771484375, -0.348052978515625, -0.28033447265625, -0.212615966796875, -0.1448974609375, -0.077178955078125, -0.00946044921875, 0.058258056640625, 0.1259765625, 0.193695068359375, 0.26141357421875, 0.329132080078125, 0.3968505859375, 0.464569091796875, 0.53228759765625, 0.600006103515625, 0.667724609375, 0.735443115234375, 0.80316162109375, 0.870880126953125, 0.9385986328125, 1.006317138671875, 1.07403564453125, 1.141754150390625, 1.20947265625, 1.277191162109375, 1.34490966796875, 1.412628173828125, 1.4803466796875, 1.548065185546875, 1.61578369140625, 1.683502197265625, 1.751220703125, 1.818939208984375, 1.88665771484375, 1.954376220703125, 2.0220947265625, 2.089813232421875, 2.15753173828125, 2.225250244140625, 2.29296875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 12.0, 22.0, 32.0, 57.0, 87.0, 153.0, 145.0, 165.0, 118.0, 93.0, 42.0, 33.0, 19.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.616308212280273, -24.925312042236328, -24.234315872192383, -23.543319702148438, -22.852325439453125, -22.16132926940918, -21.470333099365234, -20.77933692932129, -20.088340759277344, -19.3973445892334, -18.706348419189453, -18.01535415649414, -17.324357986450195, -16.63336181640625, -15.942365646362305, -15.25136947631836, -14.560375213623047, -13.869379043579102, -13.178383827209473, -12.487387657165527, -11.796392440795898, -11.105396270751953, -10.414400100708008, -9.723403930664062, -9.032408714294434, -8.341412544250488, -7.650417327880859, -6.959421157836914, -6.268425464630127, -5.57742977142334, -4.8864336013793945, -4.195437908172607, -3.504444122314453, -2.813448429107666, -2.1224524974823, -1.4314565658569336, -0.7404608726501465, -0.049465179443359375, 0.6415309906005859, 1.332526683807373, 2.02352237701416, 2.7145180702209473, 3.4055140018463135, 4.09650993347168, 4.787505626678467, 5.478501319885254, 6.169497489929199, 6.860493183135986, 7.551488876342773, 8.242485046386719, 8.933480262756348, 9.624476432800293, 10.315471649169922, 11.006467819213867, 11.697463989257812, 12.388460159301758, 13.079455375671387, 13.770451545715332, 14.461446762084961, 15.152442932128906, 15.843439102172852, 16.534435272216797, 17.22542953491211, 17.916425704956055, 18.607421875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 11.0, 9.0, 17.0, 11.0, 16.0, 16.0, 22.0, 30.0, 28.0, 27.0, 43.0, 44.0, 48.0, 39.0, 59.0, 40.0, 51.0, 59.0, 38.0, 49.0, 40.0, 37.0, 44.0, 27.0, 30.0, 32.0, 22.0, 22.0, 14.0, 16.0, 11.0, 5.0, 8.0, 5.0, 3.0, 8.0, 1.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.094172477722168, -9.75648021697998, -9.418787956237793, -9.081095695495605, -8.743402481079102, -8.405710220336914, -8.068017959594727, -7.730325698852539, -7.392633438110352, -7.054941177368164, -6.717248916625977, -6.379556179046631, -6.041863918304443, -5.704171657562256, -5.36647891998291, -5.028786659240723, -4.691094398498535, -4.353402137756348, -4.01570987701416, -3.6780171394348145, -3.340324878692627, -3.0026326179504395, -2.664940118789673, -2.3272476196289062, -1.9895553588867188, -1.6518629789352417, -1.3141705989837646, -0.9764782190322876, -0.6387858390808105, -0.3010934591293335, 0.036598920822143555, 0.37429141998291016, 0.7119836807250977, 1.0496760606765747, 1.3873684406280518, 1.7250608205795288, 2.062753200531006, 2.4004454612731934, 2.73813796043396, 3.0758304595947266, 3.413522720336914, 3.7512149810791016, 4.088907241821289, 4.426599979400635, 4.764292240142822, 5.10198450088501, 5.4396772384643555, 5.777369499206543, 6.1150617599487305, 6.452754020690918, 6.7904462814331055, 7.128139019012451, 7.465831279754639, 7.803523540496826, 8.141216278076172, 8.47890853881836, 8.816600799560547, 9.154293060302734, 9.491985321044922, 9.82967758178711, 10.167369842529297, 10.5050630569458, 10.842755317687988, 11.180447578430176, 11.518139839172363]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 9.0, 16.0, 31.0, 34.0, 45.0, 63.0, 96.0, 148.0, 257.0, 421.0, 681.0, 1236.0, 2188.0, 3830.0, 7380.0, 14065.0, 26180.0, 50202.0, 94722.0, 169900.0, 238702.0, 195963.0, 113703.0, 60517.0, 31773.0, 16495.0, 8736.0, 4844.0, 2580.0, 1449.0, 876.0, 536.0, 305.0, 182.0, 107.0, 78.0, 58.0, 41.0, 28.0, 13.0, 14.0, 7.0, 5.0, 6.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1259765625, -1.0879974365234375, -1.050018310546875, -1.0120391845703125, -0.97406005859375, -0.9360809326171875, -0.898101806640625, -0.8601226806640625, -0.8221435546875, -0.7841644287109375, -0.746185302734375, -0.7082061767578125, -0.67022705078125, -0.6322479248046875, -0.594268798828125, -0.5562896728515625, -0.518310546875, -0.4803314208984375, -0.442352294921875, -0.4043731689453125, -0.36639404296875, -0.3284149169921875, -0.290435791015625, -0.2524566650390625, -0.2144775390625, -0.1764984130859375, -0.138519287109375, -0.1005401611328125, -0.06256103515625, -0.0245819091796875, 0.013397216796875, 0.0513763427734375, 0.08935546875, 0.1273345947265625, 0.165313720703125, 0.2032928466796875, 0.24127197265625, 0.2792510986328125, 0.317230224609375, 0.3552093505859375, 0.3931884765625, 0.4311676025390625, 0.469146728515625, 0.5071258544921875, 0.54510498046875, 0.5830841064453125, 0.621063232421875, 0.6590423583984375, 0.697021484375, 0.7350006103515625, 0.772979736328125, 0.8109588623046875, 0.84893798828125, 0.8869171142578125, 0.924896240234375, 0.9628753662109375, 1.0008544921875, 1.0388336181640625, 1.076812744140625, 1.1147918701171875, 1.15277099609375, 1.1907501220703125, 1.228729248046875, 1.2667083740234375, 1.3046875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 6.0, 10.0, 10.0, 8.0, 16.0, 22.0, 24.0, 24.0, 37.0, 32.0, 36.0, 39.0, 37.0, 54.0, 64.0, 43.0, 62.0, 46.0, 43.0, 56.0, 44.0, 49.0, 34.0, 28.0, 23.0, 36.0, 26.0, 25.0, 10.0, 12.0, 8.0, 7.0, 5.0, 11.0, 5.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1533203125, -1.1158905029296875, -1.078460693359375, -1.0410308837890625, -1.00360107421875, -0.9661712646484375, -0.928741455078125, -0.8913116455078125, -0.8538818359375, -0.8164520263671875, -0.779022216796875, -0.7415924072265625, -0.70416259765625, -0.6667327880859375, -0.629302978515625, -0.5918731689453125, -0.554443359375, -0.5170135498046875, -0.479583740234375, -0.4421539306640625, -0.40472412109375, -0.3672943115234375, -0.329864501953125, -0.2924346923828125, -0.2550048828125, -0.2175750732421875, -0.180145263671875, -0.1427154541015625, -0.10528564453125, -0.0678558349609375, -0.030426025390625, 0.0070037841796875, 0.04443359375, 0.0818634033203125, 0.119293212890625, 0.1567230224609375, 0.19415283203125, 0.2315826416015625, 0.269012451171875, 0.3064422607421875, 0.3438720703125, 0.3813018798828125, 0.418731689453125, 0.4561614990234375, 0.49359130859375, 0.5310211181640625, 0.568450927734375, 0.6058807373046875, 0.643310546875, 0.6807403564453125, 0.718170166015625, 0.7555999755859375, 0.79302978515625, 0.8304595947265625, 0.867889404296875, 0.9053192138671875, 0.9427490234375, 0.9801788330078125, 1.017608642578125, 1.0550384521484375, 1.09246826171875, 1.1298980712890625, 1.167327880859375, 1.2047576904296875, 1.2421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 8.0, 8.0, 12.0, 10.0, 14.0, 22.0, 31.0, 34.0, 71.0, 71.0, 119.0, 159.0, 218.0, 304.0, 489.0, 853.0, 1670.0, 3677.0, 9822.0, 30534.0, 112140.0, 565215.0, 232194.0, 60923.0, 17930.0, 6252.0, 2570.0, 1227.0, 657.0, 377.0, 268.0, 185.0, 124.0, 75.0, 71.0, 42.0, 39.0, 37.0, 21.0, 21.0, 9.0, 11.0, 9.0, 9.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0], "bins": [-2.60546875, -2.525970458984375, -2.44647216796875, -2.366973876953125, -2.2874755859375, -2.207977294921875, -2.12847900390625, -2.048980712890625, -1.969482421875, -1.889984130859375, -1.81048583984375, -1.730987548828125, -1.6514892578125, -1.571990966796875, -1.49249267578125, -1.412994384765625, -1.33349609375, -1.253997802734375, -1.17449951171875, -1.095001220703125, -1.0155029296875, -0.936004638671875, -0.85650634765625, -0.777008056640625, -0.697509765625, -0.618011474609375, -0.53851318359375, -0.459014892578125, -0.3795166015625, -0.300018310546875, -0.22052001953125, -0.141021728515625, -0.0615234375, 0.017974853515625, 0.09747314453125, 0.176971435546875, 0.2564697265625, 0.335968017578125, 0.41546630859375, 0.494964599609375, 0.574462890625, 0.653961181640625, 0.73345947265625, 0.812957763671875, 0.8924560546875, 0.971954345703125, 1.05145263671875, 1.130950927734375, 1.21044921875, 1.289947509765625, 1.36944580078125, 1.448944091796875, 1.5284423828125, 1.607940673828125, 1.68743896484375, 1.766937255859375, 1.846435546875, 1.925933837890625, 2.00543212890625, 2.084930419921875, 2.1644287109375, 2.243927001953125, 2.32342529296875, 2.402923583984375, 2.482421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 5.0, 7.0, 20.0, 12.0, 8.0, 18.0, 28.0, 27.0, 32.0, 32.0, 41.0, 55.0, 60.0, 59.0, 58.0, 54.0, 49.0, 57.0, 52.0, 44.0, 42.0, 39.0, 34.0, 28.0, 23.0, 31.0, 17.0, 12.0, 12.0, 11.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75390625, -4.60821533203125, -4.4625244140625, -4.31683349609375, -4.171142578125, -4.02545166015625, -3.8797607421875, -3.73406982421875, -3.58837890625, -3.44268798828125, -3.2969970703125, -3.15130615234375, -3.005615234375, -2.85992431640625, -2.7142333984375, -2.56854248046875, -2.4228515625, -2.27716064453125, -2.1314697265625, -1.98577880859375, -1.840087890625, -1.69439697265625, -1.5487060546875, -1.40301513671875, -1.25732421875, -1.11163330078125, -0.9659423828125, -0.82025146484375, -0.674560546875, -0.52886962890625, -0.3831787109375, -0.23748779296875, -0.091796875, 0.05389404296875, 0.1995849609375, 0.34527587890625, 0.490966796875, 0.63665771484375, 0.7823486328125, 0.92803955078125, 1.07373046875, 1.21942138671875, 1.3651123046875, 1.51080322265625, 1.656494140625, 1.80218505859375, 1.9478759765625, 2.09356689453125, 2.2392578125, 2.38494873046875, 2.5306396484375, 2.67633056640625, 2.822021484375, 2.96771240234375, 3.1134033203125, 3.25909423828125, 3.40478515625, 3.55047607421875, 3.6961669921875, 3.84185791015625, 3.987548828125, 4.13323974609375, 4.2789306640625, 4.42462158203125, 4.5703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 6.0, 1.0, 2.0, 6.0, 3.0, 10.0, 6.0, 16.0, 20.0, 17.0, 21.0, 49.0, 44.0, 70.0, 76.0, 132.0, 175.0, 310.0, 518.0, 996.0, 1900.0, 4213.0, 10508.0, 29379.0, 97141.0, 577568.0, 231069.0, 60680.0, 19753.0, 7206.0, 3063.0, 1476.0, 787.0, 439.0, 286.0, 177.0, 116.0, 91.0, 63.0, 40.0, 28.0, 22.0, 22.0, 5.0, 9.0, 10.0, 12.0, 4.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.765625, -0.74298095703125, -0.7203369140625, -0.69769287109375, -0.675048828125, -0.65240478515625, -0.6297607421875, -0.60711669921875, -0.58447265625, -0.56182861328125, -0.5391845703125, -0.51654052734375, -0.493896484375, -0.47125244140625, -0.4486083984375, -0.42596435546875, -0.4033203125, -0.38067626953125, -0.3580322265625, -0.33538818359375, -0.312744140625, -0.29010009765625, -0.2674560546875, -0.24481201171875, -0.22216796875, -0.19952392578125, -0.1768798828125, -0.15423583984375, -0.131591796875, -0.10894775390625, -0.0863037109375, -0.06365966796875, -0.041015625, -0.01837158203125, 0.0042724609375, 0.02691650390625, 0.049560546875, 0.07220458984375, 0.0948486328125, 0.11749267578125, 0.14013671875, 0.16278076171875, 0.1854248046875, 0.20806884765625, 0.230712890625, 0.25335693359375, 0.2760009765625, 0.29864501953125, 0.3212890625, 0.34393310546875, 0.3665771484375, 0.38922119140625, 0.411865234375, 0.43450927734375, 0.4571533203125, 0.47979736328125, 0.50244140625, 0.52508544921875, 0.5477294921875, 0.57037353515625, 0.593017578125, 0.61566162109375, 0.6383056640625, 0.66094970703125, 0.68359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 10.0, 7.0, 18.0, 24.0, 27.0, 28.0, 40.0, 64.0, 87.0, 124.0, 147.0, 103.0, 75.0, 63.0, 34.0, 30.0, 25.0, 23.0, 12.0, 12.0, 9.0, 8.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003604888916015625, -0.0003499835729598999, -0.0003394782543182373, -0.0003289729356765747, -0.0003184676170349121, -0.0003079622983932495, -0.0002974569797515869, -0.0002869516611099243, -0.0002764463424682617, -0.0002659410238265991, -0.0002554357051849365, -0.0002449303865432739, -0.00023442506790161133, -0.00022391974925994873, -0.00021341443061828613, -0.00020290911197662354, -0.00019240379333496094, -0.00018189847469329834, -0.00017139315605163574, -0.00016088783740997314, -0.00015038251876831055, -0.00013987720012664795, -0.00012937188148498535, -0.00011886656284332275, -0.00010836124420166016, -9.785592555999756e-05, -8.735060691833496e-05, -7.684528827667236e-05, -6.633996963500977e-05, -5.583465099334717e-05, -4.532933235168457e-05, -3.482401371002197e-05, -2.4318695068359375e-05, -1.3813376426696777e-05, -3.3080577850341797e-06, 7.197260856628418e-06, 1.7702579498291016e-05, 2.8207898139953613e-05, 3.871321678161621e-05, 4.921853542327881e-05, 5.9723854064941406e-05, 7.0229172706604e-05, 8.07344913482666e-05, 9.12398099899292e-05, 0.0001017451286315918, 0.0001122504472732544, 0.000122755765914917, 0.0001332610845565796, 0.0001437664031982422, 0.00015427172183990479, 0.00016477704048156738, 0.00017528235912322998, 0.00018578767776489258, 0.00019629299640655518, 0.00020679831504821777, 0.00021730363368988037, 0.00022780895233154297, 0.00023831427097320557, 0.00024881958961486816, 0.00025932490825653076, 0.00026983022689819336, 0.00028033554553985596, 0.00029084086418151855, 0.00030134618282318115, 0.00031185150146484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 3.0, 6.0, 6.0, 6.0, 15.0, 13.0, 25.0, 34.0, 33.0, 74.0, 114.0, 156.0, 284.0, 445.0, 840.0, 1709.0, 3946.0, 10930.0, 35420.0, 148503.0, 652036.0, 141977.0, 34022.0, 10460.0, 3890.0, 1666.0, 766.0, 435.0, 217.0, 149.0, 114.0, 75.0, 58.0, 35.0, 15.0, 17.0, 16.0, 11.0, 4.0, 4.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7783203125, -0.751922607421875, -0.72552490234375, -0.699127197265625, -0.6727294921875, -0.646331787109375, -0.61993408203125, -0.593536376953125, -0.567138671875, -0.540740966796875, -0.51434326171875, -0.487945556640625, -0.4615478515625, -0.435150146484375, -0.40875244140625, -0.382354736328125, -0.35595703125, -0.329559326171875, -0.30316162109375, -0.276763916015625, -0.2503662109375, -0.223968505859375, -0.19757080078125, -0.171173095703125, -0.144775390625, -0.118377685546875, -0.09197998046875, -0.065582275390625, -0.0391845703125, -0.012786865234375, 0.01361083984375, 0.040008544921875, 0.06640625, 0.092803955078125, 0.11920166015625, 0.145599365234375, 0.1719970703125, 0.198394775390625, 0.22479248046875, 0.251190185546875, 0.277587890625, 0.303985595703125, 0.33038330078125, 0.356781005859375, 0.3831787109375, 0.409576416015625, 0.43597412109375, 0.462371826171875, 0.48876953125, 0.515167236328125, 0.54156494140625, 0.567962646484375, 0.5943603515625, 0.620758056640625, 0.64715576171875, 0.673553466796875, 0.699951171875, 0.726348876953125, 0.75274658203125, 0.779144287109375, 0.8055419921875, 0.831939697265625, 0.85833740234375, 0.884735107421875, 0.9111328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 12.0, 13.0, 11.0, 15.0, 20.0, 25.0, 35.0, 46.0, 49.0, 64.0, 74.0, 85.0, 80.0, 83.0, 75.0, 57.0, 49.0, 39.0, 28.0, 25.0, 18.0, 15.0, 10.0, 19.0, 12.0, 3.0, 3.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1015625, -1.070709228515625, -1.03985595703125, -1.009002685546875, -0.9781494140625, -0.947296142578125, -0.91644287109375, -0.885589599609375, -0.854736328125, -0.823883056640625, -0.79302978515625, -0.762176513671875, -0.7313232421875, -0.700469970703125, -0.66961669921875, -0.638763427734375, -0.60791015625, -0.577056884765625, -0.54620361328125, -0.515350341796875, -0.4844970703125, -0.453643798828125, -0.42279052734375, -0.391937255859375, -0.361083984375, -0.330230712890625, -0.29937744140625, -0.268524169921875, -0.2376708984375, -0.206817626953125, -0.17596435546875, -0.145111083984375, -0.1142578125, -0.083404541015625, -0.05255126953125, -0.021697998046875, 0.0091552734375, 0.040008544921875, 0.07086181640625, 0.101715087890625, 0.132568359375, 0.163421630859375, 0.19427490234375, 0.225128173828125, 0.2559814453125, 0.286834716796875, 0.31768798828125, 0.348541259765625, 0.37939453125, 0.410247802734375, 0.44110107421875, 0.471954345703125, 0.5028076171875, 0.533660888671875, 0.56451416015625, 0.595367431640625, 0.626220703125, 0.657073974609375, 0.68792724609375, 0.718780517578125, 0.7496337890625, 0.780487060546875, 0.81134033203125, 0.842193603515625, 0.873046875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 13.0, 9.0, 12.0, 33.0, 24.0, 61.0, 96.0, 227.0, 209.0, 107.0, 80.0, 53.0, 23.0, 22.0, 10.0, 8.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.340713500976562, -19.66080093383789, -18.98088836669922, -18.300975799560547, -17.621063232421875, -16.941152572631836, -16.261240005493164, -15.581327438354492, -14.90141487121582, -14.221502304077148, -13.541589736938477, -12.861678123474121, -12.18176555633545, -11.501852989196777, -10.821941375732422, -10.14202880859375, -9.462116241455078, -8.782203674316406, -8.102291107177734, -7.422379493713379, -6.742466926574707, -6.062554359436035, -5.3826422691345215, -4.702730178833008, -4.022817611694336, -3.342905282974243, -2.6629929542541504, -1.9830806255340576, -1.3031682968139648, -0.6232559680938721, 0.0566563606262207, 0.7365684509277344, 1.4164810180664062, 2.096393346786499, 2.776305675506592, 3.4562180042266846, 4.136130332946777, 4.816042900085449, 5.495954990386963, 6.175867080688477, 6.855779647827148, 7.53569221496582, 8.215604782104492, 8.895516395568848, 9.57542896270752, 10.255341529846191, 10.935253143310547, 11.615165710449219, 12.29507827758789, 12.974990844726562, 13.654903411865234, 14.33481502532959, 15.014727592468262, 15.694640159606934, 16.37455177307129, 17.05446434020996, 17.734376907348633, 18.414289474487305, 19.094202041625977, 19.77411460876465, 20.454025268554688, 21.13393783569336, 21.81385040283203, 22.493762969970703, 23.173675537109375]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 7.0, 13.0, 13.0, 21.0, 16.0, 27.0, 21.0, 27.0, 31.0, 24.0, 32.0, 48.0, 62.0, 97.0, 138.0, 68.0, 46.0, 43.0, 33.0, 27.0, 36.0, 33.0, 28.0, 14.0, 12.0, 10.0, 12.0, 10.0, 11.0, 6.0, 3.0, 1.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.02457046508789, -19.438522338867188, -18.852474212646484, -18.26642417907715, -17.680376052856445, -17.094327926635742, -16.508277893066406, -15.922229766845703, -15.336181640625, -14.750133514404297, -14.164084434509277, -13.578035354614258, -12.991987228393555, -12.405939102172852, -11.819890022277832, -11.233840942382812, -10.64779281616211, -10.061744689941406, -9.475695610046387, -8.889646530151367, -8.303598403930664, -7.717549800872803, -7.131501197814941, -6.54545259475708, -5.959403991699219, -5.373355388641357, -4.787306785583496, -4.201258182525635, -3.6152095794677734, -3.029160976409912, -2.443112373352051, -1.8570637702941895, -1.2710151672363281, -0.6849665641784668, -0.09891796112060547, 0.48713064193725586, 1.0731792449951172, 1.6592278480529785, 2.24527645111084, 2.831325054168701, 3.4173736572265625, 4.003422260284424, 4.589470863342285, 5.1755194664001465, 5.761568069458008, 6.347616672515869, 6.9336652755737305, 7.519713878631592, 8.105762481689453, 8.691810607910156, 9.277859687805176, 9.863908767700195, 10.449956893920898, 11.036005020141602, 11.622054100036621, 12.20810317993164, 12.794151306152344, 13.380199432373047, 13.966248512268066, 14.552297592163086, 15.138345718383789, 15.724393844604492, 16.310443878173828, 16.89649200439453, 17.482540130615234]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 8.0, 14.0, 29.0, 41.0, 72.0, 111.0, 177.0, 295.0, 506.0, 936.0, 1792.0, 3727.0, 8277.0, 20201.0, 56956.0, 177781.0, 589893.0, 1491019.0, 1224795.0, 424058.0, 125614.0, 40095.0, 14944.0, 6407.0, 3021.0, 1540.0, 771.0, 464.0, 284.0, 177.0, 123.0, 53.0, 35.0, 26.0, 16.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0537109375, -1.024322509765625, -0.99493408203125, -0.965545654296875, -0.9361572265625, -0.906768798828125, -0.87738037109375, -0.847991943359375, -0.818603515625, -0.789215087890625, -0.75982666015625, -0.730438232421875, -0.7010498046875, -0.671661376953125, -0.64227294921875, -0.612884521484375, -0.58349609375, -0.554107666015625, -0.52471923828125, -0.495330810546875, -0.4659423828125, -0.436553955078125, -0.40716552734375, -0.377777099609375, -0.348388671875, -0.319000244140625, -0.28961181640625, -0.260223388671875, -0.2308349609375, -0.201446533203125, -0.17205810546875, -0.142669677734375, -0.11328125, -0.083892822265625, -0.05450439453125, -0.025115966796875, 0.0042724609375, 0.033660888671875, 0.06304931640625, 0.092437744140625, 0.121826171875, 0.151214599609375, 0.18060302734375, 0.209991455078125, 0.2393798828125, 0.268768310546875, 0.29815673828125, 0.327545166015625, 0.35693359375, 0.386322021484375, 0.41571044921875, 0.445098876953125, 0.4744873046875, 0.503875732421875, 0.53326416015625, 0.562652587890625, 0.592041015625, 0.621429443359375, 0.65081787109375, 0.680206298828125, 0.7095947265625, 0.738983154296875, 0.76837158203125, 0.797760009765625, 0.8271484375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 7.0, 0.0, 6.0, 8.0, 9.0, 7.0, 12.0, 17.0, 20.0, 16.0, 22.0, 32.0, 39.0, 34.0, 36.0, 45.0, 48.0, 48.0, 46.0, 53.0, 45.0, 52.0, 51.0, 46.0, 44.0, 46.0, 41.0, 30.0, 20.0, 17.0, 23.0, 14.0, 14.0, 10.0, 9.0, 9.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.015625, -0.9805145263671875, -0.945404052734375, -0.9102935791015625, -0.87518310546875, -0.8400726318359375, -0.804962158203125, -0.7698516845703125, -0.7347412109375, -0.6996307373046875, -0.664520263671875, -0.6294097900390625, -0.59429931640625, -0.5591888427734375, -0.524078369140625, -0.4889678955078125, -0.453857421875, -0.4187469482421875, -0.383636474609375, -0.3485260009765625, -0.31341552734375, -0.2783050537109375, -0.243194580078125, -0.2080841064453125, -0.1729736328125, -0.1378631591796875, -0.102752685546875, -0.0676422119140625, -0.03253173828125, 0.0025787353515625, 0.037689208984375, 0.0727996826171875, 0.10791015625, 0.1430206298828125, 0.178131103515625, 0.2132415771484375, 0.24835205078125, 0.2834625244140625, 0.318572998046875, 0.3536834716796875, 0.3887939453125, 0.4239044189453125, 0.459014892578125, 0.4941253662109375, 0.52923583984375, 0.5643463134765625, 0.599456787109375, 0.6345672607421875, 0.669677734375, 0.7047882080078125, 0.739898681640625, 0.7750091552734375, 0.81011962890625, 0.8452301025390625, 0.880340576171875, 0.9154510498046875, 0.9505615234375, 0.9856719970703125, 1.020782470703125, 1.0558929443359375, 1.09100341796875, 1.1261138916015625, 1.161224365234375, 1.1963348388671875, 1.2314453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 11.0, 13.0, 17.0, 31.0, 47.0, 68.0, 138.0, 272.0, 641.0, 2427.0, 16022.0, 292653.0, 3720221.0, 148473.0, 10315.0, 1837.0, 548.0, 233.0, 110.0, 70.0, 42.0, 27.0, 21.0, 14.0, 9.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.55078125, -3.4300537109375, -3.309326171875, -3.1885986328125, -3.06787109375, -2.9471435546875, -2.826416015625, -2.7056884765625, -2.5849609375, -2.4642333984375, -2.343505859375, -2.2227783203125, -2.10205078125, -1.9813232421875, -1.860595703125, -1.7398681640625, -1.619140625, -1.4984130859375, -1.377685546875, -1.2569580078125, -1.13623046875, -1.0155029296875, -0.894775390625, -0.7740478515625, -0.6533203125, -0.5325927734375, -0.411865234375, -0.2911376953125, -0.17041015625, -0.0496826171875, 0.071044921875, 0.1917724609375, 0.3125, 0.4332275390625, 0.553955078125, 0.6746826171875, 0.79541015625, 0.9161376953125, 1.036865234375, 1.1575927734375, 1.2783203125, 1.3990478515625, 1.519775390625, 1.6405029296875, 1.76123046875, 1.8819580078125, 2.002685546875, 2.1234130859375, 2.244140625, 2.3648681640625, 2.485595703125, 2.6063232421875, 2.72705078125, 2.8477783203125, 2.968505859375, 3.0892333984375, 3.2099609375, 3.3306884765625, 3.451416015625, 3.5721435546875, 3.69287109375, 3.8135986328125, 3.934326171875, 4.0550537109375, 4.17578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 8.0, 16.0, 17.0, 27.0, 24.0, 44.0, 43.0, 71.0, 95.0, 155.0, 229.0, 326.0, 483.0, 537.0, 574.0, 442.0, 309.0, 211.0, 131.0, 95.0, 57.0, 43.0, 30.0, 24.0, 16.0, 17.0, 8.0, 10.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.26171875, -2.188629150390625, -2.11553955078125, -2.042449951171875, -1.9693603515625, -1.896270751953125, -1.82318115234375, -1.750091552734375, -1.677001953125, -1.603912353515625, -1.53082275390625, -1.457733154296875, -1.3846435546875, -1.311553955078125, -1.23846435546875, -1.165374755859375, -1.09228515625, -1.019195556640625, -0.94610595703125, -0.873016357421875, -0.7999267578125, -0.726837158203125, -0.65374755859375, -0.580657958984375, -0.507568359375, -0.434478759765625, -0.36138916015625, -0.288299560546875, -0.2152099609375, -0.142120361328125, -0.06903076171875, 0.004058837890625, 0.0771484375, 0.150238037109375, 0.22332763671875, 0.296417236328125, 0.3695068359375, 0.442596435546875, 0.51568603515625, 0.588775634765625, 0.661865234375, 0.734954833984375, 0.80804443359375, 0.881134033203125, 0.9542236328125, 1.027313232421875, 1.10040283203125, 1.173492431640625, 1.24658203125, 1.319671630859375, 1.39276123046875, 1.465850830078125, 1.5389404296875, 1.612030029296875, 1.68511962890625, 1.758209228515625, 1.831298828125, 1.904388427734375, 1.97747802734375, 2.050567626953125, 2.1236572265625, 2.196746826171875, 2.26983642578125, 2.342926025390625, 2.416015625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 1.0, 5.0, 6.0, 27.0, 58.0, 109.0, 195.0, 238.0, 182.0, 110.0, 37.0, 11.0, 11.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.34957504272461, -17.300260543823242, -16.250946044921875, -15.20163345336914, -14.152318954467773, -13.103004455566406, -12.053690910339355, -11.004377365112305, -9.955062866210938, -8.90574836730957, -7.8564348220825195, -6.8071208000183105, -5.757806777954102, -4.708492755889893, -3.6591787338256836, -2.6098647117614746, -1.5605506896972656, -0.5112366676330566, 0.5380773544311523, 1.5873913764953613, 2.6367053985595703, 3.6860194206237793, 4.735333442687988, 5.784647464752197, 6.833961486816406, 7.883275508880615, 8.932589530944824, 9.981903076171875, 11.031217575073242, 12.08053207397461, 13.12984561920166, 14.179159164428711, 15.228477478027344, 16.27779197692871, 17.327106475830078, 18.376419067382812, 19.42573356628418, 20.475048065185547, 21.52436065673828, 22.57367515563965, 23.622989654541016, 24.672304153442383, 25.72161865234375, 26.770931243896484, 27.82024574279785, 28.86956024169922, 29.918872833251953, 30.96818733215332, 32.01750183105469, 33.06681442260742, 34.11613082885742, 35.165443420410156, 36.214759826660156, 37.26407241821289, 38.313385009765625, 39.362701416015625, 40.41201400756836, 41.461326599121094, 42.510643005371094, 43.55995559692383, 44.60926818847656, 45.65858459472656, 46.7078971862793, 47.7572135925293, 48.80652618408203]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 11.0, 5.0, 11.0, 12.0, 17.0, 20.0, 28.0, 24.0, 29.0, 25.0, 30.0, 16.0, 39.0, 41.0, 48.0, 46.0, 35.0, 27.0, 53.0, 37.0, 34.0, 37.0, 49.0, 47.0, 37.0, 25.0, 42.0, 20.0, 34.0, 14.0, 20.0, 17.0, 20.0, 17.0, 11.0, 4.0, 8.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.1329345703125, -11.789010047912598, -11.445085525512695, -11.101161003112793, -10.75723648071289, -10.413312911987305, -10.069388389587402, -9.7254638671875, -9.381539344787598, -9.037614822387695, -8.693690299987793, -8.34976577758789, -8.005842208862305, -7.661917209625244, -7.3179931640625, -6.974068641662598, -6.630144119262695, -6.286219596862793, -5.942295074462891, -5.5983710289001465, -5.254446506500244, -4.910521984100342, -4.566597938537598, -4.222673416137695, -3.878748893737793, -3.5348243713378906, -3.1909000873565674, -2.846975803375244, -2.503051280975342, -2.1591267585754395, -1.8152024745941162, -1.471278190612793, -1.1273527145385742, -0.7834283113479614, -0.43950390815734863, -0.09557950496673584, 0.24834489822387695, 0.5922693014144897, 0.9361937046051025, 1.2801179885864258, 1.6240425109863281, 1.967966914176941, 2.3118913173675537, 2.655815601348877, 2.9997401237487793, 3.3436646461486816, 3.687588930130005, 4.031513214111328, 4.3754377365112305, 4.719362258911133, 5.063286781311035, 5.407210826873779, 5.751135349273682, 6.095059871673584, 6.438983917236328, 6.7829084396362305, 7.126832962036133, 7.470757484436035, 7.8146820068359375, 8.15860652923584, 8.502531051635742, 8.846454620361328, 9.19037914276123, 9.534303665161133, 9.878228187561035]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 11.0, 7.0, 12.0, 15.0, 13.0, 27.0, 50.0, 84.0, 135.0, 159.0, 288.0, 422.0, 610.0, 1056.0, 1584.0, 2684.0, 4443.0, 7769.0, 14268.0, 26968.0, 52934.0, 110498.0, 225874.0, 280177.0, 160509.0, 75955.0, 37132.0, 19454.0, 10408.0, 5796.0, 3587.0, 2031.0, 1258.0, 820.0, 517.0, 336.0, 204.0, 147.0, 104.0, 73.0, 57.0, 30.0, 20.0, 5.0, 5.0, 3.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0], "bins": [-1.8017578125, -1.750640869140625, -1.69952392578125, -1.648406982421875, -1.5972900390625, -1.546173095703125, -1.49505615234375, -1.443939208984375, -1.392822265625, -1.341705322265625, -1.29058837890625, -1.239471435546875, -1.1883544921875, -1.137237548828125, -1.08612060546875, -1.035003662109375, -0.98388671875, -0.932769775390625, -0.88165283203125, -0.830535888671875, -0.7794189453125, -0.728302001953125, -0.67718505859375, -0.626068115234375, -0.574951171875, -0.523834228515625, -0.47271728515625, -0.421600341796875, -0.3704833984375, -0.319366455078125, -0.26824951171875, -0.217132568359375, -0.166015625, -0.114898681640625, -0.06378173828125, -0.012664794921875, 0.0384521484375, 0.089569091796875, 0.14068603515625, 0.191802978515625, 0.242919921875, 0.294036865234375, 0.34515380859375, 0.396270751953125, 0.4473876953125, 0.498504638671875, 0.54962158203125, 0.600738525390625, 0.65185546875, 0.702972412109375, 0.75408935546875, 0.805206298828125, 0.8563232421875, 0.907440185546875, 0.95855712890625, 1.009674072265625, 1.060791015625, 1.111907958984375, 1.16302490234375, 1.214141845703125, 1.2652587890625, 1.316375732421875, 1.36749267578125, 1.418609619140625, 1.4697265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 4.0, 10.0, 3.0, 6.0, 7.0, 8.0, 8.0, 11.0, 21.0, 13.0, 30.0, 22.0, 26.0, 23.0, 33.0, 38.0, 22.0, 23.0, 42.0, 38.0, 46.0, 52.0, 50.0, 47.0, 36.0, 38.0, 27.0, 44.0, 30.0, 27.0, 22.0, 32.0, 20.0, 20.0, 19.0, 12.0, 12.0, 13.0, 10.0, 7.0, 9.0, 6.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.93603515625, -0.9051132202148438, -0.8741912841796875, -0.8432693481445312, -0.812347412109375, -0.7814254760742188, -0.7505035400390625, -0.7195816040039062, -0.68865966796875, -0.6577377319335938, -0.6268157958984375, -0.5958938598632812, -0.564971923828125, -0.5340499877929688, -0.5031280517578125, -0.47220611572265625, -0.4412841796875, -0.41036224365234375, -0.3794403076171875, -0.34851837158203125, -0.317596435546875, -0.28667449951171875, -0.2557525634765625, -0.22483062744140625, -0.19390869140625, -0.16298675537109375, -0.1320648193359375, -0.10114288330078125, -0.070220947265625, -0.03929901123046875, -0.0083770751953125, 0.02254486083984375, 0.053466796875, 0.08438873291015625, 0.1153106689453125, 0.14623260498046875, 0.177154541015625, 0.20807647705078125, 0.2389984130859375, 0.26992034912109375, 0.30084228515625, 0.33176422119140625, 0.3626861572265625, 0.39360809326171875, 0.424530029296875, 0.45545196533203125, 0.4863739013671875, 0.5172958374023438, 0.5482177734375, 0.5791397094726562, 0.6100616455078125, 0.6409835815429688, 0.671905517578125, 0.7028274536132812, 0.7337493896484375, 0.7646713256835938, 0.79559326171875, 0.8265151977539062, 0.8574371337890625, 0.8883590698242188, 0.919281005859375, 0.9502029418945312, 0.9811248779296875, 1.0120468139648438, 1.04296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 4.0, 11.0, 12.0, 11.0, 13.0, 31.0, 33.0, 34.0, 63.0, 61.0, 108.0, 156.0, 212.0, 316.0, 490.0, 857.0, 1684.0, 4142.0, 13515.0, 68983.0, 684425.0, 224801.0, 34384.0, 8044.0, 2886.0, 1265.0, 688.0, 404.0, 271.0, 176.0, 119.0, 101.0, 66.0, 36.0, 46.0, 30.0, 15.0, 21.0, 4.0, 10.0, 6.0, 5.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0], "bins": [-4.1484375, -4.03570556640625, -3.9229736328125, -3.81024169921875, -3.697509765625, -3.58477783203125, -3.4720458984375, -3.35931396484375, -3.24658203125, -3.13385009765625, -3.0211181640625, -2.90838623046875, -2.795654296875, -2.68292236328125, -2.5701904296875, -2.45745849609375, -2.3447265625, -2.23199462890625, -2.1192626953125, -2.00653076171875, -1.893798828125, -1.78106689453125, -1.6683349609375, -1.55560302734375, -1.44287109375, -1.33013916015625, -1.2174072265625, -1.10467529296875, -0.991943359375, -0.87921142578125, -0.7664794921875, -0.65374755859375, -0.541015625, -0.42828369140625, -0.3155517578125, -0.20281982421875, -0.090087890625, 0.02264404296875, 0.1353759765625, 0.24810791015625, 0.36083984375, 0.47357177734375, 0.5863037109375, 0.69903564453125, 0.811767578125, 0.92449951171875, 1.0372314453125, 1.14996337890625, 1.2626953125, 1.37542724609375, 1.4881591796875, 1.60089111328125, 1.713623046875, 1.82635498046875, 1.9390869140625, 2.05181884765625, 2.16455078125, 2.27728271484375, 2.3900146484375, 2.50274658203125, 2.615478515625, 2.72821044921875, 2.8409423828125, 2.95367431640625, 3.06640625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 9.0, 13.0, 11.0, 13.0, 14.0, 23.0, 19.0, 36.0, 36.0, 38.0, 52.0, 60.0, 73.0, 77.0, 73.0, 61.0, 64.0, 66.0, 52.0, 36.0, 39.0, 32.0, 23.0, 21.0, 11.0, 15.0, 8.0, 7.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.95703125, -5.783447265625, -5.60986328125, -5.436279296875, -5.2626953125, -5.089111328125, -4.91552734375, -4.741943359375, -4.568359375, -4.394775390625, -4.22119140625, -4.047607421875, -3.8740234375, -3.700439453125, -3.52685546875, -3.353271484375, -3.1796875, -3.006103515625, -2.83251953125, -2.658935546875, -2.4853515625, -2.311767578125, -2.13818359375, -1.964599609375, -1.791015625, -1.617431640625, -1.44384765625, -1.270263671875, -1.0966796875, -0.923095703125, -0.74951171875, -0.575927734375, -0.40234375, -0.228759765625, -0.05517578125, 0.118408203125, 0.2919921875, 0.465576171875, 0.63916015625, 0.812744140625, 0.986328125, 1.159912109375, 1.33349609375, 1.507080078125, 1.6806640625, 1.854248046875, 2.02783203125, 2.201416015625, 2.375, 2.548583984375, 2.72216796875, 2.895751953125, 3.0693359375, 3.242919921875, 3.41650390625, 3.590087890625, 3.763671875, 3.937255859375, 4.11083984375, 4.284423828125, 4.4580078125, 4.631591796875, 4.80517578125, 4.978759765625, 5.15234375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 14.0, 21.0, 32.0, 40.0, 43.0, 77.0, 114.0, 209.0, 293.0, 616.0, 1152.0, 2633.0, 7276.0, 24870.0, 100615.0, 666028.0, 183734.0, 42228.0, 11495.0, 3657.0, 1557.0, 752.0, 418.0, 222.0, 130.0, 109.0, 51.0, 44.0, 22.0, 19.0, 13.0, 12.0, 10.0, 7.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6064453125, -0.5845489501953125, -0.562652587890625, -0.5407562255859375, -0.51885986328125, -0.4969635009765625, -0.475067138671875, -0.4531707763671875, -0.4312744140625, -0.4093780517578125, -0.387481689453125, -0.3655853271484375, -0.34368896484375, -0.3217926025390625, -0.299896240234375, -0.2779998779296875, -0.256103515625, -0.2342071533203125, -0.212310791015625, -0.1904144287109375, -0.16851806640625, -0.1466217041015625, -0.124725341796875, -0.1028289794921875, -0.0809326171875, -0.0590362548828125, -0.037139892578125, -0.0152435302734375, 0.00665283203125, 0.0285491943359375, 0.050445556640625, 0.0723419189453125, 0.09423828125, 0.1161346435546875, 0.138031005859375, 0.1599273681640625, 0.18182373046875, 0.2037200927734375, 0.225616455078125, 0.2475128173828125, 0.2694091796875, 0.2913055419921875, 0.313201904296875, 0.3350982666015625, 0.35699462890625, 0.3788909912109375, 0.400787353515625, 0.4226837158203125, 0.444580078125, 0.4664764404296875, 0.488372802734375, 0.5102691650390625, 0.53216552734375, 0.5540618896484375, 0.575958251953125, 0.5978546142578125, 0.6197509765625, 0.6416473388671875, 0.663543701171875, 0.6854400634765625, 0.70733642578125, 0.7292327880859375, 0.751129150390625, 0.7730255126953125, 0.794921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 8.0, 13.0, 19.0, 28.0, 35.0, 39.0, 59.0, 72.0, 100.0, 129.0, 117.0, 108.0, 75.0, 50.0, 37.0, 33.0, 23.0, 15.0, 7.0, 6.0, 6.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027680397033691406, -0.0002661310136318207, -0.0002554580569267273, -0.0002447851002216339, -0.00023411214351654053, -0.00022343918681144714, -0.00021276623010635376, -0.00020209327340126038, -0.000191420316696167, -0.0001807473599910736, -0.00017007440328598022, -0.00015940144658088684, -0.00014872848987579346, -0.00013805553317070007, -0.0001273825764656067, -0.0001167096197605133, -0.00010603666305541992, -9.536370635032654e-05, -8.469074964523315e-05, -7.401779294013977e-05, -6.334483623504639e-05, -5.2671879529953e-05, -4.199892282485962e-05, -3.1325966119766235e-05, -2.065300941467285e-05, -9.980052709579468e-06, 6.92903995513916e-07, 1.13658607006073e-05, 2.2038817405700684e-05, 3.271177411079407e-05, 4.338473081588745e-05, 5.4057687520980835e-05, 6.473064422607422e-05, 7.54036009311676e-05, 8.607655763626099e-05, 9.674951434135437e-05, 0.00010742247104644775, 0.00011809542775154114, 0.00012876838445663452, 0.0001394413411617279, 0.0001501142978668213, 0.00016078725457191467, 0.00017146021127700806, 0.00018213316798210144, 0.00019280612468719482, 0.0002034790813922882, 0.0002141520380973816, 0.00022482499480247498, 0.00023549795150756836, 0.00024617090821266174, 0.0002568438649177551, 0.0002675168216228485, 0.0002781897783279419, 0.0002888627350330353, 0.00029953569173812866, 0.00031020864844322205, 0.00032088160514831543, 0.0003315545618534088, 0.0003422275185585022, 0.0003529004752635956, 0.00036357343196868896, 0.00037424638867378235, 0.00038491934537887573, 0.0003955923020839691, 0.0004062652587890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 10.0, 15.0, 12.0, 29.0, 26.0, 43.0, 54.0, 99.0, 153.0, 256.0, 453.0, 944.0, 2116.0, 6334.0, 26309.0, 160875.0, 725179.0, 99818.0, 17563.0, 4734.0, 1693.0, 806.0, 391.0, 212.0, 133.0, 97.0, 45.0, 36.0, 26.0, 27.0, 11.0, 11.0, 8.0, 8.0, 6.0, 7.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.82080078125, -0.7946395874023438, -0.7684783935546875, -0.7423171997070312, -0.716156005859375, -0.6899948120117188, -0.6638336181640625, -0.6376724243164062, -0.61151123046875, -0.5853500366210938, -0.5591888427734375, -0.5330276489257812, -0.506866455078125, -0.48070526123046875, -0.4545440673828125, -0.42838287353515625, -0.4022216796875, -0.37606048583984375, -0.3498992919921875, -0.32373809814453125, -0.297576904296875, -0.27141571044921875, -0.2452545166015625, -0.21909332275390625, -0.19293212890625, -0.16677093505859375, -0.1406097412109375, -0.11444854736328125, -0.088287353515625, -0.06212615966796875, -0.0359649658203125, -0.00980377197265625, 0.016357421875, 0.04251861572265625, 0.0686798095703125, 0.09484100341796875, 0.121002197265625, 0.14716339111328125, 0.1733245849609375, 0.19948577880859375, 0.22564697265625, 0.25180816650390625, 0.2779693603515625, 0.30413055419921875, 0.330291748046875, 0.35645294189453125, 0.3826141357421875, 0.40877532958984375, 0.4349365234375, 0.46109771728515625, 0.4872589111328125, 0.5134201049804688, 0.539581298828125, 0.5657424926757812, 0.5919036865234375, 0.6180648803710938, 0.64422607421875, 0.6703872680664062, 0.6965484619140625, 0.7227096557617188, 0.748870849609375, 0.7750320434570312, 0.8011932373046875, 0.8273544311523438, 0.853515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 6.0, 5.0, 8.0, 15.0, 7.0, 20.0, 19.0, 22.0, 16.0, 37.0, 55.0, 51.0, 60.0, 71.0, 54.0, 74.0, 59.0, 63.0, 74.0, 57.0, 42.0, 34.0, 36.0, 19.0, 21.0, 16.0, 9.0, 11.0, 10.0, 4.0, 7.0, 7.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59130859375, -0.5698623657226562, -0.5484161376953125, -0.5269699096679688, -0.505523681640625, -0.48407745361328125, -0.4626312255859375, -0.44118499755859375, -0.41973876953125, -0.39829254150390625, -0.3768463134765625, -0.35540008544921875, -0.333953857421875, -0.31250762939453125, -0.2910614013671875, -0.26961517333984375, -0.2481689453125, -0.22672271728515625, -0.2052764892578125, -0.18383026123046875, -0.162384033203125, -0.14093780517578125, -0.1194915771484375, -0.09804534912109375, -0.07659912109375, -0.05515289306640625, -0.0337066650390625, -0.01226043701171875, 0.009185791015625, 0.03063201904296875, 0.0520782470703125, 0.07352447509765625, 0.094970703125, 0.11641693115234375, 0.1378631591796875, 0.15930938720703125, 0.180755615234375, 0.20220184326171875, 0.2236480712890625, 0.24509429931640625, 0.26654052734375, 0.28798675537109375, 0.3094329833984375, 0.33087921142578125, 0.352325439453125, 0.37377166748046875, 0.3952178955078125, 0.41666412353515625, 0.4381103515625, 0.45955657958984375, 0.4810028076171875, 0.5024490356445312, 0.523895263671875, 0.5453414916992188, 0.5667877197265625, 0.5882339477539062, 0.60968017578125, 0.6311264038085938, 0.6525726318359375, 0.6740188598632812, 0.695465087890625, 0.7169113159179688, 0.7383575439453125, 0.7598037719726562, 0.78125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 16.0, 18.0, 56.0, 117.0, 362.0, 223.0, 101.0, 50.0, 19.0, 16.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.81583786010742, -43.74491882324219, -42.67399597167969, -41.60307693481445, -40.53215789794922, -39.46123504638672, -38.390316009521484, -37.31939697265625, -36.24847412109375, -35.177555084228516, -34.106632232666016, -33.03571319580078, -31.964794158935547, -30.89387321472168, -29.822952270507812, -28.752033233642578, -27.681114196777344, -26.610193252563477, -25.539274215698242, -24.468353271484375, -23.39743423461914, -22.326513290405273, -21.255592346191406, -20.184673309326172, -19.113752365112305, -18.042831420898438, -16.971912384033203, -15.900991439819336, -14.830071449279785, -13.759151458740234, -12.688230514526367, -11.617310523986816, -10.546388626098633, -9.475468635559082, -8.404548645019531, -7.333627700805664, -6.262707710266113, -5.1917877197265625, -4.1208672523498535, -3.0499467849731445, -1.9790267944335938, -0.9081065654754639, 0.16281366348266602, 1.233733892440796, 2.304654121398926, 3.3755741119384766, 4.4464945793151855, 5.5174150466918945, 6.588335037231445, 7.659255027770996, 8.730175018310547, 9.801095962524414, 10.872015953063965, 11.942935943603516, 13.013856887817383, 14.084776878356934, 15.155696868896484, 16.22661781311035, 17.297536849975586, 18.368457794189453, 19.439376831054688, 20.510297775268555, 21.581218719482422, 22.652137756347656, 23.723058700561523]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 5.0, 0.0, 6.0, 6.0, 6.0, 8.0, 7.0, 8.0, 10.0, 9.0, 16.0, 12.0, 26.0, 21.0, 29.0, 23.0, 27.0, 27.0, 36.0, 97.0, 178.0, 86.0, 44.0, 30.0, 36.0, 17.0, 38.0, 24.0, 19.0, 25.0, 21.0, 19.0, 13.0, 11.0, 10.0, 11.0, 9.0, 5.0, 10.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-18.386028289794922, -17.867717742919922, -17.349407196044922, -16.831098556518555, -16.312788009643555, -15.794477462768555, -15.276167869567871, -14.757858276367188, -14.239547729492188, -13.721237182617188, -13.202927589416504, -12.68461799621582, -12.16630744934082, -11.64799690246582, -11.129687309265137, -10.611377716064453, -10.093067169189453, -9.574756622314453, -9.05644702911377, -8.538137435913086, -8.019826889038086, -7.501516819000244, -6.983206748962402, -6.4648966789245605, -5.946586608886719, -5.428276538848877, -4.909966468811035, -4.391656398773193, -3.8733463287353516, -3.3550362586975098, -2.836726188659668, -2.318416118621826, -1.8001060485839844, -1.2817959785461426, -0.7634859085083008, -0.24517583847045898, 0.2731342315673828, 0.7914443016052246, 1.3097543716430664, 1.8280644416809082, 2.34637451171875, 2.864684581756592, 3.3829946517944336, 3.9013047218322754, 4.419614791870117, 4.937924861907959, 5.456234931945801, 5.974545001983643, 6.492855072021484, 7.011165142059326, 7.529475212097168, 8.047784805297852, 8.566095352172852, 9.084405899047852, 9.602715492248535, 10.121025085449219, 10.639335632324219, 11.157646179199219, 11.675955772399902, 12.194265365600586, 12.712575912475586, 13.230886459350586, 13.74919605255127, 14.267505645751953, 14.785816192626953]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 13.0, 16.0, 20.0, 25.0, 53.0, 55.0, 111.0, 176.0, 240.0, 347.0, 545.0, 890.0, 1519.0, 2787.0, 5194.0, 11384.0, 29011.0, 88355.0, 283939.0, 835597.0, 1530565.0, 927123.0, 321501.0, 97700.0, 32116.0, 12242.0, 5642.0, 2848.0, 1609.0, 939.0, 605.0, 379.0, 234.0, 145.0, 118.0, 75.0, 36.0, 42.0, 26.0, 15.0, 4.0, 9.0, 10.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1953125, -1.15618896484375, -1.1170654296875, -1.07794189453125, -1.038818359375, -0.99969482421875, -0.9605712890625, -0.92144775390625, -0.88232421875, -0.84320068359375, -0.8040771484375, -0.76495361328125, -0.725830078125, -0.68670654296875, -0.6475830078125, -0.60845947265625, -0.5693359375, -0.53021240234375, -0.4910888671875, -0.45196533203125, -0.412841796875, -0.37371826171875, -0.3345947265625, -0.29547119140625, -0.25634765625, -0.21722412109375, -0.1781005859375, -0.13897705078125, -0.099853515625, -0.06072998046875, -0.0216064453125, 0.01751708984375, 0.056640625, 0.09576416015625, 0.1348876953125, 0.17401123046875, 0.213134765625, 0.25225830078125, 0.2913818359375, 0.33050537109375, 0.36962890625, 0.40875244140625, 0.4478759765625, 0.48699951171875, 0.526123046875, 0.56524658203125, 0.6043701171875, 0.64349365234375, 0.6826171875, 0.72174072265625, 0.7608642578125, 0.79998779296875, 0.839111328125, 0.87823486328125, 0.9173583984375, 0.95648193359375, 0.99560546875, 1.03472900390625, 1.0738525390625, 1.11297607421875, 1.152099609375, 1.19122314453125, 1.2303466796875, 1.26947021484375, 1.30859375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 7.0, 6.0, 16.0, 11.0, 10.0, 13.0, 18.0, 21.0, 18.0, 21.0, 48.0, 37.0, 35.0, 46.0, 49.0, 60.0, 59.0, 43.0, 52.0, 44.0, 40.0, 30.0, 24.0, 34.0, 37.0, 36.0, 17.0, 31.0, 26.0, 12.0, 21.0, 15.0, 9.0, 11.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0224609375, -0.9902801513671875, -0.958099365234375, -0.9259185791015625, -0.89373779296875, -0.8615570068359375, -0.829376220703125, -0.7971954345703125, -0.7650146484375, -0.7328338623046875, -0.700653076171875, -0.6684722900390625, -0.63629150390625, -0.6041107177734375, -0.571929931640625, -0.5397491455078125, -0.507568359375, -0.4753875732421875, -0.443206787109375, -0.4110260009765625, -0.37884521484375, -0.3466644287109375, -0.314483642578125, -0.2823028564453125, -0.2501220703125, -0.2179412841796875, -0.185760498046875, -0.1535797119140625, -0.12139892578125, -0.0892181396484375, -0.057037353515625, -0.0248565673828125, 0.00732421875, 0.0395050048828125, 0.071685791015625, 0.1038665771484375, 0.13604736328125, 0.1682281494140625, 0.200408935546875, 0.2325897216796875, 0.2647705078125, 0.2969512939453125, 0.329132080078125, 0.3613128662109375, 0.39349365234375, 0.4256744384765625, 0.457855224609375, 0.4900360107421875, 0.522216796875, 0.5543975830078125, 0.586578369140625, 0.6187591552734375, 0.65093994140625, 0.6831207275390625, 0.715301513671875, 0.7474822998046875, 0.7796630859375, 0.8118438720703125, 0.844024658203125, 0.8762054443359375, 0.90838623046875, 0.9405670166015625, 0.972747802734375, 1.0049285888671875, 1.037109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 4.0, 5.0, 6.0, 22.0, 24.0, 52.0, 67.0, 121.0, 256.0, 483.0, 1132.0, 3280.0, 23887.0, 3600322.0, 551327.0, 9640.0, 2082.0, 766.0, 367.0, 178.0, 96.0, 67.0, 34.0, 21.0, 13.0, 9.0, 10.0, 2.0, 9.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.3160400390625, -6.089111328125, -5.8621826171875, -5.63525390625, -5.4083251953125, -5.181396484375, -4.9544677734375, -4.7275390625, -4.5006103515625, -4.273681640625, -4.0467529296875, -3.81982421875, -3.5928955078125, -3.365966796875, -3.1390380859375, -2.912109375, -2.6851806640625, -2.458251953125, -2.2313232421875, -2.00439453125, -1.7774658203125, -1.550537109375, -1.3236083984375, -1.0966796875, -0.8697509765625, -0.642822265625, -0.4158935546875, -0.18896484375, 0.0379638671875, 0.264892578125, 0.4918212890625, 0.71875, 0.9456787109375, 1.172607421875, 1.3995361328125, 1.62646484375, 1.8533935546875, 2.080322265625, 2.3072509765625, 2.5341796875, 2.7611083984375, 2.988037109375, 3.2149658203125, 3.44189453125, 3.6688232421875, 3.895751953125, 4.1226806640625, 4.349609375, 4.5765380859375, 4.803466796875, 5.0303955078125, 5.25732421875, 5.4842529296875, 5.711181640625, 5.9381103515625, 6.1650390625, 6.3919677734375, 6.618896484375, 6.8458251953125, 7.07275390625, 7.2996826171875, 7.526611328125, 7.7535400390625, 7.98046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 6.0, 3.0, 10.0, 13.0, 19.0, 39.0, 42.0, 85.0, 122.0, 148.0, 242.0, 352.0, 501.0, 656.0, 622.0, 408.0, 310.0, 176.0, 117.0, 72.0, 50.0, 27.0, 16.0, 8.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.046875, -4.916473388671875, -4.78607177734375, -4.655670166015625, -4.5252685546875, -4.394866943359375, -4.26446533203125, -4.134063720703125, -4.003662109375, -3.873260498046875, -3.74285888671875, -3.612457275390625, -3.4820556640625, -3.351654052734375, -3.22125244140625, -3.090850830078125, -2.96044921875, -2.830047607421875, -2.69964599609375, -2.569244384765625, -2.4388427734375, -2.308441162109375, -2.17803955078125, -2.047637939453125, -1.917236328125, -1.786834716796875, -1.65643310546875, -1.526031494140625, -1.3956298828125, -1.265228271484375, -1.13482666015625, -1.004425048828125, -0.8740234375, -0.743621826171875, -0.61322021484375, -0.482818603515625, -0.3524169921875, -0.222015380859375, -0.09161376953125, 0.038787841796875, 0.169189453125, 0.299591064453125, 0.42999267578125, 0.560394287109375, 0.6907958984375, 0.821197509765625, 0.95159912109375, 1.082000732421875, 1.21240234375, 1.342803955078125, 1.47320556640625, 1.603607177734375, 1.7340087890625, 1.864410400390625, 1.99481201171875, 2.125213623046875, 2.255615234375, 2.386016845703125, 2.51641845703125, 2.646820068359375, 2.7772216796875, 2.907623291015625, 3.03802490234375, 3.168426513671875, 3.298828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 11.0, 13.0, 30.0, 66.0, 115.0, 216.0, 230.0, 144.0, 82.0, 39.0, 20.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-76.03483581542969, -74.31876373291016, -72.6026840209961, -70.88661193847656, -69.17053985595703, -67.45446014404297, -65.73838806152344, -64.0223159790039, -62.30624008178711, -60.59016418457031, -58.87409210205078, -57.158016204833984, -55.44194030761719, -53.725868225097656, -52.00979232788086, -50.29371643066406, -48.57764434814453, -46.861568450927734, -45.1454963684082, -43.429420471191406, -41.71334457397461, -39.99727249145508, -38.28119659423828, -36.56512451171875, -34.84904479980469, -33.13296890258789, -31.416894912719727, -29.700820922851562, -27.9847469329834, -26.268672943115234, -24.552597045898438, -22.836523056030273, -21.12044906616211, -19.404375076293945, -17.68829917907715, -15.972225189208984, -14.25615119934082, -12.54007625579834, -10.82400131225586, -9.107927322387695, -7.391852378845215, -5.675777912139893, -3.959703207015991, -2.24362850189209, -0.5275540351867676, 1.1885204315185547, 2.904595375061035, 4.620669364929199, 6.33674430847168, 8.05281925201416, 9.768893241882324, 11.484968185424805, 13.201042175292969, 14.91711711883545, 16.63319206237793, 18.349266052246094, 20.06534194946289, 21.781415939331055, 23.49749183654785, 25.213565826416016, 26.92963981628418, 28.645713806152344, 30.36178970336914, 32.07786560058594, 33.79393768310547]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 5.0, 2.0, 7.0, 3.0, 10.0, 7.0, 11.0, 10.0, 15.0, 16.0, 31.0, 33.0, 25.0, 35.0, 26.0, 38.0, 45.0, 63.0, 61.0, 59.0, 52.0, 54.0, 52.0, 52.0, 49.0, 36.0, 31.0, 42.0, 25.0, 20.0, 24.0, 14.0, 12.0, 10.0, 9.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.1195068359375, -21.467880249023438, -20.816253662109375, -20.164628982543945, -19.513002395629883, -18.86137580871582, -18.20975112915039, -17.558124542236328, -16.906497955322266, -16.254871368408203, -15.603245735168457, -14.951620101928711, -14.299993515014648, -13.648366928100586, -12.99674129486084, -12.345115661621094, -11.693489074707031, -11.041862487792969, -10.390236854553223, -9.738611221313477, -9.086984634399414, -8.435358047485352, -7.7837324142456055, -7.132106304168701, -6.480480194091797, -5.828854084014893, -5.177227973937988, -4.525601863861084, -3.8739757537841797, -3.2223496437072754, -2.570723533630371, -1.9190974235534668, -1.2674713134765625, -0.6158452033996582, 0.035780906677246094, 0.6874070167541504, 1.3390331268310547, 1.990659236907959, 2.6422853469848633, 3.2939114570617676, 3.945537567138672, 4.597163677215576, 5.2487897872924805, 5.900415897369385, 6.552042007446289, 7.203668117523193, 7.855294227600098, 8.506919860839844, 9.158546447753906, 9.810173034667969, 10.461798667907715, 11.113424301147461, 11.765050888061523, 12.416677474975586, 13.068303108215332, 13.719928741455078, 14.37155532836914, 15.023181915283203, 15.67480754852295, 16.326433181762695, 16.978059768676758, 17.62968635559082, 18.28131103515625, 18.932937622070312, 19.584564208984375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 9.0, 1.0, 7.0, 16.0, 30.0, 33.0, 49.0, 77.0, 111.0, 215.0, 340.0, 584.0, 970.0, 1694.0, 3114.0, 5913.0, 12459.0, 28790.0, 74236.0, 239478.0, 474323.0, 124469.0, 45085.0, 18604.0, 8444.0, 4085.0, 2311.0, 1235.0, 740.0, 429.0, 258.0, 153.0, 114.0, 66.0, 34.0, 28.0, 19.0, 17.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.22265625, -2.1595916748046875, -2.096527099609375, -2.0334625244140625, -1.97039794921875, -1.9073333740234375, -1.844268798828125, -1.7812042236328125, -1.7181396484375, -1.6550750732421875, -1.592010498046875, -1.5289459228515625, -1.46588134765625, -1.4028167724609375, -1.339752197265625, -1.2766876220703125, -1.213623046875, -1.1505584716796875, -1.087493896484375, -1.0244293212890625, -0.96136474609375, -0.8983001708984375, -0.835235595703125, -0.7721710205078125, -0.7091064453125, -0.6460418701171875, -0.582977294921875, -0.5199127197265625, -0.45684814453125, -0.3937835693359375, -0.330718994140625, -0.2676544189453125, -0.20458984375, -0.1415252685546875, -0.078460693359375, -0.0153961181640625, 0.04766845703125, 0.1107330322265625, 0.173797607421875, 0.2368621826171875, 0.2999267578125, 0.3629913330078125, 0.426055908203125, 0.4891204833984375, 0.55218505859375, 0.6152496337890625, 0.678314208984375, 0.7413787841796875, 0.804443359375, 0.8675079345703125, 0.930572509765625, 0.9936370849609375, 1.05670166015625, 1.1197662353515625, 1.182830810546875, 1.2458953857421875, 1.3089599609375, 1.3720245361328125, 1.435089111328125, 1.4981536865234375, 1.56121826171875, 1.6242828369140625, 1.687347412109375, 1.7504119873046875, 1.8134765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 11.0, 5.0, 6.0, 9.0, 15.0, 19.0, 5.0, 19.0, 21.0, 27.0, 23.0, 26.0, 31.0, 39.0, 38.0, 58.0, 38.0, 54.0, 51.0, 48.0, 50.0, 48.0, 45.0, 44.0, 37.0, 34.0, 33.0, 33.0, 27.0, 13.0, 17.0, 12.0, 8.0, 15.0, 10.0, 7.0, 5.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3623046875, -1.3222808837890625, -1.282257080078125, -1.2422332763671875, -1.20220947265625, -1.1621856689453125, -1.122161865234375, -1.0821380615234375, -1.0421142578125, -1.0020904541015625, -0.962066650390625, -0.9220428466796875, -0.88201904296875, -0.8419952392578125, -0.801971435546875, -0.7619476318359375, -0.721923828125, -0.6819000244140625, -0.641876220703125, -0.6018524169921875, -0.56182861328125, -0.5218048095703125, -0.481781005859375, -0.4417572021484375, -0.4017333984375, -0.3617095947265625, -0.321685791015625, -0.2816619873046875, -0.24163818359375, -0.2016143798828125, -0.161590576171875, -0.1215667724609375, -0.08154296875, -0.0415191650390625, -0.001495361328125, 0.0385284423828125, 0.07855224609375, 0.1185760498046875, 0.158599853515625, 0.1986236572265625, 0.2386474609375, 0.2786712646484375, 0.318695068359375, 0.3587188720703125, 0.39874267578125, 0.4387664794921875, 0.478790283203125, 0.5188140869140625, 0.558837890625, 0.5988616943359375, 0.638885498046875, 0.6789093017578125, 0.71893310546875, 0.7589569091796875, 0.798980712890625, 0.8390045166015625, 0.8790283203125, 0.9190521240234375, 0.959075927734375, 0.9990997314453125, 1.03912353515625, 1.0791473388671875, 1.119171142578125, 1.1591949462890625, 1.19921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 11.0, 23.0, 18.0, 12.0, 21.0, 45.0, 63.0, 94.0, 135.0, 253.0, 394.0, 774.0, 1854.0, 5520.0, 26653.0, 593985.0, 383695.0, 25842.0, 5566.0, 1860.0, 714.0, 374.0, 240.0, 119.0, 68.0, 57.0, 48.0, 31.0, 17.0, 18.0, 9.0, 6.0, 4.0, 2.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.884765625, -3.76702880859375, -3.6492919921875, -3.53155517578125, -3.413818359375, -3.29608154296875, -3.1783447265625, -3.06060791015625, -2.94287109375, -2.82513427734375, -2.7073974609375, -2.58966064453125, -2.471923828125, -2.35418701171875, -2.2364501953125, -2.11871337890625, -2.0009765625, -1.88323974609375, -1.7655029296875, -1.64776611328125, -1.530029296875, -1.41229248046875, -1.2945556640625, -1.17681884765625, -1.05908203125, -0.94134521484375, -0.8236083984375, -0.70587158203125, -0.588134765625, -0.47039794921875, -0.3526611328125, -0.23492431640625, -0.1171875, 0.00054931640625, 0.1182861328125, 0.23602294921875, 0.353759765625, 0.47149658203125, 0.5892333984375, 0.70697021484375, 0.82470703125, 0.94244384765625, 1.0601806640625, 1.17791748046875, 1.295654296875, 1.41339111328125, 1.5311279296875, 1.64886474609375, 1.7666015625, 1.88433837890625, 2.0020751953125, 2.11981201171875, 2.237548828125, 2.35528564453125, 2.4730224609375, 2.59075927734375, 2.70849609375, 2.82623291015625, 2.9439697265625, 3.06170654296875, 3.179443359375, 3.29718017578125, 3.4149169921875, 3.53265380859375, 3.650390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 4.0, 9.0, 8.0, 10.0, 10.0, 13.0, 19.0, 20.0, 26.0, 28.0, 37.0, 29.0, 58.0, 56.0, 74.0, 86.0, 77.0, 74.0, 68.0, 56.0, 37.0, 34.0, 22.0, 20.0, 25.0, 11.0, 11.0, 9.0, 17.0, 13.0, 6.0, 6.0, 9.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6796875, -5.5029296875, -5.326171875, -5.1494140625, -4.97265625, -4.7958984375, -4.619140625, -4.4423828125, -4.265625, -4.0888671875, -3.912109375, -3.7353515625, -3.55859375, -3.3818359375, -3.205078125, -3.0283203125, -2.8515625, -2.6748046875, -2.498046875, -2.3212890625, -2.14453125, -1.9677734375, -1.791015625, -1.6142578125, -1.4375, -1.2607421875, -1.083984375, -0.9072265625, -0.73046875, -0.5537109375, -0.376953125, -0.2001953125, -0.0234375, 0.1533203125, 0.330078125, 0.5068359375, 0.68359375, 0.8603515625, 1.037109375, 1.2138671875, 1.390625, 1.5673828125, 1.744140625, 1.9208984375, 2.09765625, 2.2744140625, 2.451171875, 2.6279296875, 2.8046875, 2.9814453125, 3.158203125, 3.3349609375, 3.51171875, 3.6884765625, 3.865234375, 4.0419921875, 4.21875, 4.3955078125, 4.572265625, 4.7490234375, 4.92578125, 5.1025390625, 5.279296875, 5.4560546875, 5.6328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 6.0, 7.0, 11.0, 11.0, 12.0, 30.0, 29.0, 31.0, 58.0, 86.0, 128.0, 215.0, 428.0, 864.0, 1871.0, 4669.0, 13846.0, 59549.0, 841393.0, 96217.0, 18551.0, 5956.0, 2352.0, 1046.0, 508.0, 239.0, 139.0, 87.0, 51.0, 39.0, 32.0, 20.0, 14.0, 21.0, 18.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.79150390625, -0.7698898315429688, -0.7482757568359375, -0.7266616821289062, -0.705047607421875, -0.6834335327148438, -0.6618194580078125, -0.6402053833007812, -0.61859130859375, -0.5969772338867188, -0.5753631591796875, -0.5537490844726562, -0.532135009765625, -0.5105209350585938, -0.4889068603515625, -0.46729278564453125, -0.4456787109375, -0.42406463623046875, -0.4024505615234375, -0.38083648681640625, -0.359222412109375, -0.33760833740234375, -0.3159942626953125, -0.29438018798828125, -0.27276611328125, -0.25115203857421875, -0.2295379638671875, -0.20792388916015625, -0.186309814453125, -0.16469573974609375, -0.1430816650390625, -0.12146759033203125, -0.099853515625, -0.07823944091796875, -0.0566253662109375, -0.03501129150390625, -0.013397216796875, 0.00821685791015625, 0.0298309326171875, 0.05144500732421875, 0.07305908203125, 0.09467315673828125, 0.1162872314453125, 0.13790130615234375, 0.159515380859375, 0.18112945556640625, 0.2027435302734375, 0.22435760498046875, 0.2459716796875, 0.26758575439453125, 0.2891998291015625, 0.31081390380859375, 0.332427978515625, 0.35404205322265625, 0.3756561279296875, 0.39727020263671875, 0.41888427734375, 0.44049835205078125, 0.4621124267578125, 0.48372650146484375, 0.505340576171875, 0.5269546508789062, 0.5485687255859375, 0.5701828002929688, 0.591796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 3.0, 5.0, 11.0, 9.0, 18.0, 13.0, 15.0, 27.0, 31.0, 34.0, 47.0, 73.0, 120.0, 120.0, 110.0, 94.0, 69.0, 28.0, 43.0, 26.0, 27.0, 12.0, 7.0, 9.0, 11.0, 7.0, 11.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002486705780029297, -0.00024131685495376587, -0.00023396313190460205, -0.00022660940885543823, -0.00021925568580627441, -0.0002119019627571106, -0.00020454823970794678, -0.00019719451665878296, -0.00018984079360961914, -0.00018248707056045532, -0.0001751333475112915, -0.00016777962446212769, -0.00016042590141296387, -0.00015307217836380005, -0.00014571845531463623, -0.0001383647322654724, -0.0001310110092163086, -0.00012365728616714478, -0.00011630356311798096, -0.00010894984006881714, -0.00010159611701965332, -9.42423939704895e-05, -8.688867092132568e-05, -7.953494787216187e-05, -7.218122482299805e-05, -6.482750177383423e-05, -5.747377872467041e-05, -5.012005567550659e-05, -4.2766332626342773e-05, -3.5412609577178955e-05, -2.8058886528015137e-05, -2.070516347885132e-05, -1.33514404296875e-05, -5.997717380523682e-06, 1.3560056686401367e-06, 8.709728717803955e-06, 1.6063451766967773e-05, 2.3417174816131592e-05, 3.077089786529541e-05, 3.812462091445923e-05, 4.547834396362305e-05, 5.2832067012786865e-05, 6.0185790061950684e-05, 6.75395131111145e-05, 7.489323616027832e-05, 8.224695920944214e-05, 8.960068225860596e-05, 9.695440530776978e-05, 0.0001043081283569336, 0.00011166185140609741, 0.00011901557445526123, 0.00012636929750442505, 0.00013372302055358887, 0.00014107674360275269, 0.0001484304666519165, 0.00015578418970108032, 0.00016313791275024414, 0.00017049163579940796, 0.00017784535884857178, 0.0001851990818977356, 0.00019255280494689941, 0.00019990652799606323, 0.00020726025104522705, 0.00021461397409439087, 0.0002219676971435547]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 6.0, 12.0, 11.0, 15.0, 35.0, 35.0, 67.0, 85.0, 131.0, 241.0, 420.0, 795.0, 1702.0, 3906.0, 10603.0, 36027.0, 242603.0, 692884.0, 39414.0, 11563.0, 4323.0, 1700.0, 887.0, 411.0, 240.0, 138.0, 97.0, 54.0, 42.0, 32.0, 16.0, 14.0, 8.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5478515625, -0.5322151184082031, -0.5165786743164062, -0.5009422302246094, -0.4853057861328125, -0.4696693420410156, -0.45403289794921875, -0.4383964538574219, -0.422760009765625, -0.4071235656738281, -0.39148712158203125, -0.3758506774902344, -0.3602142333984375, -0.3445777893066406, -0.32894134521484375, -0.3133049011230469, -0.29766845703125, -0.2820320129394531, -0.26639556884765625, -0.2507591247558594, -0.2351226806640625, -0.21948623657226562, -0.20384979248046875, -0.18821334838867188, -0.172576904296875, -0.15694046020507812, -0.14130401611328125, -0.12566757202148438, -0.1100311279296875, -0.09439468383789062, -0.07875823974609375, -0.06312179565429688, -0.0474853515625, -0.031848907470703125, -0.01621246337890625, -0.000576019287109375, 0.0150604248046875, 0.030696868896484375, 0.04633331298828125, 0.061969757080078125, 0.077606201171875, 0.09324264526367188, 0.10887908935546875, 0.12451553344726562, 0.1401519775390625, 0.15578842163085938, 0.17142486572265625, 0.18706130981445312, 0.20269775390625, 0.21833419799804688, 0.23397064208984375, 0.24960708618164062, 0.2652435302734375, 0.2808799743652344, 0.29651641845703125, 0.3121528625488281, 0.327789306640625, 0.3434257507324219, 0.35906219482421875, 0.3746986389160156, 0.3903350830078125, 0.4059715270996094, 0.42160797119140625, 0.4372444152832031, 0.452880859375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 3.0, 1.0, 10.0, 9.0, 16.0, 14.0, 17.0, 33.0, 30.0, 31.0, 56.0, 82.0, 97.0, 116.0, 100.0, 97.0, 71.0, 43.0, 39.0, 29.0, 15.0, 17.0, 17.0, 6.0, 8.0, 5.0, 9.0, 1.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.72705078125, -0.7056045532226562, -0.6841583251953125, -0.6627120971679688, -0.641265869140625, -0.6198196411132812, -0.5983734130859375, -0.5769271850585938, -0.55548095703125, -0.5340347290039062, -0.5125885009765625, -0.49114227294921875, -0.469696044921875, -0.44824981689453125, -0.4268035888671875, -0.40535736083984375, -0.3839111328125, -0.36246490478515625, -0.3410186767578125, -0.31957244873046875, -0.298126220703125, -0.27667999267578125, -0.2552337646484375, -0.23378753662109375, -0.21234130859375, -0.19089508056640625, -0.1694488525390625, -0.14800262451171875, -0.126556396484375, -0.10511016845703125, -0.0836639404296875, -0.06221771240234375, -0.040771484375, -0.01932525634765625, 0.0021209716796875, 0.02356719970703125, 0.045013427734375, 0.06645965576171875, 0.0879058837890625, 0.10935211181640625, 0.13079833984375, 0.15224456787109375, 0.1736907958984375, 0.19513702392578125, 0.216583251953125, 0.23802947998046875, 0.2594757080078125, 0.28092193603515625, 0.3023681640625, 0.32381439208984375, 0.3452606201171875, 0.36670684814453125, 0.388153076171875, 0.40959930419921875, 0.4310455322265625, 0.45249176025390625, 0.47393798828125, 0.49538421630859375, 0.5168304443359375, 0.5382766723632812, 0.559722900390625, 0.5811691284179688, 0.6026153564453125, 0.6240615844726562, 0.6455078125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 15.0, 32.0, 66.0, 87.0, 510.0, 127.0, 67.0, 42.0, 22.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.34033966064453, -40.39403533935547, -39.44772720336914, -38.50142288208008, -37.555118560791016, -36.60881042480469, -35.662506103515625, -34.71620178222656, -33.769893646240234, -32.82358932495117, -31.877283096313477, -30.93097686767578, -29.984670639038086, -29.03836441040039, -28.092060089111328, -27.145753860473633, -26.19944953918457, -25.253143310546875, -24.306838989257812, -23.360532760620117, -22.414226531982422, -21.46792221069336, -20.521615982055664, -19.57530975341797, -18.629005432128906, -17.68269920349121, -16.73639488220215, -15.790088653564453, -14.843782424926758, -13.897477149963379, -12.951171875, -12.004865646362305, -11.05855941772461, -10.11225414276123, -9.165947914123535, -8.219642639160156, -7.273336887359619, -6.327031135559082, -5.380725860595703, -4.434420108795166, -3.488114356994629, -2.541808605194092, -1.5955030918121338, -0.6491975784301758, 0.29710817337036133, 1.2434139251708984, 2.1897192001342773, 3.1360249519348145, 4.082330703735352, 5.028636455535889, 5.974942207336426, 6.921247482299805, 7.867553234100342, 8.813858985900879, 9.760164260864258, 10.706470489501953, 11.652775764465332, 12.599081039428711, 13.545387268066406, 14.491692543029785, 15.437997817993164, 16.38430404663086, 17.330608367919922, 18.276914596557617, 19.223220825195312]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 6.0, 2.0, 3.0, 6.0, 5.0, 12.0, 15.0, 9.0, 18.0, 8.0, 18.0, 18.0, 27.0, 42.0, 28.0, 32.0, 94.0, 325.0, 100.0, 37.0, 29.0, 20.0, 17.0, 16.0, 20.0, 17.0, 10.0, 18.0, 11.0, 9.0, 10.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-18.823379516601562, -18.32134246826172, -17.819303512573242, -17.3172664642334, -16.815227508544922, -16.313190460205078, -15.811152458190918, -15.309114456176758, -14.807076454162598, -14.305038452148438, -13.803000450134277, -13.300962448120117, -12.798925399780273, -12.296886444091797, -11.794849395751953, -11.292811393737793, -10.790773391723633, -10.288735389709473, -9.786697387695312, -9.284659385681152, -8.782621383666992, -8.280584335327148, -7.778546333312988, -7.276508331298828, -6.774470329284668, -6.272432327270508, -5.770394325256348, -5.268356800079346, -4.7663187980651855, -4.264280796051025, -3.7622430324554443, -3.2602052688598633, -2.7581663131713867, -2.2561283111572266, -1.7540905475616455, -1.252052664756775, -0.7500147819519043, -0.24797677993774414, 0.2540609836578369, 0.756098747253418, 1.2581367492675781, 1.7601746320724487, 2.2622125148773193, 2.7642502784729004, 3.2662882804870605, 3.7683262825012207, 4.270363807678223, 4.772401809692383, 5.274439811706543, 5.776477813720703, 6.278515815734863, 6.780553340911865, 7.282591342926025, 7.7846293449401855, 8.286666870117188, 8.788704872131348, 9.290742874145508, 9.792780876159668, 10.294818878173828, 10.796856880187988, 11.298894882202148, 11.800931930541992, 12.302969932556152, 12.805007934570312, 13.307045936584473]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 8.0, 13.0, 7.0, 10.0, 7.0, 9.0, 6.0, 22.0, 12.0, 14.0, 15.0, 24.0, 20.0, 33.0, 41.0, 38.0, 82.0, 184.0, 108.0, 55.0, 28.0, 32.0, 40.0, 23.0, 24.0, 17.0, 14.0, 18.0, 15.0, 9.0, 10.0, 10.0, 10.0, 6.0, 4.0, 5.0, 7.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9736328125, -0.9417266845703125, -0.909820556640625, -0.8779144287109375, -0.84600830078125, -0.8141021728515625, -0.782196044921875, -0.7502899169921875, -0.7183837890625, -0.6864776611328125, -0.654571533203125, -0.6226654052734375, -0.59075927734375, -0.5588531494140625, -0.526947021484375, -0.4950408935546875, -0.463134765625, -0.4312286376953125, -0.399322509765625, -0.3674163818359375, -0.33551025390625, -0.3036041259765625, -0.271697998046875, -0.2397918701171875, -0.2078857421875, -0.1759796142578125, -0.144073486328125, -0.1121673583984375, -0.08026123046875, -0.0483551025390625, -0.016448974609375, 0.0154571533203125, 0.04736328125, 0.0792694091796875, 0.111175537109375, 0.1430816650390625, 0.17498779296875, 0.2068939208984375, 0.238800048828125, 0.2707061767578125, 0.3026123046875, 0.3345184326171875, 0.366424560546875, 0.3983306884765625, 0.43023681640625, 0.4621429443359375, 0.494049072265625, 0.5259552001953125, 0.557861328125, 0.5897674560546875, 0.621673583984375, 0.6535797119140625, 0.68548583984375, 0.7173919677734375, 0.749298095703125, 0.7812042236328125, 0.8131103515625, 0.8450164794921875, 0.876922607421875, 0.9088287353515625, 0.94073486328125, 0.9726409912109375, 1.004547119140625, 1.0364532470703125, 1.068359375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 7.0, 0.0, 8.0, 4.0, 9.0, 6.0, 4.0, 15.0, 21.0, 23.0, 45.0, 90.0, 156.0, 321.0, 1052.0, 4136.0, 39021.0, 8331728.0, 8890.0, 1930.0, 564.0, 220.0, 108.0, 63.0, 23.0, 26.0, 22.0, 26.0, 2.0, 7.0, 9.0, 6.0, 4.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 4.0], "bins": [-13.309447288513184, -12.883353233337402, -12.457258224487305, -12.031164169311523, -11.605069160461426, -11.178975105285645, -10.752880096435547, -10.326786041259766, -9.900691032409668, -9.474596977233887, -9.048501968383789, -8.622407913208008, -8.19631290435791, -7.770218849182129, -7.344123840332031, -6.91802978515625, -6.4919352531433105, -6.065840721130371, -5.639746189117432, -5.213651657104492, -4.787557125091553, -4.361462593078613, -3.935368299484253, -3.5092737674713135, -3.083179235458374, -2.6570847034454346, -2.230990171432495, -1.8048957586288452, -1.3788012266159058, -0.9527068138122559, -0.5266122817993164, -0.10051774978637695, 0.3255767822265625, 0.751671314239502, 1.1777658462524414, 1.6038602590560913, 2.0299549102783203, 2.4560492038726807, 2.88214373588562, 3.3082382678985596, 3.734332799911499, 4.160427093505859, 4.586521625518799, 5.012616157531738, 5.438710689544678, 5.864805221557617, 6.290899753570557, 6.716994285583496, 7.1430888175964355, 7.569183349609375, 7.9952778816223145, 8.421372413635254, 8.847466468811035, 9.273561477661133, 9.699655532836914, 10.125750541687012, 10.551844596862793, 10.977938652038574, 11.404033660888672, 11.830127716064453, 12.25622272491455, 12.682316780090332, 13.10841178894043, 13.534505844116211, 13.960600852966309]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 7.0, 5.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 1.0, 6.0, 4.0, 3.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.521769523620605, -11.245092391967773, -10.968414306640625, -10.691737174987793, -10.415060043334961, -10.138382911682129, -9.86170482635498, -9.585027694702148, -9.308350563049316, -9.031673431396484, -8.754995346069336, -8.478318214416504, -8.201641082763672, -7.924963474273682, -7.648285865783691, -7.371608734130859, -7.094931125640869, -6.818253517150879, -6.541576385498047, -6.264898777008057, -5.988221645355225, -5.711544036865234, -5.434866905212402, -5.158189296722412, -4.881511688232422, -4.604834079742432, -4.3281569480896, -4.051479339599609, -3.7748022079467773, -3.498124599456787, -3.221447229385376, -2.944769859313965, -2.6680922508239746, -2.3914148807525635, -2.1147375106811523, -1.8380600214004517, -1.5613826513290405, -1.2847052812576294, -1.0080277919769287, -0.7313504219055176, -0.45467305183410645, -0.17799565196037292, 0.0986817479133606, 0.3753591775894165, 0.6520365476608276, 0.9287139177322388, 1.2053914070129395, 1.4820687770843506, 1.7587461471557617, 2.035423517227173, 2.312100887298584, 2.588778495788574, 2.8654556274414062, 3.1421332359313965, 3.4188106060028076, 3.6954879760742188, 3.97216534614563, 4.248842716217041, 4.525520324707031, 4.802197456359863, 5.0788750648498535, 5.3555521965026855, 5.632229804992676, 5.908906936645508, 6.185584545135498]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 1.0, 7.0, 12.0, 20.0, 20.0, 31.0, 46.0, 55.0, 91.0, 148.0, 253.0, 481.0, 949.0, 2207.0, 5936.0, 16898.0, 51651.0, 158694.0, 189592.0, 64860.0, 20375.0, 7079.0, 2688.0, 991.0, 487.0, 248.0, 144.0, 88.0, 62.0, 40.0, 30.0, 23.0, 10.0, 13.0, 11.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-12.6015625, -12.2525634765625, -11.903564453125, -11.5545654296875, -11.20556640625, -10.8565673828125, -10.507568359375, -10.1585693359375, -9.8095703125, -9.4605712890625, -9.111572265625, -8.7625732421875, -8.41357421875, -8.0645751953125, -7.715576171875, -7.3665771484375, -7.017578125, -6.6685791015625, -6.319580078125, -5.9705810546875, -5.62158203125, -5.2725830078125, -4.923583984375, -4.5745849609375, -4.2255859375, -3.8765869140625, -3.527587890625, -3.1785888671875, -2.82958984375, -2.4805908203125, -2.131591796875, -1.7825927734375, -1.43359375, -1.0845947265625, -0.735595703125, -0.3865966796875, -0.03759765625, 0.3114013671875, 0.660400390625, 1.0093994140625, 1.3583984375, 1.7073974609375, 2.056396484375, 2.4053955078125, 2.75439453125, 3.1033935546875, 3.452392578125, 3.8013916015625, 4.150390625, 4.4993896484375, 4.848388671875, 5.1973876953125, 5.54638671875, 5.8953857421875, 6.244384765625, 6.5933837890625, 6.9423828125, 7.2913818359375, 7.640380859375, 7.9893798828125, 8.33837890625, 8.6873779296875, 9.036376953125, 9.3853759765625, 9.734375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 7.0, 6.0, 10.0, 15.0, 12.0, 15.0, 18.0, 21.0, 33.0, 30.0, 48.0, 53.0, 68.0, 72.0, 71.0, 69.0, 60.0, 56.0, 54.0, 59.0, 32.0, 35.0, 33.0, 29.0, 9.0, 12.0, 17.0, 6.0, 8.0, 7.0, 9.0, 5.0, 1.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.818359375, -1.7715301513671875, -1.724700927734375, -1.6778717041015625, -1.63104248046875, -1.5842132568359375, -1.537384033203125, -1.4905548095703125, -1.4437255859375, -1.3968963623046875, -1.350067138671875, -1.3032379150390625, -1.25640869140625, -1.2095794677734375, -1.162750244140625, -1.1159210205078125, -1.069091796875, -1.0222625732421875, -0.975433349609375, -0.9286041259765625, -0.88177490234375, -0.8349456787109375, -0.788116455078125, -0.7412872314453125, -0.6944580078125, -0.6476287841796875, -0.600799560546875, -0.5539703369140625, -0.50714111328125, -0.4603118896484375, -0.413482666015625, -0.3666534423828125, -0.31982421875, -0.2729949951171875, -0.226165771484375, -0.1793365478515625, -0.13250732421875, -0.0856781005859375, -0.038848876953125, 0.0079803466796875, 0.0548095703125, 0.1016387939453125, 0.148468017578125, 0.1952972412109375, 0.24212646484375, 0.2889556884765625, 0.335784912109375, 0.3826141357421875, 0.429443359375, 0.4762725830078125, 0.523101806640625, 0.5699310302734375, 0.61676025390625, 0.6635894775390625, 0.710418701171875, 0.7572479248046875, 0.8040771484375, 0.8509063720703125, 0.897735595703125, 0.9445648193359375, 0.99139404296875, 1.0382232666015625, 1.085052490234375, 1.1318817138671875, 1.1787109375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 8.0, 2.0, 6.0, 11.0, 13.0, 29.0, 49.0, 83.0, 117.0, 75.0, 39.0, 18.0, 7.0, 6.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.193470001220703, -8.796862602233887, -8.400256156921387, -8.00364875793457, -7.607041835784912, -7.210434913635254, -6.813827991485596, -6.4172210693359375, -6.020613670349121, -5.624006748199463, -5.227399826049805, -4.830792427062988, -4.43418550491333, -4.037578582763672, -3.6409716606140137, -3.2443645000457764, -2.8477578163146973, -2.451150894165039, -2.0545437335968018, -1.6579368114471436, -1.2613297700881958, -0.864722728729248, -0.46811580657958984, -0.07150864601135254, 0.32509827613830566, 0.7217053174972534, 1.1183123588562012, 1.5149192810058594, 1.9115263223648071, 2.308133363723755, 2.704740285873413, 3.1013474464416504, 3.4979543685913086, 3.894561290740967, 4.291168212890625, 4.687775611877441, 5.0843825340271, 5.480989456176758, 5.877596378326416, 6.274203300476074, 6.670810699462891, 7.067417621612549, 7.464024543762207, 7.860631942749023, 8.257238388061523, 8.65384578704834, 9.050453186035156, 9.447059631347656, 9.843666076660156, 10.240273475646973, 10.636879920959473, 11.033487319946289, 11.430093765258789, 11.826701164245605, 12.223308563232422, 12.619915008544922, 13.016522407531738, 13.413129806518555, 13.809736251831055, 14.206343650817871, 14.602950096130371, 14.999557495117188, 15.396163940429688, 15.792771339416504, 16.18937873840332]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 5.0, 11.0, 10.0, 23.0, 47.0, 64.0, 75.0, 73.0, 59.0, 33.0, 20.0, 9.0, 6.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.668726921081543, -6.446429252624512, -6.224132061004639, -6.001834392547607, -5.779537200927734, -5.557239532470703, -5.334941864013672, -5.112644195556641, -4.890347003936768, -4.668049335479736, -4.445752143859863, -4.223454475402832, -4.001156806945801, -3.7788596153259277, -3.5565619468688965, -3.3342645168304443, -3.111967086791992, -2.88966965675354, -2.667372226715088, -2.4450745582580566, -2.2227771282196045, -2.0004796981811523, -1.7781821489334106, -1.555884599685669, -1.3335871696472168, -1.1112897396087646, -0.888992190361023, -0.666694700717926, -0.4443972110748291, -0.22209978103637695, 0.0001977682113647461, 0.22249531745910645, 0.4447932243347168, 0.6670907139778137, 0.8893882036209106, 1.1116857528686523, 1.3339831829071045, 1.5562806129455566, 1.7785781621932983, 2.00087571144104, 2.223173141479492, 2.4454705715179443, 2.6677680015563965, 2.8900656700134277, 3.11236310005188, 3.334660530090332, 3.5569581985473633, 3.7792556285858154, 4.001553058624268, 4.223850727081299, 4.446147918701172, 4.668445587158203, 4.890743255615234, 5.113040447235107, 5.335338115692139, 5.557635307312012, 5.779932975769043, 6.002230644226074, 6.224527835845947, 6.4468255043029785, 6.669122695922852, 6.891420364379883, 7.113718032836914, 7.336015701293945, 7.558312892913818]}, "eval/loss": 4.172859191894531, "eval/wer": 2.3791352637842125, "eval/runtime": 933.3183, "eval/samples_per_second": 2.831, "eval/steps_per_second": 0.237, "train/train_runtime": 6714.5583, "train/train_samples_per_second": 4.25, "train/train_steps_per_second": 0.177, "train/total_flos": 0.0, "train/train_loss": 4.242165094268132} \ No newline at end of file