diff --git "a/wandb/run-20220310_205608-mf17w61i/files/wandb-summary.json" "b/wandb/run-20220310_205608-mf17w61i/files/wandb-summary.json" --- "a/wandb/run-20220310_205608-mf17w61i/files/wandb-summary.json" +++ "b/wandb/run-20220310_205608-mf17w61i/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 5.844, "train/learning_rate": 2.1101543942992875e-05, "train/epoch": 6.73, "train/global_step": 6000, "_runtime": 40115, "_timestamp": 1646985883, "_step": 6003, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 38.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 4.0, 1.0, 30272.0, 111.0, 35.0, 9.0, 6.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-101.9375, -99.916259765625, -97.89501953125, -95.873779296875, -93.8525390625, -91.831298828125, -89.81005859375, -87.788818359375, -85.767578125, -83.746337890625, -81.72509765625, -79.703857421875, -77.6826171875, -75.661376953125, -73.64013671875, -71.618896484375, -69.59765625, -67.576416015625, -65.55517578125, -63.533935546875, -61.5126953125, -59.491455078125, -57.47021484375, -55.448974609375, -53.427734375, -51.406494140625, -49.38525390625, -47.364013671875, -45.3427734375, -43.321533203125, -41.30029296875, -39.279052734375, -37.2578125, -35.236572265625, -33.21533203125, -31.194091796875, -29.1728515625, -27.151611328125, -25.13037109375, -23.109130859375, -21.087890625, -19.066650390625, -17.04541015625, -15.024169921875, -13.0029296875, -10.981689453125, -8.96044921875, -6.939208984375, -4.91796875, -2.896728515625, -0.87548828125, 1.145751953125, 3.1669921875, 5.188232421875, 7.20947265625, 9.230712890625, 11.251953125, 13.273193359375, 15.29443359375, 17.315673828125, 19.3369140625, 21.358154296875, 23.37939453125, 25.400634765625, 27.421875]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 48.0, 532.0, 374.0, 45.0, 14.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.6417236328125, -49.66939926147461, -44.69707489013672, -39.72474670410156, -34.75242614746094, -29.780099868774414, -24.80777359008789, -19.83544921875, -14.86312484741211, -9.890800476074219, -4.918475151062012, 0.05385017395019531, 5.026174545288086, 9.998498916625977, 14.9708251953125, 19.94314956665039, 24.91547393798828, 29.887798309326172, 34.86012268066406, 39.83245086669922, 44.804771423339844, 49.777099609375, 54.74942398071289, 59.72174835205078, 64.69407653808594, 69.6664047241211, 74.63872528076172, 79.61105346679688, 84.5833740234375, 89.55570220947266, 94.52803039550781, 99.50035095214844, 104.47267150878906, 109.44499969482422, 114.41732025146484, 119.3896484375, 124.36196899414062, 129.33428955078125, 134.30662536621094, 139.27894592285156, 144.2512664794922, 149.2235870361328, 154.1959228515625, 159.16824340820312, 164.14056396484375, 169.11288452148438, 174.08522033691406, 179.0575408935547, 184.02987670898438, 189.002197265625, 193.9745330810547, 198.9468536376953, 203.91917419433594, 208.89149475097656, 213.86383056640625, 218.83615112304688, 223.8084716796875, 228.78079223632812, 233.7531280517578, 238.72544860839844, 243.69776916503906, 248.6700897216797, 253.64242553710938, 258.61474609375, 263.5870666503906]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 4.0, 3.0, 6.0, 6.0, 10.0, 8.0, 26.0, 33.0, 31.0, 33.0, 28.0, 59.0, 47.0, 55.0, 62.0, 74.0, 80.0, 63.0, 63.0, 55.0, 50.0, 50.0, 20.0, 20.0, 28.0, 21.0, 16.0, 20.0, 14.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.506927490234375, -40.40613555908203, -39.30533981323242, -38.20454788208008, -37.10375213623047, -36.002960205078125, -34.902164459228516, -33.80137252807617, -32.70057678222656, -31.599782943725586, -30.49898910522461, -29.398195266723633, -28.297401428222656, -27.19660758972168, -26.095813751220703, -24.99502182006836, -23.894227981567383, -22.793434143066406, -21.69264030456543, -20.591846466064453, -19.491052627563477, -18.3902587890625, -17.289466857910156, -16.188671112060547, -15.087878227233887, -13.98708438873291, -12.886290550231934, -11.785497665405273, -10.684703826904297, -9.58390998840332, -8.483116149902344, -7.382322311401367, -6.281528472900391, -5.180734634399414, -4.0799407958984375, -2.979147434234619, -1.8783535957336426, -0.777559757232666, 0.32323360443115234, 1.424027442932129, 2.5248212814331055, 3.625615119934082, 4.726408958435059, 5.827202320098877, 6.9279961585998535, 8.028789520263672, 9.129583358764648, 10.230377197265625, 11.331171035766602, 12.431964874267578, 13.532758712768555, 14.633552551269531, 15.734346389770508, 16.835140228271484, 17.935932159423828, 19.036727905273438, 20.13751983642578, 21.238313674926758, 22.339107513427734, 23.43990135192871, 24.540695190429688, 25.641489028930664, 26.74228286743164, 27.843074798583984, 28.943870544433594]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 7.0, 12.0, 20.0, 24.0, 27.0, 40.0, 106.0, 169.0, 313.0, 591.0, 1295.0, 2823.0, 7122.0, 19642.0, 60216.0, 184116.0, 427858.0, 227193.0, 76924.0, 24721.0, 8839.0, 3467.0, 1500.0, 723.0, 353.0, 169.0, 108.0, 62.0, 48.0, 26.0, 11.0, 11.0, 9.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-73.875, -71.85693359375, -69.8388671875, -67.82080078125, -65.802734375, -63.78466796875, -61.7666015625, -59.74853515625, -57.73046875, -55.71240234375, -53.6943359375, -51.67626953125, -49.658203125, -47.64013671875, -45.6220703125, -43.60400390625, -41.5859375, -39.56787109375, -37.5498046875, -35.53173828125, -33.513671875, -31.49560546875, -29.4775390625, -27.45947265625, -25.44140625, -23.42333984375, -21.4052734375, -19.38720703125, -17.369140625, -15.35107421875, -13.3330078125, -11.31494140625, -9.296875, -7.27880859375, -5.2607421875, -3.24267578125, -1.224609375, 0.79345703125, 2.8115234375, 4.82958984375, 6.84765625, 8.86572265625, 10.8837890625, 12.90185546875, 14.919921875, 16.93798828125, 18.9560546875, 20.97412109375, 22.9921875, 25.01025390625, 27.0283203125, 29.04638671875, 31.064453125, 33.08251953125, 35.1005859375, 37.11865234375, 39.13671875, 41.15478515625, 43.1728515625, 45.19091796875, 47.208984375, 49.22705078125, 51.2451171875, 53.26318359375, 55.28125]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 19.0, 33.0, 25.0, 25.0, 32.0, 49.0, 43.0, 55.0, 68.0, 91.0, 113.0, 61.0, 60.0, 61.0, 47.0, 42.0, 31.0, 20.0, 18.0, 24.0, 14.0, 14.0, 12.0, 7.0, 8.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.96875, -27.271240234375, -26.57373046875, -25.876220703125, -25.1787109375, -24.481201171875, -23.78369140625, -23.086181640625, -22.388671875, -21.691162109375, -20.99365234375, -20.296142578125, -19.5986328125, -18.901123046875, -18.20361328125, -17.506103515625, -16.80859375, -16.111083984375, -15.41357421875, -14.716064453125, -14.0185546875, -13.321044921875, -12.62353515625, -11.926025390625, -11.228515625, -10.531005859375, -9.83349609375, -9.135986328125, -8.4384765625, -7.740966796875, -7.04345703125, -6.345947265625, -5.6484375, -4.950927734375, -4.25341796875, -3.555908203125, -2.8583984375, -2.160888671875, -1.46337890625, -0.765869140625, -0.068359375, 0.629150390625, 1.32666015625, 2.024169921875, 2.7216796875, 3.419189453125, 4.11669921875, 4.814208984375, 5.51171875, 6.209228515625, 6.90673828125, 7.604248046875, 8.3017578125, 8.999267578125, 9.69677734375, 10.394287109375, 11.091796875, 11.789306640625, 12.48681640625, 13.184326171875, 13.8818359375, 14.579345703125, 15.27685546875, 15.974365234375, 16.671875]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 6.0, 9.0, 9.0, 15.0, 30.0, 37.0, 36.0, 60.0, 66.0, 78.0, 92.0, 96.0, 87.0, 88.0, 69.0, 68.0, 43.0, 21.0, 27.0, 17.0, 18.0, 9.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.93404197692871, -17.926294326782227, -16.91854476928711, -15.910797119140625, -14.903048515319824, -13.895299911499023, -12.887552261352539, -11.879803657531738, -10.872055053710938, -9.864306449890137, -8.856557846069336, -7.848810195922852, -6.841061592102051, -5.83331298828125, -4.825564861297607, -3.817816734313965, -2.810068130493164, -1.8023197650909424, -0.7945713996887207, 0.21317696571350098, 1.2209253311157227, 2.2286739349365234, 3.236422061920166, 4.244170188903809, 5.251918792724609, 6.25966739654541, 7.267415523529053, 8.275163650512695, 9.282912254333496, 10.290660858154297, 11.298408508300781, 12.306157112121582, 13.31390380859375, 14.32165241241455, 15.329401016235352, 16.337148666381836, 17.344898223876953, 18.352645874023438, 19.360393524169922, 20.368141174316406, 21.375890731811523, 22.383638381958008, 23.391387939453125, 24.39913558959961, 25.406883239746094, 26.41463279724121, 27.422380447387695, 28.430130004882812, 29.437877655029297, 30.44562530517578, 31.4533748626709, 32.461124420166016, 33.4688720703125, 34.476619720458984, 35.48436737060547, 36.49211502075195, 37.49986267089844, 38.50761032104492, 39.515357971191406, 40.523109436035156, 41.53085708618164, 42.538604736328125, 43.54635238647461, 44.554100036621094, 45.561851501464844]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 0.0, 13.0, 8.0, 13.0, 15.0, 13.0, 18.0, 12.0, 19.0, 27.0, 30.0, 34.0, 34.0, 41.0, 36.0, 35.0, 36.0, 42.0, 43.0, 43.0, 41.0, 41.0, 34.0, 40.0, 36.0, 50.0, 29.0, 28.0, 26.0, 19.0, 33.0, 18.0, 18.0, 12.0, 16.0, 7.0, 8.0, 8.0, 5.0, 1.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.63519287109375, -21.97650718688965, -21.31782341003418, -20.659137725830078, -20.000452041625977, -19.341766357421875, -18.683082580566406, -18.024396896362305, -17.365711212158203, -16.7070255279541, -16.048341751098633, -15.389656066894531, -14.73097038269043, -14.072285652160645, -13.41360092163086, -12.754915237426758, -12.096231460571289, -11.437546730041504, -10.778861045837402, -10.120176315307617, -9.461490631103516, -8.80280590057373, -8.144121170043945, -7.485435962677002, -6.826750755310059, -6.168065547943115, -5.509380340576172, -4.850695610046387, -4.192010402679443, -3.5333251953125, -2.8746402263641357, -2.2159552574157715, -1.5572700500488281, -0.8985849618911743, -0.2398998737335205, 0.4187852144241333, 1.077470302581787, 1.7361555099487305, 2.3948404788970947, 3.053525447845459, 3.7122106552124023, 4.370895862579346, 5.029581069946289, 5.688265800476074, 6.346951007843018, 7.005636215209961, 7.664320945739746, 8.323005676269531, 8.981691360473633, 9.640376091003418, 10.29906177520752, 10.957746505737305, 11.616432189941406, 12.275116920471191, 12.933801651000977, 13.592487335205078, 14.251172065734863, 14.909856796264648, 15.56854248046875, 16.22722816467285, 16.88591194152832, 17.544597625732422, 18.203283309936523, 18.861967086791992, 19.520652770996094]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 8.0, 9.0, 13.0, 17.0, 25.0, 28.0, 44.0, 72.0, 99.0, 141.0, 254.0, 332.0, 486.0, 812.0, 1197.0, 1857.0, 2986.0, 4970.0, 8406.0, 14815.0, 28106.0, 69240.0, 1156428.0, 2733712.0, 96356.0, 33042.0, 16867.0, 9573.0, 5426.0, 3283.0, 2034.0, 1288.0, 804.0, 527.0, 347.0, 207.0, 155.0, 89.0, 64.0, 58.0, 34.0, 29.0, 12.0, 13.0, 8.0, 8.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-26.96875, -26.128662109375, -25.28857421875, -24.448486328125, -23.6083984375, -22.768310546875, -21.92822265625, -21.088134765625, -20.248046875, -19.407958984375, -18.56787109375, -17.727783203125, -16.8876953125, -16.047607421875, -15.20751953125, -14.367431640625, -13.52734375, -12.687255859375, -11.84716796875, -11.007080078125, -10.1669921875, -9.326904296875, -8.48681640625, -7.646728515625, -6.806640625, -5.966552734375, -5.12646484375, -4.286376953125, -3.4462890625, -2.606201171875, -1.76611328125, -0.926025390625, -0.0859375, 0.754150390625, 1.59423828125, 2.434326171875, 3.2744140625, 4.114501953125, 4.95458984375, 5.794677734375, 6.634765625, 7.474853515625, 8.31494140625, 9.155029296875, 9.9951171875, 10.835205078125, 11.67529296875, 12.515380859375, 13.35546875, 14.195556640625, 15.03564453125, 15.875732421875, 16.7158203125, 17.555908203125, 18.39599609375, 19.236083984375, 20.076171875, 20.916259765625, 21.75634765625, 22.596435546875, 23.4365234375, 24.276611328125, 25.11669921875, 25.956787109375, 26.796875]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 3.0, 5.0, 9.0, 9.0, 8.0, 7.0, 14.0, 13.0, 20.0, 15.0, 18.0, 24.0, 26.0, 32.0, 31.0, 35.0, 25.0, 32.0, 27.0, 44.0, 37.0, 29.0, 26.0, 47.0, 44.0, 38.0, 42.0, 43.0, 46.0, 29.0, 32.0, 29.0, 16.0, 21.0, 18.0, 13.0, 21.0, 14.0, 13.0, 11.0, 6.0, 3.0, 7.0, 7.0, 4.0, 4.0, 0.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.7734375, -10.4317626953125, -10.090087890625, -9.7484130859375, -9.40673828125, -9.0650634765625, -8.723388671875, -8.3817138671875, -8.0400390625, -7.6983642578125, -7.356689453125, -7.0150146484375, -6.67333984375, -6.3316650390625, -5.989990234375, -5.6483154296875, -5.306640625, -4.9649658203125, -4.623291015625, -4.2816162109375, -3.93994140625, -3.5982666015625, -3.256591796875, -2.9149169921875, -2.5732421875, -2.2315673828125, -1.889892578125, -1.5482177734375, -1.20654296875, -0.8648681640625, -0.523193359375, -0.1815185546875, 0.16015625, 0.5018310546875, 0.843505859375, 1.1851806640625, 1.52685546875, 1.8685302734375, 2.210205078125, 2.5518798828125, 2.8935546875, 3.2352294921875, 3.576904296875, 3.9185791015625, 4.26025390625, 4.6019287109375, 4.943603515625, 5.2852783203125, 5.626953125, 5.9686279296875, 6.310302734375, 6.6519775390625, 6.99365234375, 7.3353271484375, 7.677001953125, 8.0186767578125, 8.3603515625, 8.7020263671875, 9.043701171875, 9.3853759765625, 9.72705078125, 10.0687255859375, 10.410400390625, 10.7520751953125, 11.09375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 8.0, 3.0, 8.0, 11.0, 19.0, 23.0, 21.0, 49.0, 90.0, 279.0, 1201.0, 15369.0, 3982112.0, 189130.0, 4984.0, 654.0, 156.0, 53.0, 29.0, 26.0, 14.0, 18.0, 6.0, 7.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.875, -123.435546875, -118.99609375, -114.556640625, -110.1171875, -105.677734375, -101.23828125, -96.798828125, -92.359375, -87.919921875, -83.48046875, -79.041015625, -74.6015625, -70.162109375, -65.72265625, -61.283203125, -56.84375, -52.404296875, -47.96484375, -43.525390625, -39.0859375, -34.646484375, -30.20703125, -25.767578125, -21.328125, -16.888671875, -12.44921875, -8.009765625, -3.5703125, 0.869140625, 5.30859375, 9.748046875, 14.1875, 18.626953125, 23.06640625, 27.505859375, 31.9453125, 36.384765625, 40.82421875, 45.263671875, 49.703125, 54.142578125, 58.58203125, 63.021484375, 67.4609375, 71.900390625, 76.33984375, 80.779296875, 85.21875, 89.658203125, 94.09765625, 98.537109375, 102.9765625, 107.416015625, 111.85546875, 116.294921875, 120.734375, 125.173828125, 129.61328125, 134.052734375, 138.4921875, 142.931640625, 147.37109375, 151.810546875, 156.25]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 8.0, 12.0, 8.0, 14.0, 20.0, 29.0, 28.0, 47.0, 67.0, 86.0, 203.0, 561.0, 1617.0, 772.0, 267.0, 112.0, 68.0, 41.0, 18.0, 26.0, 26.0, 14.0, 8.0, 5.0, 8.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5625, -8.2830810546875, -8.003662109375, -7.7242431640625, -7.44482421875, -7.1654052734375, -6.885986328125, -6.6065673828125, -6.3271484375, -6.0477294921875, -5.768310546875, -5.4888916015625, -5.20947265625, -4.9300537109375, -4.650634765625, -4.3712158203125, -4.091796875, -3.8123779296875, -3.532958984375, -3.2535400390625, -2.97412109375, -2.6947021484375, -2.415283203125, -2.1358642578125, -1.8564453125, -1.5770263671875, -1.297607421875, -1.0181884765625, -0.73876953125, -0.4593505859375, -0.179931640625, 0.0994873046875, 0.37890625, 0.6583251953125, 0.937744140625, 1.2171630859375, 1.49658203125, 1.7760009765625, 2.055419921875, 2.3348388671875, 2.6142578125, 2.8936767578125, 3.173095703125, 3.4525146484375, 3.73193359375, 4.0113525390625, 4.290771484375, 4.5701904296875, 4.849609375, 5.1290283203125, 5.408447265625, 5.6878662109375, 5.96728515625, 6.2467041015625, 6.526123046875, 6.8055419921875, 7.0849609375, 7.3643798828125, 7.643798828125, 7.9232177734375, 8.20263671875, 8.4820556640625, 8.761474609375, 9.0408935546875, 9.3203125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 6.0, 8.0, 9.0, 13.0, 16.0, 33.0, 34.0, 52.0, 48.0, 72.0, 84.0, 105.0, 99.0, 103.0, 63.0, 66.0, 48.0, 38.0, 28.0, 21.0, 15.0, 10.0, 12.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.041411399841309, -11.452208518981934, -10.863005638122559, -10.273802757263184, -9.684599876403809, -9.095396995544434, -8.506195068359375, -7.916991710662842, -7.327788829803467, -6.738585948944092, -6.149383068084717, -5.5601806640625, -4.970977783203125, -4.38177490234375, -3.792572021484375, -3.203369140625, -2.614166259765625, -2.02496337890625, -1.4357606172561646, -0.8465578556060791, -0.2573549747467041, 0.3318479061126709, 0.9210505485534668, 1.5102534294128418, 2.099456310272217, 2.688659191131592, 3.277862071990967, 3.8670647144317627, 4.456267356872559, 5.045470237731934, 5.634673118591309, 6.223875999450684, 6.813079833984375, 7.40228271484375, 7.991485595703125, 8.5806884765625, 9.169891357421875, 9.75909423828125, 10.348297119140625, 10.9375, 11.526702880859375, 12.11590576171875, 12.705108642578125, 13.2943115234375, 13.883514404296875, 14.47271728515625, 15.061920166015625, 15.651123046875, 16.240325927734375, 16.82952880859375, 17.418731689453125, 18.0079345703125, 18.597137451171875, 19.18634033203125, 19.775543212890625, 20.36474609375, 20.953947067260742, 21.543149948120117, 22.132352828979492, 22.721555709838867, 23.310758590698242, 23.899961471557617, 24.489164352416992, 25.078367233276367, 25.667570114135742]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 4.0, 4.0, 8.0, 10.0, 12.0, 16.0, 18.0, 16.0, 12.0, 23.0, 17.0, 29.0, 26.0, 30.0, 34.0, 25.0, 30.0, 30.0, 47.0, 41.0, 31.0, 38.0, 40.0, 43.0, 47.0, 40.0, 29.0, 35.0, 26.0, 36.0, 27.0, 31.0, 19.0, 19.0, 23.0, 15.0, 14.0, 10.0, 6.0, 6.0, 3.0, 10.0, 7.0, 6.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.75975513458252, -11.386200904846191, -11.01264762878418, -10.639093399047852, -10.265539169311523, -9.891984939575195, -9.518431663513184, -9.144877433776855, -8.771323204040527, -8.3977689743042, -8.024215698242188, -7.650661468505859, -7.277107238769531, -6.903553485870361, -6.529999732971191, -6.156445503234863, -5.782891750335693, -5.409337997436523, -5.035783767700195, -4.662230014801025, -4.288675785064697, -3.9151220321655273, -3.5415680408477783, -3.1680140495300293, -2.7944600582122803, -2.4209060668945312, -2.0473520755767822, -1.6737982034683228, -1.3002442121505737, -0.9266902208328247, -0.5531363487243652, -0.1795823574066162, 0.1939716339111328, 0.5675256252288818, 0.9410795569419861, 1.3146334886550903, 1.6881874799728394, 2.061741352081299, 2.435295343399048, 2.808849334716797, 3.182403326034546, 3.555957317352295, 3.929511308670044, 4.303065299987793, 4.676619052886963, 5.050173282623291, 5.423727035522461, 5.797281265258789, 6.170835018157959, 6.544388771057129, 6.917943000793457, 7.291496753692627, 7.665050983428955, 8.038604736328125, 8.412158966064453, 8.785713195800781, 9.159266471862793, 9.532820701599121, 9.906373977661133, 10.279928207397461, 10.653482437133789, 11.027036666870117, 11.400589942932129, 11.774144172668457, 12.147698402404785]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 9.0, 9.0, 4.0, 13.0, 25.0, 25.0, 41.0, 59.0, 102.0, 118.0, 187.0, 299.0, 456.0, 784.0, 1090.0, 1840.0, 2999.0, 5038.0, 8273.0, 14869.0, 28351.0, 54617.0, 111366.0, 233391.0, 286295.0, 146797.0, 70753.0, 36022.0, 18917.0, 10155.0, 6034.0, 3537.0, 2138.0, 1447.0, 886.0, 564.0, 348.0, 227.0, 138.0, 109.0, 70.0, 52.0, 37.0, 20.0, 21.0, 8.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-17.28125, -16.760498046875, -16.23974609375, -15.718994140625, -15.1982421875, -14.677490234375, -14.15673828125, -13.635986328125, -13.115234375, -12.594482421875, -12.07373046875, -11.552978515625, -11.0322265625, -10.511474609375, -9.99072265625, -9.469970703125, -8.94921875, -8.428466796875, -7.90771484375, -7.386962890625, -6.8662109375, -6.345458984375, -5.82470703125, -5.303955078125, -4.783203125, -4.262451171875, -3.74169921875, -3.220947265625, -2.7001953125, -2.179443359375, -1.65869140625, -1.137939453125, -0.6171875, -0.096435546875, 0.42431640625, 0.945068359375, 1.4658203125, 1.986572265625, 2.50732421875, 3.028076171875, 3.548828125, 4.069580078125, 4.59033203125, 5.111083984375, 5.6318359375, 6.152587890625, 6.67333984375, 7.194091796875, 7.71484375, 8.235595703125, 8.75634765625, 9.277099609375, 9.7978515625, 10.318603515625, 10.83935546875, 11.360107421875, 11.880859375, 12.401611328125, 12.92236328125, 13.443115234375, 13.9638671875, 14.484619140625, 15.00537109375, 15.526123046875, 16.046875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 9.0, 11.0, 10.0, 12.0, 20.0, 13.0, 18.0, 23.0, 27.0, 19.0, 27.0, 34.0, 33.0, 35.0, 35.0, 39.0, 34.0, 39.0, 39.0, 37.0, 50.0, 30.0, 40.0, 39.0, 32.0, 32.0, 30.0, 31.0, 28.0, 23.0, 27.0, 18.0, 21.0, 15.0, 17.0, 9.0, 10.0, 10.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.671875, -9.3643798828125, -9.056884765625, -8.7493896484375, -8.44189453125, -8.1343994140625, -7.826904296875, -7.5194091796875, -7.2119140625, -6.9044189453125, -6.596923828125, -6.2894287109375, -5.98193359375, -5.6744384765625, -5.366943359375, -5.0594482421875, -4.751953125, -4.4444580078125, -4.136962890625, -3.8294677734375, -3.52197265625, -3.2144775390625, -2.906982421875, -2.5994873046875, -2.2919921875, -1.9844970703125, -1.677001953125, -1.3695068359375, -1.06201171875, -0.7545166015625, -0.447021484375, -0.1395263671875, 0.16796875, 0.4754638671875, 0.782958984375, 1.0904541015625, 1.39794921875, 1.7054443359375, 2.012939453125, 2.3204345703125, 2.6279296875, 2.9354248046875, 3.242919921875, 3.5504150390625, 3.85791015625, 4.1654052734375, 4.472900390625, 4.7803955078125, 5.087890625, 5.3953857421875, 5.702880859375, 6.0103759765625, 6.31787109375, 6.6253662109375, 6.932861328125, 7.2403564453125, 7.5478515625, 7.8553466796875, 8.162841796875, 8.4703369140625, 8.77783203125, 9.0853271484375, 9.392822265625, 9.7003173828125, 10.0078125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 6.0, 3.0, 11.0, 6.0, 11.0, 18.0, 25.0, 26.0, 61.0, 76.0, 103.0, 136.0, 180.0, 327.0, 442.0, 779.0, 1325.0, 2510.0, 5059.0, 11168.0, 26643.0, 81331.0, 394080.0, 394441.0, 80612.0, 27090.0, 10865.0, 5132.0, 2545.0, 1330.0, 740.0, 487.0, 299.0, 188.0, 147.0, 109.0, 62.0, 52.0, 33.0, 26.0, 26.0, 14.0, 13.0, 8.0, 5.0, 2.0, 5.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.1875, -12.7479248046875, -12.308349609375, -11.8687744140625, -11.42919921875, -10.9896240234375, -10.550048828125, -10.1104736328125, -9.6708984375, -9.2313232421875, -8.791748046875, -8.3521728515625, -7.91259765625, -7.4730224609375, -7.033447265625, -6.5938720703125, -6.154296875, -5.7147216796875, -5.275146484375, -4.8355712890625, -4.39599609375, -3.9564208984375, -3.516845703125, -3.0772705078125, -2.6376953125, -2.1981201171875, -1.758544921875, -1.3189697265625, -0.87939453125, -0.4398193359375, -0.000244140625, 0.4393310546875, 0.87890625, 1.3184814453125, 1.758056640625, 2.1976318359375, 2.63720703125, 3.0767822265625, 3.516357421875, 3.9559326171875, 4.3955078125, 4.8350830078125, 5.274658203125, 5.7142333984375, 6.15380859375, 6.5933837890625, 7.032958984375, 7.4725341796875, 7.912109375, 8.3516845703125, 8.791259765625, 9.2308349609375, 9.67041015625, 10.1099853515625, 10.549560546875, 10.9891357421875, 11.4287109375, 11.8682861328125, 12.307861328125, 12.7474365234375, 13.18701171875, 13.6265869140625, 14.066162109375, 14.5057373046875, 14.9453125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 6.0, 7.0, 6.0, 12.0, 16.0, 19.0, 15.0, 15.0, 22.0, 29.0, 22.0, 30.0, 18.0, 39.0, 36.0, 34.0, 27.0, 40.0, 37.0, 34.0, 36.0, 34.0, 41.0, 48.0, 34.0, 41.0, 28.0, 34.0, 26.0, 36.0, 27.0, 21.0, 20.0, 23.0, 13.0, 14.0, 17.0, 8.0, 7.0, 10.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.34765625, -6.15020751953125, -5.9527587890625, -5.75531005859375, -5.557861328125, -5.36041259765625, -5.1629638671875, -4.96551513671875, -4.76806640625, -4.57061767578125, -4.3731689453125, -4.17572021484375, -3.978271484375, -3.78082275390625, -3.5833740234375, -3.38592529296875, -3.1884765625, -2.99102783203125, -2.7935791015625, -2.59613037109375, -2.398681640625, -2.20123291015625, -2.0037841796875, -1.80633544921875, -1.60888671875, -1.41143798828125, -1.2139892578125, -1.01654052734375, -0.819091796875, -0.62164306640625, -0.4241943359375, -0.22674560546875, -0.029296875, 0.16815185546875, 0.3656005859375, 0.56304931640625, 0.760498046875, 0.95794677734375, 1.1553955078125, 1.35284423828125, 1.55029296875, 1.74774169921875, 1.9451904296875, 2.14263916015625, 2.340087890625, 2.53753662109375, 2.7349853515625, 2.93243408203125, 3.1298828125, 3.32733154296875, 3.5247802734375, 3.72222900390625, 3.919677734375, 4.11712646484375, 4.3145751953125, 4.51202392578125, 4.70947265625, 4.90692138671875, 5.1043701171875, 5.30181884765625, 5.499267578125, 5.69671630859375, 5.8941650390625, 6.09161376953125, 6.2890625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 0.0, 3.0, 5.0, 9.0, 11.0, 15.0, 16.0, 30.0, 44.0, 60.0, 95.0, 156.0, 202.0, 330.0, 562.0, 783.0, 1445.0, 2739.0, 5470.0, 13049.0, 41022.0, 272887.0, 618800.0, 59504.0, 17113.0, 6873.0, 3142.0, 1687.0, 964.0, 490.0, 344.0, 219.0, 153.0, 90.0, 59.0, 54.0, 35.0, 30.0, 22.0, 7.0, 9.0, 10.0, 6.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8515625, -5.66357421875, -5.4755859375, -5.28759765625, -5.099609375, -4.91162109375, -4.7236328125, -4.53564453125, -4.34765625, -4.15966796875, -3.9716796875, -3.78369140625, -3.595703125, -3.40771484375, -3.2197265625, -3.03173828125, -2.84375, -2.65576171875, -2.4677734375, -2.27978515625, -2.091796875, -1.90380859375, -1.7158203125, -1.52783203125, -1.33984375, -1.15185546875, -0.9638671875, -0.77587890625, -0.587890625, -0.39990234375, -0.2119140625, -0.02392578125, 0.1640625, 0.35205078125, 0.5400390625, 0.72802734375, 0.916015625, 1.10400390625, 1.2919921875, 1.47998046875, 1.66796875, 1.85595703125, 2.0439453125, 2.23193359375, 2.419921875, 2.60791015625, 2.7958984375, 2.98388671875, 3.171875, 3.35986328125, 3.5478515625, 3.73583984375, 3.923828125, 4.11181640625, 4.2998046875, 4.48779296875, 4.67578125, 4.86376953125, 5.0517578125, 5.23974609375, 5.427734375, 5.61572265625, 5.8037109375, 5.99169921875, 6.1796875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 1.0, 13.0, 9.0, 17.0, 24.0, 50.0, 67.0, 81.0, 113.0, 148.0, 128.0, 114.0, 70.0, 43.0, 38.0, 27.0, 13.0, 7.0, 10.0, 6.0, 4.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006227493286132812, -0.0006043165922164917, -0.0005858838558197021, -0.0005674511194229126, -0.000549018383026123, -0.0005305856466293335, -0.0005121529102325439, -0.0004937201738357544, -0.00047528743743896484, -0.0004568547010421753, -0.00043842196464538574, -0.0004199892282485962, -0.00040155649185180664, -0.0003831237554550171, -0.00036469101905822754, -0.000346258282661438, -0.00032782554626464844, -0.0003093928098678589, -0.00029096007347106934, -0.0002725273370742798, -0.00025409460067749023, -0.00023566186428070068, -0.00021722912788391113, -0.00019879639148712158, -0.00018036365509033203, -0.00016193091869354248, -0.00014349818229675293, -0.00012506544589996338, -0.00010663270950317383, -8.819997310638428e-05, -6.976723670959473e-05, -5.1334500312805176e-05, -3.2901763916015625e-05, -1.4469027519226074e-05, 3.9637088775634766e-06, 2.2396445274353027e-05, 4.082918167114258e-05, 5.926191806793213e-05, 7.769465446472168e-05, 9.612739086151123e-05, 0.00011456012725830078, 0.00013299286365509033, 0.00015142560005187988, 0.00016985833644866943, 0.00018829107284545898, 0.00020672380924224854, 0.00022515654563903809, 0.00024358928203582764, 0.0002620220184326172, 0.00028045475482940674, 0.0002988874912261963, 0.00031732022762298584, 0.0003357529640197754, 0.00035418570041656494, 0.0003726184368133545, 0.00039105117321014404, 0.0004094839096069336, 0.00042791664600372314, 0.0004463493824005127, 0.00046478211879730225, 0.0004832148551940918, 0.0005016475915908813, 0.0005200803279876709, 0.0005385130643844604, 0.00055694580078125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 6.0, 9.0, 11.0, 15.0, 10.0, 27.0, 44.0, 93.0, 359.0, 2653.0, 55818.0, 961088.0, 26313.0, 1629.0, 267.0, 70.0, 35.0, 16.0, 13.0, 13.0, 8.0, 13.0, 10.0, 2.0, 4.0, 6.0, 3.0, 0.0, 2.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.703125, -16.093505859375, -15.48388671875, -14.874267578125, -14.2646484375, -13.655029296875, -13.04541015625, -12.435791015625, -11.826171875, -11.216552734375, -10.60693359375, -9.997314453125, -9.3876953125, -8.778076171875, -8.16845703125, -7.558837890625, -6.94921875, -6.339599609375, -5.72998046875, -5.120361328125, -4.5107421875, -3.901123046875, -3.29150390625, -2.681884765625, -2.072265625, -1.462646484375, -0.85302734375, -0.243408203125, 0.3662109375, 0.975830078125, 1.58544921875, 2.195068359375, 2.8046875, 3.414306640625, 4.02392578125, 4.633544921875, 5.2431640625, 5.852783203125, 6.46240234375, 7.072021484375, 7.681640625, 8.291259765625, 8.90087890625, 9.510498046875, 10.1201171875, 10.729736328125, 11.33935546875, 11.948974609375, 12.55859375, 13.168212890625, 13.77783203125, 14.387451171875, 14.9970703125, 15.606689453125, 16.21630859375, 16.825927734375, 17.435546875, 18.045166015625, 18.65478515625, 19.264404296875, 19.8740234375, 20.483642578125, 21.09326171875, 21.702880859375, 22.3125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 3.0, 11.0, 8.0, 16.0, 18.0, 15.0, 28.0, 31.0, 63.0, 51.0, 118.0, 128.0, 153.0, 95.0, 66.0, 52.0, 31.0, 20.0, 15.0, 9.0, 9.0, 7.0, 8.0, 8.0, 6.0, 2.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0712890625, -1.0355072021484375, -0.999725341796875, -0.9639434814453125, -0.92816162109375, -0.8923797607421875, -0.856597900390625, -0.8208160400390625, -0.7850341796875, -0.7492523193359375, -0.713470458984375, -0.6776885986328125, -0.64190673828125, -0.6061248779296875, -0.570343017578125, -0.5345611572265625, -0.498779296875, -0.4629974365234375, -0.427215576171875, -0.3914337158203125, -0.35565185546875, -0.3198699951171875, -0.284088134765625, -0.2483062744140625, -0.2125244140625, -0.1767425537109375, -0.140960693359375, -0.1051788330078125, -0.06939697265625, -0.0336151123046875, 0.002166748046875, 0.0379486083984375, 0.07373046875, 0.1095123291015625, 0.145294189453125, 0.1810760498046875, 0.21685791015625, 0.2526397705078125, 0.288421630859375, 0.3242034912109375, 0.3599853515625, 0.3957672119140625, 0.431549072265625, 0.4673309326171875, 0.50311279296875, 0.5388946533203125, 0.574676513671875, 0.6104583740234375, 0.646240234375, 0.6820220947265625, 0.717803955078125, 0.7535858154296875, 0.78936767578125, 0.8251495361328125, 0.860931396484375, 0.8967132568359375, 0.9324951171875, 0.9682769775390625, 1.004058837890625, 1.0398406982421875, 1.07562255859375, 1.1114044189453125, 1.147186279296875, 1.1829681396484375, 1.21875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 12.0, 14.0, 23.0, 19.0, 33.0, 29.0, 40.0, 50.0, 48.0, 64.0, 85.0, 82.0, 79.0, 66.0, 68.0, 49.0, 49.0, 36.0, 25.0, 39.0, 20.0, 20.0, 7.0, 11.0, 6.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.824517250061035, -10.424786567687988, -10.025054931640625, -9.625324249267578, -9.225592613220215, -8.825861930847168, -8.426130294799805, -8.026399612426758, -7.6266679763793945, -7.2269368171691895, -6.827205657958984, -6.427474498748779, -6.027743339538574, -5.628012180328369, -5.228281021118164, -4.828550338745117, -4.428819179534912, -4.029088020324707, -3.629356861114502, -3.229625701904297, -2.829894542694092, -2.4301633834838867, -2.0304324626922607, -1.6307013034820557, -1.2309701442718506, -0.8312389850616455, -0.4315078854560852, -0.0317767858505249, 0.3679543733596802, 0.7676855325698853, 1.1674165725708008, 1.5671477317810059, 1.966878890991211, 2.366610050201416, 2.766341209411621, 3.166072368621826, 3.5658035278320312, 3.9655346870422363, 4.365265846252441, 4.764996528625488, 5.164728164672852, 5.564459323883057, 5.964190483093262, 6.363921642303467, 6.763652801513672, 7.163383960723877, 7.563115119934082, 7.962845802307129, 8.362577438354492, 8.762308120727539, 9.162039756774902, 9.56177043914795, 9.961502075195312, 10.36123275756836, 10.760964393615723, 11.16069507598877, 11.560425758361816, 11.960156440734863, 12.359888076782227, 12.759618759155273, 13.159350395202637, 13.559081077575684, 13.958812713623047, 14.358543395996094, 14.758275032043457]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 7.0, 7.0, 7.0, 11.0, 14.0, 25.0, 10.0, 15.0, 18.0, 20.0, 24.0, 28.0, 32.0, 34.0, 26.0, 30.0, 34.0, 37.0, 39.0, 32.0, 37.0, 37.0, 39.0, 48.0, 39.0, 38.0, 30.0, 31.0, 27.0, 32.0, 27.0, 27.0, 17.0, 23.0, 15.0, 16.0, 11.0, 9.0, 6.0, 9.0, 3.0, 8.0, 8.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.740001678466797, -8.457123756408691, -8.174246788024902, -7.891368865966797, -7.608490943908691, -7.325613498687744, -7.042736053466797, -6.759858131408691, -6.476980686187744, -6.194103240966797, -5.911225318908691, -5.628347873687744, -5.345470428466797, -5.062592506408691, -4.779715061187744, -4.496837615966797, -4.213959693908691, -3.931082010269165, -3.6482043266296387, -3.3653268814086914, -3.082449197769165, -2.7995715141296387, -2.5166940689086914, -2.233816385269165, -1.9509387016296387, -1.6680610179901123, -1.3851834535598755, -1.1023058891296387, -0.8194282054901123, -0.5365505218505859, -0.2536729574203491, 0.029204607009887695, 0.31208324432373047, 0.5949608683586121, 0.8778384923934937, 1.1607160568237305, 1.4435937404632568, 1.7264714241027832, 2.0093488693237305, 2.292226552963257, 2.575104236602783, 2.8579819202423096, 3.140859603881836, 3.423737049102783, 3.7066147327423096, 3.989492416381836, 4.272369861602783, 4.5552473068237305, 4.838125228881836, 5.121002674102783, 5.403880596160889, 5.686758041381836, 5.969635963439941, 6.252513408660889, 6.535390853881836, 6.818268775939941, 7.101146221160889, 7.384023666381836, 7.666901588439941, 7.949779033660889, 8.232656478881836, 8.515534400939941, 8.798412322998047, 9.081289291381836, 9.364167213439941]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 6.0, 9.0, 11.0, 10.0, 16.0, 13.0, 14.0, 34.0, 47.0, 62.0, 74.0, 126.0, 208.0, 298.0, 463.0, 674.0, 1201.0, 1923.0, 3512.0, 5849.0, 10363.0, 18115.0, 31638.0, 53430.0, 87818.0, 130231.0, 165043.0, 168356.0, 136335.0, 93220.0, 58230.0, 34371.0, 19864.0, 11227.0, 6431.0, 3682.0, 2145.0, 1263.0, 793.0, 449.0, 319.0, 209.0, 125.0, 96.0, 77.0, 43.0, 40.0, 33.0, 23.0, 13.0, 8.0, 5.0, 6.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-10.5625, -10.2113037109375, -9.860107421875, -9.5089111328125, -9.15771484375, -8.8065185546875, -8.455322265625, -8.1041259765625, -7.7529296875, -7.4017333984375, -7.050537109375, -6.6993408203125, -6.34814453125, -5.9969482421875, -5.645751953125, -5.2945556640625, -4.943359375, -4.5921630859375, -4.240966796875, -3.8897705078125, -3.53857421875, -3.1873779296875, -2.836181640625, -2.4849853515625, -2.1337890625, -1.7825927734375, -1.431396484375, -1.0802001953125, -0.72900390625, -0.3778076171875, -0.026611328125, 0.3245849609375, 0.67578125, 1.0269775390625, 1.378173828125, 1.7293701171875, 2.08056640625, 2.4317626953125, 2.782958984375, 3.1341552734375, 3.4853515625, 3.8365478515625, 4.187744140625, 4.5389404296875, 4.89013671875, 5.2413330078125, 5.592529296875, 5.9437255859375, 6.294921875, 6.6461181640625, 6.997314453125, 7.3485107421875, 7.69970703125, 8.0509033203125, 8.402099609375, 8.7532958984375, 9.1044921875, 9.4556884765625, 9.806884765625, 10.1580810546875, 10.50927734375, 10.8604736328125, 11.211669921875, 11.5628662109375, 11.9140625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 5.0, 4.0, 9.0, 14.0, 17.0, 17.0, 23.0, 20.0, 17.0, 22.0, 26.0, 42.0, 34.0, 33.0, 30.0, 40.0, 36.0, 43.0, 54.0, 47.0, 45.0, 36.0, 40.0, 43.0, 33.0, 31.0, 38.0, 39.0, 33.0, 20.0, 18.0, 16.0, 12.0, 12.0, 7.0, 6.0, 10.0, 5.0, 6.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -3.99163818359375, -3.8387451171875, -3.68585205078125, -3.532958984375, -3.38006591796875, -3.2271728515625, -3.07427978515625, -2.92138671875, -2.76849365234375, -2.6156005859375, -2.46270751953125, -2.309814453125, -2.15692138671875, -2.0040283203125, -1.85113525390625, -1.6982421875, -1.54534912109375, -1.3924560546875, -1.23956298828125, -1.086669921875, -0.93377685546875, -0.7808837890625, -0.62799072265625, -0.47509765625, -0.32220458984375, -0.1693115234375, -0.01641845703125, 0.136474609375, 0.28936767578125, 0.4422607421875, 0.59515380859375, 0.748046875, 0.90093994140625, 1.0538330078125, 1.20672607421875, 1.359619140625, 1.51251220703125, 1.6654052734375, 1.81829833984375, 1.97119140625, 2.12408447265625, 2.2769775390625, 2.42987060546875, 2.582763671875, 2.73565673828125, 2.8885498046875, 3.04144287109375, 3.1943359375, 3.34722900390625, 3.5001220703125, 3.65301513671875, 3.805908203125, 3.95880126953125, 4.1116943359375, 4.26458740234375, 4.41748046875, 4.57037353515625, 4.7232666015625, 4.87615966796875, 5.029052734375, 5.18194580078125, 5.3348388671875, 5.48773193359375, 5.640625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 9.0, 9.0, 10.0, 18.0, 22.0, 18.0, 19.0, 22.0, 19.0, 34.0, 44.0, 48.0, 35.0, 65.0, 843.0, 47058.0, 878644.0, 119368.0, 1808.0, 87.0, 38.0, 40.0, 42.0, 42.0, 27.0, 32.0, 22.0, 18.0, 14.0, 20.0, 14.0, 8.0, 12.0, 6.0, 2.0, 7.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.5625, -75.0283203125, -72.494140625, -69.9599609375, -67.42578125, -64.8916015625, -62.357421875, -59.8232421875, -57.2890625, -54.7548828125, -52.220703125, -49.6865234375, -47.15234375, -44.6181640625, -42.083984375, -39.5498046875, -37.015625, -34.4814453125, -31.947265625, -29.4130859375, -26.87890625, -24.3447265625, -21.810546875, -19.2763671875, -16.7421875, -14.2080078125, -11.673828125, -9.1396484375, -6.60546875, -4.0712890625, -1.537109375, 0.9970703125, 3.53125, 6.0654296875, 8.599609375, 11.1337890625, 13.66796875, 16.2021484375, 18.736328125, 21.2705078125, 23.8046875, 26.3388671875, 28.873046875, 31.4072265625, 33.94140625, 36.4755859375, 39.009765625, 41.5439453125, 44.078125, 46.6123046875, 49.146484375, 51.6806640625, 54.21484375, 56.7490234375, 59.283203125, 61.8173828125, 64.3515625, 66.8857421875, 69.419921875, 71.9541015625, 74.48828125, 77.0224609375, 79.556640625, 82.0908203125, 84.625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 9.0, 13.0, 13.0, 11.0, 11.0, 21.0, 22.0, 22.0, 27.0, 23.0, 30.0, 34.0, 30.0, 44.0, 44.0, 43.0, 42.0, 51.0, 48.0, 41.0, 38.0, 42.0, 27.0, 30.0, 31.0, 26.0, 30.0, 32.0, 30.0, 16.0, 24.0, 14.0, 7.0, 10.0, 12.0, 6.0, 5.0, 8.0, 5.0, 2.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62890625, -5.45513916015625, -5.2813720703125, -5.10760498046875, -4.933837890625, -4.76007080078125, -4.5863037109375, -4.41253662109375, -4.23876953125, -4.06500244140625, -3.8912353515625, -3.71746826171875, -3.543701171875, -3.36993408203125, -3.1961669921875, -3.02239990234375, -2.8486328125, -2.67486572265625, -2.5010986328125, -2.32733154296875, -2.153564453125, -1.97979736328125, -1.8060302734375, -1.63226318359375, -1.45849609375, -1.28472900390625, -1.1109619140625, -0.93719482421875, -0.763427734375, -0.58966064453125, -0.4158935546875, -0.24212646484375, -0.068359375, 0.10540771484375, 0.2791748046875, 0.45294189453125, 0.626708984375, 0.80047607421875, 0.9742431640625, 1.14801025390625, 1.32177734375, 1.49554443359375, 1.6693115234375, 1.84307861328125, 2.016845703125, 2.19061279296875, 2.3643798828125, 2.53814697265625, 2.7119140625, 2.88568115234375, 3.0594482421875, 3.23321533203125, 3.406982421875, 3.58074951171875, 3.7545166015625, 3.92828369140625, 4.10205078125, 4.27581787109375, 4.4495849609375, 4.62335205078125, 4.797119140625, 4.97088623046875, 5.1446533203125, 5.31842041015625, 5.4921875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 13.0, 15.0, 27.0, 52.0, 76.0, 175.0, 346.0, 772.0, 1986.0, 6762.0, 36870.0, 402109.0, 537613.0, 49407.0, 8391.0, 2305.0, 869.0, 400.0, 198.0, 73.0, 35.0, 25.0, 12.0, 11.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.28515625, -3.172149658203125, -3.05914306640625, -2.946136474609375, -2.8331298828125, -2.720123291015625, -2.60711669921875, -2.494110107421875, -2.381103515625, -2.268096923828125, -2.15509033203125, -2.042083740234375, -1.9290771484375, -1.816070556640625, -1.70306396484375, -1.590057373046875, -1.47705078125, -1.364044189453125, -1.25103759765625, -1.138031005859375, -1.0250244140625, -0.912017822265625, -0.79901123046875, -0.686004638671875, -0.572998046875, -0.459991455078125, -0.34698486328125, -0.233978271484375, -0.1209716796875, -0.007965087890625, 0.10504150390625, 0.218048095703125, 0.3310546875, 0.444061279296875, 0.55706787109375, 0.670074462890625, 0.7830810546875, 0.896087646484375, 1.00909423828125, 1.122100830078125, 1.235107421875, 1.348114013671875, 1.46112060546875, 1.574127197265625, 1.6871337890625, 1.800140380859375, 1.91314697265625, 2.026153564453125, 2.13916015625, 2.252166748046875, 2.36517333984375, 2.478179931640625, 2.5911865234375, 2.704193115234375, 2.81719970703125, 2.930206298828125, 3.043212890625, 3.156219482421875, 3.26922607421875, 3.382232666015625, 3.4952392578125, 3.608245849609375, 3.72125244140625, 3.834259033203125, 3.947265625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 6.0, 5.0, 9.0, 12.0, 10.0, 27.0, 56.0, 52.0, 100.0, 134.0, 140.0, 149.0, 100.0, 64.0, 46.0, 35.0, 23.0, 15.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00066375732421875, -0.000647813081741333, -0.000631868839263916, -0.000615924596786499, -0.000599980354309082, -0.000584036111831665, -0.000568091869354248, -0.0005521476268768311, -0.0005362033843994141, -0.0005202591419219971, -0.0005043148994445801, -0.0004883706569671631, -0.0004724264144897461, -0.0004564821720123291, -0.0004405379295349121, -0.0004245936870574951, -0.0004086494445800781, -0.00039270520210266113, -0.00037676095962524414, -0.00036081671714782715, -0.00034487247467041016, -0.00032892823219299316, -0.00031298398971557617, -0.0002970397472381592, -0.0002810955047607422, -0.0002651512622833252, -0.0002492070198059082, -0.0002332627773284912, -0.00021731853485107422, -0.00020137429237365723, -0.00018543004989624023, -0.00016948580741882324, -0.00015354156494140625, -0.00013759732246398926, -0.00012165307998657227, -0.00010570883750915527, -8.976459503173828e-05, -7.382035255432129e-05, -5.78761100769043e-05, -4.1931867599487305e-05, -2.5987625122070312e-05, -1.004338264465332e-05, 5.900859832763672e-06, 2.1845102310180664e-05, 3.7789344787597656e-05, 5.373358726501465e-05, 6.967782974243164e-05, 8.562207221984863e-05, 0.00010156631469726562, 0.00011751055717468262, 0.0001334547996520996, 0.0001493990421295166, 0.0001653432846069336, 0.00018128752708435059, 0.00019723176956176758, 0.00021317601203918457, 0.00022912025451660156, 0.00024506449699401855, 0.00026100873947143555, 0.00027695298194885254, 0.00029289722442626953, 0.0003088414669036865, 0.0003247857093811035, 0.0003407299518585205, 0.0003566741943359375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 6.0, 8.0, 9.0, 22.0, 11.0, 20.0, 35.0, 61.0, 120.0, 961.0, 233421.0, 811756.0, 1755.0, 169.0, 51.0, 37.0, 20.0, 16.0, 15.0, 12.0, 6.0, 4.0, 6.0, 2.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.2421875, -10.891845703125, -10.54150390625, -10.191162109375, -9.8408203125, -9.490478515625, -9.14013671875, -8.789794921875, -8.439453125, -8.089111328125, -7.73876953125, -7.388427734375, -7.0380859375, -6.687744140625, -6.33740234375, -5.987060546875, -5.63671875, -5.286376953125, -4.93603515625, -4.585693359375, -4.2353515625, -3.885009765625, -3.53466796875, -3.184326171875, -2.833984375, -2.483642578125, -2.13330078125, -1.782958984375, -1.4326171875, -1.082275390625, -0.73193359375, -0.381591796875, -0.03125, 0.319091796875, 0.66943359375, 1.019775390625, 1.3701171875, 1.720458984375, 2.07080078125, 2.421142578125, 2.771484375, 3.121826171875, 3.47216796875, 3.822509765625, 4.1728515625, 4.523193359375, 4.87353515625, 5.223876953125, 5.57421875, 5.924560546875, 6.27490234375, 6.625244140625, 6.9755859375, 7.325927734375, 7.67626953125, 8.026611328125, 8.376953125, 8.727294921875, 9.07763671875, 9.427978515625, 9.7783203125, 10.128662109375, 10.47900390625, 10.829345703125, 11.1796875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 9.0, 10.0, 10.0, 12.0, 9.0, 14.0, 18.0, 34.0, 49.0, 41.0, 63.0, 90.0, 96.0, 97.0, 97.0, 88.0, 50.0, 50.0, 46.0, 29.0, 23.0, 12.0, 11.0, 6.0, 13.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.64453125, -0.6246719360351562, -0.6048126220703125, -0.5849533081054688, -0.565093994140625, -0.5452346801757812, -0.5253753662109375, -0.5055160522460938, -0.48565673828125, -0.46579742431640625, -0.4459381103515625, -0.42607879638671875, -0.406219482421875, -0.38636016845703125, -0.3665008544921875, -0.34664154052734375, -0.3267822265625, -0.30692291259765625, -0.2870635986328125, -0.26720428466796875, -0.247344970703125, -0.22748565673828125, -0.2076263427734375, -0.18776702880859375, -0.16790771484375, -0.14804840087890625, -0.1281890869140625, -0.10832977294921875, -0.088470458984375, -0.06861114501953125, -0.0487518310546875, -0.02889251708984375, -0.009033203125, 0.01082611083984375, 0.0306854248046875, 0.05054473876953125, 0.070404052734375, 0.09026336669921875, 0.1101226806640625, 0.12998199462890625, 0.14984130859375, 0.16970062255859375, 0.1895599365234375, 0.20941925048828125, 0.229278564453125, 0.24913787841796875, 0.2689971923828125, 0.28885650634765625, 0.3087158203125, 0.32857513427734375, 0.3484344482421875, 0.36829376220703125, 0.388153076171875, 0.40801239013671875, 0.4278717041015625, 0.44773101806640625, 0.46759033203125, 0.48744964599609375, 0.5073089599609375, 0.5271682739257812, 0.547027587890625, 0.5668869018554688, 0.5867462158203125, 0.6066055297851562, 0.62646484375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 7.0, 13.0, 17.0, 34.0, 61.0, 143.0, 183.0, 202.0, 150.0, 106.0, 45.0, 26.0, 21.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.737106800079346, -5.049020290374756, -4.360934257507324, -3.6728477478027344, -2.9847614765167236, -2.296675205230713, -1.608588695526123, -0.9205026626586914, -0.23241615295410156, 0.45567017793655396, 1.1437565088272095, 1.8318428993225098, 2.5199291706085205, 3.2080154418945312, 3.896101951599121, 4.584187984466553, 5.272274494171143, 5.960361003875732, 6.648447036743164, 7.336533546447754, 8.024620056152344, 8.712705612182617, 9.400793075561523, 10.088878631591797, 10.776965141296387, 11.465051651000977, 12.153138160705566, 12.841224670410156, 13.52931022644043, 14.21739673614502, 14.90548324584961, 15.593568801879883, 16.28165626525879, 16.969741821289062, 17.65782928466797, 18.345914840698242, 19.03400230407715, 19.722087860107422, 20.410175323486328, 21.0982608795166, 21.786346435546875, 22.47443199157715, 23.162519454956055, 23.850605010986328, 24.538692474365234, 25.226778030395508, 25.91486358642578, 26.602951049804688, 27.291038513183594, 27.979124069213867, 28.667211532592773, 29.355297088623047, 30.043384552001953, 30.731470108032227, 31.4195556640625, 32.107643127441406, 32.79572677612305, 33.48381423950195, 34.171897888183594, 34.8599853515625, 35.548072814941406, 36.23616027832031, 36.92424392700195, 37.61233139038086, 38.300418853759766]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 7.0, 5.0, 10.0, 7.0, 20.0, 11.0, 15.0, 21.0, 28.0, 28.0, 30.0, 31.0, 31.0, 37.0, 53.0, 42.0, 29.0, 36.0, 51.0, 31.0, 42.0, 46.0, 38.0, 29.0, 28.0, 36.0, 34.0, 35.0, 28.0, 25.0, 16.0, 33.0, 15.0, 9.0, 7.0, 16.0, 8.0, 4.0, 7.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-9.709304809570312, -9.4174222946167, -9.125539779663086, -8.833657264709473, -8.54177474975586, -8.24989128112793, -7.958008766174316, -7.666126251220703, -7.37424373626709, -7.082361221313477, -6.790478706359863, -6.498595714569092, -6.2067131996154785, -5.914830684661865, -5.622947692871094, -5.3310651779174805, -5.039182662963867, -4.747300148010254, -4.455417633056641, -4.163534641265869, -3.871652126312256, -3.5797696113586426, -3.28788685798645, -2.996004104614258, -2.7041215896606445, -2.4122390747070312, -2.120356321334839, -1.828473687171936, -1.5365910530090332, -1.2447084188461304, -0.9528257846832275, -0.6609430313110352, -0.36905956268310547, -0.07717692852020264, 0.2147057056427002, 0.506588339805603, 0.7984709739685059, 1.0903536081314087, 1.3822362422943115, 1.674118995666504, 1.9660015106201172, 2.2578840255737305, 2.549766778945923, 2.8416495323181152, 3.1335320472717285, 3.425414562225342, 3.717297315597534, 4.009180068969727, 4.30106258392334, 4.592945098876953, 4.884827613830566, 5.176710605621338, 5.468593120574951, 5.7604756355285645, 6.052358627319336, 6.344241142272949, 6.6361236572265625, 6.928006172180176, 7.219888687133789, 7.5117716789245605, 7.803654193878174, 8.095537185668945, 8.387419700622559, 8.679302215576172, 8.971184730529785]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 9.0, 11.0, 15.0, 21.0, 36.0, 61.0, 69.0, 95.0, 179.0, 234.0, 275.0, 494.0, 661.0, 946.0, 1403.0, 2033.0, 3027.0, 4551.0, 7285.0, 11599.0, 20069.0, 36957.0, 82513.0, 490588.0, 2910922.0, 452725.0, 78569.0, 35812.0, 19511.0, 11757.0, 7221.0, 4616.0, 3100.0, 2141.0, 1425.0, 997.0, 659.0, 520.0, 331.0, 269.0, 167.0, 131.0, 86.0, 73.0, 38.0, 27.0, 21.0, 13.0, 12.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.515625, -10.181640625, -9.84765625, -9.513671875, -9.1796875, -8.845703125, -8.51171875, -8.177734375, -7.84375, -7.509765625, -7.17578125, -6.841796875, -6.5078125, -6.173828125, -5.83984375, -5.505859375, -5.171875, -4.837890625, -4.50390625, -4.169921875, -3.8359375, -3.501953125, -3.16796875, -2.833984375, -2.5, -2.166015625, -1.83203125, -1.498046875, -1.1640625, -0.830078125, -0.49609375, -0.162109375, 0.171875, 0.505859375, 0.83984375, 1.173828125, 1.5078125, 1.841796875, 2.17578125, 2.509765625, 2.84375, 3.177734375, 3.51171875, 3.845703125, 4.1796875, 4.513671875, 4.84765625, 5.181640625, 5.515625, 5.849609375, 6.18359375, 6.517578125, 6.8515625, 7.185546875, 7.51953125, 7.853515625, 8.1875, 8.521484375, 8.85546875, 9.189453125, 9.5234375, 9.857421875, 10.19140625, 10.525390625, 10.859375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 7.0, 4.0, 11.0, 14.0, 13.0, 10.0, 13.0, 21.0, 23.0, 22.0, 21.0, 26.0, 36.0, 43.0, 41.0, 33.0, 34.0, 34.0, 34.0, 36.0, 39.0, 43.0, 50.0, 35.0, 27.0, 36.0, 36.0, 33.0, 21.0, 29.0, 20.0, 33.0, 25.0, 14.0, 17.0, 12.0, 13.0, 7.0, 6.0, 5.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.64453125, -5.47540283203125, -5.3062744140625, -5.13714599609375, -4.968017578125, -4.79888916015625, -4.6297607421875, -4.46063232421875, -4.29150390625, -4.12237548828125, -3.9532470703125, -3.78411865234375, -3.614990234375, -3.44586181640625, -3.2767333984375, -3.10760498046875, -2.9384765625, -2.76934814453125, -2.6002197265625, -2.43109130859375, -2.261962890625, -2.09283447265625, -1.9237060546875, -1.75457763671875, -1.58544921875, -1.41632080078125, -1.2471923828125, -1.07806396484375, -0.908935546875, -0.73980712890625, -0.5706787109375, -0.40155029296875, -0.232421875, -0.06329345703125, 0.1058349609375, 0.27496337890625, 0.444091796875, 0.61322021484375, 0.7823486328125, 0.95147705078125, 1.12060546875, 1.28973388671875, 1.4588623046875, 1.62799072265625, 1.797119140625, 1.96624755859375, 2.1353759765625, 2.30450439453125, 2.4736328125, 2.64276123046875, 2.8118896484375, 2.98101806640625, 3.150146484375, 3.31927490234375, 3.4884033203125, 3.65753173828125, 3.82666015625, 3.99578857421875, 4.1649169921875, 4.33404541015625, 4.503173828125, 4.67230224609375, 4.8414306640625, 5.01055908203125, 5.1796875]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 20.0, 16.0, 30.0, 47.0, 50.0, 118.0, 476.0, 14340.0, 4162847.0, 15491.0, 465.0, 127.0, 66.0, 48.0, 23.0, 23.0, 19.0, 16.0, 8.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.8125, -56.5810546875, -53.349609375, -50.1181640625, -46.88671875, -43.6552734375, -40.423828125, -37.1923828125, -33.9609375, -30.7294921875, -27.498046875, -24.2666015625, -21.03515625, -17.8037109375, -14.572265625, -11.3408203125, -8.109375, -4.8779296875, -1.646484375, 1.5849609375, 4.81640625, 8.0478515625, 11.279296875, 14.5107421875, 17.7421875, 20.9736328125, 24.205078125, 27.4365234375, 30.66796875, 33.8994140625, 37.130859375, 40.3623046875, 43.59375, 46.8251953125, 50.056640625, 53.2880859375, 56.51953125, 59.7509765625, 62.982421875, 66.2138671875, 69.4453125, 72.6767578125, 75.908203125, 79.1396484375, 82.37109375, 85.6025390625, 88.833984375, 92.0654296875, 95.296875, 98.5283203125, 101.759765625, 104.9912109375, 108.22265625, 111.4541015625, 114.685546875, 117.9169921875, 121.1484375, 124.3798828125, 127.611328125, 130.8427734375, 134.07421875, 137.3056640625, 140.537109375, 143.7685546875, 147.0]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 12.0, 23.0, 15.0, 30.0, 51.0, 73.0, 100.0, 233.0, 672.0, 1437.0, 745.0, 268.0, 128.0, 78.0, 52.0, 32.0, 25.0, 27.0, 18.0, 12.0, 8.0, 4.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0234375, -2.86871337890625, -2.7139892578125, -2.55926513671875, -2.404541015625, -2.24981689453125, -2.0950927734375, -1.94036865234375, -1.78564453125, -1.63092041015625, -1.4761962890625, -1.32147216796875, -1.166748046875, -1.01202392578125, -0.8572998046875, -0.70257568359375, -0.5478515625, -0.39312744140625, -0.2384033203125, -0.08367919921875, 0.071044921875, 0.22576904296875, 0.3804931640625, 0.53521728515625, 0.68994140625, 0.84466552734375, 0.9993896484375, 1.15411376953125, 1.308837890625, 1.46356201171875, 1.6182861328125, 1.77301025390625, 1.927734375, 2.08245849609375, 2.2371826171875, 2.39190673828125, 2.546630859375, 2.70135498046875, 2.8560791015625, 3.01080322265625, 3.16552734375, 3.32025146484375, 3.4749755859375, 3.62969970703125, 3.784423828125, 3.93914794921875, 4.0938720703125, 4.24859619140625, 4.4033203125, 4.55804443359375, 4.7127685546875, 4.86749267578125, 5.022216796875, 5.17694091796875, 5.3316650390625, 5.48638916015625, 5.64111328125, 5.79583740234375, 5.9505615234375, 6.10528564453125, 6.260009765625, 6.41473388671875, 6.5694580078125, 6.72418212890625, 6.87890625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 10.0, 13.0, 15.0, 20.0, 17.0, 23.0, 36.0, 36.0, 69.0, 82.0, 111.0, 95.0, 94.0, 80.0, 54.0, 52.0, 36.0, 37.0, 27.0, 23.0, 18.0, 12.0, 7.0, 9.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.734691143035889, -6.492444038391113, -6.250197410583496, -6.007950305938721, -5.765703201293945, -5.523456573486328, -5.281209468841553, -5.038962364196777, -4.79671573638916, -4.554468631744385, -4.312222003936768, -4.069974899291992, -3.827728033065796, -3.5854811668395996, -3.343234062194824, -3.100987195968628, -2.8587403297424316, -2.6164934635162354, -2.374246597290039, -2.1319994926452637, -1.8897526264190674, -1.647505760192871, -1.4052587747573853, -1.1630117893218994, -0.9207649230957031, -0.6785179972648621, -0.436271071434021, -0.19402414560317993, 0.04822278022766113, 0.2904696464538574, 0.5327166318893433, 0.7749636173248291, 1.0172100067138672, 1.2594568729400635, 1.5017038583755493, 1.7439508438110352, 1.9861977100372314, 2.2284445762634277, 2.470691680908203, 2.7129385471343994, 2.9551854133605957, 3.197432279586792, 3.4396791458129883, 3.6819262504577637, 3.92417311668396, 4.166419982910156, 4.408667087554932, 4.650914192199707, 4.893160820007324, 5.1354079246521, 5.377654552459717, 5.619901657104492, 5.862148284912109, 6.104395389556885, 6.34664249420166, 6.588889122009277, 6.831136226654053, 7.073383331298828, 7.315629959106445, 7.557877063751221, 7.800124168395996, 8.042370796203613, 8.28461742401123, 8.526865005493164, 8.769111633300781]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 11.0, 7.0, 10.0, 13.0, 17.0, 16.0, 22.0, 26.0, 27.0, 36.0, 31.0, 36.0, 37.0, 42.0, 46.0, 46.0, 43.0, 42.0, 50.0, 32.0, 32.0, 50.0, 44.0, 41.0, 34.0, 35.0, 30.0, 28.0, 15.0, 10.0, 13.0, 9.0, 7.0, 12.0, 13.0, 7.0, 7.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.025304794311523, -7.784073829650879, -7.542843341827393, -7.301612377166748, -7.0603814125061035, -6.819150924682617, -6.577919960021973, -6.336688995361328, -6.095458030700684, -5.854227066040039, -5.612996578216553, -5.371765613555908, -5.130534648895264, -4.889304161071777, -4.648073196411133, -4.406842231750488, -4.165611267089844, -3.9243805408477783, -3.683149576187134, -3.4419188499450684, -3.200687885284424, -2.9594571590423584, -2.718226432800293, -2.4769954681396484, -2.235764980316162, -1.9945341348648071, -1.7533032894134521, -1.5120725631713867, -1.2708415985107422, -1.0296108722686768, -0.7883800268173218, -0.5471491813659668, -0.30591821670532227, -0.06468738615512848, 0.1765434443950653, 0.4177742600440979, 0.6590051054954529, 0.9002358913421631, 1.141466736793518, 1.382697582244873, 1.623928427696228, 1.865159273147583, 2.1063899993896484, 2.347620964050293, 2.5888516902923584, 2.830082416534424, 3.0713133811950684, 3.312544345855713, 3.5537750720977783, 3.7950057983398438, 4.036236763000488, 4.277467727661133, 4.518698215484619, 4.759929180145264, 5.001160144805908, 5.2423906326293945, 5.483621597290039, 5.724852561950684, 5.96608304977417, 6.2073140144348145, 6.448544979095459, 6.689775466918945, 6.93100643157959, 7.172237396240234, 7.413468360900879]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 13.0, 34.0, 21.0, 41.0, 71.0, 76.0, 103.0, 168.0, 238.0, 316.0, 555.0, 829.0, 1508.0, 2781.0, 5494.0, 11301.0, 25188.0, 58540.0, 147188.0, 358998.0, 259828.0, 98889.0, 40712.0, 17804.0, 8234.0, 4120.0, 2153.0, 1224.0, 721.0, 445.0, 278.0, 184.0, 145.0, 94.0, 75.0, 43.0, 37.0, 24.0, 23.0, 12.0, 12.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.625, -10.290771484375, -9.95654296875, -9.622314453125, -9.2880859375, -8.953857421875, -8.61962890625, -8.285400390625, -7.951171875, -7.616943359375, -7.28271484375, -6.948486328125, -6.6142578125, -6.280029296875, -5.94580078125, -5.611572265625, -5.27734375, -4.943115234375, -4.60888671875, -4.274658203125, -3.9404296875, -3.606201171875, -3.27197265625, -2.937744140625, -2.603515625, -2.269287109375, -1.93505859375, -1.600830078125, -1.2666015625, -0.932373046875, -0.59814453125, -0.263916015625, 0.0703125, 0.404541015625, 0.73876953125, 1.072998046875, 1.4072265625, 1.741455078125, 2.07568359375, 2.409912109375, 2.744140625, 3.078369140625, 3.41259765625, 3.746826171875, 4.0810546875, 4.415283203125, 4.74951171875, 5.083740234375, 5.41796875, 5.752197265625, 6.08642578125, 6.420654296875, 6.7548828125, 7.089111328125, 7.42333984375, 7.757568359375, 8.091796875, 8.426025390625, 8.76025390625, 9.094482421875, 9.4287109375, 9.762939453125, 10.09716796875, 10.431396484375, 10.765625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 8.0, 9.0, 4.0, 14.0, 18.0, 12.0, 17.0, 20.0, 26.0, 32.0, 35.0, 30.0, 38.0, 30.0, 31.0, 39.0, 49.0, 51.0, 36.0, 48.0, 48.0, 47.0, 33.0, 40.0, 39.0, 42.0, 30.0, 22.0, 28.0, 19.0, 13.0, 11.0, 15.0, 10.0, 4.0, 8.0, 11.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.01953125, -5.8394775390625, -5.659423828125, -5.4793701171875, -5.29931640625, -5.1192626953125, -4.939208984375, -4.7591552734375, -4.5791015625, -4.3990478515625, -4.218994140625, -4.0389404296875, -3.85888671875, -3.6788330078125, -3.498779296875, -3.3187255859375, -3.138671875, -2.9586181640625, -2.778564453125, -2.5985107421875, -2.41845703125, -2.2384033203125, -2.058349609375, -1.8782958984375, -1.6982421875, -1.5181884765625, -1.338134765625, -1.1580810546875, -0.97802734375, -0.7979736328125, -0.617919921875, -0.4378662109375, -0.2578125, -0.0777587890625, 0.102294921875, 0.2823486328125, 0.46240234375, 0.6424560546875, 0.822509765625, 1.0025634765625, 1.1826171875, 1.3626708984375, 1.542724609375, 1.7227783203125, 1.90283203125, 2.0828857421875, 2.262939453125, 2.4429931640625, 2.623046875, 2.8031005859375, 2.983154296875, 3.1632080078125, 3.34326171875, 3.5233154296875, 3.703369140625, 3.8834228515625, 4.0634765625, 4.2435302734375, 4.423583984375, 4.6036376953125, 4.78369140625, 4.9637451171875, 5.143798828125, 5.3238525390625, 5.50390625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 10.0, 7.0, 7.0, 12.0, 28.0, 41.0, 41.0, 62.0, 85.0, 220.0, 326.0, 593.0, 1273.0, 2560.0, 5635.0, 13549.0, 36184.0, 120672.0, 559213.0, 218679.0, 55264.0, 19360.0, 7863.0, 3432.0, 1590.0, 806.0, 418.0, 217.0, 130.0, 94.0, 50.0, 34.0, 17.0, 20.0, 18.0, 13.0, 6.0, 3.0, 3.0, 1.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.3515625, -8.0703125, -7.7890625, -7.5078125, -7.2265625, -6.9453125, -6.6640625, -6.3828125, -6.1015625, -5.8203125, -5.5390625, -5.2578125, -4.9765625, -4.6953125, -4.4140625, -4.1328125, -3.8515625, -3.5703125, -3.2890625, -3.0078125, -2.7265625, -2.4453125, -2.1640625, -1.8828125, -1.6015625, -1.3203125, -1.0390625, -0.7578125, -0.4765625, -0.1953125, 0.0859375, 0.3671875, 0.6484375, 0.9296875, 1.2109375, 1.4921875, 1.7734375, 2.0546875, 2.3359375, 2.6171875, 2.8984375, 3.1796875, 3.4609375, 3.7421875, 4.0234375, 4.3046875, 4.5859375, 4.8671875, 5.1484375, 5.4296875, 5.7109375, 5.9921875, 6.2734375, 6.5546875, 6.8359375, 7.1171875, 7.3984375, 7.6796875, 7.9609375, 8.2421875, 8.5234375, 8.8046875, 9.0859375, 9.3671875, 9.6484375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 11.0, 9.0, 9.0, 13.0, 16.0, 17.0, 25.0, 23.0, 27.0, 29.0, 25.0, 29.0, 29.0, 45.0, 42.0, 27.0, 50.0, 48.0, 51.0, 47.0, 42.0, 39.0, 43.0, 38.0, 39.0, 35.0, 26.0, 32.0, 19.0, 13.0, 22.0, 17.0, 11.0, 8.0, 11.0, 6.0, 7.0, 4.0, 4.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.3984375, -4.26080322265625, -4.1231689453125, -3.98553466796875, -3.847900390625, -3.71026611328125, -3.5726318359375, -3.43499755859375, -3.29736328125, -3.15972900390625, -3.0220947265625, -2.88446044921875, -2.746826171875, -2.60919189453125, -2.4715576171875, -2.33392333984375, -2.1962890625, -2.05865478515625, -1.9210205078125, -1.78338623046875, -1.645751953125, -1.50811767578125, -1.3704833984375, -1.23284912109375, -1.09521484375, -0.95758056640625, -0.8199462890625, -0.68231201171875, -0.544677734375, -0.40704345703125, -0.2694091796875, -0.13177490234375, 0.005859375, 0.14349365234375, 0.2811279296875, 0.41876220703125, 0.556396484375, 0.69403076171875, 0.8316650390625, 0.96929931640625, 1.10693359375, 1.24456787109375, 1.3822021484375, 1.51983642578125, 1.657470703125, 1.79510498046875, 1.9327392578125, 2.07037353515625, 2.2080078125, 2.34564208984375, 2.4832763671875, 2.62091064453125, 2.758544921875, 2.89617919921875, 3.0338134765625, 3.17144775390625, 3.30908203125, 3.44671630859375, 3.5843505859375, 3.72198486328125, 3.859619140625, 3.99725341796875, 4.1348876953125, 4.27252197265625, 4.41015625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 8.0, 5.0, 7.0, 13.0, 13.0, 21.0, 33.0, 52.0, 86.0, 97.0, 117.0, 181.0, 291.0, 403.0, 569.0, 908.0, 1316.0, 2148.0, 3629.0, 6583.0, 12266.0, 25842.0, 67139.0, 341116.0, 450585.0, 76557.0, 28031.0, 13039.0, 6797.0, 4033.0, 2382.0, 1447.0, 976.0, 566.0, 402.0, 283.0, 173.0, 136.0, 96.0, 71.0, 47.0, 26.0, 28.0, 11.0, 12.0, 6.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.701171875, -3.585693359375, -3.47021484375, -3.354736328125, -3.2392578125, -3.123779296875, -3.00830078125, -2.892822265625, -2.77734375, -2.661865234375, -2.54638671875, -2.430908203125, -2.3154296875, -2.199951171875, -2.08447265625, -1.968994140625, -1.853515625, -1.738037109375, -1.62255859375, -1.507080078125, -1.3916015625, -1.276123046875, -1.16064453125, -1.045166015625, -0.9296875, -0.814208984375, -0.69873046875, -0.583251953125, -0.4677734375, -0.352294921875, -0.23681640625, -0.121337890625, -0.005859375, 0.109619140625, 0.22509765625, 0.340576171875, 0.4560546875, 0.571533203125, 0.68701171875, 0.802490234375, 0.91796875, 1.033447265625, 1.14892578125, 1.264404296875, 1.3798828125, 1.495361328125, 1.61083984375, 1.726318359375, 1.841796875, 1.957275390625, 2.07275390625, 2.188232421875, 2.3037109375, 2.419189453125, 2.53466796875, 2.650146484375, 2.765625, 2.881103515625, 2.99658203125, 3.112060546875, 3.2275390625, 3.343017578125, 3.45849609375, 3.573974609375, 3.689453125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 3.0, 5.0, 12.0, 6.0, 11.0, 16.0, 16.0, 25.0, 46.0, 76.0, 149.0, 202.0, 161.0, 104.0, 66.0, 31.0, 20.0, 13.0, 17.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00049591064453125, -0.00047863274812698364, -0.0004613548517227173, -0.00044407695531845093, -0.00042679905891418457, -0.0004095211625099182, -0.00039224326610565186, -0.0003749653697013855, -0.00035768747329711914, -0.0003404095768928528, -0.0003231316804885864, -0.00030585378408432007, -0.0002885758876800537, -0.00027129799127578735, -0.000254020094871521, -0.00023674219846725464, -0.00021946430206298828, -0.00020218640565872192, -0.00018490850925445557, -0.0001676306128501892, -0.00015035271644592285, -0.0001330748200416565, -0.00011579692363739014, -9.851902723312378e-05, -8.124113082885742e-05, -6.396323442459106e-05, -4.668533802032471e-05, -2.940744161605835e-05, -1.2129545211791992e-05, 5.148351192474365e-06, 2.2426247596740723e-05, 3.970414400100708e-05, 5.698204040527344e-05, 7.42599368095398e-05, 9.153783321380615e-05, 0.00010881572961807251, 0.00012609362602233887, 0.00014337152242660522, 0.00016064941883087158, 0.00017792731523513794, 0.0001952052116394043, 0.00021248310804367065, 0.000229761004447937, 0.00024703890085220337, 0.0002643167972564697, 0.0002815946936607361, 0.00029887259006500244, 0.0003161504864692688, 0.00033342838287353516, 0.0003507062792778015, 0.00036798417568206787, 0.00038526207208633423, 0.0004025399684906006, 0.00041981786489486694, 0.0004370957612991333, 0.00045437365770339966, 0.000471651554107666, 0.0004889294505119324, 0.0005062073469161987, 0.0005234852433204651, 0.0005407631397247314, 0.0005580410361289978, 0.0005753189325332642, 0.0005925968289375305, 0.0006098747253417969]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 10.0, 13.0, 8.0, 5.0, 11.0, 16.0, 15.0, 19.0, 20.0, 30.0, 41.0, 76.0, 396.0, 3331.0, 85453.0, 938905.0, 18441.0, 1304.0, 200.0, 47.0, 40.0, 24.0, 27.0, 17.0, 17.0, 15.0, 12.0, 9.0, 6.0, 9.0, 5.0, 9.0, 3.0, 0.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.265625, -20.607177734375, -19.94873046875, -19.290283203125, -18.6318359375, -17.973388671875, -17.31494140625, -16.656494140625, -15.998046875, -15.339599609375, -14.68115234375, -14.022705078125, -13.3642578125, -12.705810546875, -12.04736328125, -11.388916015625, -10.73046875, -10.072021484375, -9.41357421875, -8.755126953125, -8.0966796875, -7.438232421875, -6.77978515625, -6.121337890625, -5.462890625, -4.804443359375, -4.14599609375, -3.487548828125, -2.8291015625, -2.170654296875, -1.51220703125, -0.853759765625, -0.1953125, 0.463134765625, 1.12158203125, 1.780029296875, 2.4384765625, 3.096923828125, 3.75537109375, 4.413818359375, 5.072265625, 5.730712890625, 6.38916015625, 7.047607421875, 7.7060546875, 8.364501953125, 9.02294921875, 9.681396484375, 10.33984375, 10.998291015625, 11.65673828125, 12.315185546875, 12.9736328125, 13.632080078125, 14.29052734375, 14.948974609375, 15.607421875, 16.265869140625, 16.92431640625, 17.582763671875, 18.2412109375, 18.899658203125, 19.55810546875, 20.216552734375, 20.875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 13.0, 17.0, 10.0, 14.0, 29.0, 24.0, 40.0, 50.0, 62.0, 88.0, 125.0, 115.0, 91.0, 68.0, 47.0, 44.0, 28.0, 26.0, 21.0, 15.0, 14.0, 13.0, 12.0, 3.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.146484375, -1.1095123291015625, -1.072540283203125, -1.0355682373046875, -0.99859619140625, -0.9616241455078125, -0.924652099609375, -0.8876800537109375, -0.8507080078125, -0.8137359619140625, -0.776763916015625, -0.7397918701171875, -0.70281982421875, -0.6658477783203125, -0.628875732421875, -0.5919036865234375, -0.554931640625, -0.5179595947265625, -0.480987548828125, -0.4440155029296875, -0.40704345703125, -0.3700714111328125, -0.333099365234375, -0.2961273193359375, -0.2591552734375, -0.2221832275390625, -0.185211181640625, -0.1482391357421875, -0.11126708984375, -0.0742950439453125, -0.037322998046875, -0.0003509521484375, 0.03662109375, 0.0735931396484375, 0.110565185546875, 0.1475372314453125, 0.18450927734375, 0.2214813232421875, 0.258453369140625, 0.2954254150390625, 0.3323974609375, 0.3693695068359375, 0.406341552734375, 0.4433135986328125, 0.48028564453125, 0.5172576904296875, 0.554229736328125, 0.5912017822265625, 0.628173828125, 0.6651458740234375, 0.702117919921875, 0.7390899658203125, 0.77606201171875, 0.8130340576171875, 0.850006103515625, 0.8869781494140625, 0.9239501953125, 0.9609222412109375, 0.997894287109375, 1.0348663330078125, 1.07183837890625, 1.1088104248046875, 1.145782470703125, 1.1827545166015625, 1.2197265625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 14.0, 4.0, 14.0, 34.0, 48.0, 89.0, 113.0, 165.0, 170.0, 134.0, 71.0, 54.0, 41.0, 16.0, 13.0, 13.0, 9.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.942188262939453, -16.557514190673828, -16.172842025756836, -15.788168907165527, -15.403495788574219, -15.01882266998291, -14.634149551391602, -14.249476432800293, -13.864803314208984, -13.480130195617676, -13.095457077026367, -12.710783958435059, -12.32611083984375, -11.941437721252441, -11.556764602661133, -11.172091484069824, -10.787418365478516, -10.402745246887207, -10.018072128295898, -9.63339900970459, -9.248725891113281, -8.864052772521973, -8.479379653930664, -8.094706535339355, -7.710033416748047, -7.325360298156738, -6.94068717956543, -6.556014060974121, -6.1713409423828125, -5.786667823791504, -5.401994705200195, -5.017321586608887, -4.632648944854736, -4.247975826263428, -3.863302707672119, -3.4786295890808105, -3.093956470489502, -2.7092833518981934, -2.3246102333068848, -1.9399371147155762, -1.5552639961242676, -1.170590877532959, -0.7859177589416504, -0.4012446403503418, -0.016571521759033203, 0.3681015968322754, 0.752774715423584, 1.1374478340148926, 1.5221209526062012, 1.9067940711975098, 2.2914671897888184, 2.676140308380127, 3.0608134269714355, 3.445486545562744, 3.8301596641540527, 4.214832782745361, 4.59950590133667, 4.9841790199279785, 5.368852138519287, 5.753525257110596, 6.138198375701904, 6.522871494293213, 6.9075446128845215, 7.29221773147583, 7.676890850067139]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 7.0, 4.0, 7.0, 9.0, 12.0, 14.0, 17.0, 23.0, 17.0, 25.0, 35.0, 32.0, 35.0, 47.0, 48.0, 48.0, 42.0, 45.0, 36.0, 31.0, 45.0, 37.0, 39.0, 42.0, 48.0, 41.0, 31.0, 32.0, 26.0, 19.0, 21.0, 16.0, 10.0, 5.0, 13.0, 9.0, 6.0, 10.0, 5.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.088141918182373, -6.8908891677856445, -6.693635940551758, -6.496382713317871, -6.299129962921143, -6.101877212524414, -5.904623985290527, -5.707370758056641, -5.510118007659912, -5.312865257263184, -5.115612030029297, -4.91835880279541, -4.721106052398682, -4.523853302001953, -4.326600074768066, -4.12934684753418, -3.932094097137451, -3.7348411083221436, -3.537588119506836, -3.3403351306915283, -3.1430821418762207, -2.945829153060913, -2.7485761642456055, -2.551323175430298, -2.3540701866149902, -2.1568171977996826, -1.959564208984375, -1.7623112201690674, -1.5650582313537598, -1.3678052425384521, -1.1705522537231445, -0.9732992649078369, -0.7760462760925293, -0.5787932872772217, -0.38154029846191406, -0.18428730964660645, 0.012965679168701172, 0.2102186679840088, 0.4074716567993164, 0.604724645614624, 0.8019776344299316, 0.9992306232452393, 1.1964836120605469, 1.3937366008758545, 1.590989589691162, 1.7882425785064697, 1.9854955673217773, 2.182748556137085, 2.3800015449523926, 2.5772545337677, 2.774507522583008, 2.9717605113983154, 3.169013500213623, 3.3662664890289307, 3.5635194778442383, 3.760772466659546, 3.9580254554748535, 4.155278205871582, 4.352531433105469, 4.5497846603393555, 4.747037410736084, 4.9442901611328125, 5.141543388366699, 5.338796615600586, 5.5360493659973145]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 19.0, 18.0, 42.0, 42.0, 58.0, 77.0, 132.0, 160.0, 271.0, 363.0, 529.0, 797.0, 1248.0, 2017.0, 3772.0, 7849.0, 18245.0, 47869.0, 139086.0, 333440.0, 303466.0, 116829.0, 40592.0, 15969.0, 6794.0, 3433.0, 1885.0, 1167.0, 760.0, 479.0, 348.0, 216.0, 183.0, 120.0, 71.0, 54.0, 43.0, 35.0, 16.0, 19.0, 10.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-12.578125, -12.196044921875, -11.81396484375, -11.431884765625, -11.0498046875, -10.667724609375, -10.28564453125, -9.903564453125, -9.521484375, -9.139404296875, -8.75732421875, -8.375244140625, -7.9931640625, -7.611083984375, -7.22900390625, -6.846923828125, -6.46484375, -6.082763671875, -5.70068359375, -5.318603515625, -4.9365234375, -4.554443359375, -4.17236328125, -3.790283203125, -3.408203125, -3.026123046875, -2.64404296875, -2.261962890625, -1.8798828125, -1.497802734375, -1.11572265625, -0.733642578125, -0.3515625, 0.030517578125, 0.41259765625, 0.794677734375, 1.1767578125, 1.558837890625, 1.94091796875, 2.322998046875, 2.705078125, 3.087158203125, 3.46923828125, 3.851318359375, 4.2333984375, 4.615478515625, 4.99755859375, 5.379638671875, 5.76171875, 6.143798828125, 6.52587890625, 6.907958984375, 7.2900390625, 7.672119140625, 8.05419921875, 8.436279296875, 8.818359375, 9.200439453125, 9.58251953125, 9.964599609375, 10.3466796875, 10.728759765625, 11.11083984375, 11.492919921875, 11.875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 5.0, 13.0, 6.0, 9.0, 17.0, 22.0, 17.0, 20.0, 31.0, 27.0, 45.0, 36.0, 45.0, 42.0, 51.0, 43.0, 36.0, 52.0, 35.0, 47.0, 46.0, 49.0, 30.0, 44.0, 36.0, 29.0, 21.0, 27.0, 25.0, 10.0, 13.0, 11.0, 13.0, 8.0, 7.0, 12.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.04296875, -4.90032958984375, -4.7576904296875, -4.61505126953125, -4.472412109375, -4.32977294921875, -4.1871337890625, -4.04449462890625, -3.90185546875, -3.75921630859375, -3.6165771484375, -3.47393798828125, -3.331298828125, -3.18865966796875, -3.0460205078125, -2.90338134765625, -2.7607421875, -2.61810302734375, -2.4754638671875, -2.33282470703125, -2.190185546875, -2.04754638671875, -1.9049072265625, -1.76226806640625, -1.61962890625, -1.47698974609375, -1.3343505859375, -1.19171142578125, -1.049072265625, -0.90643310546875, -0.7637939453125, -0.62115478515625, -0.478515625, -0.33587646484375, -0.1932373046875, -0.05059814453125, 0.092041015625, 0.23468017578125, 0.3773193359375, 0.51995849609375, 0.66259765625, 0.80523681640625, 0.9478759765625, 1.09051513671875, 1.233154296875, 1.37579345703125, 1.5184326171875, 1.66107177734375, 1.8037109375, 1.94635009765625, 2.0889892578125, 2.23162841796875, 2.374267578125, 2.51690673828125, 2.6595458984375, 2.80218505859375, 2.94482421875, 3.08746337890625, 3.2301025390625, 3.37274169921875, 3.515380859375, 3.65802001953125, 3.8006591796875, 3.94329833984375, 4.0859375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 2.0, 12.0, 16.0, 16.0, 16.0, 13.0, 34.0, 24.0, 27.0, 27.0, 39.0, 44.0, 40.0, 90.0, 503.0, 9536.0, 1002383.0, 34349.0, 914.0, 115.0, 55.0, 38.0, 47.0, 35.0, 34.0, 22.0, 16.0, 11.0, 22.0, 16.0, 13.0, 8.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.5625, -96.5107421875, -93.458984375, -90.4072265625, -87.35546875, -84.3037109375, -81.251953125, -78.2001953125, -75.1484375, -72.0966796875, -69.044921875, -65.9931640625, -62.94140625, -59.8896484375, -56.837890625, -53.7861328125, -50.734375, -47.6826171875, -44.630859375, -41.5791015625, -38.52734375, -35.4755859375, -32.423828125, -29.3720703125, -26.3203125, -23.2685546875, -20.216796875, -17.1650390625, -14.11328125, -11.0615234375, -8.009765625, -4.9580078125, -1.90625, 1.1455078125, 4.197265625, 7.2490234375, 10.30078125, 13.3525390625, 16.404296875, 19.4560546875, 22.5078125, 25.5595703125, 28.611328125, 31.6630859375, 34.71484375, 37.7666015625, 40.818359375, 43.8701171875, 46.921875, 49.9736328125, 53.025390625, 56.0771484375, 59.12890625, 62.1806640625, 65.232421875, 68.2841796875, 71.3359375, 74.3876953125, 77.439453125, 80.4912109375, 83.54296875, 86.5947265625, 89.646484375, 92.6982421875, 95.75]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 8.0, 4.0, 9.0, 9.0, 13.0, 18.0, 19.0, 23.0, 29.0, 41.0, 31.0, 36.0, 45.0, 55.0, 46.0, 65.0, 55.0, 52.0, 61.0, 46.0, 47.0, 48.0, 50.0, 49.0, 23.0, 21.0, 25.0, 13.0, 15.0, 8.0, 8.0, 8.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.015625, -7.77325439453125, -7.5308837890625, -7.28851318359375, -7.046142578125, -6.80377197265625, -6.5614013671875, -6.31903076171875, -6.07666015625, -5.83428955078125, -5.5919189453125, -5.34954833984375, -5.107177734375, -4.86480712890625, -4.6224365234375, -4.38006591796875, -4.1376953125, -3.89532470703125, -3.6529541015625, -3.41058349609375, -3.168212890625, -2.92584228515625, -2.6834716796875, -2.44110107421875, -2.19873046875, -1.95635986328125, -1.7139892578125, -1.47161865234375, -1.229248046875, -0.98687744140625, -0.7445068359375, -0.50213623046875, -0.259765625, -0.01739501953125, 0.2249755859375, 0.46734619140625, 0.709716796875, 0.95208740234375, 1.1944580078125, 1.43682861328125, 1.67919921875, 1.92156982421875, 2.1639404296875, 2.40631103515625, 2.648681640625, 2.89105224609375, 3.1334228515625, 3.37579345703125, 3.6181640625, 3.86053466796875, 4.1029052734375, 4.34527587890625, 4.587646484375, 4.83001708984375, 5.0723876953125, 5.31475830078125, 5.55712890625, 5.79949951171875, 6.0418701171875, 6.28424072265625, 6.526611328125, 6.76898193359375, 7.0113525390625, 7.25372314453125, 7.49609375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 10.0, 21.0, 28.0, 59.0, 92.0, 172.0, 506.0, 2389.0, 44921.0, 986539.0, 11893.0, 1265.0, 317.0, 131.0, 81.0, 45.0, 35.0, 12.0, 16.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0], "bins": [-19.4375, -19.0267333984375, -18.615966796875, -18.2052001953125, -17.79443359375, -17.3836669921875, -16.972900390625, -16.5621337890625, -16.1513671875, -15.7406005859375, -15.329833984375, -14.9190673828125, -14.50830078125, -14.0975341796875, -13.686767578125, -13.2760009765625, -12.865234375, -12.4544677734375, -12.043701171875, -11.6329345703125, -11.22216796875, -10.8114013671875, -10.400634765625, -9.9898681640625, -9.5791015625, -9.1683349609375, -8.757568359375, -8.3468017578125, -7.93603515625, -7.5252685546875, -7.114501953125, -6.7037353515625, -6.29296875, -5.8822021484375, -5.471435546875, -5.0606689453125, -4.64990234375, -4.2391357421875, -3.828369140625, -3.4176025390625, -3.0068359375, -2.5960693359375, -2.185302734375, -1.7745361328125, -1.36376953125, -0.9530029296875, -0.542236328125, -0.1314697265625, 0.279296875, 0.6900634765625, 1.100830078125, 1.5115966796875, 1.92236328125, 2.3331298828125, 2.743896484375, 3.1546630859375, 3.5654296875, 3.9761962890625, 4.386962890625, 4.7977294921875, 5.20849609375, 5.6192626953125, 6.030029296875, 6.4407958984375, 6.8515625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 9.0, 7.0, 19.0, 26.0, 40.0, 55.0, 99.0, 166.0, 162.0, 139.0, 106.0, 53.0, 37.0, 21.0, 17.0, 15.0, 10.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00030231475830078125, -0.00029425323009490967, -0.0002861917018890381, -0.0002781301736831665, -0.0002700686454772949, -0.00026200711727142334, -0.00025394558906555176, -0.0002458840608596802, -0.0002378225326538086, -0.000229761004447937, -0.00022169947624206543, -0.00021363794803619385, -0.00020557641983032227, -0.00019751489162445068, -0.0001894533634185791, -0.00018139183521270752, -0.00017333030700683594, -0.00016526877880096436, -0.00015720725059509277, -0.0001491457223892212, -0.0001410841941833496, -0.00013302266597747803, -0.00012496113777160645, -0.00011689960956573486, -0.00010883808135986328, -0.0001007765531539917, -9.271502494812012e-05, -8.465349674224854e-05, -7.659196853637695e-05, -6.853044033050537e-05, -6.046891212463379e-05, -5.240738391876221e-05, -4.4345855712890625e-05, -3.628432750701904e-05, -2.822279930114746e-05, -2.016127109527588e-05, -1.2099742889404297e-05, -4.038214683532715e-06, 4.023313522338867e-06, 1.208484172821045e-05, 2.014636993408203e-05, 2.8207898139953613e-05, 3.6269426345825195e-05, 4.433095455169678e-05, 5.239248275756836e-05, 6.045401096343994e-05, 6.851553916931152e-05, 7.65770673751831e-05, 8.463859558105469e-05, 9.270012378692627e-05, 0.00010076165199279785, 0.00010882318019866943, 0.00011688470840454102, 0.0001249462366104126, 0.00013300776481628418, 0.00014106929302215576, 0.00014913082122802734, 0.00015719234943389893, 0.0001652538776397705, 0.0001733154058456421, 0.00018137693405151367, 0.00018943846225738525, 0.00019749999046325684, 0.00020556151866912842, 0.000213623046875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 0.0, 3.0, 3.0, 5.0, 2.0, 6.0, 8.0, 11.0, 11.0, 33.0, 46.0, 100.0, 977.0, 1033359.0, 13544.0, 229.0, 76.0, 38.0, 23.0, 22.0, 18.0, 12.0, 10.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.90625, -31.959228515625, -31.01220703125, -30.065185546875, -29.1181640625, -28.171142578125, -27.22412109375, -26.277099609375, -25.330078125, -24.383056640625, -23.43603515625, -22.489013671875, -21.5419921875, -20.594970703125, -19.64794921875, -18.700927734375, -17.75390625, -16.806884765625, -15.85986328125, -14.912841796875, -13.9658203125, -13.018798828125, -12.07177734375, -11.124755859375, -10.177734375, -9.230712890625, -8.28369140625, -7.336669921875, -6.3896484375, -5.442626953125, -4.49560546875, -3.548583984375, -2.6015625, -1.654541015625, -0.70751953125, 0.239501953125, 1.1865234375, 2.133544921875, 3.08056640625, 4.027587890625, 4.974609375, 5.921630859375, 6.86865234375, 7.815673828125, 8.7626953125, 9.709716796875, 10.65673828125, 11.603759765625, 12.55078125, 13.497802734375, 14.44482421875, 15.391845703125, 16.3388671875, 17.285888671875, 18.23291015625, 19.179931640625, 20.126953125, 21.073974609375, 22.02099609375, 22.968017578125, 23.9150390625, 24.862060546875, 25.80908203125, 26.756103515625, 27.703125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 3.0, 3.0, 6.0, 6.0, 9.0, 12.0, 19.0, 32.0, 64.0, 88.0, 134.0, 213.0, 125.0, 82.0, 69.0, 31.0, 24.0, 20.0, 15.0, 13.0, 9.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.033203125, -1.9743194580078125, -1.915435791015625, -1.8565521240234375, -1.79766845703125, -1.7387847900390625, -1.679901123046875, -1.6210174560546875, -1.5621337890625, -1.5032501220703125, -1.444366455078125, -1.3854827880859375, -1.32659912109375, -1.2677154541015625, -1.208831787109375, -1.1499481201171875, -1.091064453125, -1.0321807861328125, -0.973297119140625, -0.9144134521484375, -0.85552978515625, -0.7966461181640625, -0.737762451171875, -0.6788787841796875, -0.6199951171875, -0.5611114501953125, -0.502227783203125, -0.4433441162109375, -0.38446044921875, -0.3255767822265625, -0.266693115234375, -0.2078094482421875, -0.14892578125, -0.0900421142578125, -0.031158447265625, 0.0277252197265625, 0.08660888671875, 0.1454925537109375, 0.204376220703125, 0.2632598876953125, 0.3221435546875, 0.3810272216796875, 0.439910888671875, 0.4987945556640625, 0.55767822265625, 0.6165618896484375, 0.675445556640625, 0.7343292236328125, 0.793212890625, 0.8520965576171875, 0.910980224609375, 0.9698638916015625, 1.02874755859375, 1.0876312255859375, 1.146514892578125, 1.2053985595703125, 1.2642822265625, 1.3231658935546875, 1.382049560546875, 1.4409332275390625, 1.49981689453125, 1.5587005615234375, 1.617584228515625, 1.6764678955078125, 1.7353515625]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 32.0, 333.0, 553.0, 86.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84779930114746, -17.680919647216797, -16.514041900634766, -15.347162246704102, -14.180282592773438, -13.01340389251709, -11.846525192260742, -10.679645538330078, -9.51276683807373, -8.345888137817383, -7.179008483886719, -6.012129783630371, -4.845250606536865, -3.6783714294433594, -2.5114927291870117, -1.3446130752563477, -0.177734375, 0.9891446828842163, 2.1560237407684326, 3.3229026794433594, 4.489781856536865, 5.656661033630371, 6.823539733886719, 7.990419387817383, 9.15729808807373, 10.324176788330078, 11.491056442260742, 12.65793514251709, 13.824813842773438, 14.991693496704102, 16.158573150634766, 17.325450897216797, 18.492328643798828, 19.659208297729492, 20.826086044311523, 21.992965698242188, 23.15984535217285, 24.326725006103516, 25.493602752685547, 26.66048240661621, 27.827362060546875, 28.99424171447754, 30.16111946105957, 31.327999114990234, 32.494876861572266, 33.66175842285156, 34.828636169433594, 35.995513916015625, 37.162391662597656, 38.32926940917969, 39.496150970458984, 40.663028717041016, 41.82990646362305, 42.996788024902344, 44.163665771484375, 45.330543518066406, 46.4974250793457, 47.664302825927734, 48.83118438720703, 49.99806213378906, 51.164939880371094, 52.33182144165039, 53.49869918823242, 54.66558074951172, 55.83245849609375]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 9.0, 12.0, 10.0, 15.0, 12.0, 13.0, 13.0, 23.0, 31.0, 23.0, 25.0, 33.0, 34.0, 30.0, 36.0, 41.0, 31.0, 47.0, 44.0, 42.0, 38.0, 40.0, 43.0, 40.0, 38.0, 31.0, 26.0, 39.0, 34.0, 25.0, 20.0, 23.0, 14.0, 11.0, 5.0, 9.0, 9.0, 6.0, 3.0, 8.0, 1.0, 5.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.69399881362915, -5.507467746734619, -5.32093620300293, -5.134405136108398, -4.947874069213867, -4.761343002319336, -4.574811935424805, -4.388280391693115, -4.201749324798584, -4.015218257904053, -3.8286869525909424, -3.642155647277832, -3.455624580383301, -3.2690935134887695, -3.082562208175659, -2.896030902862549, -2.7094998359680176, -2.5229687690734863, -2.336437463760376, -2.1499061584472656, -1.9633750915527344, -1.7768439054489136, -1.5903127193450928, -1.403781533241272, -1.2172503471374512, -1.0307191610336304, -0.8441879749298096, -0.6576567888259888, -0.47112560272216797, -0.28459441661834717, -0.09806323051452637, 0.08846795558929443, 0.27499961853027344, 0.46153080463409424, 0.648061990737915, 0.8345931768417358, 1.0211243629455566, 1.2076555490493774, 1.3941867351531982, 1.580717921257019, 1.7672491073608398, 1.9537802934646606, 2.1403114795684814, 2.326842784881592, 2.513373851776123, 2.6999049186706543, 2.8864362239837646, 3.072967529296875, 3.2594985961914062, 3.4460296630859375, 3.632560968399048, 3.819092273712158, 4.0056233406066895, 4.192154407501221, 4.37868595123291, 4.565217018127441, 4.751748085021973, 4.938279151916504, 5.124810218811035, 5.311341762542725, 5.497872829437256, 5.684403896331787, 5.870935440063477, 6.057466506958008, 6.243997573852539]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 4.0, 6.0, 7.0, 10.0, 13.0, 42.0, 38.0, 51.0, 92.0, 120.0, 178.0, 272.0, 358.0, 555.0, 778.0, 1201.0, 1857.0, 2966.0, 4972.0, 8278.0, 15719.0, 36753.0, 121254.0, 610550.0, 2166609.0, 946591.0, 189013.0, 44108.0, 17684.0, 9246.0, 5403.0, 3317.0, 2022.0, 1364.0, 852.0, 558.0, 420.0, 300.0, 202.0, 155.0, 96.0, 78.0, 51.0, 44.0, 28.0, 26.0, 12.0, 7.0, 5.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.01953125, -4.86083984375, -4.7021484375, -4.54345703125, -4.384765625, -4.22607421875, -4.0673828125, -3.90869140625, -3.75, -3.59130859375, -3.4326171875, -3.27392578125, -3.115234375, -2.95654296875, -2.7978515625, -2.63916015625, -2.48046875, -2.32177734375, -2.1630859375, -2.00439453125, -1.845703125, -1.68701171875, -1.5283203125, -1.36962890625, -1.2109375, -1.05224609375, -0.8935546875, -0.73486328125, -0.576171875, -0.41748046875, -0.2587890625, -0.10009765625, 0.05859375, 0.21728515625, 0.3759765625, 0.53466796875, 0.693359375, 0.85205078125, 1.0107421875, 1.16943359375, 1.328125, 1.48681640625, 1.6455078125, 1.80419921875, 1.962890625, 2.12158203125, 2.2802734375, 2.43896484375, 2.59765625, 2.75634765625, 2.9150390625, 3.07373046875, 3.232421875, 3.39111328125, 3.5498046875, 3.70849609375, 3.8671875, 4.02587890625, 4.1845703125, 4.34326171875, 4.501953125, 4.66064453125, 4.8193359375, 4.97802734375, 5.13671875]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 12.0, 10.0, 7.0, 10.0, 9.0, 21.0, 22.0, 26.0, 22.0, 21.0, 38.0, 24.0, 29.0, 39.0, 33.0, 33.0, 50.0, 41.0, 44.0, 42.0, 46.0, 42.0, 36.0, 46.0, 36.0, 36.0, 27.0, 33.0, 27.0, 23.0, 23.0, 21.0, 12.0, 5.0, 13.0, 7.0, 8.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.34765625, -3.23150634765625, -3.1153564453125, -2.99920654296875, -2.883056640625, -2.76690673828125, -2.6507568359375, -2.53460693359375, -2.41845703125, -2.30230712890625, -2.1861572265625, -2.07000732421875, -1.953857421875, -1.83770751953125, -1.7215576171875, -1.60540771484375, -1.4892578125, -1.37310791015625, -1.2569580078125, -1.14080810546875, -1.024658203125, -0.90850830078125, -0.7923583984375, -0.67620849609375, -0.56005859375, -0.44390869140625, -0.3277587890625, -0.21160888671875, -0.095458984375, 0.02069091796875, 0.1368408203125, 0.25299072265625, 0.369140625, 0.48529052734375, 0.6014404296875, 0.71759033203125, 0.833740234375, 0.94989013671875, 1.0660400390625, 1.18218994140625, 1.29833984375, 1.41448974609375, 1.5306396484375, 1.64678955078125, 1.762939453125, 1.87908935546875, 1.9952392578125, 2.11138916015625, 2.2275390625, 2.34368896484375, 2.4598388671875, 2.57598876953125, 2.692138671875, 2.80828857421875, 2.9244384765625, 3.04058837890625, 3.15673828125, 3.27288818359375, 3.3890380859375, 3.50518798828125, 3.621337890625, 3.73748779296875, 3.8536376953125, 3.96978759765625, 4.0859375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 10.0, 5.0, 18.0, 31.0, 88.0, 279.0, 1215.0, 4182458.0, 9564.0, 382.0, 106.0, 37.0, 26.0, 14.0, 3.0, 8.0, 7.0, 3.0, 5.0, 8.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.0, -64.87109375, -61.7421875, -58.61328125, -55.484375, -52.35546875, -49.2265625, -46.09765625, -42.96875, -39.83984375, -36.7109375, -33.58203125, -30.453125, -27.32421875, -24.1953125, -21.06640625, -17.9375, -14.80859375, -11.6796875, -8.55078125, -5.421875, -2.29296875, 0.8359375, 3.96484375, 7.09375, 10.22265625, 13.3515625, 16.48046875, 19.609375, 22.73828125, 25.8671875, 28.99609375, 32.125, 35.25390625, 38.3828125, 41.51171875, 44.640625, 47.76953125, 50.8984375, 54.02734375, 57.15625, 60.28515625, 63.4140625, 66.54296875, 69.671875, 72.80078125, 75.9296875, 79.05859375, 82.1875, 85.31640625, 88.4453125, 91.57421875, 94.703125, 97.83203125, 100.9609375, 104.08984375, 107.21875, 110.34765625, 113.4765625, 116.60546875, 119.734375, 122.86328125, 125.9921875, 129.12109375, 132.25]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 6.0, 7.0, 7.0, 18.0, 18.0, 33.0, 103.0, 273.0, 677.0, 1252.0, 1016.0, 391.0, 124.0, 44.0, 32.0, 22.0, 7.0, 8.0, 6.0, 6.0, 5.0, 3.0, 5.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.466796875, -2.358734130859375, -2.25067138671875, -2.142608642578125, -2.0345458984375, -1.926483154296875, -1.81842041015625, -1.710357666015625, -1.602294921875, -1.494232177734375, -1.38616943359375, -1.278106689453125, -1.1700439453125, -1.061981201171875, -0.95391845703125, -0.845855712890625, -0.73779296875, -0.629730224609375, -0.52166748046875, -0.413604736328125, -0.3055419921875, -0.197479248046875, -0.08941650390625, 0.018646240234375, 0.126708984375, 0.234771728515625, 0.34283447265625, 0.450897216796875, 0.5589599609375, 0.667022705078125, 0.77508544921875, 0.883148193359375, 0.9912109375, 1.099273681640625, 1.20733642578125, 1.315399169921875, 1.4234619140625, 1.531524658203125, 1.63958740234375, 1.747650146484375, 1.855712890625, 1.963775634765625, 2.07183837890625, 2.179901123046875, 2.2879638671875, 2.396026611328125, 2.50408935546875, 2.612152099609375, 2.72021484375, 2.828277587890625, 2.93634033203125, 3.044403076171875, 3.1524658203125, 3.260528564453125, 3.36859130859375, 3.476654052734375, 3.584716796875, 3.692779541015625, 3.80084228515625, 3.908905029296875, 4.0169677734375, 4.125030517578125, 4.23309326171875, 4.341156005859375, 4.44921875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 507.0, 467.0, 34.0, 2.0, 4.0], "bins": [-72.5263442993164, -71.31607055664062, -70.10579681396484, -68.89552307128906, -67.68525695800781, -66.47498321533203, -65.26470947265625, -64.05443572998047, -62.84416580200195, -61.63389205932617, -60.423622131347656, -59.213348388671875, -58.003074645996094, -56.79280471801758, -55.5825309753418, -54.37226104736328, -53.1619873046875, -51.95171356201172, -50.7414436340332, -49.53116989135742, -48.32089614868164, -47.110626220703125, -45.900352478027344, -44.69007873535156, -43.47980499267578, -42.26953125, -41.059261322021484, -39.8489875793457, -38.63871383666992, -37.428443908691406, -36.218170166015625, -35.007896423339844, -33.79762649536133, -32.58735275268555, -31.3770809173584, -30.16680908203125, -28.9565372467041, -27.746265411376953, -26.535991668701172, -25.325719833374023, -24.115446090698242, -22.905174255371094, -21.694900512695312, -20.484628677368164, -19.274356842041016, -18.064083099365234, -16.853811264038086, -15.643539428710938, -14.433265686035156, -13.222992897033691, -12.012721061706543, -10.802448272705078, -9.59217643737793, -8.381903648376465, -7.171630859375, -5.961359024047852, -4.751086711883545, -3.5408143997192383, -2.3305418491363525, -1.1202692985534668, 0.09000301361083984, 1.3002753257751465, 2.5105481147766113, 3.7208199501037598, 4.931092739105225]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 11.0, 10.0, 20.0, 17.0, 14.0, 17.0, 24.0, 30.0, 27.0, 31.0, 35.0, 34.0, 29.0, 50.0, 45.0, 48.0, 50.0, 51.0, 39.0, 50.0, 44.0, 38.0, 34.0, 29.0, 28.0, 28.0, 26.0, 23.0, 22.0, 23.0, 15.0, 13.0, 8.0, 5.0, 2.0, 8.0, 3.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.8833327293396, -4.73965311050415, -4.595973014831543, -4.452293395996094, -4.308613300323486, -4.164933681488037, -4.02125358581543, -3.8775739669799805, -3.733893871307373, -3.5902140140533447, -3.4465341567993164, -3.302854299545288, -3.1591744422912598, -3.0154945850372314, -2.871814727783203, -2.728135108947754, -2.5844552516937256, -2.4407753944396973, -2.297095537185669, -2.1534156799316406, -2.0097358226776123, -1.866055965423584, -1.7223762273788452, -1.578696370124817, -1.4350165128707886, -1.2913366556167603, -1.147656798362732, -1.0039770603179932, -0.8602971434593201, -0.7166172862052917, -0.5729374885559082, -0.4292576313018799, -0.28557777404785156, -0.14189793169498444, 0.0017819106578826904, 0.14546173810958862, 0.28914159536361694, 0.43282145261764526, 0.5765012502670288, 0.7201811075210571, 0.8638609647750854, 1.0075408220291138, 1.151220679283142, 1.2949004173278809, 1.4385802745819092, 1.5822601318359375, 1.7259399890899658, 1.8696198463439941, 2.0132997035980225, 2.156979560852051, 2.300659418106079, 2.4443392753601074, 2.5880191326141357, 2.731698989868164, 2.8753786087036133, 3.0190587043762207, 3.16273832321167, 3.3064181804656982, 3.4500980377197266, 3.593777894973755, 3.737457752227783, 3.8811376094818115, 4.02481746673584, 4.168497085571289, 4.3121771812438965]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 19.0, 19.0, 31.0, 57.0, 88.0, 145.0, 243.0, 417.0, 615.0, 1053.0, 1786.0, 3168.0, 5477.0, 10107.0, 19417.0, 38508.0, 79444.0, 171402.0, 320994.0, 206477.0, 94331.0, 45532.0, 22527.0, 11773.0, 6394.0, 3500.0, 2073.0, 1189.0, 670.0, 408.0, 261.0, 145.0, 97.0, 71.0, 31.0, 23.0, 20.0, 12.0, 12.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.65234375, -4.50518798828125, -4.3580322265625, -4.21087646484375, -4.063720703125, -3.91656494140625, -3.7694091796875, -3.62225341796875, -3.47509765625, -3.32794189453125, -3.1807861328125, -3.03363037109375, -2.886474609375, -2.73931884765625, -2.5921630859375, -2.44500732421875, -2.2978515625, -2.15069580078125, -2.0035400390625, -1.85638427734375, -1.709228515625, -1.56207275390625, -1.4149169921875, -1.26776123046875, -1.12060546875, -0.97344970703125, -0.8262939453125, -0.67913818359375, -0.531982421875, -0.38482666015625, -0.2376708984375, -0.09051513671875, 0.056640625, 0.20379638671875, 0.3509521484375, 0.49810791015625, 0.645263671875, 0.79241943359375, 0.9395751953125, 1.08673095703125, 1.23388671875, 1.38104248046875, 1.5281982421875, 1.67535400390625, 1.822509765625, 1.96966552734375, 2.1168212890625, 2.26397705078125, 2.4111328125, 2.55828857421875, 2.7054443359375, 2.85260009765625, 2.999755859375, 3.14691162109375, 3.2940673828125, 3.44122314453125, 3.58837890625, 3.73553466796875, 3.8826904296875, 4.02984619140625, 4.177001953125, 4.32415771484375, 4.4713134765625, 4.61846923828125, 4.765625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 5.0, 6.0, 7.0, 15.0, 13.0, 20.0, 21.0, 24.0, 27.0, 29.0, 35.0, 32.0, 31.0, 36.0, 48.0, 37.0, 43.0, 52.0, 43.0, 42.0, 43.0, 42.0, 38.0, 37.0, 33.0, 36.0, 25.0, 25.0, 25.0, 23.0, 22.0, 22.0, 11.0, 10.0, 7.0, 8.0, 4.0, 8.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.21875, -3.124481201171875, -3.03021240234375, -2.935943603515625, -2.8416748046875, -2.747406005859375, -2.65313720703125, -2.558868408203125, -2.464599609375, -2.370330810546875, -2.27606201171875, -2.181793212890625, -2.0875244140625, -1.993255615234375, -1.89898681640625, -1.804718017578125, -1.71044921875, -1.616180419921875, -1.52191162109375, -1.427642822265625, -1.3333740234375, -1.239105224609375, -1.14483642578125, -1.050567626953125, -0.956298828125, -0.862030029296875, -0.76776123046875, -0.673492431640625, -0.5792236328125, -0.484954833984375, -0.39068603515625, -0.296417236328125, -0.2021484375, -0.107879638671875, -0.01361083984375, 0.080657958984375, 0.1749267578125, 0.269195556640625, 0.36346435546875, 0.457733154296875, 0.552001953125, 0.646270751953125, 0.74053955078125, 0.834808349609375, 0.9290771484375, 1.023345947265625, 1.11761474609375, 1.211883544921875, 1.30615234375, 1.400421142578125, 1.49468994140625, 1.588958740234375, 1.6832275390625, 1.777496337890625, 1.87176513671875, 1.966033935546875, 2.060302734375, 2.154571533203125, 2.24884033203125, 2.343109130859375, 2.4373779296875, 2.531646728515625, 2.62591552734375, 2.720184326171875, 2.814453125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 5.0, 9.0, 10.0, 16.0, 18.0, 29.0, 37.0, 56.0, 102.0, 130.0, 186.0, 294.0, 472.0, 779.0, 1280.0, 2072.0, 3265.0, 5380.0, 9186.0, 16323.0, 30501.0, 64404.0, 165903.0, 420864.0, 184443.0, 69432.0, 32385.0, 16938.0, 9613.0, 5463.0, 3370.0, 2075.0, 1274.0, 810.0, 499.0, 327.0, 192.0, 116.0, 97.0, 67.0, 41.0, 28.0, 28.0, 13.0, 9.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.14886474609375, -3.0457763671875, -2.94268798828125, -2.839599609375, -2.73651123046875, -2.6334228515625, -2.53033447265625, -2.42724609375, -2.32415771484375, -2.2210693359375, -2.11798095703125, -2.014892578125, -1.91180419921875, -1.8087158203125, -1.70562744140625, -1.6025390625, -1.49945068359375, -1.3963623046875, -1.29327392578125, -1.190185546875, -1.08709716796875, -0.9840087890625, -0.88092041015625, -0.77783203125, -0.67474365234375, -0.5716552734375, -0.46856689453125, -0.365478515625, -0.26239013671875, -0.1593017578125, -0.05621337890625, 0.046875, 0.14996337890625, 0.2530517578125, 0.35614013671875, 0.459228515625, 0.56231689453125, 0.6654052734375, 0.76849365234375, 0.87158203125, 0.97467041015625, 1.0777587890625, 1.18084716796875, 1.283935546875, 1.38702392578125, 1.4901123046875, 1.59320068359375, 1.6962890625, 1.79937744140625, 1.9024658203125, 2.00555419921875, 2.108642578125, 2.21173095703125, 2.3148193359375, 2.41790771484375, 2.52099609375, 2.62408447265625, 2.7271728515625, 2.83026123046875, 2.933349609375, 3.03643798828125, 3.1395263671875, 3.24261474609375, 3.345703125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 7.0, 6.0, 14.0, 17.0, 19.0, 17.0, 16.0, 28.0, 19.0, 28.0, 25.0, 37.0, 35.0, 36.0, 34.0, 34.0, 54.0, 51.0, 36.0, 54.0, 37.0, 35.0, 42.0, 42.0, 33.0, 30.0, 26.0, 24.0, 23.0, 25.0, 27.0, 15.0, 9.0, 10.0, 8.0, 8.0, 8.0, 9.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.169921875, -2.099090576171875, -2.02825927734375, -1.957427978515625, -1.8865966796875, -1.815765380859375, -1.74493408203125, -1.674102783203125, -1.603271484375, -1.532440185546875, -1.46160888671875, -1.390777587890625, -1.3199462890625, -1.249114990234375, -1.17828369140625, -1.107452392578125, -1.03662109375, -0.965789794921875, -0.89495849609375, -0.824127197265625, -0.7532958984375, -0.682464599609375, -0.61163330078125, -0.540802001953125, -0.469970703125, -0.399139404296875, -0.32830810546875, -0.257476806640625, -0.1866455078125, -0.115814208984375, -0.04498291015625, 0.025848388671875, 0.0966796875, 0.167510986328125, 0.23834228515625, 0.309173583984375, 0.3800048828125, 0.450836181640625, 0.52166748046875, 0.592498779296875, 0.663330078125, 0.734161376953125, 0.80499267578125, 0.875823974609375, 0.9466552734375, 1.017486572265625, 1.08831787109375, 1.159149169921875, 1.22998046875, 1.300811767578125, 1.37164306640625, 1.442474365234375, 1.5133056640625, 1.584136962890625, 1.65496826171875, 1.725799560546875, 1.796630859375, 1.867462158203125, 1.93829345703125, 2.009124755859375, 2.0799560546875, 2.150787353515625, 2.22161865234375, 2.292449951171875, 2.36328125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 6.0, 17.0, 12.0, 17.0, 20.0, 29.0, 35.0, 47.0, 66.0, 91.0, 126.0, 180.0, 241.0, 358.0, 537.0, 885.0, 1481.0, 2566.0, 5321.0, 13507.0, 64099.0, 876804.0, 57581.0, 12912.0, 5039.0, 2540.0, 1433.0, 818.0, 563.0, 331.0, 235.0, 171.0, 124.0, 90.0, 43.0, 61.0, 31.0, 30.0, 29.0, 13.0, 15.0, 12.0, 11.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.6953125, -4.546142578125, -4.39697265625, -4.247802734375, -4.0986328125, -3.949462890625, -3.80029296875, -3.651123046875, -3.501953125, -3.352783203125, -3.20361328125, -3.054443359375, -2.9052734375, -2.756103515625, -2.60693359375, -2.457763671875, -2.30859375, -2.159423828125, -2.01025390625, -1.861083984375, -1.7119140625, -1.562744140625, -1.41357421875, -1.264404296875, -1.115234375, -0.966064453125, -0.81689453125, -0.667724609375, -0.5185546875, -0.369384765625, -0.22021484375, -0.071044921875, 0.078125, 0.227294921875, 0.37646484375, 0.525634765625, 0.6748046875, 0.823974609375, 0.97314453125, 1.122314453125, 1.271484375, 1.420654296875, 1.56982421875, 1.718994140625, 1.8681640625, 2.017333984375, 2.16650390625, 2.315673828125, 2.46484375, 2.614013671875, 2.76318359375, 2.912353515625, 3.0615234375, 3.210693359375, 3.35986328125, 3.509033203125, 3.658203125, 3.807373046875, 3.95654296875, 4.105712890625, 4.2548828125, 4.404052734375, 4.55322265625, 4.702392578125, 4.8515625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 10.0, 5.0, 6.0, 17.0, 22.0, 38.0, 47.0, 97.0, 243.0, 254.0, 115.0, 60.0, 36.0, 12.0, 13.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021505355834960938, -0.0002043396234512329, -0.00019362568855285645, -0.00018291175365447998, -0.00017219781875610352, -0.00016148388385772705, -0.00015076994895935059, -0.00014005601406097412, -0.00012934207916259766, -0.00011862814426422119, -0.00010791420936584473, -9.720027446746826e-05, -8.64863395690918e-05, -7.577240467071533e-05, -6.505846977233887e-05, -5.43445348739624e-05, -4.363059997558594e-05, -3.291666507720947e-05, -2.2202730178833008e-05, -1.1488795280456543e-05, -7.748603820800781e-07, 9.939074516296387e-06, 2.065300941467285e-05, 3.1366944313049316e-05, 4.208087921142578e-05, 5.2794814109802246e-05, 6.350874900817871e-05, 7.422268390655518e-05, 8.493661880493164e-05, 9.56505537033081e-05, 0.00010636448860168457, 0.00011707842350006104, 0.0001277923583984375, 0.00013850629329681396, 0.00014922022819519043, 0.0001599341630935669, 0.00017064809799194336, 0.00018136203289031982, 0.0001920759677886963, 0.00020278990268707275, 0.00021350383758544922, 0.00022421777248382568, 0.00023493170738220215, 0.0002456456422805786, 0.0002563595771789551, 0.00026707351207733154, 0.000277787446975708, 0.00028850138187408447, 0.00029921531677246094, 0.0003099292516708374, 0.00032064318656921387, 0.00033135712146759033, 0.0003420710563659668, 0.00035278499126434326, 0.0003634989261627197, 0.0003742128610610962, 0.00038492679595947266, 0.0003956407308578491, 0.0004063546657562256, 0.00041706860065460205, 0.0004277825355529785, 0.000438496470451355, 0.00044921040534973145, 0.0004599243402481079, 0.0004706382751464844]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 1.0, 5.0, 4.0, 11.0, 5.0, 16.0, 23.0, 65.0, 516.0, 1041879.0, 5787.0, 106.0, 33.0, 26.0, 15.0, 11.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-76.875, -74.66015625, -72.4453125, -70.23046875, -68.015625, -65.80078125, -63.5859375, -61.37109375, -59.15625, -56.94140625, -54.7265625, -52.51171875, -50.296875, -48.08203125, -45.8671875, -43.65234375, -41.4375, -39.22265625, -37.0078125, -34.79296875, -32.578125, -30.36328125, -28.1484375, -25.93359375, -23.71875, -21.50390625, -19.2890625, -17.07421875, -14.859375, -12.64453125, -10.4296875, -8.21484375, -6.0, -3.78515625, -1.5703125, 0.64453125, 2.859375, 5.07421875, 7.2890625, 9.50390625, 11.71875, 13.93359375, 16.1484375, 18.36328125, 20.578125, 22.79296875, 25.0078125, 27.22265625, 29.4375, 31.65234375, 33.8671875, 36.08203125, 38.296875, 40.51171875, 42.7265625, 44.94140625, 47.15625, 49.37109375, 51.5859375, 53.80078125, 56.015625, 58.23046875, 60.4453125, 62.66015625, 64.875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 5.0, 1.0, 4.0, 7.0, 4.0, 8.0, 12.0, 19.0, 44.0, 73.0, 486.0, 157.0, 57.0, 33.0, 23.0, 12.0, 12.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.822265625, -1.769866943359375, -1.71746826171875, -1.665069580078125, -1.6126708984375, -1.560272216796875, -1.50787353515625, -1.455474853515625, -1.403076171875, -1.350677490234375, -1.29827880859375, -1.245880126953125, -1.1934814453125, -1.141082763671875, -1.08868408203125, -1.036285400390625, -0.98388671875, -0.931488037109375, -0.87908935546875, -0.826690673828125, -0.7742919921875, -0.721893310546875, -0.66949462890625, -0.617095947265625, -0.564697265625, -0.512298583984375, -0.45989990234375, -0.407501220703125, -0.3551025390625, -0.302703857421875, -0.25030517578125, -0.197906494140625, -0.1455078125, -0.093109130859375, -0.04071044921875, 0.011688232421875, 0.0640869140625, 0.116485595703125, 0.16888427734375, 0.221282958984375, 0.273681640625, 0.326080322265625, 0.37847900390625, 0.430877685546875, 0.4832763671875, 0.535675048828125, 0.58807373046875, 0.640472412109375, 0.69287109375, 0.745269775390625, 0.79766845703125, 0.850067138671875, 0.9024658203125, 0.954864501953125, 1.00726318359375, 1.059661865234375, 1.112060546875, 1.164459228515625, 1.21685791015625, 1.269256591796875, 1.3216552734375, 1.374053955078125, 1.42645263671875, 1.478851318359375, 1.53125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 834.0, 179.0, 8.0], "bins": [-144.1192169189453, -141.78550720214844, -139.45179748535156, -137.1180877685547, -134.7843780517578, -132.45066833496094, -130.11695861816406, -127.78324890136719, -125.44953918457031, -123.11582946777344, -120.78211975097656, -118.44841003417969, -116.11470031738281, -113.78099060058594, -111.44728088378906, -109.11357116699219, -106.77985382080078, -104.4461441040039, -102.11243438720703, -99.77872467041016, -97.44501495361328, -95.1113052368164, -92.77759552001953, -90.44387817382812, -88.11016845703125, -85.77645874023438, -83.4427490234375, -81.10903930664062, -78.77532958984375, -76.44161987304688, -74.10791015625, -71.77420043945312, -69.44049835205078, -67.1067886352539, -64.77307891845703, -62.439369201660156, -60.10565948486328, -57.771949768066406, -55.438236236572266, -53.10452651977539, -50.77081298828125, -48.437103271484375, -46.1033935546875, -43.769683837890625, -41.43597412109375, -39.102264404296875, -36.768550872802734, -34.43484115600586, -32.101131439208984, -29.76742172241211, -27.433712005615234, -25.100000381469727, -22.76629066467285, -20.432580947875977, -18.09886932373047, -15.765159606933594, -13.431450843811035, -11.097740173339844, -8.764030456542969, -6.4303202629089355, -4.096610069274902, -1.7629003524780273, 0.5708103179931641, 2.9045209884643555, 5.2382307052612305]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 8.0, 15.0, 17.0, 31.0, 27.0, 28.0, 27.0, 29.0, 49.0, 38.0, 57.0, 45.0, 68.0, 50.0, 51.0, 48.0, 56.0, 58.0, 44.0, 40.0, 48.0, 36.0, 26.0, 13.0, 24.0, 18.0, 12.0, 9.0, 8.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.593400478363037, -4.472352981567383, -4.35130500793457, -4.230257511138916, -4.1092095375061035, -3.988162040710449, -3.867114305496216, -3.7460665702819824, -3.625019073486328, -3.5039713382720947, -3.3829236030578613, -3.261876106262207, -3.1408283710479736, -3.0197806358337402, -2.898732900619507, -2.7776851654052734, -2.65663743019104, -2.5355896949768066, -2.4145419597625732, -2.29349422454834, -2.1724467277526855, -2.051398992538452, -1.9303512573242188, -1.8093035221099854, -1.6882559061050415, -1.567208170890808, -1.4461605548858643, -1.3251128196716309, -1.2040650844573975, -1.0830174684524536, -0.9619697332382202, -0.8409220576286316, -0.7198741436004639, -0.5988264679908752, -0.47777876257896423, -0.3567310571670532, -0.2356833815574646, -0.11463570594787598, 0.006412029266357422, 0.12745970487594604, 0.24850738048553467, 0.3695550560951233, 0.4906027615070343, 0.6116504669189453, 0.7326981425285339, 0.8537458181381226, 0.974793553352356, 1.0958411693572998, 1.2168889045715332, 1.3379366397857666, 1.4589842557907104, 1.5800319910049438, 1.7010796070098877, 1.822127342224121, 1.9431750774383545, 2.064222812652588, 2.185270309448242, 2.3063180446624756, 2.427365779876709, 2.5484132766723633, 2.6694610118865967, 2.79050874710083, 2.9115564823150635, 3.032604217529297, 3.1536519527435303]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 4.0, 4.0, 7.0, 5.0, 7.0, 7.0, 8.0, 10.0, 12.0, 15.0, 13.0, 19.0, 17.0, 28.0, 51.0, 68.0, 118.0, 271.0, 842.0, 3045.0, 12820.0, 68136.0, 656179.0, 262922.0, 33952.0, 7192.0, 1779.0, 519.0, 202.0, 106.0, 42.0, 39.0, 16.0, 19.0, 16.0, 10.0, 12.0, 12.0, 12.0, 7.0, 3.0, 5.0, 1.0, 2.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7421875, -10.3414306640625, -9.940673828125, -9.5399169921875, -9.13916015625, -8.7384033203125, -8.337646484375, -7.9368896484375, -7.5361328125, -7.1353759765625, -6.734619140625, -6.3338623046875, -5.93310546875, -5.5323486328125, -5.131591796875, -4.7308349609375, -4.330078125, -3.9293212890625, -3.528564453125, -3.1278076171875, -2.72705078125, -2.3262939453125, -1.925537109375, -1.5247802734375, -1.1240234375, -0.7232666015625, -0.322509765625, 0.0782470703125, 0.47900390625, 0.8797607421875, 1.280517578125, 1.6812744140625, 2.08203125, 2.4827880859375, 2.883544921875, 3.2843017578125, 3.68505859375, 4.0858154296875, 4.486572265625, 4.8873291015625, 5.2880859375, 5.6888427734375, 6.089599609375, 6.4903564453125, 6.89111328125, 7.2918701171875, 7.692626953125, 8.0933837890625, 8.494140625, 8.8948974609375, 9.295654296875, 9.6964111328125, 10.09716796875, 10.4979248046875, 10.898681640625, 11.2994384765625, 11.7001953125, 12.1009521484375, 12.501708984375, 12.9024658203125, 13.30322265625, 13.7039794921875, 14.104736328125, 14.5054931640625, 14.90625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 12.0, 13.0, 31.0, 45.0, 64.0, 79.0, 92.0, 104.0, 104.0, 119.0, 114.0, 87.0, 49.0, 35.0, 33.0, 13.0, 9.0, 3.0, 3.0, 1.0, 2.0], "bins": [-8.375, -8.21197509765625, -8.0489501953125, -7.88592529296875, -7.722900390625, -7.55987548828125, -7.3968505859375, -7.23382568359375, -7.07080078125, -6.90777587890625, -6.7447509765625, -6.58172607421875, -6.418701171875, -6.25567626953125, -6.0926513671875, -5.92962646484375, -5.7666015625, -5.60357666015625, -5.4405517578125, -5.27752685546875, -5.114501953125, -4.95147705078125, -4.7884521484375, -4.62542724609375, -4.46240234375, -4.29937744140625, -4.1363525390625, -3.97332763671875, -3.810302734375, -3.64727783203125, -3.4842529296875, -3.32122802734375, -3.158203125, -2.99517822265625, -2.8321533203125, -2.66912841796875, -2.506103515625, -2.34307861328125, -2.1800537109375, -2.01702880859375, -1.85400390625, -1.69097900390625, -1.5279541015625, -1.36492919921875, -1.201904296875, -1.03887939453125, -0.8758544921875, -0.71282958984375, -0.5498046875, -0.38677978515625, -0.2237548828125, -0.06072998046875, 0.102294921875, 0.26531982421875, 0.4283447265625, 0.59136962890625, 0.75439453125, 0.91741943359375, 1.0804443359375, 1.24346923828125, 1.406494140625, 1.56951904296875, 1.7325439453125, 1.89556884765625, 2.05859375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 10.0, 2.0, 4.0, 12.0, 9.0, 11.0, 26.0, 18.0, 34.0, 32.0, 39.0, 44.0, 57.0, 57.0, 199.0, 11342.0, 1022123.0, 13960.0, 208.0, 49.0, 54.0, 47.0, 43.0, 38.0, 34.0, 22.0, 19.0, 12.0, 9.0, 13.0, 13.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-43.21875, -41.966796875, -40.71484375, -39.462890625, -38.2109375, -36.958984375, -35.70703125, -34.455078125, -33.203125, -31.951171875, -30.69921875, -29.447265625, -28.1953125, -26.943359375, -25.69140625, -24.439453125, -23.1875, -21.935546875, -20.68359375, -19.431640625, -18.1796875, -16.927734375, -15.67578125, -14.423828125, -13.171875, -11.919921875, -10.66796875, -9.416015625, -8.1640625, -6.912109375, -5.66015625, -4.408203125, -3.15625, -1.904296875, -0.65234375, 0.599609375, 1.8515625, 3.103515625, 4.35546875, 5.607421875, 6.859375, 8.111328125, 9.36328125, 10.615234375, 11.8671875, 13.119140625, 14.37109375, 15.623046875, 16.875, 18.126953125, 19.37890625, 20.630859375, 21.8828125, 23.134765625, 24.38671875, 25.638671875, 26.890625, 28.142578125, 29.39453125, 30.646484375, 31.8984375, 33.150390625, 34.40234375, 35.654296875, 36.90625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 6.0, 6.0, 15.0, 18.0, 21.0, 23.0, 26.0, 37.0, 39.0, 48.0, 52.0, 51.0, 52.0, 60.0, 49.0, 62.0, 48.0, 50.0, 51.0, 50.0, 36.0, 44.0, 32.0, 20.0, 25.0, 12.0, 14.0, 12.0, 7.0, 10.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.359375, -3.259429931640625, -3.15948486328125, -3.059539794921875, -2.9595947265625, -2.859649658203125, -2.75970458984375, -2.659759521484375, -2.559814453125, -2.459869384765625, -2.35992431640625, -2.259979248046875, -2.1600341796875, -2.060089111328125, -1.96014404296875, -1.860198974609375, -1.76025390625, -1.660308837890625, -1.56036376953125, -1.460418701171875, -1.3604736328125, -1.260528564453125, -1.16058349609375, -1.060638427734375, -0.960693359375, -0.860748291015625, -0.76080322265625, -0.660858154296875, -0.5609130859375, -0.460968017578125, -0.36102294921875, -0.261077880859375, -0.1611328125, -0.061187744140625, 0.03875732421875, 0.138702392578125, 0.2386474609375, 0.338592529296875, 0.43853759765625, 0.538482666015625, 0.638427734375, 0.738372802734375, 0.83831787109375, 0.938262939453125, 1.0382080078125, 1.138153076171875, 1.23809814453125, 1.338043212890625, 1.43798828125, 1.537933349609375, 1.63787841796875, 1.737823486328125, 1.8377685546875, 1.937713623046875, 2.03765869140625, 2.137603759765625, 2.237548828125, 2.337493896484375, 2.43743896484375, 2.537384033203125, 2.6373291015625, 2.737274169921875, 2.83721923828125, 2.937164306640625, 3.037109375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 4.0, 8.0, 9.0, 15.0, 38.0, 66.0, 175.0, 509.0, 1583.0, 5914.0, 33873.0, 935139.0, 60018.0, 8207.0, 1992.0, 603.0, 216.0, 74.0, 39.0, 20.0, 11.0, 9.0, 6.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.040771484375, -1.00439453125, -0.968017578125, -0.931640625, -0.895263671875, -0.85888671875, -0.822509765625, -0.7861328125, -0.749755859375, -0.71337890625, -0.677001953125, -0.640625, -0.604248046875, -0.56787109375, -0.531494140625, -0.4951171875, -0.458740234375, -0.42236328125, -0.385986328125, -0.349609375, -0.313232421875, -0.27685546875, -0.240478515625, -0.2041015625, -0.167724609375, -0.13134765625, -0.094970703125, -0.05859375, -0.022216796875, 0.01416015625, 0.050537109375, 0.0869140625, 0.123291015625, 0.15966796875, 0.196044921875, 0.232421875, 0.268798828125, 0.30517578125, 0.341552734375, 0.3779296875, 0.414306640625, 0.45068359375, 0.487060546875, 0.5234375, 0.559814453125, 0.59619140625, 0.632568359375, 0.6689453125, 0.705322265625, 0.74169921875, 0.778076171875, 0.814453125, 0.850830078125, 0.88720703125, 0.923583984375, 0.9599609375, 0.996337890625, 1.03271484375, 1.069091796875, 1.10546875, 1.141845703125, 1.17822265625, 1.214599609375, 1.2509765625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 10.0, 7.0, 6.0, 11.0, 11.0, 13.0, 21.0, 23.0, 35.0, 45.0, 74.0, 125.0, 153.0, 138.0, 86.0, 66.0, 39.0, 29.0, 17.0, 15.0, 10.0, 17.0, 10.0, 7.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.088878631591797e-05, -3.9599835872650146e-05, -3.8310885429382324e-05, -3.70219349861145e-05, -3.573298454284668e-05, -3.444403409957886e-05, -3.3155083656311035e-05, -3.186613321304321e-05, -3.057718276977539e-05, -2.928823232650757e-05, -2.7999281883239746e-05, -2.6710331439971924e-05, -2.54213809967041e-05, -2.413243055343628e-05, -2.2843480110168457e-05, -2.1554529666900635e-05, -2.0265579223632812e-05, -1.897662878036499e-05, -1.7687678337097168e-05, -1.6398727893829346e-05, -1.5109777450561523e-05, -1.3820827007293701e-05, -1.2531876564025879e-05, -1.1242926120758057e-05, -9.953975677490234e-06, -8.665025234222412e-06, -7.37607479095459e-06, -6.087124347686768e-06, -4.798173904418945e-06, -3.509223461151123e-06, -2.2202730178833008e-06, -9.313225746154785e-07, 3.5762786865234375e-07, 1.646578311920166e-06, 2.9355287551879883e-06, 4.2244791984558105e-06, 5.513429641723633e-06, 6.802380084991455e-06, 8.091330528259277e-06, 9.3802809715271e-06, 1.0669231414794922e-05, 1.1958181858062744e-05, 1.3247132301330566e-05, 1.4536082744598389e-05, 1.582503318786621e-05, 1.7113983631134033e-05, 1.8402934074401855e-05, 1.9691884517669678e-05, 2.09808349609375e-05, 2.2269785404205322e-05, 2.3558735847473145e-05, 2.4847686290740967e-05, 2.613663673400879e-05, 2.742558717727661e-05, 2.8714537620544434e-05, 3.0003488063812256e-05, 3.129243850708008e-05, 3.25813889503479e-05, 3.387033939361572e-05, 3.5159289836883545e-05, 3.644824028015137e-05, 3.773719072341919e-05, 3.902614116668701e-05, 4.0315091609954834e-05, 4.1604042053222656e-05]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 11.0, 25.0, 98.0, 587.0, 5785.0, 931371.0, 106656.0, 3468.0, 397.0, 75.0, 22.0, 9.0, 7.0, 4.0, 1.0, 6.0, 5.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.41796875, -2.3421630859375, -2.266357421875, -2.1905517578125, -2.11474609375, -2.0389404296875, -1.963134765625, -1.8873291015625, -1.8115234375, -1.7357177734375, -1.659912109375, -1.5841064453125, -1.50830078125, -1.4324951171875, -1.356689453125, -1.2808837890625, -1.205078125, -1.1292724609375, -1.053466796875, -0.9776611328125, -0.90185546875, -0.8260498046875, -0.750244140625, -0.6744384765625, -0.5986328125, -0.5228271484375, -0.447021484375, -0.3712158203125, -0.29541015625, -0.2196044921875, -0.143798828125, -0.0679931640625, 0.0078125, 0.0836181640625, 0.159423828125, 0.2352294921875, 0.31103515625, 0.3868408203125, 0.462646484375, 0.5384521484375, 0.6142578125, 0.6900634765625, 0.765869140625, 0.8416748046875, 0.91748046875, 0.9932861328125, 1.069091796875, 1.1448974609375, 1.220703125, 1.2965087890625, 1.372314453125, 1.4481201171875, 1.52392578125, 1.5997314453125, 1.675537109375, 1.7513427734375, 1.8271484375, 1.9029541015625, 1.978759765625, 2.0545654296875, 2.13037109375, 2.2061767578125, 2.281982421875, 2.3577880859375, 2.43359375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 7.0, 15.0, 13.0, 36.0, 72.0, 196.0, 356.0, 131.0, 49.0, 30.0, 14.0, 11.0, 9.0, 7.0, 2.0, 9.0, 7.0, 1.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2412109375, -0.2337512969970703, -0.22629165649414062, -0.21883201599121094, -0.21137237548828125, -0.20391273498535156, -0.19645309448242188, -0.1889934539794922, -0.1815338134765625, -0.1740741729736328, -0.16661453247070312, -0.15915489196777344, -0.15169525146484375, -0.14423561096191406, -0.13677597045898438, -0.1293163299560547, -0.121856689453125, -0.11439704895019531, -0.10693740844726562, -0.09947776794433594, -0.09201812744140625, -0.08455848693847656, -0.07709884643554688, -0.06963920593261719, -0.0621795654296875, -0.05471992492675781, -0.047260284423828125, -0.03980064392089844, -0.03234100341796875, -0.024881362915039062, -0.017421722412109375, -0.009962081909179688, -0.00250244140625, 0.0049571990966796875, 0.012416839599609375, 0.019876480102539062, 0.02733612060546875, 0.03479576110839844, 0.042255401611328125, 0.04971504211425781, 0.0571746826171875, 0.06463432312011719, 0.07209396362304688, 0.07955360412597656, 0.08701324462890625, 0.09447288513183594, 0.10193252563476562, 0.10939216613769531, 0.116851806640625, 0.12431144714355469, 0.13177108764648438, 0.13923072814941406, 0.14669036865234375, 0.15415000915527344, 0.16160964965820312, 0.1690692901611328, 0.1765289306640625, 0.1839885711669922, 0.19144821166992188, 0.19890785217285156, 0.20636749267578125, 0.21382713317871094, 0.22128677368164062, 0.2287464141845703, 0.2362060546875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 52.0, 965.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-114.47760009765625, -112.50828552246094, -110.53897094726562, -108.56966400146484, -106.60034942626953, -104.63103485107422, -102.6617202758789, -100.6924057006836, -98.72309875488281, -96.7537841796875, -94.78446960449219, -92.8151626586914, -90.8458480834961, -88.87653350830078, -86.90721893310547, -84.93790435791016, -82.96858978271484, -80.99927520751953, -79.02996063232422, -77.06065368652344, -75.09133911132812, -73.12202453613281, -71.1527099609375, -69.18339538574219, -67.21408081054688, -65.24476623535156, -63.275455474853516, -61.3061408996582, -59.336830139160156, -57.367515563964844, -55.39820098876953, -53.42888641357422, -51.4595832824707, -49.49026870727539, -47.520957946777344, -45.55164337158203, -43.58232879638672, -41.61301803588867, -39.64370346069336, -37.67439270019531, -35.705078125, -33.73576354980469, -31.76645278930664, -29.797138214111328, -27.82782554626465, -25.85851287841797, -23.889198303222656, -21.919885635375977, -19.950572967529297, -17.981260299682617, -16.011947631835938, -14.042633056640625, -12.073320388793945, -10.104007720947266, -8.13469409942627, -6.165380477905273, -4.196067810058594, -2.226754665374756, -0.25744152069091797, 1.71187162399292, 3.681184768676758, 5.6504974365234375, 7.619811058044434, 9.58912467956543, 11.55843734741211]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 3.0, 6.0, 13.0, 12.0, 17.0, 20.0, 42.0, 29.0, 37.0, 47.0, 66.0, 63.0, 59.0, 74.0, 61.0, 79.0, 59.0, 63.0, 57.0, 49.0, 30.0, 32.0, 30.0, 16.0, 11.0, 12.0, 7.0, 5.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.517223358154297, -4.395660877227783, -4.274098873138428, -4.152536392211914, -4.030974388122559, -3.909411907196045, -3.7878496646881104, -3.666287422180176, -3.544725179672241, -3.4231629371643066, -3.301600694656372, -3.1800384521484375, -3.058475971221924, -2.9369137287139893, -2.8153514862060547, -2.69378924369812, -2.5722270011901855, -2.450664758682251, -2.3291025161743164, -2.2075400352478027, -2.085977792739868, -1.9644155502319336, -1.842853307723999, -1.7212910652160645, -1.5997285842895508, -1.4781663417816162, -1.356603980064392, -1.2350417375564575, -1.113479495048523, -0.9919171929359436, -0.8703548908233643, -0.7487926483154297, -0.6272304058074951, -0.5056681036949158, -0.3841058611869812, -0.26254355907440186, -0.1409812867641449, -0.01941901445388794, 0.1021432876586914, 0.22370553016662598, 0.3452678322792053, 0.4668301045894623, 0.5883923768997192, 0.7099546790122986, 0.8315169811248779, 0.9530792236328125, 1.074641466140747, 1.1962037086486816, 1.3177660703659058, 1.4393283128738403, 1.5608906745910645, 1.682452917098999, 1.8040151596069336, 1.9255774021148682, 2.0471396446228027, 2.1687021255493164, 2.290264368057251, 2.4118266105651855, 2.53338885307312, 2.6549510955810547, 2.7765135765075684, 2.898075819015503, 3.0196380615234375, 3.141200304031372, 3.2627625465393066]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 9.0, 7.0, 18.0, 27.0, 41.0, 74.0, 130.0, 205.0, 389.0, 765.0, 1767.0, 5573.0, 84155.0, 4026914.0, 64001.0, 7079.0, 1606.0, 728.0, 320.0, 205.0, 112.0, 68.0, 31.0, 23.0, 14.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.94140625, -7.76287841796875, -7.5843505859375, -7.40582275390625, -7.227294921875, -7.04876708984375, -6.8702392578125, -6.69171142578125, -6.51318359375, -6.33465576171875, -6.1561279296875, -5.97760009765625, -5.799072265625, -5.62054443359375, -5.4420166015625, -5.26348876953125, -5.0849609375, -4.90643310546875, -4.7279052734375, -4.54937744140625, -4.370849609375, -4.19232177734375, -4.0137939453125, -3.83526611328125, -3.65673828125, -3.47821044921875, -3.2996826171875, -3.12115478515625, -2.942626953125, -2.76409912109375, -2.5855712890625, -2.40704345703125, -2.228515625, -2.04998779296875, -1.8714599609375, -1.69293212890625, -1.514404296875, -1.33587646484375, -1.1573486328125, -0.97882080078125, -0.80029296875, -0.62176513671875, -0.4432373046875, -0.26470947265625, -0.086181640625, 0.09234619140625, 0.2708740234375, 0.44940185546875, 0.6279296875, 0.80645751953125, 0.9849853515625, 1.16351318359375, 1.342041015625, 1.52056884765625, 1.6990966796875, 1.87762451171875, 2.05615234375, 2.23468017578125, 2.4132080078125, 2.59173583984375, 2.770263671875, 2.94879150390625, 3.1273193359375, 3.30584716796875, 3.484375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 12.0, 19.0, 20.0, 36.0, 39.0, 48.0, 61.0, 75.0, 74.0, 67.0, 91.0, 78.0, 81.0, 73.0, 61.0, 42.0, 41.0, 22.0, 27.0, 7.0, 11.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.44921875, -2.3927154541015625, -2.336212158203125, -2.2797088623046875, -2.22320556640625, -2.1667022705078125, -2.110198974609375, -2.0536956787109375, -1.9971923828125, -1.9406890869140625, -1.884185791015625, -1.8276824951171875, -1.77117919921875, -1.7146759033203125, -1.658172607421875, -1.6016693115234375, -1.545166015625, -1.4886627197265625, -1.432159423828125, -1.3756561279296875, -1.31915283203125, -1.2626495361328125, -1.206146240234375, -1.1496429443359375, -1.0931396484375, -1.0366363525390625, -0.980133056640625, -0.9236297607421875, -0.86712646484375, -0.8106231689453125, -0.754119873046875, -0.6976165771484375, -0.64111328125, -0.5846099853515625, -0.528106689453125, -0.4716033935546875, -0.41510009765625, -0.3585968017578125, -0.302093505859375, -0.2455902099609375, -0.1890869140625, -0.1325836181640625, -0.076080322265625, -0.0195770263671875, 0.03692626953125, 0.0934295654296875, 0.149932861328125, 0.2064361572265625, 0.262939453125, 0.3194427490234375, 0.375946044921875, 0.4324493408203125, 0.48895263671875, 0.5454559326171875, 0.601959228515625, 0.6584625244140625, 0.7149658203125, 0.7714691162109375, 0.827972412109375, 0.8844757080078125, 0.94097900390625, 0.9974822998046875, 1.053985595703125, 1.1104888916015625, 1.1669921875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 11.0, 11.0, 17.0, 53.0, 237.0, 1887.0, 4186975.0, 4580.0, 310.0, 64.0, 40.0, 17.0, 23.0, 10.0, 11.0, 9.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-40.8125, -39.876220703125, -38.93994140625, -38.003662109375, -37.0673828125, -36.131103515625, -35.19482421875, -34.258544921875, -33.322265625, -32.385986328125, -31.44970703125, -30.513427734375, -29.5771484375, -28.640869140625, -27.70458984375, -26.768310546875, -25.83203125, -24.895751953125, -23.95947265625, -23.023193359375, -22.0869140625, -21.150634765625, -20.21435546875, -19.278076171875, -18.341796875, -17.405517578125, -16.46923828125, -15.532958984375, -14.5966796875, -13.660400390625, -12.72412109375, -11.787841796875, -10.8515625, -9.915283203125, -8.97900390625, -8.042724609375, -7.1064453125, -6.170166015625, -5.23388671875, -4.297607421875, -3.361328125, -2.425048828125, -1.48876953125, -0.552490234375, 0.3837890625, 1.320068359375, 2.25634765625, 3.192626953125, 4.12890625, 5.065185546875, 6.00146484375, 6.937744140625, 7.8740234375, 8.810302734375, 9.74658203125, 10.682861328125, 11.619140625, 12.555419921875, 13.49169921875, 14.427978515625, 15.3642578125, 16.300537109375, 17.23681640625, 18.173095703125, 19.109375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 1.0, 4.0, 8.0, 5.0, 15.0, 14.0, 21.0, 46.0, 203.0, 662.0, 1436.0, 1019.0, 385.0, 95.0, 40.0, 28.0, 17.0, 11.0, 16.0, 12.0, 6.0, 5.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-1.2294921875, -1.200042724609375, -1.17059326171875, -1.141143798828125, -1.1116943359375, -1.082244873046875, -1.05279541015625, -1.023345947265625, -0.993896484375, -0.964447021484375, -0.93499755859375, -0.905548095703125, -0.8760986328125, -0.846649169921875, -0.81719970703125, -0.787750244140625, -0.75830078125, -0.728851318359375, -0.69940185546875, -0.669952392578125, -0.6405029296875, -0.611053466796875, -0.58160400390625, -0.552154541015625, -0.522705078125, -0.493255615234375, -0.46380615234375, -0.434356689453125, -0.4049072265625, -0.375457763671875, -0.34600830078125, -0.316558837890625, -0.287109375, -0.257659912109375, -0.22821044921875, -0.198760986328125, -0.1693115234375, -0.139862060546875, -0.11041259765625, -0.080963134765625, -0.051513671875, -0.022064208984375, 0.00738525390625, 0.036834716796875, 0.0662841796875, 0.095733642578125, 0.12518310546875, 0.154632568359375, 0.18408203125, 0.213531494140625, 0.24298095703125, 0.272430419921875, 0.3018798828125, 0.331329345703125, 0.36077880859375, 0.390228271484375, 0.419677734375, 0.449127197265625, 0.47857666015625, 0.508026123046875, 0.5374755859375, 0.566925048828125, 0.59637451171875, 0.625823974609375, 0.6552734375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 642.0, 379.0, 2.0], "bins": [-52.726383209228516, -51.87491989135742, -51.02345657348633, -50.171993255615234, -49.32052993774414, -48.46906661987305, -47.61760330200195, -46.76613998413086, -45.914676666259766, -45.06321334838867, -44.21175003051758, -43.360286712646484, -42.50882339477539, -41.6573600769043, -40.8058967590332, -39.95443344116211, -39.10297393798828, -38.25151062011719, -37.400047302246094, -36.548583984375, -35.697120666503906, -34.84565734863281, -33.99419403076172, -33.142730712890625, -32.29126739501953, -31.439804077148438, -30.588340759277344, -29.73687744140625, -28.885414123535156, -28.033950805664062, -27.18248748779297, -26.331024169921875, -25.47956085205078, -24.628097534179688, -23.776634216308594, -22.9251708984375, -22.073707580566406, -21.222244262695312, -20.37078094482422, -19.519317626953125, -18.66785430908203, -17.816390991210938, -16.964927673339844, -16.11346435546875, -15.262001037597656, -14.410537719726562, -13.559075355529785, -12.707612037658691, -11.856149673461914, -11.00468635559082, -10.153223037719727, -9.301759719848633, -8.450296401977539, -7.5988335609436035, -6.747370719909668, -5.895907402038574, -5.0444440841674805, -4.192980766296387, -3.341517686843872, -2.4900546073913574, -1.6385912895202637, -0.7871279716491699, 0.06433486938476562, 0.9157981872558594, 1.7672615051269531]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 8.0, 8.0, 12.0, 11.0, 23.0, 16.0, 29.0, 28.0, 25.0, 43.0, 55.0, 45.0, 54.0, 57.0, 52.0, 53.0, 62.0, 49.0, 58.0, 45.0, 47.0, 47.0, 38.0, 36.0, 22.0, 23.0, 15.0, 11.0, 11.0, 9.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5918127298355103, -1.5467690229415894, -1.501725196838379, -1.456681489944458, -1.411637783050537, -1.3665940761566162, -1.3215502500534058, -1.2765065431594849, -1.2314627170562744, -1.1864190101623535, -1.141375184059143, -1.0963314771652222, -1.0512877702713013, -1.0062439441680908, -0.9612002372741699, -0.916156530380249, -0.8711128234863281, -0.8260690569877625, -0.7810253500938416, -0.7359815835952759, -0.690937876701355, -0.6458941102027893, -0.6008503437042236, -0.5558066368103027, -0.5107628703117371, -0.4657191336154938, -0.4206753969192505, -0.3756316304206848, -0.33058789372444153, -0.28554415702819824, -0.24050039052963257, -0.19545665383338928, -0.15041303634643555, -0.10536929219961166, -0.06032554805278778, -0.0152817964553833, 0.029761940240859985, 0.07480567693710327, 0.11984944343566895, 0.16489318013191223, 0.20993691682815552, 0.2549806535243988, 0.3000243902206421, 0.34506815671920776, 0.39011189341545105, 0.43515563011169434, 0.48019939661026, 0.5252431631088257, 0.5702868700027466, 0.6153306365013123, 0.6603743433952332, 0.7054181098937988, 0.7504618167877197, 0.7955055832862854, 0.8405493497848511, 0.885593056678772, 0.9306368231773376, 0.9756805896759033, 1.0207242965698242, 1.0657680034637451, 1.1108118295669556, 1.1558555364608765, 1.200899362564087, 1.2459430694580078, 1.2909867763519287]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 9.0, 11.0, 10.0, 11.0, 18.0, 36.0, 41.0, 70.0, 127.0, 235.0, 498.0, 987.0, 2387.0, 5552.0, 13962.0, 39196.0, 140832.0, 581829.0, 186737.0, 47700.0, 16659.0, 6497.0, 2716.0, 1242.0, 564.0, 279.0, 137.0, 74.0, 41.0, 25.0, 16.0, 15.0, 8.0, 11.0, 8.0, 6.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.54296875, -2.46246337890625, -2.3819580078125, -2.30145263671875, -2.220947265625, -2.14044189453125, -2.0599365234375, -1.97943115234375, -1.89892578125, -1.81842041015625, -1.7379150390625, -1.65740966796875, -1.576904296875, -1.49639892578125, -1.4158935546875, -1.33538818359375, -1.2548828125, -1.17437744140625, -1.0938720703125, -1.01336669921875, -0.932861328125, -0.85235595703125, -0.7718505859375, -0.69134521484375, -0.61083984375, -0.53033447265625, -0.4498291015625, -0.36932373046875, -0.288818359375, -0.20831298828125, -0.1278076171875, -0.04730224609375, 0.033203125, 0.11370849609375, 0.1942138671875, 0.27471923828125, 0.355224609375, 0.43572998046875, 0.5162353515625, 0.59674072265625, 0.67724609375, 0.75775146484375, 0.8382568359375, 0.91876220703125, 0.999267578125, 1.07977294921875, 1.1602783203125, 1.24078369140625, 1.3212890625, 1.40179443359375, 1.4822998046875, 1.56280517578125, 1.643310546875, 1.72381591796875, 1.8043212890625, 1.88482666015625, 1.96533203125, 2.04583740234375, 2.1263427734375, 2.20684814453125, 2.287353515625, 2.36785888671875, 2.4483642578125, 2.52886962890625, 2.609375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 7.0, 5.0, 16.0, 10.0, 21.0, 31.0, 43.0, 43.0, 37.0, 42.0, 58.0, 53.0, 69.0, 64.0, 75.0, 68.0, 64.0, 41.0, 58.0, 45.0, 37.0, 31.0, 21.0, 16.0, 17.0, 5.0, 8.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.32421875, -1.2909164428710938, -1.2576141357421875, -1.2243118286132812, -1.191009521484375, -1.1577072143554688, -1.1244049072265625, -1.0911026000976562, -1.05780029296875, -1.0244979858398438, -0.9911956787109375, -0.9578933715820312, -0.924591064453125, -0.8912887573242188, -0.8579864501953125, -0.8246841430664062, -0.7913818359375, -0.7580795288085938, -0.7247772216796875, -0.6914749145507812, -0.658172607421875, -0.6248703002929688, -0.5915679931640625, -0.5582656860351562, -0.52496337890625, -0.49166107177734375, -0.4583587646484375, -0.42505645751953125, -0.391754150390625, -0.35845184326171875, -0.3251495361328125, -0.29184722900390625, -0.258544921875, -0.22524261474609375, -0.1919403076171875, -0.15863800048828125, -0.125335693359375, -0.09203338623046875, -0.0587310791015625, -0.02542877197265625, 0.00787353515625, 0.04117584228515625, 0.0744781494140625, 0.10778045654296875, 0.141082763671875, 0.17438507080078125, 0.2076873779296875, 0.24098968505859375, 0.2742919921875, 0.30759429931640625, 0.3408966064453125, 0.37419891357421875, 0.407501220703125, 0.44080352783203125, 0.4741058349609375, 0.5074081420898438, 0.54071044921875, 0.5740127563476562, 0.6073150634765625, 0.6406173706054688, 0.673919677734375, 0.7072219848632812, 0.7405242919921875, 0.7738265991210938, 0.80712890625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 5.0, 5.0, 9.0, 13.0, 23.0, 16.0, 28.0, 43.0, 57.0, 87.0, 132.0, 174.0, 233.0, 358.0, 501.0, 742.0, 1022.0, 1555.0, 2410.0, 3770.0, 5944.0, 10171.0, 18160.0, 35048.0, 82958.0, 360676.0, 361597.0, 82543.0, 35239.0, 17811.0, 10001.0, 5942.0, 3828.0, 2339.0, 1666.0, 1061.0, 726.0, 494.0, 343.0, 226.0, 174.0, 112.0, 73.0, 68.0, 54.0, 32.0, 27.0, 25.0, 10.0, 12.0, 6.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 3.0], "bins": [-1.2294921875, -1.191070556640625, -1.15264892578125, -1.114227294921875, -1.0758056640625, -1.037384033203125, -0.99896240234375, -0.960540771484375, -0.922119140625, -0.883697509765625, -0.84527587890625, -0.806854248046875, -0.7684326171875, -0.730010986328125, -0.69158935546875, -0.653167724609375, -0.61474609375, -0.576324462890625, -0.53790283203125, -0.499481201171875, -0.4610595703125, -0.422637939453125, -0.38421630859375, -0.345794677734375, -0.307373046875, -0.268951416015625, -0.23052978515625, -0.192108154296875, -0.1536865234375, -0.115264892578125, -0.07684326171875, -0.038421630859375, 0.0, 0.038421630859375, 0.07684326171875, 0.115264892578125, 0.1536865234375, 0.192108154296875, 0.23052978515625, 0.268951416015625, 0.307373046875, 0.345794677734375, 0.38421630859375, 0.422637939453125, 0.4610595703125, 0.499481201171875, 0.53790283203125, 0.576324462890625, 0.61474609375, 0.653167724609375, 0.69158935546875, 0.730010986328125, 0.7684326171875, 0.806854248046875, 0.84527587890625, 0.883697509765625, 0.922119140625, 0.960540771484375, 0.99896240234375, 1.037384033203125, 1.0758056640625, 1.114227294921875, 1.15264892578125, 1.191070556640625, 1.2294921875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 11.0, 11.0, 10.0, 10.0, 15.0, 25.0, 19.0, 25.0, 24.0, 35.0, 22.0, 31.0, 53.0, 39.0, 39.0, 40.0, 54.0, 42.0, 44.0, 44.0, 51.0, 35.0, 43.0, 32.0, 24.0, 24.0, 24.0, 30.0, 23.0, 23.0, 18.0, 6.0, 9.0, 6.0, 18.0, 7.0, 11.0, 2.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.53662109375, -0.519866943359375, -0.50311279296875, -0.486358642578125, -0.4696044921875, -0.452850341796875, -0.43609619140625, -0.419342041015625, -0.402587890625, -0.385833740234375, -0.36907958984375, -0.352325439453125, -0.3355712890625, -0.318817138671875, -0.30206298828125, -0.285308837890625, -0.2685546875, -0.251800537109375, -0.23504638671875, -0.218292236328125, -0.2015380859375, -0.184783935546875, -0.16802978515625, -0.151275634765625, -0.134521484375, -0.117767333984375, -0.10101318359375, -0.084259033203125, -0.0675048828125, -0.050750732421875, -0.03399658203125, -0.017242431640625, -0.00048828125, 0.016265869140625, 0.03302001953125, 0.049774169921875, 0.0665283203125, 0.083282470703125, 0.10003662109375, 0.116790771484375, 0.133544921875, 0.150299072265625, 0.16705322265625, 0.183807373046875, 0.2005615234375, 0.217315673828125, 0.23406982421875, 0.250823974609375, 0.267578125, 0.284332275390625, 0.30108642578125, 0.317840576171875, 0.3345947265625, 0.351348876953125, 0.36810302734375, 0.384857177734375, 0.401611328125, 0.418365478515625, 0.43511962890625, 0.451873779296875, 0.4686279296875, 0.485382080078125, 0.50213623046875, 0.518890380859375, 0.53564453125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 6.0, 13.0, 7.0, 12.0, 23.0, 16.0, 30.0, 51.0, 71.0, 84.0, 92.0, 160.0, 195.0, 312.0, 434.0, 673.0, 1001.0, 1742.0, 3180.0, 7749.0, 998978.0, 22752.0, 4708.0, 2321.0, 1365.0, 799.0, 497.0, 352.0, 278.0, 175.0, 114.0, 92.0, 60.0, 56.0, 46.0, 24.0, 22.0, 20.0, 12.0, 9.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.32421875, -1.28497314453125, -1.2457275390625, -1.20648193359375, -1.167236328125, -1.12799072265625, -1.0887451171875, -1.04949951171875, -1.01025390625, -0.97100830078125, -0.9317626953125, -0.89251708984375, -0.853271484375, -0.81402587890625, -0.7747802734375, -0.73553466796875, -0.6962890625, -0.65704345703125, -0.6177978515625, -0.57855224609375, -0.539306640625, -0.50006103515625, -0.4608154296875, -0.42156982421875, -0.38232421875, -0.34307861328125, -0.3038330078125, -0.26458740234375, -0.225341796875, -0.18609619140625, -0.1468505859375, -0.10760498046875, -0.068359375, -0.02911376953125, 0.0101318359375, 0.04937744140625, 0.088623046875, 0.12786865234375, 0.1671142578125, 0.20635986328125, 0.24560546875, 0.28485107421875, 0.3240966796875, 0.36334228515625, 0.402587890625, 0.44183349609375, 0.4810791015625, 0.52032470703125, 0.5595703125, 0.59881591796875, 0.6380615234375, 0.67730712890625, 0.716552734375, 0.75579833984375, 0.7950439453125, 0.83428955078125, 0.87353515625, 0.91278076171875, 0.9520263671875, 0.99127197265625, 1.030517578125, 1.06976318359375, 1.1090087890625, 1.14825439453125, 1.1875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 14.0, 68.0, 594.0, 269.0, 22.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001232624053955078, -0.00011761859059333801, -0.00011197477579116821, -0.00010633096098899841, -0.00010068714618682861, -9.504333138465881e-05, -8.939951658248901e-05, -8.375570178031921e-05, -7.811188697814941e-05, -7.246807217597961e-05, -6.682425737380981e-05, -6.118044257164001e-05, -5.5536627769470215e-05, -4.9892812967300415e-05, -4.4248998165130615e-05, -3.8605183362960815e-05, -3.2961368560791016e-05, -2.7317553758621216e-05, -2.1673738956451416e-05, -1.6029924154281616e-05, -1.0386109352111816e-05, -4.742294549942017e-06, 9.015202522277832e-07, 6.545335054397583e-06, 1.2189149856567383e-05, 1.7832964658737183e-05, 2.3476779460906982e-05, 2.9120594263076782e-05, 3.476440906524658e-05, 4.040822386741638e-05, 4.605203866958618e-05, 5.169585347175598e-05, 5.733966827392578e-05, 6.298348307609558e-05, 6.862729787826538e-05, 7.427111268043518e-05, 7.991492748260498e-05, 8.555874228477478e-05, 9.120255708694458e-05, 9.684637188911438e-05, 0.00010249018669128418, 0.00010813400149345398, 0.00011377781629562378, 0.00011942163109779358, 0.00012506544589996338, 0.00013070926070213318, 0.00013635307550430298, 0.00014199689030647278, 0.00014764070510864258, 0.00015328451991081238, 0.00015892833471298218, 0.00016457214951515198, 0.00017021596431732178, 0.00017585977911949158, 0.00018150359392166138, 0.00018714740872383118, 0.00019279122352600098, 0.00019843503832817078, 0.00020407885313034058, 0.00020972266793251038, 0.00021536648273468018, 0.00022101029753684998, 0.00022665411233901978, 0.00023229792714118958, 0.00023794174194335938]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 10.0, 15.0, 17.0, 189.0, 1040232.0, 7993.0, 27.0, 18.0, 10.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.25, -14.799072265625, -14.34814453125, -13.897216796875, -13.4462890625, -12.995361328125, -12.54443359375, -12.093505859375, -11.642578125, -11.191650390625, -10.74072265625, -10.289794921875, -9.8388671875, -9.387939453125, -8.93701171875, -8.486083984375, -8.03515625, -7.584228515625, -7.13330078125, -6.682373046875, -6.2314453125, -5.780517578125, -5.32958984375, -4.878662109375, -4.427734375, -3.976806640625, -3.52587890625, -3.074951171875, -2.6240234375, -2.173095703125, -1.72216796875, -1.271240234375, -0.8203125, -0.369384765625, 0.08154296875, 0.532470703125, 0.9833984375, 1.434326171875, 1.88525390625, 2.336181640625, 2.787109375, 3.238037109375, 3.68896484375, 4.139892578125, 4.5908203125, 5.041748046875, 5.49267578125, 5.943603515625, 6.39453125, 6.845458984375, 7.29638671875, 7.747314453125, 8.1982421875, 8.649169921875, 9.10009765625, 9.551025390625, 10.001953125, 10.452880859375, 10.90380859375, 11.354736328125, 11.8056640625, 12.256591796875, 12.70751953125, 13.158447265625, 13.609375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 466.0, 498.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.352294921875, -0.34194183349609375, -0.3315887451171875, -0.32123565673828125, -0.310882568359375, -0.30052947998046875, -0.2901763916015625, -0.27982330322265625, -0.26947021484375, -0.25911712646484375, -0.2487640380859375, -0.23841094970703125, -0.228057861328125, -0.21770477294921875, -0.2073516845703125, -0.19699859619140625, -0.1866455078125, -0.17629241943359375, -0.1659393310546875, -0.15558624267578125, -0.145233154296875, -0.13488006591796875, -0.1245269775390625, -0.11417388916015625, -0.10382080078125, -0.09346771240234375, -0.0831146240234375, -0.07276153564453125, -0.062408447265625, -0.05205535888671875, -0.0417022705078125, -0.03134918212890625, -0.02099609375, -0.01064300537109375, -0.0002899169921875, 0.01006317138671875, 0.020416259765625, 0.03076934814453125, 0.0411224365234375, 0.05147552490234375, 0.06182861328125, 0.07218170166015625, 0.0825347900390625, 0.09288787841796875, 0.103240966796875, 0.11359405517578125, 0.1239471435546875, 0.13430023193359375, 0.1446533203125, 0.15500640869140625, 0.1653594970703125, 0.17571258544921875, 0.186065673828125, 0.19641876220703125, 0.2067718505859375, 0.21712493896484375, 0.22747802734375, 0.23783111572265625, 0.2481842041015625, 0.25853729248046875, 0.268890380859375, 0.27924346923828125, 0.2895965576171875, 0.29994964599609375, 0.310302734375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 926.0, 86.0, 4.0, 0.0, 1.0], "bins": [-33.86361312866211, -33.295162200927734, -32.726715087890625, -32.15826416015625, -31.589813232421875, -31.021364212036133, -30.452913284301758, -29.884464263916016, -29.31601333618164, -28.7475643157959, -28.179113388061523, -27.61066436767578, -27.042213439941406, -26.473764419555664, -25.90531349182129, -25.336864471435547, -24.768413543701172, -24.19996452331543, -23.631513595581055, -23.063064575195312, -22.494613647460938, -21.926164627075195, -21.35771369934082, -20.789264678955078, -20.220815658569336, -19.652366638183594, -19.08391571044922, -18.515466690063477, -17.9470157623291, -17.37856674194336, -16.810115814208984, -16.241666793823242, -15.67321491241455, -15.104764938354492, -14.536314964294434, -13.967864990234375, -13.399415016174316, -12.830965042114258, -12.262516021728516, -11.69406509399414, -11.125616073608398, -10.55716609954834, -9.988716125488281, -9.420266151428223, -8.851816177368164, -8.283366203308105, -7.714916706085205, -7.1464667320251465, -6.57801628112793, -6.009566307067871, -5.4411163330078125, -4.872666358947754, -4.304216384887695, -3.735766649246216, -3.1673169136047363, -2.5988669395446777, -2.030416965484619, -1.4619669914245605, -0.8935171365737915, -0.32506728172302246, 0.24338269233703613, 0.8118326663970947, 1.3802824020385742, 1.9487323760986328, 2.5171823501586914]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 9.0, 8.0, 11.0, 17.0, 14.0, 28.0, 19.0, 29.0, 36.0, 48.0, 53.0, 49.0, 56.0, 52.0, 56.0, 70.0, 67.0, 49.0, 50.0, 49.0, 45.0, 33.0, 34.0, 25.0, 28.0, 22.0, 12.0, 10.0, 3.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.011085033416748, -0.9812911748886108, -0.9514973163604736, -0.9217035174369812, -0.891909658908844, -0.8621158003807068, -0.8323220014572144, -0.8025281429290771, -0.7727342844009399, -0.7429404258728027, -0.7131465673446655, -0.6833527684211731, -0.6535589098930359, -0.6237650513648987, -0.5939712524414062, -0.564177393913269, -0.5343835353851318, -0.5045896768569946, -0.4747958481311798, -0.445002019405365, -0.4152081608772278, -0.3854143023490906, -0.35562047362327576, -0.32582664489746094, -0.29603278636932373, -0.2662389278411865, -0.2364450991153717, -0.2066512554883957, -0.17685741186141968, -0.14706356823444366, -0.11726972460746765, -0.08747588098049164, -0.057682037353515625, -0.027888193726539612, 0.0019056499004364014, 0.031699493527412415, 0.06149333715438843, 0.09128718078136444, 0.12108102440834045, 0.15087486803531647, 0.18066871166229248, 0.2104625552892685, 0.2402563989162445, 0.2700502276420593, 0.29984408617019653, 0.32963794469833374, 0.35943177342414856, 0.3892256021499634, 0.4190194606781006, 0.4488133192062378, 0.4786071479320526, 0.5084009766578674, 0.5381948351860046, 0.5679886937141418, 0.5977824926376343, 0.6275763511657715, 0.6573702096939087, 0.6871640682220459, 0.7169579267501831, 0.7467517256736755, 0.7765455842018127, 0.80633944272995, 0.8361332416534424, 0.8659271001815796, 0.8957209587097168]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 5.0, 7.0, 6.0, 9.0, 4.0, 12.0, 10.0, 17.0, 15.0, 21.0, 25.0, 27.0, 30.0, 41.0, 63.0, 144.0, 424.0, 1744.0, 9985.0, 70983.0, 762520.0, 176866.0, 20925.0, 3395.0, 708.0, 222.0, 96.0, 53.0, 34.0, 21.0, 28.0, 22.0, 18.0, 15.0, 10.0, 14.0, 5.0, 12.0, 8.0, 5.0, 5.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.537109375, -3.393890380859375, -3.25067138671875, -3.107452392578125, -2.9642333984375, -2.821014404296875, -2.67779541015625, -2.534576416015625, -2.391357421875, -2.248138427734375, -2.10491943359375, -1.961700439453125, -1.8184814453125, -1.675262451171875, -1.53204345703125, -1.388824462890625, -1.24560546875, -1.102386474609375, -0.95916748046875, -0.815948486328125, -0.6727294921875, -0.529510498046875, -0.38629150390625, -0.243072509765625, -0.099853515625, 0.043365478515625, 0.18658447265625, 0.329803466796875, 0.4730224609375, 0.616241455078125, 0.75946044921875, 0.902679443359375, 1.0458984375, 1.189117431640625, 1.33233642578125, 1.475555419921875, 1.6187744140625, 1.761993408203125, 1.90521240234375, 2.048431396484375, 2.191650390625, 2.334869384765625, 2.47808837890625, 2.621307373046875, 2.7645263671875, 2.907745361328125, 3.05096435546875, 3.194183349609375, 3.33740234375, 3.480621337890625, 3.62384033203125, 3.767059326171875, 3.9102783203125, 4.053497314453125, 4.19671630859375, 4.339935302734375, 4.483154296875, 4.626373291015625, 4.76959228515625, 4.912811279296875, 5.0560302734375, 5.199249267578125, 5.34246826171875, 5.485687255859375, 5.62890625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 16.0, 28.0, 38.0, 60.0, 86.0, 99.0, 142.0, 137.0, 119.0, 91.0, 74.0, 51.0, 33.0, 15.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.97607421875, -0.9562263488769531, -0.9363784790039062, -0.9165306091308594, -0.8966827392578125, -0.8768348693847656, -0.8569869995117188, -0.8371391296386719, -0.817291259765625, -0.7974433898925781, -0.7775955200195312, -0.7577476501464844, -0.7378997802734375, -0.7180519104003906, -0.6982040405273438, -0.6783561706542969, -0.65850830078125, -0.6386604309082031, -0.6188125610351562, -0.5989646911621094, -0.5791168212890625, -0.5592689514160156, -0.5394210815429688, -0.5195732116699219, -0.499725341796875, -0.4798774719238281, -0.46002960205078125, -0.4401817321777344, -0.4203338623046875, -0.4004859924316406, -0.38063812255859375, -0.3607902526855469, -0.3409423828125, -0.3210945129394531, -0.30124664306640625, -0.2813987731933594, -0.2615509033203125, -0.24170303344726562, -0.22185516357421875, -0.20200729370117188, -0.182159423828125, -0.16231155395507812, -0.14246368408203125, -0.12261581420898438, -0.1027679443359375, -0.08292007446289062, -0.06307220458984375, -0.043224334716796875, -0.02337646484375, -0.003528594970703125, 0.01631927490234375, 0.036167144775390625, 0.0560150146484375, 0.07586288452148438, 0.09571075439453125, 0.11555862426757812, 0.135406494140625, 0.15525436401367188, 0.17510223388671875, 0.19495010375976562, 0.2147979736328125, 0.23464584350585938, 0.25449371337890625, 0.2743415832519531, 0.294189453125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 7.0, 13.0, 13.0, 15.0, 11.0, 24.0, 29.0, 25.0, 56.0, 93.0, 194.0, 458.0, 1443.0, 3923.0, 12094.0, 39511.0, 154122.0, 605245.0, 169090.0, 42666.0, 12780.0, 4252.0, 1414.0, 550.0, 222.0, 86.0, 42.0, 30.0, 20.0, 17.0, 23.0, 19.0, 10.0, 9.0, 11.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5869140625, -1.533172607421875, -1.47943115234375, -1.425689697265625, -1.3719482421875, -1.318206787109375, -1.26446533203125, -1.210723876953125, -1.156982421875, -1.103240966796875, -1.04949951171875, -0.995758056640625, -0.9420166015625, -0.888275146484375, -0.83453369140625, -0.780792236328125, -0.72705078125, -0.673309326171875, -0.61956787109375, -0.565826416015625, -0.5120849609375, -0.458343505859375, -0.40460205078125, -0.350860595703125, -0.297119140625, -0.243377685546875, -0.18963623046875, -0.135894775390625, -0.0821533203125, -0.028411865234375, 0.02532958984375, 0.079071044921875, 0.1328125, 0.186553955078125, 0.24029541015625, 0.294036865234375, 0.3477783203125, 0.401519775390625, 0.45526123046875, 0.509002685546875, 0.562744140625, 0.616485595703125, 0.67022705078125, 0.723968505859375, 0.7777099609375, 0.831451416015625, 0.88519287109375, 0.938934326171875, 0.99267578125, 1.046417236328125, 1.10015869140625, 1.153900146484375, 1.2076416015625, 1.261383056640625, 1.31512451171875, 1.368865966796875, 1.422607421875, 1.476348876953125, 1.53009033203125, 1.583831787109375, 1.6375732421875, 1.691314697265625, 1.74505615234375, 1.798797607421875, 1.8525390625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 1.0, 7.0, 8.0, 13.0, 15.0, 12.0, 14.0, 18.0, 24.0, 24.0, 23.0, 32.0, 40.0, 36.0, 37.0, 39.0, 36.0, 54.0, 42.0, 36.0, 36.0, 47.0, 41.0, 32.0, 39.0, 51.0, 41.0, 24.0, 30.0, 22.0, 17.0, 17.0, 23.0, 15.0, 7.0, 12.0, 11.0, 10.0, 5.0, 1.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2464599609375, -0.2381114959716797, -0.22976303100585938, -0.22141456604003906, -0.21306610107421875, -0.20471763610839844, -0.19636917114257812, -0.1880207061767578, -0.1796722412109375, -0.1713237762451172, -0.16297531127929688, -0.15462684631347656, -0.14627838134765625, -0.13792991638183594, -0.12958145141601562, -0.12123298645019531, -0.112884521484375, -0.10453605651855469, -0.09618759155273438, -0.08783912658691406, -0.07949066162109375, -0.07114219665527344, -0.06279373168945312, -0.05444526672363281, -0.0460968017578125, -0.03774833679199219, -0.029399871826171875, -0.021051406860351562, -0.01270294189453125, -0.0043544769287109375, 0.003993988037109375, 0.012342453002929688, 0.02069091796875, 0.029039382934570312, 0.037387847900390625, 0.04573631286621094, 0.05408477783203125, 0.06243324279785156, 0.07078170776367188, 0.07913017272949219, 0.0874786376953125, 0.09582710266113281, 0.10417556762695312, 0.11252403259277344, 0.12087249755859375, 0.12922096252441406, 0.13756942749023438, 0.1459178924560547, 0.154266357421875, 0.1626148223876953, 0.17096328735351562, 0.17931175231933594, 0.18766021728515625, 0.19600868225097656, 0.20435714721679688, 0.2127056121826172, 0.2210540771484375, 0.2294025421142578, 0.23775100708007812, 0.24609947204589844, 0.25444793701171875, 0.26279640197753906, 0.2711448669433594, 0.2794933319091797, 0.287841796875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 1.0, 4.0, 8.0, 11.0, 7.0, 14.0, 14.0, 27.0, 26.0, 51.0, 66.0, 104.0, 134.0, 204.0, 321.0, 498.0, 930.0, 1785.0, 3875.0, 10181.0, 38341.0, 491359.0, 445613.0, 37081.0, 9839.0, 3831.0, 1821.0, 930.0, 512.0, 314.0, 202.0, 127.0, 89.0, 55.0, 41.0, 36.0, 32.0, 18.0, 12.0, 12.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.038787841796875, -0.0375361442565918, -0.036284446716308594, -0.03503274917602539, -0.03378105163574219, -0.032529354095458984, -0.03127765655517578, -0.030025959014892578, -0.028774261474609375, -0.027522563934326172, -0.02627086639404297, -0.025019168853759766, -0.023767471313476562, -0.02251577377319336, -0.021264076232910156, -0.020012378692626953, -0.01876068115234375, -0.017508983612060547, -0.016257286071777344, -0.01500558853149414, -0.013753890991210938, -0.012502193450927734, -0.011250495910644531, -0.009998798370361328, -0.008747100830078125, -0.007495403289794922, -0.006243705749511719, -0.004992008209228516, -0.0037403106689453125, -0.0024886131286621094, -0.0012369155883789062, 1.4781951904296875e-05, 0.0012664794921875, 0.002518177032470703, 0.0037698745727539062, 0.005021572113037109, 0.0062732696533203125, 0.007524967193603516, 0.008776664733886719, 0.010028362274169922, 0.011280059814453125, 0.012531757354736328, 0.013783454895019531, 0.015035152435302734, 0.016286849975585938, 0.01753854751586914, 0.018790245056152344, 0.020041942596435547, 0.02129364013671875, 0.022545337677001953, 0.023797035217285156, 0.02504873275756836, 0.026300430297851562, 0.027552127838134766, 0.02880382537841797, 0.030055522918701172, 0.031307220458984375, 0.03255891799926758, 0.03381061553955078, 0.035062313079833984, 0.03631401062011719, 0.03756570816040039, 0.038817405700683594, 0.0400691032409668, 0.04132080078125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 13.0, 21.0, 33.0, 47.0, 131.0, 260.0, 270.0, 105.0, 57.0, 24.0, 10.0, 9.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4020671844482422e-05, -2.3387372493743896e-05, -2.275407314300537e-05, -2.2120773792266846e-05, -2.148747444152832e-05, -2.0854175090789795e-05, -2.022087574005127e-05, -1.9587576389312744e-05, -1.895427703857422e-05, -1.8320977687835693e-05, -1.7687678337097168e-05, -1.7054378986358643e-05, -1.6421079635620117e-05, -1.5787780284881592e-05, -1.5154480934143066e-05, -1.4521181583404541e-05, -1.3887882232666016e-05, -1.325458288192749e-05, -1.2621283531188965e-05, -1.198798418045044e-05, -1.1354684829711914e-05, -1.0721385478973389e-05, -1.0088086128234863e-05, -9.454786777496338e-06, -8.821487426757812e-06, -8.188188076019287e-06, -7.554888725280762e-06, -6.921589374542236e-06, -6.288290023803711e-06, -5.6549906730651855e-06, -5.02169132232666e-06, -4.388391971588135e-06, -3.7550926208496094e-06, -3.121793270111084e-06, -2.4884939193725586e-06, -1.8551945686340332e-06, -1.2218952178955078e-06, -5.885958671569824e-07, 4.470348358154297e-08, 6.780028343200684e-07, 1.3113021850585938e-06, 1.944601535797119e-06, 2.5779008865356445e-06, 3.21120023727417e-06, 3.844499588012695e-06, 4.477798938751221e-06, 5.111098289489746e-06, 5.7443976402282715e-06, 6.377696990966797e-06, 7.010996341705322e-06, 7.644295692443848e-06, 8.277595043182373e-06, 8.910894393920898e-06, 9.544193744659424e-06, 1.017749309539795e-05, 1.0810792446136475e-05, 1.1444091796875e-05, 1.2077391147613525e-05, 1.271069049835205e-05, 1.3343989849090576e-05, 1.3977289199829102e-05, 1.4610588550567627e-05, 1.5243887901306152e-05, 1.5877187252044678e-05, 1.6510486602783203e-05]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 5.0, 3.0, 7.0, 16.0, 22.0, 33.0, 68.0, 113.0, 222.0, 396.0, 747.0, 1633.0, 4160.0, 16166.0, 120702.0, 796816.0, 87438.0, 13328.0, 3624.0, 1485.0, 702.0, 398.0, 205.0, 110.0, 66.0, 42.0, 19.0, 11.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033447265625, -0.032446861267089844, -0.03144645690917969, -0.03044605255126953, -0.029445648193359375, -0.02844524383544922, -0.027444839477539062, -0.026444435119628906, -0.02544403076171875, -0.024443626403808594, -0.023443222045898438, -0.02244281768798828, -0.021442413330078125, -0.02044200897216797, -0.019441604614257812, -0.018441200256347656, -0.0174407958984375, -0.016440391540527344, -0.015439987182617188, -0.014439582824707031, -0.013439178466796875, -0.012438774108886719, -0.011438369750976562, -0.010437965393066406, -0.00943756103515625, -0.008437156677246094, -0.0074367523193359375, -0.006436347961425781, -0.005435943603515625, -0.004435539245605469, -0.0034351348876953125, -0.0024347305297851562, -0.001434326171875, -0.00043392181396484375, 0.0005664825439453125, 0.0015668869018554688, 0.002567291259765625, 0.0035676956176757812, 0.0045680999755859375, 0.005568504333496094, 0.00656890869140625, 0.007569313049316406, 0.008569717407226562, 0.009570121765136719, 0.010570526123046875, 0.011570930480957031, 0.012571334838867188, 0.013571739196777344, 0.0145721435546875, 0.015572547912597656, 0.016572952270507812, 0.01757335662841797, 0.018573760986328125, 0.01957416534423828, 0.020574569702148438, 0.021574974060058594, 0.02257537841796875, 0.023575782775878906, 0.024576187133789062, 0.02557659149169922, 0.026576995849609375, 0.02757740020751953, 0.028577804565429688, 0.029578208923339844, 0.03057861328125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 4.0, 10.0, 13.0, 26.0, 37.0, 34.0, 52.0, 78.0, 92.0, 103.0, 137.0, 87.0, 88.0, 73.0, 47.0, 43.0, 25.0, 12.0, 5.0, 6.0, 10.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005672454833984375, -0.005479276180267334, -0.005286097526550293, -0.005092918872833252, -0.004899740219116211, -0.00470656156539917, -0.004513382911682129, -0.004320204257965088, -0.004127025604248047, -0.003933846950531006, -0.003740668296813965, -0.003547489643096924, -0.003354310989379883, -0.003161132335662842, -0.0029679536819458008, -0.0027747750282287598, -0.0025815963745117188, -0.0023884177207946777, -0.0021952390670776367, -0.0020020604133605957, -0.0018088817596435547, -0.0016157031059265137, -0.0014225244522094727, -0.0012293457984924316, -0.0010361671447753906, -0.0008429884910583496, -0.0006498098373413086, -0.0004566311836242676, -0.00026345252990722656, -7.027387619018555e-05, 0.00012290477752685547, 0.0003160834312438965, 0.0005092620849609375, 0.0007024407386779785, 0.0008956193923950195, 0.0010887980461120605, 0.0012819766998291016, 0.0014751553535461426, 0.0016683340072631836, 0.0018615126609802246, 0.0020546913146972656, 0.0022478699684143066, 0.0024410486221313477, 0.0026342272758483887, 0.0028274059295654297, 0.0030205845832824707, 0.0032137632369995117, 0.0034069418907165527, 0.0036001205444335938, 0.0037932991981506348, 0.003986477851867676, 0.004179656505584717, 0.004372835159301758, 0.004566013813018799, 0.00475919246673584, 0.004952371120452881, 0.005145549774169922, 0.005338728427886963, 0.005531907081604004, 0.005725085735321045, 0.005918264389038086, 0.006111443042755127, 0.006304621696472168, 0.006497800350189209, 0.00669097900390625]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 11.0, 27.0, 82.0, 291.0, 415.0, 111.0, 45.0, 21.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.668367862701416, -3.6005775928497314, -3.532787561416626, -3.4649972915649414, -3.397207260131836, -3.3294169902801514, -3.261626720428467, -3.1938366889953613, -3.1260464191436768, -3.058256149291992, -2.9904661178588867, -2.922675848007202, -2.8548858165740967, -2.787095546722412, -2.7193055152893066, -2.651515245437622, -2.5837249755859375, -2.515934705734253, -2.4481446743011475, -2.380354404449463, -2.3125643730163574, -2.244774103164673, -2.1769838333129883, -2.109193801879883, -2.0414037704467773, -1.9736136198043823, -1.9058234691619873, -1.8380331993103027, -1.7702430486679077, -1.7024528980255127, -1.6346627473831177, -1.5668725967407227, -1.499082326889038, -1.431292176246643, -1.363502025604248, -1.2957117557525635, -1.2279216051101685, -1.1601314544677734, -1.0923413038253784, -1.0245511531829834, -0.9567608833312988, -0.8889707326889038, -0.821180522441864, -0.753390371799469, -0.6856001615524292, -0.6178100109100342, -0.5500198602676392, -0.48222967982292175, -0.41443949937820435, -0.34664931893348694, -0.27885913848876953, -0.2110689878463745, -0.1432788074016571, -0.0754886269569397, -0.007698476314544678, 0.06009170413017273, 0.12788188457489014, 0.19567206501960754, 0.26346224546432495, 0.33125239610671997, 0.3990425765514374, 0.4668327569961548, 0.5346229076385498, 0.6024130582809448, 0.6702032685279846]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 11.0, 9.0, 17.0, 17.0, 20.0, 24.0, 39.0, 31.0, 51.0, 46.0, 45.0, 78.0, 54.0, 62.0, 40.0, 63.0, 51.0, 44.0, 59.0, 38.0, 31.0, 37.0, 30.0, 30.0, 21.0, 17.0, 17.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4048265516757965, -0.39003437757492065, -0.3752422332763672, -0.36045005917549133, -0.3456578850746155, -0.330865740776062, -0.31607356667518616, -0.3012813925743103, -0.28648924827575684, -0.271697074174881, -0.2569049298763275, -0.24211275577545166, -0.227320596575737, -0.21252843737602234, -0.19773626327514648, -0.18294410407543182, -0.16815194487571716, -0.1533597856760025, -0.13856762647628784, -0.12377545237541199, -0.10898329317569733, -0.09419113397598267, -0.07939896732568741, -0.06460680067539215, -0.04981464147567749, -0.03502247855067253, -0.020230315625667572, -0.005438152700662613, 0.009354010224342346, 0.024146169424057007, 0.038938336074352264, 0.05373050272464752, 0.06852269172668457, 0.08331485092639923, 0.09810701757669449, 0.11289918422698975, 0.1276913434267044, 0.14248350262641907, 0.15727567672729492, 0.17206783592700958, 0.18685999512672424, 0.2016521543264389, 0.21644431352615356, 0.23123648762702942, 0.24602864682674408, 0.26082080602645874, 0.2756129801273346, 0.29040515422821045, 0.3051972985267639, 0.31998947262763977, 0.33478161692619324, 0.3495737910270691, 0.36436593532562256, 0.3791581094264984, 0.39395028352737427, 0.40874242782592773, 0.4235346019268036, 0.43832677602767944, 0.4531189203262329, 0.46791109442710876, 0.4827032685279846, 0.4974954128265381, 0.5122875571250916, 0.5270797610282898, 0.5418719053268433]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 1.0, 6.0, 14.0, 5.0, 15.0, 22.0, 39.0, 50.0, 58.0, 82.0, 115.0, 173.0, 246.0, 308.0, 467.0, 701.0, 1024.0, 1502.0, 2343.0, 3908.0, 23436.0, 4098962.0, 48570.0, 4432.0, 2523.0, 1602.0, 1107.0, 751.0, 540.0, 391.0, 271.0, 177.0, 135.0, 116.0, 62.0, 39.0, 29.0, 22.0, 17.0, 7.0, 9.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1650390625, -1.1340179443359375, -1.102996826171875, -1.0719757080078125, -1.04095458984375, -1.0099334716796875, -0.978912353515625, -0.9478912353515625, -0.9168701171875, -0.8858489990234375, -0.854827880859375, -0.8238067626953125, -0.79278564453125, -0.7617645263671875, -0.730743408203125, -0.6997222900390625, -0.668701171875, -0.6376800537109375, -0.606658935546875, -0.5756378173828125, -0.54461669921875, -0.5135955810546875, -0.482574462890625, -0.4515533447265625, -0.4205322265625, -0.3895111083984375, -0.358489990234375, -0.3274688720703125, -0.29644775390625, -0.2654266357421875, -0.234405517578125, -0.2033843994140625, -0.17236328125, -0.1413421630859375, -0.110321044921875, -0.0792999267578125, -0.04827880859375, -0.0172576904296875, 0.013763427734375, 0.0447845458984375, 0.0758056640625, 0.1068267822265625, 0.137847900390625, 0.1688690185546875, 0.19989013671875, 0.2309112548828125, 0.261932373046875, 0.2929534912109375, 0.323974609375, 0.3549957275390625, 0.386016845703125, 0.4170379638671875, 0.44805908203125, 0.4790802001953125, 0.510101318359375, 0.5411224365234375, 0.5721435546875, 0.6031646728515625, 0.634185791015625, 0.6652069091796875, 0.69622802734375, 0.7272491455078125, 0.758270263671875, 0.7892913818359375, 0.8203125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 9.0, 8.0, 8.0, 10.0, 5.0, 16.0, 18.0, 26.0, 31.0, 40.0, 42.0, 42.0, 47.0, 58.0, 64.0, 52.0, 53.0, 55.0, 55.0, 46.0, 44.0, 58.0, 36.0, 34.0, 28.0, 27.0, 20.0, 15.0, 20.0, 16.0, 8.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.311767578125, -0.30367469787597656, -0.2955818176269531, -0.2874889373779297, -0.27939605712890625, -0.2713031768798828, -0.2632102966308594, -0.25511741638183594, -0.2470245361328125, -0.23893165588378906, -0.23083877563476562, -0.2227458953857422, -0.21465301513671875, -0.2065601348876953, -0.19846725463867188, -0.19037437438964844, -0.182281494140625, -0.17418861389160156, -0.16609573364257812, -0.1580028533935547, -0.14990997314453125, -0.1418170928955078, -0.13372421264648438, -0.12563133239746094, -0.1175384521484375, -0.10944557189941406, -0.10135269165039062, -0.09325981140136719, -0.08516693115234375, -0.07707405090332031, -0.06898117065429688, -0.06088829040527344, -0.05279541015625, -0.04470252990722656, -0.036609649658203125, -0.028516769409179688, -0.02042388916015625, -0.012331008911132812, -0.004238128662109375, 0.0038547515869140625, 0.0119476318359375, 0.020040512084960938, 0.028133392333984375, 0.03622627258300781, 0.04431915283203125, 0.05241203308105469, 0.060504913330078125, 0.06859779357910156, 0.076690673828125, 0.08478355407714844, 0.09287643432617188, 0.10096931457519531, 0.10906219482421875, 0.11715507507324219, 0.12524795532226562, 0.13334083557128906, 0.1414337158203125, 0.14952659606933594, 0.15761947631835938, 0.1657123565673828, 0.17380523681640625, 0.1818981170654297, 0.18999099731445312, 0.19808387756347656, 0.2061767578125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 5.0, 9.0, 8.0, 16.0, 22.0, 36.0, 62.0, 105.0, 175.0, 277.0, 430.0, 885.0, 1636.0, 3736.0, 12004.0, 419534.0, 3728611.0, 17775.0, 4630.0, 1977.0, 986.0, 551.0, 292.0, 181.0, 125.0, 71.0, 45.0, 25.0, 23.0, 13.0, 8.0, 4.0, 8.0, 1.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89697265625, -0.8681411743164062, -0.8393096923828125, -0.8104782104492188, -0.781646728515625, -0.7528152465820312, -0.7239837646484375, -0.6951522827148438, -0.66632080078125, -0.6374893188476562, -0.6086578369140625, -0.5798263549804688, -0.550994873046875, -0.5221633911132812, -0.4933319091796875, -0.46450042724609375, -0.4356689453125, -0.40683746337890625, -0.3780059814453125, -0.34917449951171875, -0.320343017578125, -0.29151153564453125, -0.2626800537109375, -0.23384857177734375, -0.20501708984375, -0.17618560791015625, -0.1473541259765625, -0.11852264404296875, -0.089691162109375, -0.06085968017578125, -0.0320281982421875, -0.00319671630859375, 0.025634765625, 0.05446624755859375, 0.0832977294921875, 0.11212921142578125, 0.140960693359375, 0.16979217529296875, 0.1986236572265625, 0.22745513916015625, 0.25628662109375, 0.28511810302734375, 0.3139495849609375, 0.34278106689453125, 0.371612548828125, 0.40044403076171875, 0.4292755126953125, 0.45810699462890625, 0.4869384765625, 0.5157699584960938, 0.5446014404296875, 0.5734329223632812, 0.602264404296875, 0.6310958862304688, 0.6599273681640625, 0.6887588500976562, 0.71759033203125, 0.7464218139648438, 0.7752532958984375, 0.8040847778320312, 0.832916259765625, 0.8617477416992188, 0.8905792236328125, 0.9194107055664062, 0.9482421875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 13.0, 11.0, 21.0, 50.0, 210.0, 733.0, 2445.0, 394.0, 110.0, 32.0, 16.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1746826171875, -0.17011737823486328, -0.16555213928222656, -0.16098690032958984, -0.15642166137695312, -0.1518564224243164, -0.1472911834716797, -0.14272594451904297, -0.13816070556640625, -0.13359546661376953, -0.1290302276611328, -0.1244649887084961, -0.11989974975585938, -0.11533451080322266, -0.11076927185058594, -0.10620403289794922, -0.1016387939453125, -0.09707355499267578, -0.09250831604003906, -0.08794307708740234, -0.08337783813476562, -0.0788125991821289, -0.07424736022949219, -0.06968212127685547, -0.06511688232421875, -0.06055164337158203, -0.05598640441894531, -0.051421165466308594, -0.046855926513671875, -0.042290687561035156, -0.03772544860839844, -0.03316020965576172, -0.028594970703125, -0.02402973175048828, -0.019464492797851562, -0.014899253845214844, -0.010334014892578125, -0.005768775939941406, -0.0012035369873046875, 0.0033617019653320312, 0.00792694091796875, 0.012492179870605469, 0.017057418823242188, 0.021622657775878906, 0.026187896728515625, 0.030753135681152344, 0.03531837463378906, 0.03988361358642578, 0.0444488525390625, 0.04901409149169922, 0.05357933044433594, 0.058144569396972656, 0.06270980834960938, 0.0672750473022461, 0.07184028625488281, 0.07640552520751953, 0.08097076416015625, 0.08553600311279297, 0.09010124206542969, 0.0946664810180664, 0.09923171997070312, 0.10379695892333984, 0.10836219787597656, 0.11292743682861328, 0.11749267578125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 11.0, 11.0, 11.0, 27.0, 39.0, 81.0, 206.0, 328.0, 133.0, 78.0, 36.0, 19.0, 14.0, 9.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0646729469299316, -1.0416688919067383, -1.018664836883545, -0.9956607818603516, -0.9726567268371582, -0.9496526122093201, -0.9266485571861267, -0.9036445021629333, -0.88064044713974, -0.8576363921165466, -0.8346323370933533, -0.8116282820701599, -0.7886241674423218, -0.7656201124191284, -0.7426160573959351, -0.7196120023727417, -0.6966079473495483, -0.673603892326355, -0.6505998373031616, -0.6275957822799683, -0.6045917272567749, -0.5815876126289368, -0.5585835576057434, -0.53557950258255, -0.5125754475593567, -0.48957139253616333, -0.46656733751296997, -0.4435632526874542, -0.42055919766426086, -0.3975551426410675, -0.37455105781555176, -0.3515470027923584, -0.32854294776916504, -0.3055388927459717, -0.2825348377227783, -0.2595307528972626, -0.2365266978740692, -0.21352264285087585, -0.1905185729265213, -0.16751450300216675, -0.1445104479789734, -0.12150638550519943, -0.09850232303142548, -0.07549826055765152, -0.052494198083877563, -0.029490135610103607, -0.006486073136329651, 0.016517996788024902, 0.03952205181121826, 0.06252611428499222, 0.08553017675876617, 0.10853423923254013, 0.1315383017063141, 0.15454235672950745, 0.177546426653862, 0.20055049657821655, 0.2235545516014099, 0.24655860662460327, 0.26956266164779663, 0.2925667464733124, 0.31557080149650574, 0.3385748565196991, 0.36157894134521484, 0.3845829963684082, 0.40758705139160156]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 2.0, 11.0, 5.0, 9.0, 12.0, 16.0, 21.0, 18.0, 8.0, 22.0, 23.0, 38.0, 37.0, 37.0, 34.0, 42.0, 43.0, 55.0, 46.0, 45.0, 34.0, 51.0, 44.0, 34.0, 27.0, 45.0, 34.0, 23.0, 31.0, 21.0, 30.0, 13.0, 12.0, 19.0, 11.0, 18.0, 7.0, 5.0, 1.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19936750829219818, -0.19320598244667053, -0.18704445660114288, -0.18088293075561523, -0.17472141981124878, -0.16855989396572113, -0.16239836812019348, -0.15623684227466583, -0.15007531642913818, -0.14391379058361053, -0.13775226473808289, -0.13159075379371643, -0.12542922794818878, -0.11926770210266113, -0.11310617625713348, -0.10694465041160583, -0.10078313201665878, -0.09462160617113113, -0.08846008777618408, -0.08229856193065643, -0.07613703608512878, -0.06997551023960114, -0.06381399184465408, -0.057652465999126434, -0.051490943878889084, -0.04532942175865173, -0.039167895913124084, -0.033006373792886734, -0.026844849810004234, -0.020683325827121735, -0.014521803706884384, -0.008360277861356735, -0.0021987557411193848, 0.003962767776101828, 0.01012429129332304, 0.016285814344882965, 0.022447338327765465, 0.028608862310647964, 0.034770384430885315, 0.040931910276412964, 0.047093432396650314, 0.053254954516887665, 0.059416480362415314, 0.06557799875736237, 0.07173952460289001, 0.07790105044841766, 0.08406257629394531, 0.09022410213947296, 0.09638562053442001, 0.10254714637994766, 0.10870866477489471, 0.11487019062042236, 0.12103171646595001, 0.12719324231147766, 0.13335475325584412, 0.13951629400253296, 0.14567780494689941, 0.15183933079242706, 0.1580008566379547, 0.16416236758232117, 0.17032389342784882, 0.17648541927337646, 0.1826469451189041, 0.18880847096443176, 0.1949699968099594]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 2.0, 3.0, 12.0, 14.0, 14.0, 20.0, 34.0, 54.0, 56.0, 80.0, 115.0, 158.0, 222.0, 278.0, 407.0, 490.0, 725.0, 1023.0, 1345.0, 2029.0, 2921.0, 4284.0, 6631.0, 10391.0, 17285.0, 30711.0, 60230.0, 139284.0, 371019.0, 216697.0, 82696.0, 40003.0, 21844.0, 12741.0, 8060.0, 5077.0, 3424.0, 2366.0, 1582.0, 1158.0, 837.0, 620.0, 449.0, 310.0, 203.0, 203.0, 131.0, 92.0, 69.0, 51.0, 38.0, 27.0, 16.0, 10.0, 13.0, 10.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.331298828125, -0.3208503723144531, -0.31040191650390625, -0.2999534606933594, -0.2895050048828125, -0.2790565490722656, -0.26860809326171875, -0.2581596374511719, -0.247711181640625, -0.23726272583007812, -0.22681427001953125, -0.21636581420898438, -0.2059173583984375, -0.19546890258789062, -0.18502044677734375, -0.17457199096679688, -0.16412353515625, -0.15367507934570312, -0.14322662353515625, -0.13277816772460938, -0.1223297119140625, -0.11188125610351562, -0.10143280029296875, -0.09098434448242188, -0.080535888671875, -0.07008743286132812, -0.05963897705078125, -0.049190521240234375, -0.0387420654296875, -0.028293609619140625, -0.01784515380859375, -0.007396697998046875, 0.0030517578125, 0.013500213623046875, 0.02394866943359375, 0.034397125244140625, 0.0448455810546875, 0.055294036865234375, 0.06574249267578125, 0.07619094848632812, 0.086639404296875, 0.09708786010742188, 0.10753631591796875, 0.11798477172851562, 0.1284332275390625, 0.13888168334960938, 0.14933013916015625, 0.15977859497070312, 0.17022705078125, 0.18067550659179688, 0.19112396240234375, 0.20157241821289062, 0.2120208740234375, 0.22246932983398438, 0.23291778564453125, 0.24336624145507812, 0.253814697265625, 0.2642631530761719, 0.27471160888671875, 0.2851600646972656, 0.2956085205078125, 0.3060569763183594, 0.31650543212890625, 0.3269538879394531, 0.33740234375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 5.0, 4.0, 6.0, 12.0, 7.0, 18.0, 16.0, 8.0, 20.0, 15.0, 24.0, 29.0, 34.0, 35.0, 33.0, 35.0, 48.0, 46.0, 37.0, 51.0, 47.0, 37.0, 30.0, 45.0, 35.0, 41.0, 27.0, 30.0, 29.0, 29.0, 26.0, 36.0, 13.0, 19.0, 8.0, 11.0, 15.0, 10.0, 3.0, 6.0, 2.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.162841796875, -0.1582183837890625, -0.153594970703125, -0.1489715576171875, -0.14434814453125, -0.1397247314453125, -0.135101318359375, -0.1304779052734375, -0.1258544921875, -0.1212310791015625, -0.116607666015625, -0.1119842529296875, -0.10736083984375, -0.1027374267578125, -0.098114013671875, -0.0934906005859375, -0.0888671875, -0.0842437744140625, -0.079620361328125, -0.0749969482421875, -0.07037353515625, -0.0657501220703125, -0.061126708984375, -0.0565032958984375, -0.0518798828125, -0.0472564697265625, -0.042633056640625, -0.0380096435546875, -0.03338623046875, -0.0287628173828125, -0.024139404296875, -0.0195159912109375, -0.014892578125, -0.0102691650390625, -0.005645751953125, -0.0010223388671875, 0.00360107421875, 0.0082244873046875, 0.012847900390625, 0.0174713134765625, 0.0220947265625, 0.0267181396484375, 0.031341552734375, 0.0359649658203125, 0.04058837890625, 0.0452117919921875, 0.049835205078125, 0.0544586181640625, 0.05908203125, 0.0637054443359375, 0.068328857421875, 0.0729522705078125, 0.07757568359375, 0.0821990966796875, 0.086822509765625, 0.0914459228515625, 0.0960693359375, 0.1006927490234375, 0.105316162109375, 0.1099395751953125, 0.11456298828125, 0.1191864013671875, 0.123809814453125, 0.1284332275390625, 0.133056640625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 8.0, 14.0, 18.0, 15.0, 40.0, 38.0, 51.0, 89.0, 107.0, 161.0, 241.0, 329.0, 466.0, 685.0, 988.0, 1454.0, 2229.0, 3475.0, 5531.0, 9367.0, 16565.0, 32973.0, 80019.0, 398788.0, 348023.0, 75143.0, 31367.0, 16029.0, 8851.0, 5382.0, 3335.0, 2181.0, 1450.0, 978.0, 652.0, 427.0, 318.0, 231.0, 148.0, 108.0, 82.0, 49.0, 39.0, 43.0, 20.0, 13.0, 13.0, 6.0, 4.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.263427734375, -0.25543785095214844, -0.24744796752929688, -0.2394580841064453, -0.23146820068359375, -0.2234783172607422, -0.21548843383789062, -0.20749855041503906, -0.1995086669921875, -0.19151878356933594, -0.18352890014648438, -0.1755390167236328, -0.16754913330078125, -0.1595592498779297, -0.15156936645507812, -0.14357948303222656, -0.135589599609375, -0.12759971618652344, -0.11960983276367188, -0.11161994934082031, -0.10363006591796875, -0.09564018249511719, -0.08765029907226562, -0.07966041564941406, -0.0716705322265625, -0.06368064880371094, -0.055690765380859375, -0.04770088195800781, -0.03971099853515625, -0.03172111511230469, -0.023731231689453125, -0.015741348266601562, -0.00775146484375, 0.0002384185791015625, 0.008228302001953125, 0.016218185424804688, 0.02420806884765625, 0.03219795227050781, 0.040187835693359375, 0.04817771911621094, 0.0561676025390625, 0.06415748596191406, 0.07214736938476562, 0.08013725280761719, 0.08812713623046875, 0.09611701965332031, 0.10410690307617188, 0.11209678649902344, 0.120086669921875, 0.12807655334472656, 0.13606643676757812, 0.1440563201904297, 0.15204620361328125, 0.1600360870361328, 0.16802597045898438, 0.17601585388183594, 0.1840057373046875, 0.19199562072753906, 0.19998550415039062, 0.2079753875732422, 0.21596527099609375, 0.2239551544189453, 0.23194503784179688, 0.23993492126464844, 0.2479248046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 0.0, 9.0, 6.0, 8.0, 10.0, 13.0, 18.0, 17.0, 21.0, 25.0, 17.0, 35.0, 25.0, 36.0, 47.0, 32.0, 54.0, 51.0, 44.0, 59.0, 41.0, 48.0, 39.0, 35.0, 38.0, 31.0, 30.0, 23.0, 34.0, 33.0, 26.0, 19.0, 13.0, 12.0, 8.0, 13.0, 6.0, 6.0, 4.0, 4.0, 2.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.1099853515625, -0.10681724548339844, -0.10364913940429688, -0.10048103332519531, -0.09731292724609375, -0.09414482116699219, -0.09097671508789062, -0.08780860900878906, -0.0846405029296875, -0.08147239685058594, -0.07830429077148438, -0.07513618469238281, -0.07196807861328125, -0.06879997253417969, -0.06563186645507812, -0.06246376037597656, -0.059295654296875, -0.05612754821777344, -0.052959442138671875, -0.04979133605957031, -0.04662322998046875, -0.04345512390136719, -0.040287017822265625, -0.03711891174316406, -0.0339508056640625, -0.030782699584960938, -0.027614593505859375, -0.024446487426757812, -0.02127838134765625, -0.018110275268554688, -0.014942169189453125, -0.011774063110351562, -0.00860595703125, -0.0054378509521484375, -0.002269744873046875, 0.0008983612060546875, 0.00406646728515625, 0.0072345733642578125, 0.010402679443359375, 0.013570785522460938, 0.0167388916015625, 0.019906997680664062, 0.023075103759765625, 0.026243209838867188, 0.02941131591796875, 0.03257942199707031, 0.035747528076171875, 0.03891563415527344, 0.042083740234375, 0.04525184631347656, 0.048419952392578125, 0.05158805847167969, 0.05475616455078125, 0.05792427062988281, 0.061092376708984375, 0.06426048278808594, 0.0674285888671875, 0.07059669494628906, 0.07376480102539062, 0.07693290710449219, 0.08010101318359375, 0.08326911926269531, 0.08643722534179688, 0.08960533142089844, 0.0927734375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 13.0, 16.0, 23.0, 34.0, 46.0, 48.0, 68.0, 84.0, 111.0, 113.0, 177.0, 232.0, 302.0, 371.0, 518.0, 717.0, 1035.0, 2067.0, 4786.0, 13149.0, 61134.0, 844059.0, 91107.0, 16282.0, 5496.0, 2355.0, 1191.0, 770.0, 492.0, 388.0, 307.0, 241.0, 193.0, 149.0, 120.0, 80.0, 65.0, 42.0, 40.0, 36.0, 16.0, 15.0, 12.0, 7.0, 9.0, 8.0, 10.0, 3.0, 5.0, 2.0, 1.0], "bins": [-0.0167388916015625, -0.016254901885986328, -0.015770912170410156, -0.015286922454833984, -0.014802932739257812, -0.01431894302368164, -0.013834953308105469, -0.013350963592529297, -0.012866973876953125, -0.012382984161376953, -0.011898994445800781, -0.01141500473022461, -0.010931015014648438, -0.010447025299072266, -0.009963035583496094, -0.009479045867919922, -0.00899505615234375, -0.008511066436767578, -0.008027076721191406, -0.007543087005615234, -0.0070590972900390625, -0.006575107574462891, -0.006091117858886719, -0.005607128143310547, -0.005123138427734375, -0.004639148712158203, -0.004155158996582031, -0.0036711692810058594, -0.0031871795654296875, -0.0027031898498535156, -0.0022192001342773438, -0.0017352104187011719, -0.001251220703125, -0.0007672309875488281, -0.00028324127197265625, 0.00020074844360351562, 0.0006847381591796875, 0.0011687278747558594, 0.0016527175903320312, 0.002136707305908203, 0.002620697021484375, 0.003104686737060547, 0.0035886764526367188, 0.004072666168212891, 0.0045566558837890625, 0.005040645599365234, 0.005524635314941406, 0.006008625030517578, 0.00649261474609375, 0.006976604461669922, 0.007460594177246094, 0.007944583892822266, 0.008428573608398438, 0.00891256332397461, 0.009396553039550781, 0.009880542755126953, 0.010364532470703125, 0.010848522186279297, 0.011332511901855469, 0.01181650161743164, 0.012300491333007812, 0.012784481048583984, 0.013268470764160156, 0.013752460479736328, 0.0142364501953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 9.0, 13.0, 5.0, 16.0, 15.0, 11.0, 12.0, 25.0, 26.0, 30.0, 38.0, 64.0, 67.0, 107.0, 132.0, 74.0, 78.0, 62.0, 40.0, 32.0, 28.0, 25.0, 10.0, 16.0, 11.0, 10.0, 15.0, 6.0, 5.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.139278411865234e-06, -5.90737909078598e-06, -5.675479769706726e-06, -5.443580448627472e-06, -5.211681127548218e-06, -4.979781806468964e-06, -4.7478824853897095e-06, -4.515983164310455e-06, -4.284083843231201e-06, -4.052184522151947e-06, -3.820285201072693e-06, -3.5883858799934387e-06, -3.3564865589141846e-06, -3.1245872378349304e-06, -2.8926879167556763e-06, -2.660788595676422e-06, -2.428889274597168e-06, -2.196989953517914e-06, -1.9650906324386597e-06, -1.7331913113594055e-06, -1.5012919902801514e-06, -1.2693926692008972e-06, -1.037493348121643e-06, -8.055940270423889e-07, -5.736947059631348e-07, -3.417953848838806e-07, -1.0989606380462646e-07, 1.2200325727462769e-07, 3.5390257835388184e-07, 5.85801899433136e-07, 8.177012205123901e-07, 1.0496005415916443e-06, 1.2814998626708984e-06, 1.5133991837501526e-06, 1.7452985048294067e-06, 1.977197825908661e-06, 2.209097146987915e-06, 2.440996468067169e-06, 2.6728957891464233e-06, 2.9047951102256775e-06, 3.1366944313049316e-06, 3.368593752384186e-06, 3.60049307346344e-06, 3.832392394542694e-06, 4.064291715621948e-06, 4.296191036701202e-06, 4.5280903577804565e-06, 4.759989678859711e-06, 4.991888999938965e-06, 5.223788321018219e-06, 5.455687642097473e-06, 5.687586963176727e-06, 5.9194862842559814e-06, 6.151385605335236e-06, 6.38328492641449e-06, 6.615184247493744e-06, 6.847083568572998e-06, 7.078982889652252e-06, 7.310882210731506e-06, 7.5427815318107605e-06, 7.774680852890015e-06, 8.006580173969269e-06, 8.238479495048523e-06, 8.470378816127777e-06, 8.702278137207031e-06]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 3.0, 10.0, 6.0, 10.0, 6.0, 11.0, 10.0, 19.0, 22.0, 68.0, 124.0, 274.0, 609.0, 1335.0, 2950.0, 10632.0, 450737.0, 565283.0, 10865.0, 3045.0, 1332.0, 596.0, 285.0, 145.0, 61.0, 18.0, 14.0, 13.0, 11.0, 8.0, 5.0, 10.0, 9.0, 7.0, 1.0, 4.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0301513671875, -0.029209375381469727, -0.028267383575439453, -0.02732539176940918, -0.026383399963378906, -0.025441408157348633, -0.02449941635131836, -0.023557424545288086, -0.022615432739257812, -0.02167344093322754, -0.020731449127197266, -0.019789457321166992, -0.01884746551513672, -0.017905473709106445, -0.016963481903076172, -0.0160214900970459, -0.015079498291015625, -0.014137506484985352, -0.013195514678955078, -0.012253522872924805, -0.011311531066894531, -0.010369539260864258, -0.009427547454833984, -0.008485555648803711, -0.0075435638427734375, -0.006601572036743164, -0.005659580230712891, -0.004717588424682617, -0.0037755966186523438, -0.0028336048126220703, -0.0018916130065917969, -0.0009496212005615234, -7.62939453125e-06, 0.0009343624114990234, 0.0018763542175292969, 0.0028183460235595703, 0.0037603378295898438, 0.004702329635620117, 0.005644321441650391, 0.006586313247680664, 0.0075283050537109375, 0.008470296859741211, 0.009412288665771484, 0.010354280471801758, 0.011296272277832031, 0.012238264083862305, 0.013180255889892578, 0.014122247695922852, 0.015064239501953125, 0.0160062313079834, 0.016948223114013672, 0.017890214920043945, 0.01883220672607422, 0.019774198532104492, 0.020716190338134766, 0.02165818214416504, 0.022600173950195312, 0.023542165756225586, 0.02448415756225586, 0.025426149368286133, 0.026368141174316406, 0.02731013298034668, 0.028252124786376953, 0.029194116592407227, 0.0301361083984375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 10.0, 17.0, 28.0, 32.0, 54.0, 112.0, 236.0, 230.0, 120.0, 44.0, 38.0, 31.0, 23.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.004344940185546875, -0.004227340221405029, -0.004109740257263184, -0.003992140293121338, -0.003874540328979492, -0.0037569403648376465, -0.0036393404006958008, -0.003521740436553955, -0.0034041404724121094, -0.0032865405082702637, -0.003168940544128418, -0.0030513405799865723, -0.0029337406158447266, -0.002816140651702881, -0.002698540687561035, -0.0025809407234191895, -0.0024633407592773438, -0.002345740795135498, -0.0022281408309936523, -0.0021105408668518066, -0.001992940902709961, -0.0018753409385681152, -0.0017577409744262695, -0.0016401410102844238, -0.0015225410461425781, -0.0014049410820007324, -0.0012873411178588867, -0.001169741153717041, -0.0010521411895751953, -0.0009345412254333496, -0.0008169412612915039, -0.0006993412971496582, -0.0005817413330078125, -0.0004641413688659668, -0.0003465414047241211, -0.0002289414405822754, -0.00011134147644042969, 6.258487701416016e-06, 0.00012385845184326172, 0.00024145841598510742, 0.0003590583801269531, 0.00047665834426879883, 0.0005942583084106445, 0.0007118582725524902, 0.0008294582366943359, 0.0009470582008361816, 0.0010646581649780273, 0.001182258129119873, 0.0012998580932617188, 0.0014174580574035645, 0.0015350580215454102, 0.0016526579856872559, 0.0017702579498291016, 0.0018878579139709473, 0.002005457878112793, 0.0021230578422546387, 0.0022406578063964844, 0.00235825777053833, 0.0024758577346801758, 0.0025934576988220215, 0.002711057662963867, 0.002828657627105713, 0.0029462575912475586, 0.0030638575553894043, 0.00318145751953125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 2.0, 8.0, 7.0, 17.0, 21.0, 25.0, 39.0, 63.0, 127.0, 247.0, 199.0, 91.0, 57.0, 36.0, 22.0, 18.0, 8.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5308773517608643, -0.5178534984588623, -0.5048296451568604, -0.4918057918548584, -0.47878193855285645, -0.4657580852508545, -0.45273423194885254, -0.4397103786468506, -0.42668652534484863, -0.4136626720428467, -0.4006388187408447, -0.3876149654388428, -0.3745911121368408, -0.36156725883483887, -0.3485434055328369, -0.33551955223083496, -0.322495698928833, -0.30947184562683105, -0.2964479923248291, -0.28342413902282715, -0.2704002857208252, -0.25737643241882324, -0.2443525791168213, -0.23132872581481934, -0.21830487251281738, -0.20528101921081543, -0.19225716590881348, -0.17923331260681152, -0.16620945930480957, -0.15318560600280762, -0.14016175270080566, -0.1271378993988037, -0.11411401629447937, -0.10109016299247742, -0.08806630969047546, -0.07504245638847351, -0.06201860308647156, -0.048994749784469604, -0.03597089648246765, -0.022947043180465698, -0.009923189878463745, 0.003100663423538208, 0.01612451672554016, 0.029148370027542114, 0.04217222332954407, 0.05519607663154602, 0.06821992993354797, 0.08124378323554993, 0.09426763653755188, 0.10729148983955383, 0.12031534314155579, 0.13333919644355774, 0.1463630497455597, 0.15938690304756165, 0.1724107563495636, 0.18543460965156555, 0.1984584629535675, 0.21148231625556946, 0.2245061695575714, 0.23753002285957336, 0.2505538761615753, 0.26357772946357727, 0.2766015827655792, 0.2896254360675812, 0.30264928936958313]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 4.0, 4.0, 9.0, 4.0, 7.0, 9.0, 12.0, 16.0, 18.0, 16.0, 14.0, 20.0, 17.0, 35.0, 40.0, 39.0, 41.0, 43.0, 44.0, 48.0, 54.0, 44.0, 33.0, 48.0, 39.0, 36.0, 34.0, 38.0, 29.0, 37.0, 28.0, 30.0, 17.0, 20.0, 22.0, 10.0, 18.0, 9.0, 5.0, 2.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15435917675495148, -0.14960479736328125, -0.14485040307044983, -0.1400960236787796, -0.13534164428710938, -0.13058726489543915, -0.12583288550376892, -0.1210784912109375, -0.11632411181926727, -0.11156973242759705, -0.10681534558534622, -0.1020609587430954, -0.09730657935142517, -0.09255219995975494, -0.08779781311750412, -0.0830434262752533, -0.07828904688358307, -0.07353466749191284, -0.06878028064966202, -0.0640258938074112, -0.05927151441574097, -0.05451713129878044, -0.049762748181819916, -0.04500836506485939, -0.040253981947898865, -0.03549959883093834, -0.030745215713977814, -0.025990832597017288, -0.021236449480056763, -0.016482066363096237, -0.011727683246135712, -0.006973300129175186, -0.0022189170122146606, 0.002535466104745865, 0.00728984922170639, 0.012044232338666916, 0.01679861545562744, 0.021552998572587967, 0.026307381689548492, 0.031061764806509018, 0.03581614792346954, 0.04057053104043007, 0.045324914157390594, 0.05007929727435112, 0.054833680391311646, 0.05958806350827217, 0.0643424466252327, 0.06909683346748352, 0.07385121285915375, 0.07860559225082397, 0.0833599790930748, 0.08811436593532562, 0.09286874532699585, 0.09762312471866608, 0.1023775115609169, 0.10713189840316772, 0.11188627779483795, 0.11664065718650818, 0.121395044028759, 0.12614943087100983, 0.13090381026268005, 0.13565818965435028, 0.1404125690460205, 0.14516696333885193, 0.14992134273052216]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 7.0, 4.0, 11.0, 9.0, 24.0, 25.0, 28.0, 42.0, 63.0, 131.0, 246.0, 596.0, 1558.0, 4297.0, 13658.0, 47242.0, 207100.0, 602488.0, 124559.0, 31757.0, 9505.0, 3060.0, 1158.0, 440.0, 214.0, 105.0, 58.0, 40.0, 30.0, 19.0, 20.0, 11.0, 6.0, 7.0, 6.0, 6.0, 5.0, 2.0, 8.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53271484375, -0.5151596069335938, -0.4976043701171875, -0.48004913330078125, -0.462493896484375, -0.44493865966796875, -0.4273834228515625, -0.40982818603515625, -0.39227294921875, -0.37471771240234375, -0.3571624755859375, -0.33960723876953125, -0.322052001953125, -0.30449676513671875, -0.2869415283203125, -0.26938629150390625, -0.2518310546875, -0.23427581787109375, -0.2167205810546875, -0.19916534423828125, -0.181610107421875, -0.16405487060546875, -0.1464996337890625, -0.12894439697265625, -0.11138916015625, -0.09383392333984375, -0.0762786865234375, -0.05872344970703125, -0.041168212890625, -0.02361297607421875, -0.0060577392578125, 0.01149749755859375, 0.029052734375, 0.04660797119140625, 0.0641632080078125, 0.08171844482421875, 0.099273681640625, 0.11682891845703125, 0.1343841552734375, 0.15193939208984375, 0.16949462890625, 0.18704986572265625, 0.2046051025390625, 0.22216033935546875, 0.239715576171875, 0.25727081298828125, 0.2748260498046875, 0.29238128662109375, 0.3099365234375, 0.32749176025390625, 0.3450469970703125, 0.36260223388671875, 0.380157470703125, 0.39771270751953125, 0.4152679443359375, 0.43282318115234375, 0.45037841796875, 0.46793365478515625, 0.4854888916015625, 0.5030441284179688, 0.520599365234375, 0.5381546020507812, 0.5557098388671875, 0.5732650756835938, 0.5908203125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 14.0, 8.0, 14.0, 28.0, 40.0, 42.0, 63.0, 71.0, 70.0, 67.0, 94.0, 77.0, 69.0, 79.0, 58.0, 48.0, 53.0, 38.0, 25.0, 13.0, 14.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.14599609375, -0.1427478790283203, -0.13949966430664062, -0.13625144958496094, -0.13300323486328125, -0.12975502014160156, -0.12650680541992188, -0.12325859069824219, -0.1200103759765625, -0.11676216125488281, -0.11351394653320312, -0.11026573181152344, -0.10701751708984375, -0.10376930236816406, -0.10052108764648438, -0.09727287292480469, -0.094024658203125, -0.09077644348144531, -0.08752822875976562, -0.08428001403808594, -0.08103179931640625, -0.07778358459472656, -0.07453536987304688, -0.07128715515136719, -0.0680389404296875, -0.06479072570800781, -0.061542510986328125, -0.05829429626464844, -0.05504608154296875, -0.05179786682128906, -0.048549652099609375, -0.04530143737792969, -0.04205322265625, -0.03880500793457031, -0.035556793212890625, -0.03230857849121094, -0.02906036376953125, -0.025812149047851562, -0.022563934326171875, -0.019315719604492188, -0.0160675048828125, -0.012819290161132812, -0.009571075439453125, -0.0063228607177734375, -0.00307464599609375, 0.0001735687255859375, 0.003421783447265625, 0.0066699981689453125, 0.009918212890625, 0.013166427612304688, 0.016414642333984375, 0.019662857055664062, 0.02291107177734375, 0.026159286499023438, 0.029407501220703125, 0.03265571594238281, 0.0359039306640625, 0.03915214538574219, 0.042400360107421875, 0.04564857482910156, 0.04889678955078125, 0.05214500427246094, 0.055393218994140625, 0.05864143371582031, 0.0618896484375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 6.0, 2.0, 8.0, 16.0, 19.0, 22.0, 37.0, 58.0, 67.0, 114.0, 180.0, 272.0, 574.0, 945.0, 1793.0, 3394.0, 6849.0, 13985.0, 29026.0, 65009.0, 176614.0, 425838.0, 192821.0, 70114.0, 30781.0, 14853.0, 7229.0, 3608.0, 1845.0, 1004.0, 567.0, 331.0, 200.0, 138.0, 79.0, 57.0, 26.0, 29.0, 17.0, 9.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.213623046875, -0.2068500518798828, -0.20007705688476562, -0.19330406188964844, -0.18653106689453125, -0.17975807189941406, -0.17298507690429688, -0.1662120819091797, -0.1594390869140625, -0.1526660919189453, -0.14589309692382812, -0.13912010192871094, -0.13234710693359375, -0.12557411193847656, -0.11880111694335938, -0.11202812194824219, -0.105255126953125, -0.09848213195800781, -0.09170913696289062, -0.08493614196777344, -0.07816314697265625, -0.07139015197753906, -0.06461715698242188, -0.05784416198730469, -0.0510711669921875, -0.04429817199707031, -0.037525177001953125, -0.030752182006835938, -0.02397918701171875, -0.017206192016601562, -0.010433197021484375, -0.0036602020263671875, 0.00311279296875, 0.009885787963867188, 0.016658782958984375, 0.023431777954101562, 0.03020477294921875, 0.03697776794433594, 0.043750762939453125, 0.05052375793457031, 0.0572967529296875, 0.06406974792480469, 0.07084274291992188, 0.07761573791503906, 0.08438873291015625, 0.09116172790527344, 0.09793472290039062, 0.10470771789550781, 0.111480712890625, 0.11825370788574219, 0.12502670288085938, 0.13179969787597656, 0.13857269287109375, 0.14534568786621094, 0.15211868286132812, 0.1588916778564453, 0.1656646728515625, 0.1724376678466797, 0.17921066284179688, 0.18598365783691406, 0.19275665283203125, 0.19952964782714844, 0.20630264282226562, 0.2130756378173828, 0.2198486328125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 4.0, 4.0, 10.0, 6.0, 9.0, 21.0, 20.0, 11.0, 16.0, 24.0, 18.0, 27.0, 23.0, 30.0, 36.0, 49.0, 39.0, 47.0, 50.0, 41.0, 49.0, 39.0, 48.0, 45.0, 47.0, 43.0, 41.0, 33.0, 24.0, 24.0, 26.0, 19.0, 18.0, 14.0, 18.0, 8.0, 5.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05322265625, -0.051558494567871094, -0.04989433288574219, -0.04823017120361328, -0.046566009521484375, -0.04490184783935547, -0.04323768615722656, -0.041573524475097656, -0.03990936279296875, -0.038245201110839844, -0.03658103942871094, -0.03491687774658203, -0.033252716064453125, -0.03158855438232422, -0.029924392700195312, -0.028260231018066406, -0.0265960693359375, -0.024931907653808594, -0.023267745971679688, -0.02160358428955078, -0.019939422607421875, -0.01827526092529297, -0.016611099243164062, -0.014946937561035156, -0.01328277587890625, -0.011618614196777344, -0.009954452514648438, -0.008290290832519531, -0.006626129150390625, -0.004961967468261719, -0.0032978057861328125, -0.0016336441040039062, 3.0517578125e-05, 0.0016946792602539062, 0.0033588409423828125, 0.005023002624511719, 0.006687164306640625, 0.008351325988769531, 0.010015487670898438, 0.011679649353027344, 0.01334381103515625, 0.015007972717285156, 0.016672134399414062, 0.01833629608154297, 0.020000457763671875, 0.02166461944580078, 0.023328781127929688, 0.024992942810058594, 0.0266571044921875, 0.028321266174316406, 0.029985427856445312, 0.03164958953857422, 0.033313751220703125, 0.03497791290283203, 0.03664207458496094, 0.038306236267089844, 0.03997039794921875, 0.041634559631347656, 0.04329872131347656, 0.04496288299560547, 0.046627044677734375, 0.04829120635986328, 0.04995536804199219, 0.051619529724121094, 0.05328369140625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 7.0, 2.0, 6.0, 12.0, 16.0, 14.0, 19.0, 49.0, 74.0, 88.0, 104.0, 169.0, 267.0, 422.0, 642.0, 1081.0, 1854.0, 3546.0, 7274.0, 17262.0, 49040.0, 220995.0, 592027.0, 100994.0, 29607.0, 11360.0, 5163.0, 2620.0, 1460.0, 796.0, 505.0, 341.0, 197.0, 140.0, 112.0, 84.0, 63.0, 34.0, 34.0, 20.0, 15.0, 11.0, 9.0, 3.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0070343017578125, -0.0068228840827941895, -0.006611466407775879, -0.006400048732757568, -0.006188631057739258, -0.005977213382720947, -0.005765795707702637, -0.005554378032684326, -0.005342960357666016, -0.005131542682647705, -0.0049201250076293945, -0.004708707332611084, -0.0044972896575927734, -0.004285871982574463, -0.004074454307556152, -0.003863036632537842, -0.0036516189575195312, -0.0034402012825012207, -0.00322878360748291, -0.0030173659324645996, -0.002805948257446289, -0.0025945305824279785, -0.002383112907409668, -0.0021716952323913574, -0.001960277557373047, -0.0017488598823547363, -0.0015374422073364258, -0.0013260245323181152, -0.0011146068572998047, -0.0009031891822814941, -0.0006917715072631836, -0.00048035383224487305, -0.0002689361572265625, -5.751848220825195e-05, 0.0001538991928100586, 0.00036531686782836914, 0.0005767345428466797, 0.0007881522178649902, 0.0009995698928833008, 0.0012109875679016113, 0.0014224052429199219, 0.0016338229179382324, 0.001845240592956543, 0.0020566582679748535, 0.002268075942993164, 0.0024794936180114746, 0.002690911293029785, 0.0029023289680480957, 0.0031137466430664062, 0.003325164318084717, 0.0035365819931030273, 0.003747999668121338, 0.0039594173431396484, 0.004170835018157959, 0.0043822526931762695, 0.00459367036819458, 0.004805088043212891, 0.005016505718231201, 0.005227923393249512, 0.005439341068267822, 0.005650758743286133, 0.005862176418304443, 0.006073594093322754, 0.0062850117683410645, 0.006496429443359375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 7.0, 4.0, 4.0, 5.0, 8.0, 6.0, 11.0, 14.0, 5.0, 41.0, 29.0, 51.0, 54.0, 83.0, 113.0, 79.0, 130.0, 66.0, 82.0, 33.0, 54.0, 30.0, 13.0, 19.0, 18.0, 17.0, 8.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.185604095458984e-06, -5.03193587064743e-06, -4.8782676458358765e-06, -4.7245994210243225e-06, -4.5709311962127686e-06, -4.417262971401215e-06, -4.263594746589661e-06, -4.109926521778107e-06, -3.956258296966553e-06, -3.8025900721549988e-06, -3.648921847343445e-06, -3.495253622531891e-06, -3.341585397720337e-06, -3.187917172908783e-06, -3.034248948097229e-06, -2.880580723285675e-06, -2.726912498474121e-06, -2.573244273662567e-06, -2.419576048851013e-06, -2.2659078240394592e-06, -2.1122395992279053e-06, -1.9585713744163513e-06, -1.8049031496047974e-06, -1.6512349247932434e-06, -1.4975666999816895e-06, -1.3438984751701355e-06, -1.1902302503585815e-06, -1.0365620255470276e-06, -8.828938007354736e-07, -7.292255759239197e-07, -5.755573511123657e-07, -4.2188912630081177e-07, -2.682209014892578e-07, -1.1455267667770386e-07, 3.91155481338501e-08, 1.9278377294540405e-07, 3.46451997756958e-07, 5.00120222568512e-07, 6.537884473800659e-07, 8.074566721916199e-07, 9.611248970031738e-07, 1.1147931218147278e-06, 1.2684613466262817e-06, 1.4221295714378357e-06, 1.5757977962493896e-06, 1.7294660210609436e-06, 1.8831342458724976e-06, 2.0368024706840515e-06, 2.1904706954956055e-06, 2.3441389203071594e-06, 2.4978071451187134e-06, 2.6514753699302673e-06, 2.8051435947418213e-06, 2.9588118195533752e-06, 3.112480044364929e-06, 3.266148269176483e-06, 3.419816493988037e-06, 3.573484718799591e-06, 3.727152943611145e-06, 3.880821168422699e-06, 4.034489393234253e-06, 4.188157618045807e-06, 4.341825842857361e-06, 4.495494067668915e-06, 4.649162292480469e-06]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 8.0, 9.0, 8.0, 17.0, 20.0, 31.0, 38.0, 74.0, 122.0, 175.0, 320.0, 565.0, 1070.0, 2044.0, 4066.0, 8490.0, 18137.0, 41901.0, 111663.0, 386858.0, 315349.0, 91170.0, 35697.0, 15660.0, 7516.0, 3510.0, 1852.0, 909.0, 517.0, 287.0, 169.0, 99.0, 66.0, 46.0, 32.0, 18.0, 14.0, 6.0, 4.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0027256011962890625, -0.002637416124343872, -0.0025492310523986816, -0.002461045980453491, -0.0023728609085083008, -0.0022846758365631104, -0.00219649076461792, -0.0021083056926727295, -0.002020120620727539, -0.0019319355487823486, -0.0018437504768371582, -0.0017555654048919678, -0.0016673803329467773, -0.001579195261001587, -0.0014910101890563965, -0.001402825117111206, -0.0013146400451660156, -0.0012264549732208252, -0.0011382699012756348, -0.0010500848293304443, -0.0009618997573852539, -0.0008737146854400635, -0.000785529613494873, -0.0006973445415496826, -0.0006091594696044922, -0.0005209743976593018, -0.00043278932571411133, -0.0003446042537689209, -0.00025641918182373047, -0.00016823410987854004, -8.004903793334961e-05, 8.13603401184082e-06, 9.632110595703125e-05, 0.00018450617790222168, 0.0002726912498474121, 0.00036087632179260254, 0.00044906139373779297, 0.0005372464656829834, 0.0006254315376281738, 0.0007136166095733643, 0.0008018016815185547, 0.0008899867534637451, 0.0009781718254089355, 0.001066356897354126, 0.0011545419692993164, 0.0012427270412445068, 0.0013309121131896973, 0.0014190971851348877, 0.0015072822570800781, 0.0015954673290252686, 0.001683652400970459, 0.0017718374729156494, 0.0018600225448608398, 0.0019482076168060303, 0.0020363926887512207, 0.002124577760696411, 0.0022127628326416016, 0.002300947904586792, 0.0023891329765319824, 0.002477318048477173, 0.0025655031204223633, 0.0026536881923675537, 0.002741873264312744, 0.0028300583362579346, 0.002918243408203125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 2.0, 6.0, 8.0, 4.0, 13.0, 14.0, 7.0, 17.0, 15.0, 23.0, 33.0, 24.0, 36.0, 30.0, 32.0, 29.0, 42.0, 61.0, 53.0, 56.0, 52.0, 43.0, 55.0, 46.0, 42.0, 37.0, 32.0, 32.0, 28.0, 20.0, 11.0, 17.0, 13.0, 14.0, 13.0, 10.0, 6.0, 4.0, 2.0, 3.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005941390991210938, -0.0005748122930526733, -0.0005554854869842529, -0.0005361586809158325, -0.0005168318748474121, -0.0004975050687789917, -0.0004781782627105713, -0.0004588514566421509, -0.00043952465057373047, -0.00042019784450531006, -0.00040087103843688965, -0.00038154423236846924, -0.00036221742630004883, -0.0003428906202316284, -0.000323563814163208, -0.0003042370080947876, -0.0002849102020263672, -0.0002655833959579468, -0.00024625658988952637, -0.00022692978382110596, -0.00020760297775268555, -0.00018827617168426514, -0.00016894936561584473, -0.00014962255954742432, -0.0001302957534790039, -0.0001109689474105835, -9.164214134216309e-05, -7.231533527374268e-05, -5.2988529205322266e-05, -3.3661723136901855e-05, -1.4334917068481445e-05, 4.991888999938965e-06, 2.4318695068359375e-05, 4.3645501136779785e-05, 6.29723072052002e-05, 8.22991132736206e-05, 0.00010162591934204102, 0.00012095272541046143, 0.00014027953147888184, 0.00015960633754730225, 0.00017893314361572266, 0.00019825994968414307, 0.00021758675575256348, 0.0002369135618209839, 0.0002562403678894043, 0.0002755671739578247, 0.0002948939800262451, 0.00031422078609466553, 0.00033354759216308594, 0.00035287439823150635, 0.00037220120429992676, 0.00039152801036834717, 0.0004108548164367676, 0.000430181622505188, 0.0004495084285736084, 0.0004688352346420288, 0.0004881620407104492, 0.0005074888467788696, 0.00052681565284729, 0.0005461424589157104, 0.0005654692649841309, 0.0005847960710525513, 0.0006041228771209717, 0.0006234496831893921, 0.0006427764892578125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 12.0, 19.0, 31.0, 78.0, 111.0, 231.0, 237.0, 112.0, 66.0, 39.0, 26.0, 13.0, 11.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.3569425642490387, -0.34980109333992004, -0.3426596224308014, -0.33551812171936035, -0.3283766508102417, -0.32123517990112305, -0.3140937089920044, -0.30695223808288574, -0.2998107671737671, -0.29266929626464844, -0.2855278253555298, -0.27838632464408875, -0.2712448537349701, -0.26410338282585144, -0.2569619119167328, -0.24982044100761414, -0.2426789402961731, -0.23553746938705444, -0.2283959835767746, -0.22125451266765594, -0.2141130268573761, -0.20697155594825745, -0.1998300850391388, -0.19268861413002014, -0.1855471283197403, -0.17840565741062164, -0.1712641716003418, -0.16412270069122314, -0.1569812297821045, -0.14983974397182465, -0.142698273062706, -0.13555678725242615, -0.1284153163433075, -0.12127383798360825, -0.114132359623909, -0.10699088871479034, -0.0998494103550911, -0.09270793199539185, -0.0855664610862732, -0.07842498272657394, -0.0712834969162941, -0.06414201855659485, -0.0570005439221859, -0.04985906928777695, -0.0427175909280777, -0.03557611256837845, -0.028434637933969498, -0.021293163299560547, -0.014151684939861298, -0.007010208442807198, 0.00013126805424690247, 0.0072727445513010025, 0.014414221048355103, 0.021555699408054352, 0.028697174042463303, 0.03583864867687225, 0.0429801270365715, 0.05012160539627075, 0.0572630800306797, 0.06440455466508865, 0.0715460330247879, 0.07868751138448715, 0.0858289897441864, 0.09297046065330505, 0.1001119390130043]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 7.0, 8.0, 13.0, 10.0, 14.0, 21.0, 24.0, 42.0, 24.0, 23.0, 26.0, 41.0, 29.0, 37.0, 31.0, 51.0, 39.0, 42.0, 41.0, 50.0, 39.0, 32.0, 44.0, 38.0, 29.0, 43.0, 27.0, 27.0, 21.0, 22.0, 12.0, 19.0, 9.0, 15.0, 10.0, 9.0, 6.0, 4.0, 4.0, 5.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.08405295759439468, -0.08182258158922195, -0.07959219813346863, -0.0773618221282959, -0.07513144612312317, -0.07290106266736984, -0.07067068666219711, -0.06844030320644379, -0.06620992720127106, -0.06397955119609833, -0.061749167740345, -0.05951879173517227, -0.057288412004709244, -0.055058032274246216, -0.052827656269073486, -0.05059727653861046, -0.04836689680814743, -0.0461365170776844, -0.043906137347221375, -0.041675761342048645, -0.03944538161158562, -0.03721500188112259, -0.03498462587594986, -0.03275424614548683, -0.030523866415023804, -0.028293486684560776, -0.026063108816742897, -0.02383273094892502, -0.02160235121846199, -0.019371971487998962, -0.017141593620181084, -0.01491121482104063, -0.012680836021900177, -0.010450457222759724, -0.00822007842361927, -0.005989699624478817, -0.0037593208253383636, -0.0015289420261979103, 0.000701436772942543, 0.0029318155720829964, 0.00516219437122345, 0.007392573170363903, 0.009622951969504356, 0.01185333076864481, 0.014083709567785263, 0.01631408929824829, 0.01854446716606617, 0.02077484503388405, 0.023005224764347076, 0.025235604494810104, 0.027465982362627983, 0.029696360230445862, 0.03192673996090889, 0.03415711969137192, 0.03638749569654465, 0.038617875427007675, 0.0408482551574707, 0.04307863488793373, 0.04530901461839676, 0.04753939062356949, 0.049769770354032516, 0.052000150084495544, 0.054230526089668274, 0.0564609058201313, 0.05869128555059433]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 8.0, 15.0, 30.0, 49.0, 99.0, 174.0, 498.0, 1910.0, 4120346.0, 68773.0, 1662.0, 418.0, 146.0, 70.0, 53.0, 15.0, 13.0, 6.0, 2.0], "bins": [-0.99267578125, -0.9742469787597656, -0.9558181762695312, -0.9373893737792969, -0.9189605712890625, -0.9005317687988281, -0.8821029663085938, -0.8636741638183594, -0.845245361328125, -0.8268165588378906, -0.8083877563476562, -0.7899589538574219, -0.7715301513671875, -0.7531013488769531, -0.7346725463867188, -0.7162437438964844, -0.69781494140625, -0.6793861389160156, -0.6609573364257812, -0.6425285339355469, -0.6240997314453125, -0.6056709289550781, -0.5872421264648438, -0.5688133239746094, -0.550384521484375, -0.5319557189941406, -0.5135269165039062, -0.4950981140136719, -0.4766693115234375, -0.4582405090332031, -0.43981170654296875, -0.4213829040527344, -0.4029541015625, -0.3845252990722656, -0.36609649658203125, -0.3476676940917969, -0.3292388916015625, -0.3108100891113281, -0.29238128662109375, -0.2739524841308594, -0.255523681640625, -0.23709487915039062, -0.21866607666015625, -0.20023727416992188, -0.1818084716796875, -0.16337966918945312, -0.14495086669921875, -0.12652206420898438, -0.10809326171875, -0.08966445922851562, -0.07123565673828125, -0.052806854248046875, -0.0343780517578125, -0.015949249267578125, 0.00247955322265625, 0.020908355712890625, 0.039337158203125, 0.057765960693359375, 0.07619476318359375, 0.09462356567382812, 0.1130523681640625, 0.13148117065429688, 0.14990997314453125, 0.16833877563476562, 0.186767578125]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 8.0, 14.0, 30.0, 44.0, 64.0, 78.0, 100.0, 108.0, 119.0, 119.0, 94.0, 85.0, 48.0, 51.0, 21.0, 13.0, 12.0, 2.0, 2.0], "bins": [-0.2493896484375, -0.24471664428710938, -0.24004364013671875, -0.23537063598632812, -0.2306976318359375, -0.22602462768554688, -0.22135162353515625, -0.21667861938476562, -0.212005615234375, -0.20733261108398438, -0.20265960693359375, -0.19798660278320312, -0.1933135986328125, -0.18864059448242188, -0.18396759033203125, -0.17929458618164062, -0.17462158203125, -0.16994857788085938, -0.16527557373046875, -0.16060256958007812, -0.1559295654296875, -0.15125656127929688, -0.14658355712890625, -0.14191055297851562, -0.137237548828125, -0.13256454467773438, -0.12789154052734375, -0.12321853637695312, -0.1185455322265625, -0.11387252807617188, -0.10919952392578125, -0.10452651977539062, -0.099853515625, -0.09518051147460938, -0.09050750732421875, -0.08583450317382812, -0.0811614990234375, -0.07648849487304688, -0.07181549072265625, -0.06714248657226562, -0.062469482421875, -0.057796478271484375, -0.05312347412109375, -0.048450469970703125, -0.0437774658203125, -0.039104461669921875, -0.03443145751953125, -0.029758453369140625, -0.02508544921875, -0.020412445068359375, -0.01573944091796875, -0.011066436767578125, -0.0063934326171875, -0.001720428466796875, 0.00295257568359375, 0.007625579833984375, 0.012298583984375, 0.016971588134765625, 0.02164459228515625, 0.026317596435546875, 0.0309906005859375, 0.035663604736328125, 0.04033660888671875, 0.045009613037109375, 0.0496826171875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 13.0, 22.0, 68.0, 113.0, 239.0, 496.0, 940.0, 2083.0, 7689.0, 915265.0, 3254867.0, 8359.0, 2157.0, 959.0, 486.0, 234.0, 128.0, 71.0, 31.0, 19.0, 9.0, 5.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.272216796875, -0.2639732360839844, -0.25572967529296875, -0.24748611450195312, -0.2392425537109375, -0.23099899291992188, -0.22275543212890625, -0.21451187133789062, -0.206268310546875, -0.19802474975585938, -0.18978118896484375, -0.18153762817382812, -0.1732940673828125, -0.16505050659179688, -0.15680694580078125, -0.14856338500976562, -0.14031982421875, -0.13207626342773438, -0.12383270263671875, -0.11558914184570312, -0.1073455810546875, -0.09910202026367188, -0.09085845947265625, -0.08261489868164062, -0.074371337890625, -0.06612777709960938, -0.05788421630859375, -0.049640655517578125, -0.0413970947265625, -0.033153533935546875, -0.02490997314453125, -0.016666412353515625, -0.0084228515625, -0.000179290771484375, 0.00806427001953125, 0.016307830810546875, 0.0245513916015625, 0.032794952392578125, 0.04103851318359375, 0.049282073974609375, 0.057525634765625, 0.06576919555664062, 0.07401275634765625, 0.08225631713867188, 0.0904998779296875, 0.09874343872070312, 0.10698699951171875, 0.11523056030273438, 0.12347412109375, 0.13171768188476562, 0.13996124267578125, 0.14820480346679688, 0.1564483642578125, 0.16469192504882812, 0.17293548583984375, 0.18117904663085938, 0.189422607421875, 0.19766616821289062, 0.20590972900390625, 0.21415328979492188, 0.2223968505859375, 0.23064041137695312, 0.23888397216796875, 0.24712753295898438, 0.25537109375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 10.0, 23.0, 44.0, 110.0, 346.0, 2545.0, 663.0, 193.0, 66.0, 30.0, 14.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031585693359375, -0.030621051788330078, -0.029656410217285156, -0.028691768646240234, -0.027727127075195312, -0.02676248550415039, -0.02579784393310547, -0.024833202362060547, -0.023868560791015625, -0.022903919219970703, -0.02193927764892578, -0.02097463607788086, -0.020009994506835938, -0.019045352935791016, -0.018080711364746094, -0.017116069793701172, -0.01615142822265625, -0.015186786651611328, -0.014222145080566406, -0.013257503509521484, -0.012292861938476562, -0.01132822036743164, -0.010363578796386719, -0.009398937225341797, -0.008434295654296875, -0.007469654083251953, -0.006505012512207031, -0.005540370941162109, -0.0045757293701171875, -0.0036110877990722656, -0.0026464462280273438, -0.0016818046569824219, -0.0007171630859375, 0.0002474784851074219, 0.0012121200561523438, 0.0021767616271972656, 0.0031414031982421875, 0.004106044769287109, 0.005070686340332031, 0.006035327911376953, 0.006999969482421875, 0.007964611053466797, 0.008929252624511719, 0.00989389419555664, 0.010858535766601562, 0.011823177337646484, 0.012787818908691406, 0.013752460479736328, 0.01471710205078125, 0.015681743621826172, 0.016646385192871094, 0.017611026763916016, 0.018575668334960938, 0.01954030990600586, 0.02050495147705078, 0.021469593048095703, 0.022434234619140625, 0.023398876190185547, 0.02436351776123047, 0.02532815933227539, 0.026292800903320312, 0.027257442474365234, 0.028222084045410156, 0.029186725616455078, 0.0301513671875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 7.0, 13.0, 13.0, 21.0, 33.0, 66.0, 85.0, 170.0, 229.0, 143.0, 79.0, 44.0, 37.0, 22.0, 17.0, 14.0, 3.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2174672931432724, -0.21287468075752258, -0.20828205347061157, -0.20368944108486176, -0.19909681379795074, -0.19450420141220093, -0.18991157412528992, -0.1853189617395401, -0.18072634935379028, -0.17613373696804047, -0.17154110968112946, -0.16694849729537964, -0.16235587000846863, -0.1577632576227188, -0.1531706303358078, -0.14857801795005798, -0.14398539066314697, -0.13939277827739716, -0.13480015099048615, -0.13020753860473633, -0.12561491131782532, -0.1210222989320755, -0.11642967909574509, -0.11183705925941467, -0.10724443942308426, -0.10265181958675385, -0.09805919975042343, -0.09346657991409302, -0.0888739675283432, -0.08428134024143219, -0.07968872785568237, -0.07509610801935196, -0.07050348818302155, -0.06591086834669113, -0.06131824851036072, -0.0567256323993206, -0.05213301256299019, -0.047540392726659775, -0.04294777661561966, -0.038355156779289246, -0.03376253694295883, -0.029169917106628418, -0.024577299132943153, -0.01998468115925789, -0.015392061322927475, -0.010799441486597061, -0.006206823512911797, -0.001614205539226532, 0.002978414297103882, 0.007571033202111721, 0.01216365210711956, 0.016756270080804825, 0.02134888991713524, 0.025941509753465652, 0.030534127727150917, 0.03512674570083618, 0.039719365537166595, 0.04431198537349701, 0.04890460520982742, 0.05349722132086754, 0.05808984115719795, 0.06268246471881866, 0.06727507710456848, 0.0718676969408989, 0.07646031677722931]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 3.0, 12.0, 13.0, 9.0, 26.0, 24.0, 32.0, 31.0, 30.0, 25.0, 32.0, 36.0, 37.0, 34.0, 39.0, 44.0, 41.0, 47.0, 48.0, 46.0, 35.0, 30.0, 48.0, 45.0, 35.0, 30.0, 21.0, 27.0, 14.0, 14.0, 14.0, 20.0, 17.0, 5.0, 4.0, 4.0, 3.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.06569084525108337, -0.06392133980989456, -0.06215183436870575, -0.06038232892751694, -0.05861282721161842, -0.05684332177042961, -0.0550738163292408, -0.05330431088805199, -0.05153480917215347, -0.04976530373096466, -0.04799579828977585, -0.046226292848587036, -0.04445679113268852, -0.04268728569149971, -0.0409177802503109, -0.039148274809122086, -0.03737876936793327, -0.03560926392674446, -0.03383975848555565, -0.032070256769657135, -0.030300751328468323, -0.02853124588727951, -0.026761740446090698, -0.024992235004901886, -0.023222731426358223, -0.02145322598516941, -0.019683722406625748, -0.017914216965436935, -0.016144711524248123, -0.01437520794570446, -0.012605702504515648, -0.01083619799464941, -0.009066693484783173, -0.007297188974916935, -0.00552768399938941, -0.003758179023861885, -0.0019886745139956474, -0.0002191700041294098, 0.0015503354370594025, 0.00331983994692564, 0.005089344456791878, 0.006858848966658115, 0.008628353476524353, 0.010397858917713165, 0.012167363427579403, 0.01393686793744564, 0.015706373378634453, 0.017475876957178116, 0.019245382398366928, 0.02101488783955574, 0.022784391418099403, 0.024553896859288216, 0.02632340043783188, 0.02809290587902069, 0.029862411320209503, 0.031631916761398315, 0.03340142220258713, 0.03517092764377594, 0.03694043308496475, 0.038709938526153564, 0.04047944024205208, 0.04224894568324089, 0.0440184511244297, 0.045787956565618515, 0.04755745828151703]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 7.0, 2.0, 6.0, 5.0, 3.0, 9.0, 10.0, 24.0, 30.0, 50.0, 59.0, 58.0, 120.0, 168.0, 230.0, 376.0, 537.0, 828.0, 1299.0, 2246.0, 4082.0, 7935.0, 16517.0, 38743.0, 110255.0, 454063.0, 279938.0, 74904.0, 28668.0, 12721.0, 6178.0, 3290.0, 1836.0, 1165.0, 760.0, 445.0, 328.0, 201.0, 144.0, 105.0, 61.0, 48.0, 34.0, 19.0, 23.0, 11.0, 7.0, 7.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1317138671875, -0.12729835510253906, -0.12288284301757812, -0.11846733093261719, -0.11405181884765625, -0.10963630676269531, -0.10522079467773438, -0.10080528259277344, -0.0963897705078125, -0.09197425842285156, -0.08755874633789062, -0.08314323425292969, -0.07872772216796875, -0.07431221008300781, -0.06989669799804688, -0.06548118591308594, -0.061065673828125, -0.05665016174316406, -0.052234649658203125, -0.04781913757324219, -0.04340362548828125, -0.03898811340332031, -0.034572601318359375, -0.030157089233398438, -0.0257415771484375, -0.021326065063476562, -0.016910552978515625, -0.012495040893554688, -0.00807952880859375, -0.0036640167236328125, 0.000751495361328125, 0.0051670074462890625, 0.00958251953125, 0.013998031616210938, 0.018413543701171875, 0.022829055786132812, 0.02724456787109375, 0.03166007995605469, 0.036075592041015625, 0.04049110412597656, 0.0449066162109375, 0.04932212829589844, 0.053737640380859375, 0.05815315246582031, 0.06256866455078125, 0.06698417663574219, 0.07139968872070312, 0.07581520080566406, 0.080230712890625, 0.08464622497558594, 0.08906173706054688, 0.09347724914550781, 0.09789276123046875, 0.10230827331542969, 0.10672378540039062, 0.11113929748535156, 0.1155548095703125, 0.11997032165527344, 0.12438583374023438, 0.1288013458251953, 0.13321685791015625, 0.1376323699951172, 0.14204788208007812, 0.14646339416503906, 0.15087890625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 8.0, 8.0, 23.0, 21.0, 20.0, 27.0, 19.0, 35.0, 41.0, 37.0, 33.0, 41.0, 38.0, 43.0, 44.0, 48.0, 53.0, 45.0, 46.0, 34.0, 36.0, 46.0, 36.0, 34.0, 31.0, 18.0, 19.0, 22.0, 13.0, 12.0, 15.0, 12.0, 2.0, 5.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05523681640625, -0.05364084243774414, -0.05204486846923828, -0.05044889450073242, -0.04885292053222656, -0.0472569465637207, -0.045660972595214844, -0.044064998626708984, -0.042469024658203125, -0.040873050689697266, -0.039277076721191406, -0.03768110275268555, -0.03608512878417969, -0.03448915481567383, -0.03289318084716797, -0.03129720687866211, -0.02970123291015625, -0.02810525894165039, -0.02650928497314453, -0.024913311004638672, -0.023317337036132812, -0.021721363067626953, -0.020125389099121094, -0.018529415130615234, -0.016933441162109375, -0.015337467193603516, -0.013741493225097656, -0.012145519256591797, -0.010549545288085938, -0.008953571319580078, -0.007357597351074219, -0.005761623382568359, -0.0041656494140625, -0.0025696754455566406, -0.0009737014770507812, 0.0006222724914550781, 0.0022182464599609375, 0.003814220428466797, 0.005410194396972656, 0.007006168365478516, 0.008602142333984375, 0.010198116302490234, 0.011794090270996094, 0.013390064239501953, 0.014986038208007812, 0.016582012176513672, 0.01817798614501953, 0.01977396011352539, 0.02136993408203125, 0.02296590805053711, 0.02456188201904297, 0.026157855987548828, 0.027753829956054688, 0.029349803924560547, 0.030945777893066406, 0.032541751861572266, 0.034137725830078125, 0.035733699798583984, 0.037329673767089844, 0.0389256477355957, 0.04052162170410156, 0.04211759567260742, 0.04371356964111328, 0.04530954360961914, 0.046905517578125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 6.0, 6.0, 22.0, 20.0, 35.0, 58.0, 110.0, 137.0, 211.0, 350.0, 565.0, 938.0, 1461.0, 2582.0, 4435.0, 8500.0, 17332.0, 40651.0, 137274.0, 616827.0, 138755.0, 41304.0, 17231.0, 8511.0, 4604.0, 2589.0, 1516.0, 906.0, 585.0, 352.0, 248.0, 149.0, 91.0, 65.0, 38.0, 35.0, 14.0, 13.0, 12.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.10260009765625, -0.09962654113769531, -0.09665298461914062, -0.09367942810058594, -0.09070587158203125, -0.08773231506347656, -0.08475875854492188, -0.08178520202636719, -0.0788116455078125, -0.07583808898925781, -0.07286453247070312, -0.06989097595214844, -0.06691741943359375, -0.06394386291503906, -0.060970306396484375, -0.05799674987792969, -0.055023193359375, -0.05204963684082031, -0.049076080322265625, -0.04610252380371094, -0.04312896728515625, -0.04015541076660156, -0.037181854248046875, -0.03420829772949219, -0.0312347412109375, -0.028261184692382812, -0.025287628173828125, -0.022314071655273438, -0.01934051513671875, -0.016366958618164062, -0.013393402099609375, -0.010419845581054688, -0.0074462890625, -0.0044727325439453125, -0.001499176025390625, 0.0014743804931640625, 0.00444793701171875, 0.0074214935302734375, 0.010395050048828125, 0.013368606567382812, 0.0163421630859375, 0.019315719604492188, 0.022289276123046875, 0.025262832641601562, 0.02823638916015625, 0.031209945678710938, 0.034183502197265625, 0.03715705871582031, 0.040130615234375, 0.04310417175292969, 0.046077728271484375, 0.04905128479003906, 0.05202484130859375, 0.05499839782714844, 0.057971954345703125, 0.06094551086425781, 0.0639190673828125, 0.06689262390136719, 0.06986618041992188, 0.07283973693847656, 0.07581329345703125, 0.07878684997558594, 0.08176040649414062, 0.08473396301269531, 0.08770751953125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 2.0, 8.0, 10.0, 15.0, 14.0, 19.0, 20.0, 27.0, 33.0, 38.0, 55.0, 47.0, 35.0, 44.0, 46.0, 54.0, 49.0, 58.0, 48.0, 58.0, 44.0, 49.0, 37.0, 29.0, 28.0, 28.0, 21.0, 19.0, 16.0, 11.0, 12.0, 11.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04400634765625, -0.042861223220825195, -0.04171609878540039, -0.040570974349975586, -0.03942584991455078, -0.03828072547912598, -0.03713560104370117, -0.03599047660827637, -0.03484535217285156, -0.03370022773742676, -0.03255510330200195, -0.03140997886657715, -0.030264854431152344, -0.02911972999572754, -0.027974605560302734, -0.02682948112487793, -0.025684356689453125, -0.02453923225402832, -0.023394107818603516, -0.02224898338317871, -0.021103858947753906, -0.0199587345123291, -0.018813610076904297, -0.017668485641479492, -0.016523361206054688, -0.015378236770629883, -0.014233112335205078, -0.013087987899780273, -0.011942863464355469, -0.010797739028930664, -0.00965261459350586, -0.008507490158081055, -0.00736236572265625, -0.006217241287231445, -0.005072116851806641, -0.003926992416381836, -0.0027818679809570312, -0.0016367435455322266, -0.0004916191101074219, 0.0006535053253173828, 0.0017986297607421875, 0.002943754196166992, 0.004088878631591797, 0.0052340030670166016, 0.006379127502441406, 0.007524251937866211, 0.008669376373291016, 0.00981450080871582, 0.010959625244140625, 0.01210474967956543, 0.013249874114990234, 0.014394998550415039, 0.015540122985839844, 0.01668524742126465, 0.017830371856689453, 0.018975496292114258, 0.020120620727539062, 0.021265745162963867, 0.022410869598388672, 0.023555994033813477, 0.02470111846923828, 0.025846242904663086, 0.02699136734008789, 0.028136491775512695, 0.0292816162109375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 6.0, 8.0, 10.0, 9.0, 17.0, 19.0, 26.0, 37.0, 39.0, 88.0, 114.0, 129.0, 180.0, 238.0, 365.0, 541.0, 781.0, 1198.0, 1926.0, 3125.0, 5798.0, 13313.0, 42974.0, 833224.0, 105174.0, 20161.0, 8094.0, 4058.0, 2386.0, 1458.0, 938.0, 638.0, 404.0, 307.0, 206.0, 152.0, 87.0, 86.0, 47.0, 54.0, 31.0, 33.0, 18.0, 21.0, 13.0, 3.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.00641632080078125, -0.006226003170013428, -0.0060356855392456055, -0.005845367908477783, -0.005655050277709961, -0.005464732646942139, -0.005274415016174316, -0.005084097385406494, -0.004893779754638672, -0.00470346212387085, -0.004513144493103027, -0.004322826862335205, -0.004132509231567383, -0.0039421916007995605, -0.0037518739700317383, -0.003561556339263916, -0.0033712387084960938, -0.0031809210777282715, -0.0029906034469604492, -0.002800285816192627, -0.0026099681854248047, -0.0024196505546569824, -0.00222933292388916, -0.002039015293121338, -0.0018486976623535156, -0.0016583800315856934, -0.001468062400817871, -0.0012777447700500488, -0.0010874271392822266, -0.0008971095085144043, -0.000706791877746582, -0.0005164742469787598, -0.0003261566162109375, -0.00013583898544311523, 5.447864532470703e-05, 0.0002447962760925293, 0.00043511390686035156, 0.0006254315376281738, 0.0008157491683959961, 0.0010060667991638184, 0.0011963844299316406, 0.0013867020606994629, 0.0015770196914672852, 0.0017673373222351074, 0.0019576549530029297, 0.002147972583770752, 0.0023382902145385742, 0.0025286078453063965, 0.0027189254760742188, 0.002909243106842041, 0.0030995607376098633, 0.0032898783683776855, 0.003480195999145508, 0.00367051362991333, 0.0038608312606811523, 0.004051148891448975, 0.004241466522216797, 0.004431784152984619, 0.004622101783752441, 0.004812419414520264, 0.005002737045288086, 0.005193054676055908, 0.0053833723068237305, 0.005573689937591553, 0.005764007568359375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 4.0, 3.0, 7.0, 10.0, 5.0, 15.0, 14.0, 16.0, 15.0, 30.0, 18.0, 27.0, 34.0, 30.0, 41.0, 30.0, 35.0, 45.0, 52.0, 55.0, 54.0, 48.0, 46.0, 39.0, 50.0, 42.0, 35.0, 32.0, 31.0, 19.0, 22.0, 20.0, 18.0, 12.0, 13.0, 7.0, 7.0, 6.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0067901611328125e-06, -4.827976226806641e-06, -4.649162292480469e-06, -4.470348358154297e-06, -4.291534423828125e-06, -4.112720489501953e-06, -3.933906555175781e-06, -3.7550926208496094e-06, -3.5762786865234375e-06, -3.3974647521972656e-06, -3.2186508178710938e-06, -3.039836883544922e-06, -2.86102294921875e-06, -2.682209014892578e-06, -2.5033950805664062e-06, -2.3245811462402344e-06, -2.1457672119140625e-06, -1.9669532775878906e-06, -1.7881393432617188e-06, -1.6093254089355469e-06, -1.430511474609375e-06, -1.2516975402832031e-06, -1.0728836059570312e-06, -8.940696716308594e-07, -7.152557373046875e-07, -5.364418029785156e-07, -3.5762786865234375e-07, -1.7881393432617188e-07, 0.0, 1.7881393432617188e-07, 3.5762786865234375e-07, 5.364418029785156e-07, 7.152557373046875e-07, 8.940696716308594e-07, 1.0728836059570312e-06, 1.2516975402832031e-06, 1.430511474609375e-06, 1.6093254089355469e-06, 1.7881393432617188e-06, 1.9669532775878906e-06, 2.1457672119140625e-06, 2.3245811462402344e-06, 2.5033950805664062e-06, 2.682209014892578e-06, 2.86102294921875e-06, 3.039836883544922e-06, 3.2186508178710938e-06, 3.3974647521972656e-06, 3.5762786865234375e-06, 3.7550926208496094e-06, 3.933906555175781e-06, 4.112720489501953e-06, 4.291534423828125e-06, 4.470348358154297e-06, 4.649162292480469e-06, 4.827976226806641e-06, 5.0067901611328125e-06, 5.185604095458984e-06, 5.364418029785156e-06, 5.543231964111328e-06, 5.7220458984375e-06, 5.900859832763672e-06, 6.079673767089844e-06, 6.258487701416016e-06, 6.4373016357421875e-06]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 6.0, 5.0, 21.0, 26.0, 46.0, 102.0, 285.0, 862.0, 2893.0, 10287.0, 44123.0, 928652.0, 46300.0, 10524.0, 2989.0, 880.0, 291.0, 117.0, 40.0, 23.0, 15.0, 9.0, 5.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01104736328125, -0.010696768760681152, -0.010346174240112305, -0.009995579719543457, -0.00964498519897461, -0.009294390678405762, -0.008943796157836914, -0.008593201637268066, -0.008242607116699219, -0.007892012596130371, -0.0075414180755615234, -0.007190823554992676, -0.006840229034423828, -0.0064896345138549805, -0.006139039993286133, -0.005788445472717285, -0.0054378509521484375, -0.00508725643157959, -0.004736661911010742, -0.0043860673904418945, -0.004035472869873047, -0.0036848783493041992, -0.0033342838287353516, -0.002983689308166504, -0.0026330947875976562, -0.0022825002670288086, -0.001931905746459961, -0.0015813112258911133, -0.0012307167053222656, -0.000880122184753418, -0.0005295276641845703, -0.00017893314361572266, 0.000171661376953125, 0.0005222558975219727, 0.0008728504180908203, 0.001223444938659668, 0.0015740394592285156, 0.0019246339797973633, 0.002275228500366211, 0.0026258230209350586, 0.0029764175415039062, 0.003327012062072754, 0.0036776065826416016, 0.004028201103210449, 0.004378795623779297, 0.0047293901443481445, 0.005079984664916992, 0.00543057918548584, 0.0057811737060546875, 0.006131768226623535, 0.006482362747192383, 0.0068329572677612305, 0.007183551788330078, 0.007534146308898926, 0.007884740829467773, 0.008235335350036621, 0.008585929870605469, 0.008936524391174316, 0.009287118911743164, 0.009637713432312012, 0.00998830795288086, 0.010338902473449707, 0.010689496994018555, 0.011040091514587402, 0.01139068603515625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 8.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 8.0, 4.0, 9.0, 17.0, 23.0, 36.0, 63.0, 110.0, 147.0, 172.0, 132.0, 87.0, 41.0, 30.0, 15.0, 12.0, 8.0, 13.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008254051208496094, -0.0007981434464454651, -0.0007708817720413208, -0.0007436200976371765, -0.0007163584232330322, -0.0006890967488288879, -0.0006618350744247437, -0.0006345734000205994, -0.0006073117256164551, -0.0005800500512123108, -0.0005527883768081665, -0.0005255267024040222, -0.0004982650279998779, -0.00047100335359573364, -0.00044374167919158936, -0.00041648000478744507, -0.0003892183303833008, -0.0003619566559791565, -0.0003346949815750122, -0.0003074333071708679, -0.00028017163276672363, -0.00025290995836257935, -0.00022564828395843506, -0.00019838660955429077, -0.00017112493515014648, -0.0001438632607460022, -0.00011660158634185791, -8.933991193771362e-05, -6.207823753356934e-05, -3.481656312942505e-05, -7.554888725280762e-06, 1.9706785678863525e-05, 4.696846008300781e-05, 7.42301344871521e-05, 0.00010149180889129639, 0.00012875348329544067, 0.00015601515769958496, 0.00018327683210372925, 0.00021053850650787354, 0.00023780018091201782, 0.0002650618553161621, 0.0002923235297203064, 0.0003195852041244507, 0.00034684687852859497, 0.00037410855293273926, 0.00040137022733688354, 0.00042863190174102783, 0.0004558935761451721, 0.0004831552505493164, 0.0005104169249534607, 0.000537678599357605, 0.0005649402737617493, 0.0005922019481658936, 0.0006194636225700378, 0.0006467252969741821, 0.0006739869713783264, 0.0007012486457824707, 0.000728510320186615, 0.0007557719945907593, 0.0007830336689949036, 0.0008102953433990479, 0.0008375570178031921, 0.0008648186922073364, 0.0008920803666114807, 0.000919342041015625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 8.0, 5.0, 7.0, 5.0, 4.0, 8.0, 19.0, 11.0, 17.0, 38.0, 35.0, 57.0, 69.0, 90.0, 120.0, 148.0, 82.0, 65.0, 41.0, 35.0, 34.0, 16.0, 14.0, 11.0, 10.0, 13.0, 7.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.08864366263151169, -0.08647649735212326, -0.08430933207273483, -0.0821421667933464, -0.07997500151395798, -0.07780783623456955, -0.07564067095518112, -0.0734735056757927, -0.07130634039640427, -0.06913917511701584, -0.06697200983762741, -0.06480484455823898, -0.06263767927885056, -0.06047051399946213, -0.0583033487200737, -0.05613618344068527, -0.053969018161296844, -0.05180185288190842, -0.04963468760251999, -0.04746752232313156, -0.045300357043743134, -0.043133191764354706, -0.04096602648496628, -0.03879886120557785, -0.03663169592618942, -0.034464530646800995, -0.03229736536741257, -0.03013020008802414, -0.02796303480863571, -0.025795869529247284, -0.023628704249858856, -0.02146153897047043, -0.019294381141662598, -0.01712721586227417, -0.014960050582885742, -0.012792885303497314, -0.010625720024108887, -0.008458554744720459, -0.006291389465332031, -0.0041242241859436035, -0.0019570589065551758, 0.00021010637283325195, 0.0023772716522216797, 0.004544436931610107, 0.006711602210998535, 0.008878767490386963, 0.01104593276977539, 0.013213098049163818, 0.015380263328552246, 0.017547428607940674, 0.0197145938873291, 0.02188175916671753, 0.024048924446105957, 0.026216089725494385, 0.028383255004882812, 0.03055042028427124, 0.03271758556365967, 0.034884750843048096, 0.03705191612243652, 0.03921908140182495, 0.04138624668121338, 0.04355341196060181, 0.045720577239990234, 0.04788774251937866, 0.05005490779876709]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 13.0, 9.0, 21.0, 23.0, 30.0, 32.0, 33.0, 28.0, 28.0, 37.0, 38.0, 32.0, 39.0, 39.0, 45.0, 43.0, 50.0, 45.0, 39.0, 32.0, 44.0, 44.0, 36.0, 33.0, 27.0, 24.0, 16.0, 12.0, 19.0, 18.0, 18.0, 5.0, 4.0, 4.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0564374141395092, -0.05492740124464035, -0.0534173920750618, -0.051907382905483246, -0.050397370010614395, -0.048887357115745544, -0.04737734794616699, -0.04586733877658844, -0.04435732588171959, -0.04284731298685074, -0.041337303817272186, -0.039827294647693634, -0.03831728175282478, -0.03680726885795593, -0.03529725968837738, -0.03378725051879883, -0.03227723762392998, -0.030767226591706276, -0.029257215559482574, -0.027747204527258873, -0.02623719349503517, -0.02472718246281147, -0.02321717143058777, -0.021707160398364067, -0.020197149366140366, -0.018687138333916664, -0.017177127301692963, -0.01566711626946926, -0.01415710523724556, -0.012647094205021858, -0.011137083172798157, -0.009627072140574455, -0.008117064833641052, -0.006607053801417351, -0.005097042769193649, -0.003587031736969948, -0.0020770207047462463, -0.0005670096725225449, 0.0009430013597011566, 0.002453012391924858, 0.00396302342414856, 0.005473034456372261, 0.0069830454885959625, 0.008493056520819664, 0.010003067553043365, 0.011513078585267067, 0.013023089617490768, 0.01453310064971447, 0.01604311168193817, 0.017553122714161873, 0.019063133746385574, 0.020573144778609276, 0.022083155810832977, 0.02359316684305668, 0.02510317787528038, 0.02661318890750408, 0.028123199939727783, 0.029633210971951485, 0.031143222004175186, 0.03265323489904404, 0.03416324406862259, 0.03567325323820114, 0.03718326613306999, 0.03869327902793884, 0.040203288197517395]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 8.0, 14.0, 22.0, 38.0, 48.0, 75.0, 133.0, 225.0, 337.0, 514.0, 812.0, 1468.0, 2470.0, 4300.0, 8325.0, 15822.0, 31289.0, 65514.0, 154078.0, 376443.0, 217381.0, 86200.0, 40145.0, 19592.0, 10319.0, 5582.0, 2995.0, 1839.0, 975.0, 551.0, 370.0, 217.0, 144.0, 98.0, 55.0, 38.0, 38.0, 27.0, 17.0, 16.0, 7.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10076904296875, -0.09768486022949219, -0.09460067749023438, -0.09151649475097656, -0.08843231201171875, -0.08534812927246094, -0.08226394653320312, -0.07917976379394531, -0.0760955810546875, -0.07301139831542969, -0.06992721557617188, -0.06684303283691406, -0.06375885009765625, -0.06067466735839844, -0.057590484619140625, -0.05450630187988281, -0.051422119140625, -0.04833793640136719, -0.045253753662109375, -0.04216957092285156, -0.03908538818359375, -0.03600120544433594, -0.032917022705078125, -0.029832839965820312, -0.0267486572265625, -0.023664474487304688, -0.020580291748046875, -0.017496109008789062, -0.01441192626953125, -0.011327743530273438, -0.008243560791015625, -0.0051593780517578125, -0.0020751953125, 0.0010089874267578125, 0.004093170166015625, 0.0071773529052734375, 0.01026153564453125, 0.013345718383789062, 0.016429901123046875, 0.019514083862304688, 0.0225982666015625, 0.025682449340820312, 0.028766632080078125, 0.03185081481933594, 0.03493499755859375, 0.03801918029785156, 0.041103363037109375, 0.04418754577636719, 0.047271728515625, 0.05035591125488281, 0.053440093994140625, 0.05652427673339844, 0.05960845947265625, 0.06269264221191406, 0.06577682495117188, 0.06886100769042969, 0.0719451904296875, 0.07502937316894531, 0.07811355590820312, 0.08119773864746094, 0.08428192138671875, 0.08736610412597656, 0.09045028686523438, 0.09353446960449219, 0.09661865234375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 2.0, 10.0, 10.0, 21.0, 24.0, 19.0, 36.0, 23.0, 27.0, 35.0, 35.0, 39.0, 45.0, 41.0, 56.0, 43.0, 56.0, 49.0, 48.0, 54.0, 43.0, 46.0, 33.0, 27.0, 29.0, 32.0, 17.0, 17.0, 23.0, 11.0, 13.0, 5.0, 3.0, 10.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026885986328125, -0.02614307403564453, -0.025400161743164062, -0.024657249450683594, -0.023914337158203125, -0.023171424865722656, -0.022428512573242188, -0.02168560028076172, -0.02094268798828125, -0.02019977569580078, -0.019456863403320312, -0.018713951110839844, -0.017971038818359375, -0.017228126525878906, -0.016485214233398438, -0.01574230194091797, -0.0149993896484375, -0.014256477355957031, -0.013513565063476562, -0.012770652770996094, -0.012027740478515625, -0.011284828186035156, -0.010541915893554688, -0.009799003601074219, -0.00905609130859375, -0.008313179016113281, -0.0075702667236328125, -0.006827354431152344, -0.006084442138671875, -0.005341529846191406, -0.0045986175537109375, -0.0038557052612304688, -0.00311279296875, -0.0023698806762695312, -0.0016269683837890625, -0.0008840560913085938, -0.000141143798828125, 0.0006017684936523438, 0.0013446807861328125, 0.0020875930786132812, 0.00283050537109375, 0.0035734176635742188, 0.0043163299560546875, 0.005059242248535156, 0.005802154541015625, 0.006545066833496094, 0.0072879791259765625, 0.008030891418457031, 0.0087738037109375, 0.009516716003417969, 0.010259628295898438, 0.011002540588378906, 0.011745452880859375, 0.012488365173339844, 0.013231277465820312, 0.013974189758300781, 0.01471710205078125, 0.015460014343261719, 0.016202926635742188, 0.016945838928222656, 0.017688751220703125, 0.018431663513183594, 0.019174575805664062, 0.01991748809814453, 0.020660400390625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 7.0, 8.0, 3.0, 10.0, 11.0, 16.0, 20.0, 24.0, 35.0, 52.0, 102.0, 176.0, 259.0, 466.0, 782.0, 1238.0, 2149.0, 3833.0, 6396.0, 11222.0, 19631.0, 35265.0, 67842.0, 141467.0, 303788.0, 233259.0, 104304.0, 51730.0, 27707.0, 15384.0, 8819.0, 5049.0, 3082.0, 1705.0, 1063.0, 614.0, 377.0, 230.0, 150.0, 98.0, 58.0, 32.0, 29.0, 15.0, 15.0, 9.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.058868408203125, -0.05707359313964844, -0.055278778076171875, -0.05348396301269531, -0.05168914794921875, -0.04989433288574219, -0.048099517822265625, -0.04630470275878906, -0.0445098876953125, -0.04271507263183594, -0.040920257568359375, -0.03912544250488281, -0.03733062744140625, -0.03553581237792969, -0.033740997314453125, -0.03194618225097656, -0.0301513671875, -0.028356552124023438, -0.026561737060546875, -0.024766921997070312, -0.02297210693359375, -0.021177291870117188, -0.019382476806640625, -0.017587661743164062, -0.0157928466796875, -0.013998031616210938, -0.012203216552734375, -0.010408401489257812, -0.00861358642578125, -0.0068187713623046875, -0.005023956298828125, -0.0032291412353515625, -0.001434326171875, 0.0003604888916015625, 0.002155303955078125, 0.0039501190185546875, 0.00574493408203125, 0.0075397491455078125, 0.009334564208984375, 0.011129379272460938, 0.0129241943359375, 0.014719009399414062, 0.016513824462890625, 0.018308639526367188, 0.02010345458984375, 0.021898269653320312, 0.023693084716796875, 0.025487899780273438, 0.02728271484375, 0.029077529907226562, 0.030872344970703125, 0.03266716003417969, 0.03446197509765625, 0.03625679016113281, 0.038051605224609375, 0.03984642028808594, 0.0416412353515625, 0.04343605041503906, 0.045230865478515625, 0.04702568054199219, 0.04882049560546875, 0.05061531066894531, 0.052410125732421875, 0.05420494079589844, 0.055999755859375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 9.0, 5.0, 6.0, 8.0, 12.0, 15.0, 14.0, 15.0, 13.0, 28.0, 23.0, 37.0, 30.0, 29.0, 33.0, 23.0, 32.0, 41.0, 29.0, 34.0, 41.0, 37.0, 36.0, 37.0, 49.0, 36.0, 25.0, 35.0, 23.0, 28.0, 34.0, 21.0, 19.0, 15.0, 19.0, 15.0, 17.0, 14.0, 12.0, 6.0, 10.0, 10.0, 1.0, 9.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.01474761962890625, -0.014261126518249512, -0.013774633407592773, -0.013288140296936035, -0.012801647186279297, -0.012315154075622559, -0.01182866096496582, -0.011342167854309082, -0.010855674743652344, -0.010369181632995605, -0.009882688522338867, -0.009396195411682129, -0.00890970230102539, -0.008423209190368652, -0.007936716079711914, -0.007450222969055176, -0.0069637298583984375, -0.006477236747741699, -0.005990743637084961, -0.005504250526428223, -0.005017757415771484, -0.004531264305114746, -0.004044771194458008, -0.0035582780838012695, -0.0030717849731445312, -0.002585291862487793, -0.0020987987518310547, -0.0016123056411743164, -0.0011258125305175781, -0.0006393194198608398, -0.00015282630920410156, 0.0003336668014526367, 0.000820159912109375, 0.0013066530227661133, 0.0017931461334228516, 0.00227963924407959, 0.002766132354736328, 0.0032526254653930664, 0.0037391185760498047, 0.004225611686706543, 0.004712104797363281, 0.0051985979080200195, 0.005685091018676758, 0.006171584129333496, 0.006658077239990234, 0.007144570350646973, 0.007631063461303711, 0.00811755657196045, 0.008604049682617188, 0.009090542793273926, 0.009577035903930664, 0.010063529014587402, 0.01055002212524414, 0.011036515235900879, 0.011523008346557617, 0.012009501457214355, 0.012495994567871094, 0.012982487678527832, 0.01346898078918457, 0.013955473899841309, 0.014441967010498047, 0.014928460121154785, 0.015414953231811523, 0.01590144634246826, 0.016387939453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 21.0, 24.0, 31.0, 33.0, 71.0, 74.0, 105.0, 147.0, 271.0, 372.0, 616.0, 935.0, 1646.0, 2936.0, 5245.0, 10487.0, 23345.0, 60586.0, 236216.0, 524962.0, 111311.0, 36476.0, 15455.0, 7458.0, 3944.0, 2248.0, 1346.0, 750.0, 493.0, 313.0, 214.0, 122.0, 77.0, 78.0, 39.0, 37.0, 15.0, 14.0, 8.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0020389556884765625, -0.0019737184047698975, -0.0019084811210632324, -0.0018432438373565674, -0.0017780065536499023, -0.0017127692699432373, -0.0016475319862365723, -0.0015822947025299072, -0.0015170574188232422, -0.0014518201351165771, -0.0013865828514099121, -0.001321345567703247, -0.001256108283996582, -0.001190871000289917, -0.001125633716583252, -0.001060396432876587, -0.0009951591491699219, -0.0009299218654632568, -0.0008646845817565918, -0.0007994472980499268, -0.0007342100143432617, -0.0006689727306365967, -0.0006037354469299316, -0.0005384981632232666, -0.00047326087951660156, -0.0004080235958099365, -0.0003427863121032715, -0.00027754902839660645, -0.0002123117446899414, -0.00014707446098327637, -8.183717727661133e-05, -1.659989356994629e-05, 4.863739013671875e-05, 0.00011387467384338379, 0.00017911195755004883, 0.00024434924125671387, 0.0003095865249633789, 0.00037482380867004395, 0.000440061092376709, 0.000505298376083374, 0.0005705356597900391, 0.0006357729434967041, 0.0007010102272033691, 0.0007662475109100342, 0.0008314847946166992, 0.0008967220783233643, 0.0009619593620300293, 0.0010271966457366943, 0.0010924339294433594, 0.0011576712131500244, 0.0012229084968566895, 0.0012881457805633545, 0.0013533830642700195, 0.0014186203479766846, 0.0014838576316833496, 0.0015490949153900146, 0.0016143321990966797, 0.0016795694828033447, 0.0017448067665100098, 0.0018100440502166748, 0.0018752813339233398, 0.0019405186176300049, 0.00200575590133667, 0.002070993185043335, 0.00213623046875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 6.0, 6.0, 12.0, 10.0, 28.0, 13.0, 41.0, 30.0, 75.0, 61.0, 103.0, 146.0, 115.0, 117.0, 61.0, 52.0, 21.0, 26.0, 20.0, 9.0, 11.0, 7.0, 4.0, 3.0, 3.0, 3.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.854534149169922e-06, -6.650574505329132e-06, -6.446614861488342e-06, -6.2426552176475525e-06, -6.038695573806763e-06, -5.834735929965973e-06, -5.630776286125183e-06, -5.426816642284393e-06, -5.2228569984436035e-06, -5.018897354602814e-06, -4.814937710762024e-06, -4.610978066921234e-06, -4.407018423080444e-06, -4.2030587792396545e-06, -3.999099135398865e-06, -3.795139491558075e-06, -3.591179847717285e-06, -3.3872202038764954e-06, -3.1832605600357056e-06, -2.9793009161949158e-06, -2.775341272354126e-06, -2.571381628513336e-06, -2.3674219846725464e-06, -2.1634623408317566e-06, -1.959502696990967e-06, -1.755543053150177e-06, -1.5515834093093872e-06, -1.3476237654685974e-06, -1.1436641216278076e-06, -9.397044777870178e-07, -7.35744833946228e-07, -5.317851901054382e-07, -3.2782554626464844e-07, -1.2386590242385864e-07, 8.009374141693115e-08, 2.8405338525772095e-07, 4.880130290985107e-07, 6.919726729393005e-07, 8.959323167800903e-07, 1.0998919606208801e-06, 1.30385160446167e-06, 1.5078112483024597e-06, 1.7117708921432495e-06, 1.9157305359840393e-06, 2.119690179824829e-06, 2.323649823665619e-06, 2.5276094675064087e-06, 2.7315691113471985e-06, 2.9355287551879883e-06, 3.139488399028778e-06, 3.343448042869568e-06, 3.5474076867103577e-06, 3.7513673305511475e-06, 3.955326974391937e-06, 4.159286618232727e-06, 4.363246262073517e-06, 4.567205905914307e-06, 4.7711655497550964e-06, 4.975125193595886e-06, 5.179084837436676e-06, 5.383044481277466e-06, 5.587004125118256e-06, 5.790963768959045e-06, 5.994923412799835e-06, 6.198883056640625e-06]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 5.0, 5.0, 11.0, 35.0, 38.0, 58.0, 94.0, 138.0, 212.0, 367.0, 586.0, 949.0, 1748.0, 2688.0, 4827.0, 8296.0, 14556.0, 26888.0, 52286.0, 109878.0, 258357.0, 302146.0, 133113.0, 60911.0, 31051.0, 16633.0, 9489.0, 5377.0, 3168.0, 1863.0, 1064.0, 641.0, 390.0, 258.0, 160.0, 97.0, 61.0, 40.0, 32.0, 13.0, 10.0, 5.0, 8.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008082389831542969, -0.0007845461368560791, -0.0007608532905578613, -0.0007371604442596436, -0.0007134675979614258, -0.000689774751663208, -0.0006660819053649902, -0.0006423890590667725, -0.0006186962127685547, -0.0005950033664703369, -0.0005713105201721191, -0.0005476176738739014, -0.0005239248275756836, -0.0005002319812774658, -0.00047653913497924805, -0.0004528462886810303, -0.0004291534423828125, -0.0004054605960845947, -0.00038176774978637695, -0.0003580749034881592, -0.0003343820571899414, -0.00031068921089172363, -0.00028699636459350586, -0.0002633035182952881, -0.0002396106719970703, -0.00021591782569885254, -0.00019222497940063477, -0.000168532133102417, -0.00014483928680419922, -0.00012114644050598145, -9.745359420776367e-05, -7.37607479095459e-05, -5.0067901611328125e-05, -2.637505531311035e-05, -2.682209014892578e-06, 2.1010637283325195e-05, 4.470348358154297e-05, 6.839632987976074e-05, 9.208917617797852e-05, 0.00011578202247619629, 0.00013947486877441406, 0.00016316771507263184, 0.0001868605613708496, 0.00021055340766906738, 0.00023424625396728516, 0.00025793910026550293, 0.0002816319465637207, 0.0003053247928619385, 0.00032901763916015625, 0.000352710485458374, 0.0003764033317565918, 0.00040009617805480957, 0.00042378902435302734, 0.0004474818706512451, 0.0004711747169494629, 0.0004948675632476807, 0.0005185604095458984, 0.0005422532558441162, 0.000565946102142334, 0.0005896389484405518, 0.0006133317947387695, 0.0006370246410369873, 0.0006607174873352051, 0.0006844103336334229, 0.0007081031799316406]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 5.0, 2.0, 11.0, 11.0, 12.0, 11.0, 17.0, 12.0, 17.0, 23.0, 25.0, 39.0, 30.0, 37.0, 41.0, 41.0, 48.0, 46.0, 53.0, 37.0, 43.0, 55.0, 49.0, 33.0, 48.0, 44.0, 40.0, 22.0, 18.0, 21.0, 29.0, 15.0, 18.0, 15.0, 6.0, 2.0, 4.0, 8.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019359588623046875, -0.0001864507794380188, -0.00017930567264556885, -0.0001721605658531189, -0.00016501545906066895, -0.000157870352268219, -0.00015072524547576904, -0.0001435801386833191, -0.00013643503189086914, -0.0001292899250984192, -0.00012214481830596924, -0.00011499971151351929, -0.00010785460472106934, -0.00010070949792861938, -9.356439113616943e-05, -8.641928434371948e-05, -7.927417755126953e-05, -7.212907075881958e-05, -6.498396396636963e-05, -5.783885717391968e-05, -5.0693750381469727e-05, -4.3548643589019775e-05, -3.6403536796569824e-05, -2.9258430004119873e-05, -2.2113323211669922e-05, -1.496821641921997e-05, -7.82310962677002e-06, -6.780028343200684e-07, 6.467103958129883e-06, 1.3612210750579834e-05, 2.0757317543029785e-05, 2.7902424335479736e-05, 3.504753112792969e-05, 4.219263792037964e-05, 4.933774471282959e-05, 5.648285150527954e-05, 6.362795829772949e-05, 7.077306509017944e-05, 7.79181718826294e-05, 8.506327867507935e-05, 9.22083854675293e-05, 9.935349225997925e-05, 0.0001064985990524292, 0.00011364370584487915, 0.0001207888126373291, 0.00012793391942977905, 0.000135079026222229, 0.00014222413301467896, 0.0001493692398071289, 0.00015651434659957886, 0.0001636594533920288, 0.00017080456018447876, 0.0001779496669769287, 0.00018509477376937866, 0.0001922398805618286, 0.00019938498735427856, 0.00020653009414672852, 0.00021367520093917847, 0.00022082030773162842, 0.00022796541452407837, 0.00023511052131652832, 0.00024225562810897827, 0.0002494007349014282, 0.0002565458416938782, 0.0002636909484863281]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 16.0, 16.0, 20.0, 34.0, 65.0, 85.0, 152.0, 207.0, 131.0, 90.0, 51.0, 42.0, 25.0, 11.0, 14.0, 9.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07028557360172272, -0.06850417703390121, -0.06672278791666031, -0.0649413913488388, -0.0631600022315979, -0.0613786056637764, -0.059597212821245193, -0.05781581997871399, -0.05603442341089249, -0.05425303056836128, -0.05247163772583008, -0.050690241158008575, -0.04890884831547737, -0.04712745547294617, -0.04534606263041496, -0.04356466978788376, -0.041783276945352554, -0.04000188410282135, -0.038220491260290146, -0.03643909841775894, -0.03465770184993744, -0.032876309007406235, -0.03109491616487503, -0.029313523322343826, -0.027532128617167473, -0.02575073577463627, -0.023969341069459915, -0.02218794822692871, -0.020406555384397507, -0.018625160679221153, -0.01684376783668995, -0.01506237406283617, -0.013280976563692093, -0.011499582789838314, -0.009718189015984535, -0.007936796173453331, -0.006155402399599552, -0.004374008625745773, -0.002592615783214569, -0.0008112220093607903, 0.0009701717644929886, 0.0027515653055161238, 0.004532958846539259, 0.0063143521547317505, 0.00809574592858553, 0.009877139702439308, 0.011658532544970512, 0.013439926318824291, 0.01522132009267807, 0.017002712935209274, 0.018784107640385628, 0.020565500482916832, 0.022346895188093185, 0.02412828803062439, 0.025909680873155594, 0.027691073715686798, 0.02947246842086315, 0.031253863126039505, 0.03303525596857071, 0.03481664881110191, 0.03659804165363312, 0.03837943822145462, 0.040160827338695526, 0.04194222390651703, 0.04372361674904823]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 10.0, 12.0, 21.0, 17.0, 18.0, 15.0, 35.0, 37.0, 39.0, 42.0, 53.0, 50.0, 40.0, 53.0, 49.0, 61.0, 62.0, 56.0, 46.0, 44.0, 35.0, 39.0, 26.0, 41.0, 22.0, 17.0, 11.0, 11.0, 14.0, 2.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0366097018122673, -0.035617489367723465, -0.034625280648469925, -0.033633068203926086, -0.032640859484672546, -0.03164864704012871, -0.03065643645823002, -0.02966422587633133, -0.02867201343178749, -0.0276798028498888, -0.026687592267990112, -0.025695379823446274, -0.024703169241547585, -0.023710958659648895, -0.022718748077750206, -0.021726537495851517, -0.020734326913952827, -0.019742116332054138, -0.01874990575015545, -0.01775769516825676, -0.01676548272371292, -0.015773272141814232, -0.014781061559915543, -0.013788850978016853, -0.01279663946479559, -0.0118044288828969, -0.010812217369675636, -0.009820006787776947, -0.008827796205878258, -0.007835584692656994, -0.006843374110758305, -0.005851163063198328, -0.0048589520156383514, -0.003866740968078375, -0.002874530153349042, -0.001882319338619709, -0.0008901082910597324, 0.00010210275650024414, 0.0010943133383989334, 0.00208652438595891, 0.0030787354335188866, 0.004070946481078863, 0.00506315752863884, 0.006055368110537529, 0.007047579158097506, 0.008039790205657482, 0.009032000787556171, 0.010024212300777435, 0.011016422882676125, 0.012008633464574814, 0.013000844977796078, 0.013993055559694767, 0.014985267072916031, 0.01597747765481472, 0.01696968823671341, 0.0179618988186121, 0.018954109400510788, 0.019946319982409477, 0.020938530564308167, 0.021930743008852005, 0.022922953590750694, 0.023915164172649384, 0.024907374754548073, 0.025899585336446762, 0.0268917977809906]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 5.0, 11.0, 28.0, 43.0, 63.0, 114.0, 168.0, 281.0, 409.0, 634.0, 1058.0, 2735.0, 43880.0, 3973486.0, 161275.0, 6072.0, 1582.0, 909.0, 602.0, 399.0, 230.0, 131.0, 65.0, 39.0, 30.0, 14.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.0623779296875, -0.06098175048828125, -0.0595855712890625, -0.05818939208984375, -0.056793212890625, -0.05539703369140625, -0.0540008544921875, -0.05260467529296875, -0.05120849609375, -0.04981231689453125, -0.0484161376953125, -0.04701995849609375, -0.045623779296875, -0.04422760009765625, -0.0428314208984375, -0.04143524169921875, -0.0400390625, -0.03864288330078125, -0.0372467041015625, -0.03585052490234375, -0.034454345703125, -0.03305816650390625, -0.0316619873046875, -0.03026580810546875, -0.02886962890625, -0.02747344970703125, -0.0260772705078125, -0.02468109130859375, -0.023284912109375, -0.02188873291015625, -0.0204925537109375, -0.01909637451171875, -0.0177001953125, -0.01630401611328125, -0.0149078369140625, -0.01351165771484375, -0.012115478515625, -0.01071929931640625, -0.0093231201171875, -0.00792694091796875, -0.00653076171875, -0.00513458251953125, -0.0037384033203125, -0.00234222412109375, -0.000946044921875, 0.00045013427734375, 0.0018463134765625, 0.00324249267578125, 0.004638671875, 0.00603485107421875, 0.0074310302734375, 0.00882720947265625, 0.010223388671875, 0.01161956787109375, 0.0130157470703125, 0.01441192626953125, 0.01580810546875, 0.01720428466796875, 0.0186004638671875, 0.01999664306640625, 0.021392822265625, 0.02278900146484375, 0.0241851806640625, 0.02558135986328125, 0.0269775390625]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 15.0, 25.0, 18.0, 26.0, 37.0, 38.0, 72.0, 65.0, 84.0, 71.0, 80.0, 88.0, 78.0, 79.0, 55.0, 41.0, 38.0, 39.0, 19.0, 13.0, 10.0, 9.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.05633544921875, -0.05506753921508789, -0.05379962921142578, -0.05253171920776367, -0.05126380920410156, -0.04999589920043945, -0.048727989196777344, -0.047460079193115234, -0.046192169189453125, -0.044924259185791016, -0.043656349182128906, -0.0423884391784668, -0.04112052917480469, -0.03985261917114258, -0.03858470916748047, -0.03731679916381836, -0.03604888916015625, -0.03478097915649414, -0.03351306915283203, -0.03224515914916992, -0.030977249145507812, -0.029709339141845703, -0.028441429138183594, -0.027173519134521484, -0.025905609130859375, -0.024637699127197266, -0.023369789123535156, -0.022101879119873047, -0.020833969116210938, -0.019566059112548828, -0.01829814910888672, -0.01703023910522461, -0.0157623291015625, -0.01449441909790039, -0.013226509094238281, -0.011958599090576172, -0.010690689086914062, -0.009422779083251953, -0.008154869079589844, -0.006886959075927734, -0.005619049072265625, -0.004351139068603516, -0.0030832290649414062, -0.0018153190612792969, -0.0005474090576171875, 0.0007205009460449219, 0.0019884109497070312, 0.0032563209533691406, 0.00452423095703125, 0.005792140960693359, 0.007060050964355469, 0.008327960968017578, 0.009595870971679688, 0.010863780975341797, 0.012131690979003906, 0.013399600982666016, 0.014667510986328125, 0.015935420989990234, 0.017203330993652344, 0.018471240997314453, 0.019739151000976562, 0.021007061004638672, 0.02227497100830078, 0.02354288101196289, 0.024810791015625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 15.0, 15.0, 39.0, 75.0, 180.0, 417.0, 942.0, 2706.0, 13264.0, 4112883.0, 56864.0, 4501.0, 1397.0, 531.0, 246.0, 117.0, 59.0, 15.0, 10.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0924072265625, -0.08907032012939453, -0.08573341369628906, -0.0823965072631836, -0.07905960083007812, -0.07572269439697266, -0.07238578796386719, -0.06904888153076172, -0.06571197509765625, -0.06237506866455078, -0.05903816223144531, -0.055701255798339844, -0.052364349365234375, -0.049027442932128906, -0.04569053649902344, -0.04235363006591797, -0.0390167236328125, -0.03567981719970703, -0.03234291076660156, -0.029006004333496094, -0.025669097900390625, -0.022332191467285156, -0.018995285034179688, -0.01565837860107422, -0.01232147216796875, -0.008984565734863281, -0.0056476593017578125, -0.0023107528686523438, 0.001026153564453125, 0.004363059997558594, 0.0076999664306640625, 0.011036872863769531, 0.014373779296875, 0.01771068572998047, 0.021047592163085938, 0.024384498596191406, 0.027721405029296875, 0.031058311462402344, 0.03439521789550781, 0.03773212432861328, 0.04106903076171875, 0.04440593719482422, 0.04774284362792969, 0.051079750061035156, 0.054416656494140625, 0.057753562927246094, 0.06109046936035156, 0.06442737579345703, 0.0677642822265625, 0.07110118865966797, 0.07443809509277344, 0.0777750015258789, 0.08111190795898438, 0.08444881439208984, 0.08778572082519531, 0.09112262725830078, 0.09445953369140625, 0.09779644012451172, 0.10113334655761719, 0.10447025299072266, 0.10780715942382812, 0.1111440658569336, 0.11448097229003906, 0.11781787872314453, 0.12115478515625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 8.0, 22.0, 42.0, 142.0, 432.0, 2863.0, 374.0, 101.0, 39.0, 17.0, 5.0, 4.0, 2.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01282501220703125, -0.012462973594665527, -0.012100934982299805, -0.011738896369934082, -0.01137685775756836, -0.011014819145202637, -0.010652780532836914, -0.010290741920471191, -0.009928703308105469, -0.009566664695739746, -0.009204626083374023, -0.0088425874710083, -0.008480548858642578, -0.008118510246276855, -0.007756471633911133, -0.00739443302154541, -0.0070323944091796875, -0.006670355796813965, -0.006308317184448242, -0.0059462785720825195, -0.005584239959716797, -0.005222201347351074, -0.0048601627349853516, -0.004498124122619629, -0.004136085510253906, -0.0037740468978881836, -0.003412008285522461, -0.0030499696731567383, -0.0026879310607910156, -0.002325892448425293, -0.0019638538360595703, -0.0016018152236938477, -0.001239776611328125, -0.0008777379989624023, -0.0005156993865966797, -0.00015366077423095703, 0.00020837783813476562, 0.0005704164505004883, 0.0009324550628662109, 0.0012944936752319336, 0.0016565322875976562, 0.002018570899963379, 0.0023806095123291016, 0.0027426481246948242, 0.003104686737060547, 0.0034667253494262695, 0.003828763961791992, 0.004190802574157715, 0.0045528411865234375, 0.00491487979888916, 0.005276918411254883, 0.0056389570236206055, 0.006000995635986328, 0.006363034248352051, 0.0067250728607177734, 0.007087111473083496, 0.007449150085449219, 0.007811188697814941, 0.008173227310180664, 0.008535265922546387, 0.00889730453491211, 0.009259343147277832, 0.009621381759643555, 0.009983420372009277, 0.010345458984375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 7.0, 13.0, 6.0, 17.0, 17.0, 27.0, 42.0, 50.0, 63.0, 112.0, 159.0, 121.0, 82.0, 73.0, 54.0, 33.0, 31.0, 17.0, 12.0, 12.0, 9.0, 9.0, 2.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.037831734865903854, -0.036777280271053314, -0.03572282940149307, -0.03466837480664253, -0.03361392393708229, -0.03255946934223175, -0.03150501847267151, -0.03045056387782097, -0.02939610928297043, -0.028341656550765038, -0.027287203818559647, -0.026232749223709106, -0.025178296491503716, -0.024123843759298325, -0.023069391027092934, -0.022014938294887543, -0.020960485562682152, -0.01990603283047676, -0.01885158009827137, -0.01779712736606598, -0.01674267277121544, -0.015688220039010048, -0.014633767306804657, -0.013579314574599266, -0.0125248609110713, -0.01147040817886591, -0.010415954515337944, -0.009361501783132553, -0.008307049050927162, -0.007252595387399197, -0.006198142655193806, -0.0051436894573271275, -0.0040892381221055984, -0.00303478492423892, -0.0019803319592028856, -0.000925878994166851, 0.0001285742036998272, 0.0011830274015665054, 0.0022374801337718964, 0.0032919333316385746, 0.004346386529505253, 0.005400839727371931, 0.006455292925238609, 0.007509745657444, 0.008564198389649391, 0.009618652053177357, 0.010673104785382748, 0.011727558448910713, 0.012782011181116104, 0.013836463913321495, 0.01489091757684946, 0.015945371240377426, 0.016999823972582817, 0.018054276704788208, 0.0191087294369936, 0.02016318216919899, 0.02121763676404953, 0.02227208949625492, 0.023326542228460312, 0.024380996823310852, 0.025435449555516243, 0.026489902287721634, 0.027544355019927025, 0.028598807752132416, 0.029653260484337807]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 7.0, 3.0, 10.0, 7.0, 9.0, 12.0, 18.0, 9.0, 16.0, 24.0, 21.0, 33.0, 47.0, 25.0, 44.0, 41.0, 35.0, 43.0, 48.0, 47.0, 42.0, 46.0, 50.0, 44.0, 39.0, 40.0, 38.0, 25.0, 25.0, 32.0, 28.0, 23.0, 10.0, 18.0, 9.0, 9.0, 8.0, 5.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021671462804079056, -0.020974181592464447, -0.020276900380849838, -0.01957961916923523, -0.01888233795762062, -0.018185056746006012, -0.017487775534391403, -0.016790492460131645, -0.016093211248517036, -0.015395930036902428, -0.014698648825287819, -0.01400136761367321, -0.013304085470736027, -0.012606804259121418, -0.01190952304750681, -0.011212240904569626, -0.010514960624277592, -0.009817679412662983, -0.009120398201048374, -0.00842311605811119, -0.007725834846496582, -0.007028553634881973, -0.0063312724232673645, -0.005633990745991468, -0.00493670953437686, -0.004239428322762251, -0.003542146645486355, -0.002844865433871746, -0.0021475839894264936, -0.0014503025449812412, -0.0007530213333666325, -5.573965609073639e-05, 0.0006415415555238724, 0.0013388229999691248, 0.002036104444414377, 0.002733385656028986, 0.0034306671004742384, 0.004127948544919491, 0.0048252297565341, 0.005522511433809996, 0.006219792645424604, 0.006917073857039213, 0.007614355534315109, 0.008311636745929718, 0.009008917957544327, 0.009706199169158936, 0.010403480380773544, 0.011100762523710728, 0.011798043735325336, 0.012495324946939945, 0.013192606158554554, 0.013889888301491737, 0.014587169513106346, 0.015284450724720955, 0.015981731936335564, 0.016679013147950172, 0.01737629435956478, 0.01807357557117939, 0.018770856782794, 0.019468137994408607, 0.020165419206023216, 0.020862702280282974, 0.021559983491897583, 0.022257264703512192, 0.0229545459151268]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 12.0, 19.0, 27.0, 41.0, 59.0, 83.0, 91.0, 156.0, 258.0, 375.0, 550.0, 831.0, 1368.0, 2327.0, 4256.0, 8167.0, 16652.0, 37379.0, 97063.0, 329795.0, 364656.0, 106826.0, 40178.0, 17709.0, 8664.0, 4483.0, 2404.0, 1516.0, 866.0, 544.0, 390.0, 263.0, 175.0, 114.0, 74.0, 56.0, 33.0, 20.0, 19.0, 18.0, 11.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.046417236328125, -0.044968605041503906, -0.04351997375488281, -0.04207134246826172, -0.040622711181640625, -0.03917407989501953, -0.03772544860839844, -0.036276817321777344, -0.03482818603515625, -0.033379554748535156, -0.03193092346191406, -0.03048229217529297, -0.029033660888671875, -0.02758502960205078, -0.026136398315429688, -0.024687767028808594, -0.0232391357421875, -0.021790504455566406, -0.020341873168945312, -0.01889324188232422, -0.017444610595703125, -0.01599597930908203, -0.014547348022460938, -0.013098716735839844, -0.01165008544921875, -0.010201454162597656, -0.008752822875976562, -0.007304191589355469, -0.005855560302734375, -0.004406929016113281, -0.0029582977294921875, -0.0015096664428710938, -6.103515625e-05, 0.0013875961303710938, 0.0028362274169921875, 0.004284858703613281, 0.005733489990234375, 0.007182121276855469, 0.008630752563476562, 0.010079383850097656, 0.01152801513671875, 0.012976646423339844, 0.014425277709960938, 0.01587390899658203, 0.017322540283203125, 0.01877117156982422, 0.020219802856445312, 0.021668434143066406, 0.0231170654296875, 0.024565696716308594, 0.026014328002929688, 0.02746295928955078, 0.028911590576171875, 0.03036022186279297, 0.03180885314941406, 0.033257484436035156, 0.03470611572265625, 0.036154747009277344, 0.03760337829589844, 0.03905200958251953, 0.040500640869140625, 0.04194927215576172, 0.04339790344238281, 0.044846534729003906, 0.046295166015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 12.0, 12.0, 11.0, 13.0, 20.0, 15.0, 24.0, 26.0, 35.0, 43.0, 31.0, 45.0, 48.0, 50.0, 53.0, 43.0, 51.0, 47.0, 50.0, 51.0, 53.0, 30.0, 43.0, 23.0, 27.0, 31.0, 26.0, 13.0, 15.0, 11.0, 12.0, 4.0, 9.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0210113525390625, -0.020307064056396484, -0.01960277557373047, -0.018898487091064453, -0.018194198608398438, -0.017489910125732422, -0.016785621643066406, -0.01608133316040039, -0.015377044677734375, -0.01467275619506836, -0.013968467712402344, -0.013264179229736328, -0.012559890747070312, -0.011855602264404297, -0.011151313781738281, -0.010447025299072266, -0.00974273681640625, -0.009038448333740234, -0.008334159851074219, -0.007629871368408203, -0.0069255828857421875, -0.006221294403076172, -0.005517005920410156, -0.004812717437744141, -0.004108428955078125, -0.0034041404724121094, -0.0026998519897460938, -0.001995563507080078, -0.0012912750244140625, -0.0005869865417480469, 0.00011730194091796875, 0.0008215904235839844, 0.00152587890625, 0.0022301673889160156, 0.0029344558715820312, 0.003638744354248047, 0.0043430328369140625, 0.005047321319580078, 0.005751609802246094, 0.006455898284912109, 0.007160186767578125, 0.00786447525024414, 0.008568763732910156, 0.009273052215576172, 0.009977340698242188, 0.010681629180908203, 0.011385917663574219, 0.012090206146240234, 0.01279449462890625, 0.013498783111572266, 0.014203071594238281, 0.014907360076904297, 0.015611648559570312, 0.016315937042236328, 0.017020225524902344, 0.01772451400756836, 0.018428802490234375, 0.01913309097290039, 0.019837379455566406, 0.020541667938232422, 0.021245956420898438, 0.021950244903564453, 0.02265453338623047, 0.023358821868896484, 0.0240631103515625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 10.0, 7.0, 15.0, 24.0, 30.0, 44.0, 69.0, 92.0, 152.0, 196.0, 280.0, 388.0, 590.0, 933.0, 1340.0, 2081.0, 3292.0, 5392.0, 9310.0, 17347.0, 36247.0, 96417.0, 528541.0, 228771.0, 58980.0, 25515.0, 12961.0, 7290.0, 4331.0, 2691.0, 1710.0, 1093.0, 768.0, 477.0, 358.0, 244.0, 159.0, 123.0, 75.0, 60.0, 47.0, 32.0, 18.0, 16.0, 14.0, 12.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.03668212890625, -0.035562992095947266, -0.03444385528564453, -0.0333247184753418, -0.03220558166503906, -0.031086444854736328, -0.029967308044433594, -0.02884817123413086, -0.027729034423828125, -0.02660989761352539, -0.025490760803222656, -0.024371623992919922, -0.023252487182617188, -0.022133350372314453, -0.02101421356201172, -0.019895076751708984, -0.01877593994140625, -0.017656803131103516, -0.01653766632080078, -0.015418529510498047, -0.014299392700195312, -0.013180255889892578, -0.012061119079589844, -0.01094198226928711, -0.009822845458984375, -0.00870370864868164, -0.007584571838378906, -0.006465435028076172, -0.0053462982177734375, -0.004227161407470703, -0.0031080245971679688, -0.0019888877868652344, -0.0008697509765625, 0.0002493858337402344, 0.0013685226440429688, 0.002487659454345703, 0.0036067962646484375, 0.004725933074951172, 0.005845069885253906, 0.006964206695556641, 0.008083343505859375, 0.00920248031616211, 0.010321617126464844, 0.011440753936767578, 0.012559890747070312, 0.013679027557373047, 0.014798164367675781, 0.015917301177978516, 0.01703643798828125, 0.018155574798583984, 0.01927471160888672, 0.020393848419189453, 0.021512985229492188, 0.022632122039794922, 0.023751258850097656, 0.02487039566040039, 0.025989532470703125, 0.02710866928100586, 0.028227806091308594, 0.029346942901611328, 0.030466079711914062, 0.0315852165222168, 0.03270435333251953, 0.033823490142822266, 0.034942626953125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 4.0, 2.0, 9.0, 11.0, 11.0, 11.0, 13.0, 15.0, 17.0, 21.0, 23.0, 29.0, 27.0, 33.0, 27.0, 46.0, 40.0, 49.0, 51.0, 40.0, 38.0, 43.0, 40.0, 59.0, 39.0, 36.0, 37.0, 31.0, 31.0, 19.0, 25.0, 22.0, 21.0, 16.0, 13.0, 15.0, 11.0, 9.0, 3.0, 5.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01275634765625, -0.0123521089553833, -0.011947870254516602, -0.011543631553649902, -0.011139392852783203, -0.010735154151916504, -0.010330915451049805, -0.009926676750183105, -0.009522438049316406, -0.009118199348449707, -0.008713960647583008, -0.008309721946716309, -0.00790548324584961, -0.00750124454498291, -0.007097005844116211, -0.006692767143249512, -0.0062885284423828125, -0.005884289741516113, -0.005480051040649414, -0.005075812339782715, -0.004671573638916016, -0.004267334938049316, -0.003863096237182617, -0.003458857536315918, -0.0030546188354492188, -0.0026503801345825195, -0.0022461414337158203, -0.001841902732849121, -0.0014376640319824219, -0.0010334253311157227, -0.0006291866302490234, -0.00022494792938232422, 0.000179290771484375, 0.0005835294723510742, 0.0009877681732177734, 0.0013920068740844727, 0.0017962455749511719, 0.002200484275817871, 0.0026047229766845703, 0.0030089616775512695, 0.0034132003784179688, 0.003817439079284668, 0.004221677780151367, 0.004625916481018066, 0.005030155181884766, 0.005434393882751465, 0.005838632583618164, 0.006242871284484863, 0.0066471099853515625, 0.007051348686218262, 0.007455587387084961, 0.00785982608795166, 0.00826406478881836, 0.008668303489685059, 0.009072542190551758, 0.009476780891418457, 0.009881019592285156, 0.010285258293151855, 0.010689496994018555, 0.011093735694885254, 0.011497974395751953, 0.011902213096618652, 0.012306451797485352, 0.01271069049835205, 0.01311492919921875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 11.0, 14.0, 15.0, 20.0, 34.0, 61.0, 66.0, 69.0, 87.0, 146.0, 235.0, 263.0, 336.0, 485.0, 702.0, 1088.0, 1759.0, 4996.0, 113425.0, 910558.0, 8138.0, 2104.0, 1235.0, 730.0, 525.0, 379.0, 270.0, 177.0, 132.0, 132.0, 97.0, 64.0, 50.0, 38.0, 30.0, 22.0, 16.0, 12.0, 3.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00510406494140625, -0.004954516887664795, -0.00480496883392334, -0.004655420780181885, -0.00450587272644043, -0.004356324672698975, -0.0042067766189575195, -0.0040572285652160645, -0.003907680511474609, -0.0037581324577331543, -0.0036085844039916992, -0.003459036350250244, -0.003309488296508789, -0.003159940242767334, -0.003010392189025879, -0.002860844135284424, -0.0027112960815429688, -0.0025617480278015137, -0.0024121999740600586, -0.0022626519203186035, -0.0021131038665771484, -0.0019635558128356934, -0.0018140077590942383, -0.0016644597053527832, -0.0015149116516113281, -0.001365363597869873, -0.001215815544128418, -0.0010662674903869629, -0.0009167194366455078, -0.0007671713829040527, -0.0006176233291625977, -0.0004680752754211426, -0.0003185272216796875, -0.00016897916793823242, -1.9431114196777344e-05, 0.00013011693954467773, 0.0002796649932861328, 0.0004292130470275879, 0.000578761100769043, 0.000728309154510498, 0.0008778572082519531, 0.0010274052619934082, 0.0011769533157348633, 0.0013265013694763184, 0.0014760494232177734, 0.0016255974769592285, 0.0017751455307006836, 0.0019246935844421387, 0.0020742416381835938, 0.002223789691925049, 0.002373337745666504, 0.002522885799407959, 0.002672433853149414, 0.002821981906890869, 0.0029715299606323242, 0.0031210780143737793, 0.0032706260681152344, 0.0034201741218566895, 0.0035697221755981445, 0.0037192702293395996, 0.0038688182830810547, 0.00401836633682251, 0.004167914390563965, 0.00431746244430542, 0.004467010498046875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 9.0, 3.0, 10.0, 4.0, 6.0, 12.0, 14.0, 14.0, 20.0, 9.0, 27.0, 21.0, 40.0, 24.0, 61.0, 37.0, 80.0, 78.0, 52.0, 88.0, 50.0, 74.0, 28.0, 46.0, 21.0, 25.0, 27.0, 22.0, 12.0, 15.0, 13.0, 14.0, 5.0, 6.0, 5.0, 10.0, 3.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-5.0067901611328125e-06, -4.8568472266197205e-06, -4.706904292106628e-06, -4.556961357593536e-06, -4.407018423080444e-06, -4.257075488567352e-06, -4.10713255405426e-06, -3.957189619541168e-06, -3.807246685028076e-06, -3.657303750514984e-06, -3.507360816001892e-06, -3.3574178814888e-06, -3.207474946975708e-06, -3.057532012462616e-06, -2.907589077949524e-06, -2.757646143436432e-06, -2.60770320892334e-06, -2.457760274410248e-06, -2.3078173398971558e-06, -2.1578744053840637e-06, -2.0079314708709717e-06, -1.8579885363578796e-06, -1.7080456018447876e-06, -1.5581026673316956e-06, -1.4081597328186035e-06, -1.2582167983055115e-06, -1.1082738637924194e-06, -9.583309292793274e-07, -8.083879947662354e-07, -6.584450602531433e-07, -5.085021257400513e-07, -3.5855919122695923e-07, -2.086162567138672e-07, -5.8673322200775146e-08, 9.12696123123169e-08, 2.4121254682540894e-07, 3.91155481338501e-07, 5.41098415851593e-07, 6.910413503646851e-07, 8.409842848777771e-07, 9.909272193908691e-07, 1.1408701539039612e-06, 1.2908130884170532e-06, 1.4407560229301453e-06, 1.5906989574432373e-06, 1.7406418919563293e-06, 1.8905848264694214e-06, 2.0405277609825134e-06, 2.1904706954956055e-06, 2.3404136300086975e-06, 2.4903565645217896e-06, 2.6402994990348816e-06, 2.7902424335479736e-06, 2.9401853680610657e-06, 3.0901283025741577e-06, 3.2400712370872498e-06, 3.390014171600342e-06, 3.539957106113434e-06, 3.689900040626526e-06, 3.839842975139618e-06, 3.98978590965271e-06, 4.139728844165802e-06, 4.289671778678894e-06, 4.439614713191986e-06, 4.589557647705078e-06]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 13.0, 8.0, 14.0, 29.0, 46.0, 79.0, 140.0, 190.0, 359.0, 628.0, 1231.0, 2455.0, 5173.0, 33788.0, 961958.0, 32194.0, 5090.0, 2375.0, 1207.0, 686.0, 347.0, 209.0, 113.0, 84.0, 41.0, 30.0, 21.0, 13.0, 12.0, 7.0, 4.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0033435821533203125, -0.003217369318008423, -0.003091156482696533, -0.0029649436473846436, -0.002838730812072754, -0.0027125179767608643, -0.0025863051414489746, -0.002460092306137085, -0.0023338794708251953, -0.0022076666355133057, -0.002081453800201416, -0.0019552409648895264, -0.0018290281295776367, -0.001702815294265747, -0.0015766024589538574, -0.0014503896236419678, -0.0013241767883300781, -0.0011979639530181885, -0.0010717511177062988, -0.0009455382823944092, -0.0008193254470825195, -0.0006931126117706299, -0.0005668997764587402, -0.0004406869411468506, -0.00031447410583496094, -0.0001882612705230713, -6.204843521118164e-05, 6.416440010070801e-05, 0.00019037723541259766, 0.0003165900707244873, 0.00044280290603637695, 0.0005690157413482666, 0.0006952285766601562, 0.0008214414119720459, 0.0009476542472839355, 0.0010738670825958252, 0.0012000799179077148, 0.0013262927532196045, 0.0014525055885314941, 0.0015787184238433838, 0.0017049312591552734, 0.001831144094467163, 0.0019573569297790527, 0.0020835697650909424, 0.002209782600402832, 0.0023359954357147217, 0.0024622082710266113, 0.002588421106338501, 0.0027146339416503906, 0.0028408467769622803, 0.00296705961227417, 0.0030932724475860596, 0.0032194852828979492, 0.003345698118209839, 0.0034719109535217285, 0.003598123788833618, 0.003724336624145508, 0.0038505494594573975, 0.003976762294769287, 0.004102975130081177, 0.004229187965393066, 0.004355400800704956, 0.004481613636016846, 0.004607826471328735, 0.004734039306640625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 9.0, 31.0, 97.0, 224.0, 265.0, 210.0, 80.0, 34.0, 12.0, 6.0, 9.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008463859558105469, -0.00082387775182724, -0.0008013695478439331, -0.0007788613438606262, -0.0007563531398773193, -0.0007338449358940125, -0.0007113367319107056, -0.0006888285279273987, -0.0006663203239440918, -0.0006438121199607849, -0.000621303915977478, -0.0005987957119941711, -0.0005762875080108643, -0.0005537793040275574, -0.0005312711000442505, -0.0005087628960609436, -0.0004862546920776367, -0.00046374648809432983, -0.00044123828411102295, -0.00041873008012771606, -0.0003962218761444092, -0.0003737136721611023, -0.0003512054681777954, -0.0003286972641944885, -0.00030618906021118164, -0.00028368085622787476, -0.00026117265224456787, -0.00023866444826126099, -0.0002161562442779541, -0.00019364804029464722, -0.00017113983631134033, -0.00014863163232803345, -0.00012612342834472656, -0.00010361522436141968, -8.110702037811279e-05, -5.859881639480591e-05, -3.6090612411499023e-05, -1.3582408428192139e-05, 8.925795555114746e-06, 3.143399953842163e-05, 5.3942203521728516e-05, 7.64504075050354e-05, 9.895861148834229e-05, 0.00012146681547164917, 0.00014397501945495605, 0.00016648322343826294, 0.00018899142742156982, 0.0002114996314048767, 0.0002340078353881836, 0.0002565160393714905, 0.00027902424335479736, 0.00030153244733810425, 0.00032404065132141113, 0.000346548855304718, 0.0003690570592880249, 0.0003915652632713318, 0.00041407346725463867, 0.00043658167123794556, 0.00045908987522125244, 0.0004815980792045593, 0.0005041062831878662, 0.0005266144871711731, 0.00054912269115448, 0.0005716308951377869, 0.0005941390991210938]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 9.0, 4.0, 4.0, 13.0, 9.0, 15.0, 19.0, 19.0, 32.0, 34.0, 46.0, 57.0, 74.0, 83.0, 119.0, 106.0, 81.0, 61.0, 39.0, 37.0, 22.0, 21.0, 18.0, 14.0, 10.0, 6.0, 9.0, 3.0, 6.0, 7.0, 6.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.026906441897153854, -0.02610730566084385, -0.025308167561888695, -0.02450903132557869, -0.023709893226623535, -0.02291075699031353, -0.022111618891358376, -0.02131248265504837, -0.020513344556093216, -0.01971420831978321, -0.018915070220828056, -0.01811593398451805, -0.017316795885562897, -0.01651765964925289, -0.015718521550297737, -0.014919385313987732, -0.014120248146355152, -0.013321110978722572, -0.012521973811089993, -0.011722836643457413, -0.010923699475824833, -0.010124562308192253, -0.009325426071882248, -0.008526287972927094, -0.007727151270955801, -0.006928014103323221, -0.006128876935690641, -0.005329740233719349, -0.004530603066086769, -0.0037314658984541893, -0.0029323287308216095, -0.0021331915631890297, -0.0013340543955564499, -0.000534917286131531, 0.0002642198232933879, 0.0010633568745106459, 0.0018624940421432257, 0.002661630976945162, 0.0034607681445777416, 0.004259905312210321, 0.005059042479842901, 0.005858179647475481, 0.006657316815108061, 0.007456453517079353, 0.008255590684711933, 0.009054727852344513, 0.009853865019977093, 0.010653002187609673, 0.011452139355242252, 0.012251276522874832, 0.013050413690507412, 0.013849550858139992, 0.014648688025772572, 0.015447825193405151, 0.016246961429715157, 0.01704609952867031, 0.017845235764980316, 0.01864437200129032, 0.019443510100245476, 0.02024264633655548, 0.021041784435510635, 0.02184092067182064, 0.022640058770775795, 0.0234391950070858, 0.024238333106040955]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 7.0, 11.0, 8.0, 12.0, 13.0, 17.0, 16.0, 19.0, 23.0, 35.0, 46.0, 28.0, 39.0, 39.0, 39.0, 41.0, 51.0, 50.0, 44.0, 42.0, 46.0, 46.0, 37.0, 46.0, 30.0, 32.0, 23.0, 27.0, 31.0, 23.0, 11.0, 15.0, 12.0, 8.0, 8.0, 4.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019806765019893646, -0.019168777391314507, -0.018530791625380516, -0.017892803996801376, -0.017254818230867386, -0.016616830602288246, -0.015978842973709106, -0.015340856276452541, -0.014702869579195976, -0.014064882881939411, -0.013426896184682846, -0.012788908556103706, -0.012150921858847141, -0.011512935161590576, -0.010874947533011436, -0.010236960835754871, -0.009598974138498306, -0.008960987441241741, -0.008323000743985176, -0.007685013115406036, -0.007047026418149471, -0.006409039720892906, -0.005771052557975054, -0.005133065395057201, -0.004495078697800636, -0.0038570917677134275, -0.003219104837626219, -0.00258111790753901, -0.0019431309774518013, -0.0013051440473645926, -0.0006671571172773838, -2.9169954359531403e-05, 0.0006088186055421829, 0.0012468055356293917, 0.0018847924657166004, 0.002522779395803809, 0.003160766325891018, 0.0037987532559782267, 0.004436740186065435, 0.005074727348983288, 0.005712714046239853, 0.006350700743496418, 0.00698868790641427, 0.007626675069332123, 0.008264661766588688, 0.008902648463845253, 0.009540636092424393, 0.010178622789680958, 0.010816609486937523, 0.011454596184194088, 0.012092582881450653, 0.012730570510029793, 0.013368557207286358, 0.014006543904542923, 0.014644531533122063, 0.015282518230378628, 0.015920504927635193, 0.016558492556214333, 0.017196478322148323, 0.017834465950727463, 0.018472451716661453, 0.019110439345240593, 0.019748426973819733, 0.020386412739753723, 0.021024400368332863]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 15.0, 16.0, 38.0, 62.0, 74.0, 139.0, 216.0, 361.0, 577.0, 1066.0, 1702.0, 3186.0, 5672.0, 10637.0, 20282.0, 40310.0, 87093.0, 207830.0, 343443.0, 176241.0, 74846.0, 35443.0, 18055.0, 9556.0, 4923.0, 2850.0, 1554.0, 937.0, 557.0, 322.0, 197.0, 124.0, 73.0, 51.0, 26.0, 21.0, 14.0, 9.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.041290283203125, -0.039975643157958984, -0.03866100311279297, -0.03734636306762695, -0.03603172302246094, -0.03471708297729492, -0.033402442932128906, -0.03208780288696289, -0.030773162841796875, -0.02945852279663086, -0.028143882751464844, -0.026829242706298828, -0.025514602661132812, -0.024199962615966797, -0.02288532257080078, -0.021570682525634766, -0.02025604248046875, -0.018941402435302734, -0.01762676239013672, -0.016312122344970703, -0.014997482299804688, -0.013682842254638672, -0.012368202209472656, -0.01105356216430664, -0.009738922119140625, -0.00842428207397461, -0.007109642028808594, -0.005795001983642578, -0.0044803619384765625, -0.003165721893310547, -0.0018510818481445312, -0.0005364418029785156, 0.0007781982421875, 0.0020928382873535156, 0.0034074783325195312, 0.004722118377685547, 0.0060367584228515625, 0.007351398468017578, 0.008666038513183594, 0.00998067855834961, 0.011295318603515625, 0.01260995864868164, 0.013924598693847656, 0.015239238739013672, 0.016553878784179688, 0.017868518829345703, 0.01918315887451172, 0.020497798919677734, 0.02181243896484375, 0.023127079010009766, 0.02444171905517578, 0.025756359100341797, 0.027070999145507812, 0.028385639190673828, 0.029700279235839844, 0.03101491928100586, 0.032329559326171875, 0.03364419937133789, 0.034958839416503906, 0.03627347946166992, 0.03758811950683594, 0.03890275955200195, 0.04021739959716797, 0.041532039642333984, 0.0428466796875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 4.0, 6.0, 8.0, 7.0, 9.0, 21.0, 17.0, 22.0, 25.0, 29.0, 38.0, 54.0, 52.0, 53.0, 58.0, 49.0, 61.0, 54.0, 44.0, 57.0, 60.0, 62.0, 32.0, 34.0, 24.0, 23.0, 27.0, 16.0, 18.0, 8.0, 7.0, 6.0, 8.0, 5.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0156707763671875, -0.015193343162536621, -0.014715909957885742, -0.014238476753234863, -0.013761043548583984, -0.013283610343933105, -0.012806177139282227, -0.012328743934631348, -0.011851310729980469, -0.01137387752532959, -0.010896444320678711, -0.010419011116027832, -0.009941577911376953, -0.009464144706726074, -0.008986711502075195, -0.008509278297424316, -0.008031845092773438, -0.007554411888122559, -0.00707697868347168, -0.006599545478820801, -0.006122112274169922, -0.005644679069519043, -0.005167245864868164, -0.004689812660217285, -0.004212379455566406, -0.0037349462509155273, -0.0032575130462646484, -0.0027800798416137695, -0.0023026466369628906, -0.0018252134323120117, -0.0013477802276611328, -0.0008703470230102539, -0.000392913818359375, 8.45193862915039e-05, 0.0005619525909423828, 0.0010393857955932617, 0.0015168190002441406, 0.0019942522048950195, 0.0024716854095458984, 0.0029491186141967773, 0.0034265518188476562, 0.003903985023498535, 0.004381418228149414, 0.004858851432800293, 0.005336284637451172, 0.005813717842102051, 0.00629115104675293, 0.006768584251403809, 0.0072460174560546875, 0.007723450660705566, 0.008200883865356445, 0.008678317070007324, 0.009155750274658203, 0.009633183479309082, 0.010110616683959961, 0.01058804988861084, 0.011065483093261719, 0.011542916297912598, 0.012020349502563477, 0.012497782707214355, 0.012975215911865234, 0.013452649116516113, 0.013930082321166992, 0.014407515525817871, 0.01488494873046875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 5.0, 10.0, 13.0, 10.0, 17.0, 39.0, 41.0, 82.0, 164.0, 236.0, 423.0, 802.0, 1552.0, 2875.0, 5555.0, 11352.0, 24295.0, 54956.0, 135661.0, 321214.0, 284805.0, 115657.0, 47089.0, 21380.0, 9883.0, 4971.0, 2500.0, 1349.0, 683.0, 377.0, 217.0, 125.0, 79.0, 40.0, 24.0, 20.0, 12.0, 13.0, 6.0, 4.0, 7.0, 4.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03570556640625, -0.034470558166503906, -0.03323554992675781, -0.03200054168701172, -0.030765533447265625, -0.02953052520751953, -0.028295516967773438, -0.027060508728027344, -0.02582550048828125, -0.024590492248535156, -0.023355484008789062, -0.02212047576904297, -0.020885467529296875, -0.01965045928955078, -0.018415451049804688, -0.017180442810058594, -0.0159454345703125, -0.014710426330566406, -0.013475418090820312, -0.012240409851074219, -0.011005401611328125, -0.009770393371582031, -0.008535385131835938, -0.007300376892089844, -0.00606536865234375, -0.004830360412597656, -0.0035953521728515625, -0.0023603439331054688, -0.001125335693359375, 0.00010967254638671875, 0.0013446807861328125, 0.0025796890258789062, 0.003814697265625, 0.005049705505371094, 0.0062847137451171875, 0.007519721984863281, 0.008754730224609375, 0.009989738464355469, 0.011224746704101562, 0.012459754943847656, 0.01369476318359375, 0.014929771423339844, 0.016164779663085938, 0.01739978790283203, 0.018634796142578125, 0.01986980438232422, 0.021104812622070312, 0.022339820861816406, 0.0235748291015625, 0.024809837341308594, 0.026044845581054688, 0.02727985382080078, 0.028514862060546875, 0.02974987030029297, 0.030984878540039062, 0.032219886779785156, 0.03345489501953125, 0.034689903259277344, 0.03592491149902344, 0.03715991973876953, 0.038394927978515625, 0.03962993621826172, 0.04086494445800781, 0.042099952697753906, 0.0433349609375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 3.0, 5.0, 9.0, 9.0, 10.0, 13.0, 14.0, 15.0, 26.0, 22.0, 28.0, 20.0, 29.0, 27.0, 49.0, 31.0, 53.0, 51.0, 43.0, 43.0, 40.0, 31.0, 45.0, 37.0, 34.0, 39.0, 35.0, 24.0, 36.0, 25.0, 26.0, 19.0, 21.0, 12.0, 8.0, 10.0, 10.0, 11.0, 7.0, 8.0, 6.0, 6.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00939178466796875, -0.009099006652832031, -0.008806228637695312, -0.008513450622558594, -0.008220672607421875, -0.007927894592285156, -0.0076351165771484375, -0.007342338562011719, -0.007049560546875, -0.006756782531738281, -0.0064640045166015625, -0.006171226501464844, -0.005878448486328125, -0.005585670471191406, -0.0052928924560546875, -0.005000114440917969, -0.00470733642578125, -0.004414558410644531, -0.0041217803955078125, -0.0038290023803710938, -0.003536224365234375, -0.0032434463500976562, -0.0029506683349609375, -0.0026578903198242188, -0.0023651123046875, -0.0020723342895507812, -0.0017795562744140625, -0.0014867782592773438, -0.001194000244140625, -0.0009012222290039062, -0.0006084442138671875, -0.00031566619873046875, -2.288818359375e-05, 0.00026988983154296875, 0.0005626678466796875, 0.0008554458618164062, 0.001148223876953125, 0.0014410018920898438, 0.0017337799072265625, 0.0020265579223632812, 0.0023193359375, 0.0026121139526367188, 0.0029048919677734375, 0.0031976699829101562, 0.003490447998046875, 0.0037832260131835938, 0.0040760040283203125, 0.004368782043457031, 0.00466156005859375, 0.004954338073730469, 0.0052471160888671875, 0.005539894104003906, 0.005832672119140625, 0.006125450134277344, 0.0064182281494140625, 0.006711006164550781, 0.0070037841796875, 0.007296562194824219, 0.0075893402099609375, 0.007882118225097656, 0.008174896240234375, 0.008467674255371094, 0.008760452270507812, 0.009053230285644531, 0.00934600830078125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 10.0, 7.0, 20.0, 17.0, 33.0, 51.0, 73.0, 93.0, 165.0, 250.0, 399.0, 720.0, 1197.0, 2164.0, 4251.0, 8563.0, 20211.0, 56551.0, 254215.0, 541683.0, 101657.0, 31317.0, 12538.0, 5627.0, 2834.0, 1600.0, 863.0, 526.0, 351.0, 202.0, 120.0, 73.0, 48.0, 39.0, 21.0, 17.0, 12.0, 14.0, 10.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0013980865478515625, -0.001359492540359497, -0.0013208985328674316, -0.0012823045253753662, -0.0012437105178833008, -0.0012051165103912354, -0.00116652250289917, -0.0011279284954071045, -0.001089334487915039, -0.0010507404804229736, -0.0010121464729309082, -0.0009735524654388428, -0.0009349584579467773, -0.0008963644504547119, -0.0008577704429626465, -0.0008191764354705811, -0.0007805824279785156, -0.0007419884204864502, -0.0007033944129943848, -0.0006648004055023193, -0.0006262063980102539, -0.0005876123905181885, -0.000549018383026123, -0.0005104243755340576, -0.0004718303680419922, -0.00043323636054992676, -0.00039464235305786133, -0.0003560483455657959, -0.00031745433807373047, -0.00027886033058166504, -0.0002402663230895996, -0.00020167231559753418, -0.00016307830810546875, -0.00012448430061340332, -8.589029312133789e-05, -4.729628562927246e-05, -8.702278137207031e-06, 2.98917293548584e-05, 6.848573684692383e-05, 0.00010707974433898926, 0.0001456737518310547, 0.00018426775932312012, 0.00022286176681518555, 0.000261455774307251, 0.0003000497817993164, 0.00033864378929138184, 0.00037723779678344727, 0.0004158318042755127, 0.0004544258117675781, 0.0004930198192596436, 0.000531613826751709, 0.0005702078342437744, 0.0006088018417358398, 0.0006473958492279053, 0.0006859898567199707, 0.0007245838642120361, 0.0007631778717041016, 0.000801771879196167, 0.0008403658866882324, 0.0008789598941802979, 0.0009175539016723633, 0.0009561479091644287, 0.0009947419166564941, 0.0010333359241485596, 0.001071929931640625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 7.0, 4.0, 10.0, 13.0, 17.0, 16.0, 20.0, 37.0, 65.0, 50.0, 51.0, 77.0, 70.0, 65.0, 118.0, 65.0, 65.0, 58.0, 50.0, 31.0, 33.0, 14.0, 15.0, 11.0, 7.0, 11.0, 9.0, 3.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9206275939941406e-06, -2.791173756122589e-06, -2.6617199182510376e-06, -2.532266080379486e-06, -2.4028122425079346e-06, -2.273358404636383e-06, -2.1439045667648315e-06, -2.01445072889328e-06, -1.8849968910217285e-06, -1.755543053150177e-06, -1.6260892152786255e-06, -1.496635377407074e-06, -1.3671815395355225e-06, -1.237727701663971e-06, -1.1082738637924194e-06, -9.78820025920868e-07, -8.493661880493164e-07, -7.199123501777649e-07, -5.904585123062134e-07, -4.6100467443466187e-07, -3.3155083656311035e-07, -2.0209699869155884e-07, -7.264316082000732e-08, 5.681067705154419e-08, 1.862645149230957e-07, 3.157183527946472e-07, 4.4517219066619873e-07, 5.746260285377502e-07, 7.040798664093018e-07, 8.335337042808533e-07, 9.629875421524048e-07, 1.0924413800239563e-06, 1.2218952178955078e-06, 1.3513490557670593e-06, 1.4808028936386108e-06, 1.6102567315101624e-06, 1.7397105693817139e-06, 1.8691644072532654e-06, 1.998618245124817e-06, 2.1280720829963684e-06, 2.25752592086792e-06, 2.3869797587394714e-06, 2.516433596611023e-06, 2.6458874344825745e-06, 2.775341272354126e-06, 2.9047951102256775e-06, 3.034248948097229e-06, 3.1637027859687805e-06, 3.293156623840332e-06, 3.4226104617118835e-06, 3.552064299583435e-06, 3.6815181374549866e-06, 3.810971975326538e-06, 3.94042581319809e-06, 4.069879651069641e-06, 4.199333488941193e-06, 4.328787326812744e-06, 4.458241164684296e-06, 4.587695002555847e-06, 4.717148840427399e-06, 4.84660267829895e-06, 4.976056516170502e-06, 5.105510354042053e-06, 5.234964191913605e-06, 5.364418029785156e-06]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 13.0, 21.0, 32.0, 33.0, 65.0, 106.0, 164.0, 269.0, 438.0, 715.0, 1228.0, 2050.0, 3681.0, 6594.0, 12495.0, 24306.0, 48746.0, 109067.0, 255161.0, 313019.0, 143061.0, 62377.0, 30411.0, 15537.0, 8296.0, 4572.0, 2558.0, 1468.0, 818.0, 472.0, 313.0, 180.0, 119.0, 66.0, 40.0, 19.0, 14.0, 8.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004127025604248047, -0.0003985501825809479, -0.00038439780473709106, -0.00037024542689323425, -0.00035609304904937744, -0.00034194067120552063, -0.0003277882933616638, -0.000313635915517807, -0.0002994835376739502, -0.0002853311598300934, -0.00027117878198623657, -0.00025702640414237976, -0.00024287402629852295, -0.00022872164845466614, -0.00021456927061080933, -0.00020041689276695251, -0.0001862645149230957, -0.0001721121370792389, -0.00015795975923538208, -0.00014380738139152527, -0.00012965500354766846, -0.00011550262570381165, -0.00010135024785995483, -8.719787001609802e-05, -7.304549217224121e-05, -5.88931143283844e-05, -4.474073648452759e-05, -3.0588358640670776e-05, -1.6435980796813965e-05, -2.2836029529571533e-06, 1.1868774890899658e-05, 2.602115273475647e-05, 4.017353057861328e-05, 5.432590842247009e-05, 6.84782862663269e-05, 8.263066411018372e-05, 9.678304195404053e-05, 0.00011093541979789734, 0.00012508779764175415, 0.00013924017548561096, 0.00015339255332946777, 0.00016754493117332458, 0.0001816973090171814, 0.0001958496868610382, 0.00021000206470489502, 0.00022415444254875183, 0.00023830682039260864, 0.00025245919823646545, 0.00026661157608032227, 0.0002807639539241791, 0.0002949163317680359, 0.0003090687096118927, 0.0003232210874557495, 0.0003373734652996063, 0.00035152584314346313, 0.00036567822098731995, 0.00037983059883117676, 0.00039398297667503357, 0.0004081353545188904, 0.0004222877323627472, 0.000436440110206604, 0.0004505924880504608, 0.0004647448658943176, 0.00047889724373817444, 0.0004930496215820312]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 5.0, 8.0, 6.0, 14.0, 16.0, 19.0, 26.0, 19.0, 29.0, 28.0, 38.0, 25.0, 39.0, 35.0, 36.0, 50.0, 60.0, 48.0, 44.0, 50.0, 35.0, 45.0, 35.0, 38.0, 27.0, 28.0, 26.0, 21.0, 28.0, 22.0, 11.0, 15.0, 12.0, 4.0, 7.0, 14.0, 5.0, 4.0, 4.0, 2.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00010001659393310547, -9.634532034397125e-05, -9.267404675483704e-05, -8.900277316570282e-05, -8.53314995765686e-05, -8.166022598743439e-05, -7.798895239830017e-05, -7.431767880916595e-05, -7.064640522003174e-05, -6.697513163089752e-05, -6.33038580417633e-05, -5.963258445262909e-05, -5.596131086349487e-05, -5.229003727436066e-05, -4.861876368522644e-05, -4.4947490096092224e-05, -4.127621650695801e-05, -3.760494291782379e-05, -3.3933669328689575e-05, -3.026239573955536e-05, -2.6591122150421143e-05, -2.2919848561286926e-05, -1.924857497215271e-05, -1.5577301383018494e-05, -1.1906027793884277e-05, -8.234754204750061e-06, -4.563480615615845e-06, -8.922070264816284e-07, 2.779066562652588e-06, 6.450340151786804e-06, 1.012161374092102e-05, 1.3792887330055237e-05, 1.7464160919189453e-05, 2.113543450832367e-05, 2.4806708097457886e-05, 2.8477981686592102e-05, 3.214925527572632e-05, 3.5820528864860535e-05, 3.949180245399475e-05, 4.316307604312897e-05, 4.6834349632263184e-05, 5.05056232213974e-05, 5.4176896810531616e-05, 5.784817039966583e-05, 6.151944398880005e-05, 6.519071757793427e-05, 6.886199116706848e-05, 7.25332647562027e-05, 7.620453834533691e-05, 7.987581193447113e-05, 8.354708552360535e-05, 8.721835911273956e-05, 9.088963270187378e-05, 9.4560906291008e-05, 9.823217988014221e-05, 0.00010190345346927643, 0.00010557472705841064, 0.00010924600064754486, 0.00011291727423667908, 0.0001165885478258133, 0.00012025982141494751, 0.00012393109500408173, 0.00012760236859321594, 0.00013127364218235016, 0.00013494491577148438]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 8.0, 9.0, 11.0, 9.0, 14.0, 31.0, 46.0, 57.0, 74.0, 98.0, 151.0, 142.0, 96.0, 69.0, 42.0, 41.0, 27.0, 27.0, 9.0, 10.0, 4.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027323897927999496, -0.0264904722571373, -0.02565704472362995, -0.024823619052767754, -0.023990191519260406, -0.02315676584839821, -0.02232334017753601, -0.021489912644028664, -0.020656486973166466, -0.019823061302304268, -0.01898963376879692, -0.018156208097934723, -0.017322780564427376, -0.016489354893565178, -0.01565592736005783, -0.014822501689195633, -0.01398907508701086, -0.013155648484826088, -0.012322221882641315, -0.011488795280456543, -0.010655369609594345, -0.009821943007409573, -0.0089885164052248, -0.008155090734362602, -0.0073216636665165424, -0.00648823706433177, -0.005654810927808285, -0.004821384325623512, -0.00398795772343874, -0.0031545315869152546, -0.002321104984730482, -0.001487678848206997, -0.0006542522460222244, 0.00017917418153956532, 0.001012600609101355, 0.0018460270948708057, 0.0026794534642249346, 0.0035128798335790634, 0.004346306435763836, 0.005179732572287321, 0.006013159174472094, 0.006846585776656866, 0.007680011913180351, 0.008513438515365124, 0.009346865117549896, 0.010180290788412094, 0.011013718321919441, 0.011847143992781639, 0.012680570594966412, 0.013513997197151184, 0.014347423799335957, 0.015180850401520729, 0.016014276072382927, 0.016847703605890274, 0.017681129276752472, 0.01851455494761467, 0.019347982481122017, 0.020181408151984215, 0.021014835685491562, 0.02184826135635376, 0.022681688889861107, 0.023515114560723305, 0.024348542094230652, 0.02518196776509285, 0.026015393435955048]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 8.0, 5.0, 12.0, 3.0, 12.0, 16.0, 17.0, 20.0, 24.0, 24.0, 26.0, 25.0, 29.0, 34.0, 37.0, 25.0, 32.0, 36.0, 37.0, 42.0, 38.0, 34.0, 37.0, 32.0, 27.0, 35.0, 31.0, 25.0, 31.0, 25.0, 24.0, 34.0, 20.0, 14.0, 16.0, 12.0, 18.0, 12.0, 8.0, 14.0, 10.0, 14.0, 4.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.012067733332514763, -0.011668719351291656, -0.01126970537006855, -0.010870691388845444, -0.010471677407622337, -0.010072663426399231, -0.00967364851385355, -0.009274634532630444, -0.008875620551407337, -0.00847660657018423, -0.008077592588961124, -0.007678578142076731, -0.007279564160853624, -0.006880550179630518, -0.006481535732746124, -0.006082521751523018, -0.0056835077702999115, -0.005284493789076805, -0.004885479807853699, -0.004486465360969305, -0.004087451379746199, -0.0036884373985230923, -0.0032894231844693422, -0.002890408970415592, -0.002491394989192486, -0.0020923810079693794, -0.0016933667939156294, -0.0012943526962772012, -0.000895338598638773, -0.0004963246174156666, -9.731040336191654e-05, 0.0003017038106918335, 0.0007007177919149399, 0.001099731889553368, 0.0014987459871917963, 0.0018977600848302245, 0.0022967741824686527, 0.002695788163691759, 0.003094802377745509, 0.003493816591799259, 0.0038928305730223656, 0.004291844554245472, 0.004690858535468578, 0.005089872982352972, 0.005488886963576078, 0.005887900944799185, 0.0062869153916835785, 0.006685929372906685, 0.007084943354129791, 0.007483957335352898, 0.007882971316576004, 0.00828198529779911, 0.008680999279022217, 0.009080013260245323, 0.009479028172791004, 0.00987804215401411, 0.010277056135237217, 0.010676070116460323, 0.01107508409768343, 0.011474098078906536, 0.011873112991452217, 0.012272126972675323, 0.01267114095389843, 0.013070154935121536, 0.013469168916344643]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 9.0, 16.0, 17.0, 36.0, 41.0, 70.0, 90.0, 161.0, 204.0, 372.0, 573.0, 899.0, 1640.0, 2879.0, 9547.0, 194047.0, 3913559.0, 59404.0, 4745.0, 2296.0, 1338.0, 808.0, 520.0, 343.0, 210.0, 154.0, 95.0, 73.0, 41.0, 28.0, 19.0, 18.0, 11.0, 6.0, 6.0, 2.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0300750732421875, -0.029247522354125977, -0.028419971466064453, -0.02759242057800293, -0.026764869689941406, -0.025937318801879883, -0.02510976791381836, -0.024282217025756836, -0.023454666137695312, -0.02262711524963379, -0.021799564361572266, -0.020972013473510742, -0.02014446258544922, -0.019316911697387695, -0.018489360809326172, -0.01766180992126465, -0.016834259033203125, -0.0160067081451416, -0.015179157257080078, -0.014351606369018555, -0.013524055480957031, -0.012696504592895508, -0.011868953704833984, -0.011041402816772461, -0.010213851928710938, -0.009386301040649414, -0.00855875015258789, -0.007731199264526367, -0.006903648376464844, -0.00607609748840332, -0.005248546600341797, -0.0044209957122802734, -0.00359344482421875, -0.0027658939361572266, -0.0019383430480957031, -0.0011107921600341797, -0.00028324127197265625, 0.0005443096160888672, 0.0013718605041503906, 0.002199411392211914, 0.0030269622802734375, 0.003854513168334961, 0.004682064056396484, 0.005509614944458008, 0.006337165832519531, 0.007164716720581055, 0.007992267608642578, 0.008819818496704102, 0.009647369384765625, 0.010474920272827148, 0.011302471160888672, 0.012130022048950195, 0.012957572937011719, 0.013785123825073242, 0.014612674713134766, 0.015440225601196289, 0.016267776489257812, 0.017095327377319336, 0.01792287826538086, 0.018750429153442383, 0.019577980041503906, 0.02040553092956543, 0.021233081817626953, 0.022060632705688477, 0.02288818359375]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 7.0, 6.0, 4.0, 9.0, 8.0, 8.0, 15.0, 24.0, 19.0, 20.0, 21.0, 34.0, 19.0, 26.0, 32.0, 35.0, 39.0, 38.0, 30.0, 37.0, 37.0, 38.0, 43.0, 36.0, 33.0, 27.0, 34.0, 29.0, 34.0, 29.0, 27.0, 27.0, 28.0, 20.0, 17.0, 10.0, 20.0, 20.0, 12.0, 8.0, 9.0, 9.0, 5.0, 5.0, 7.0, 8.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01080322265625, -0.010444283485412598, -0.010085344314575195, -0.009726405143737793, -0.00936746597290039, -0.009008526802062988, -0.008649587631225586, -0.008290648460388184, -0.007931709289550781, -0.007572770118713379, -0.0072138309478759766, -0.006854891777038574, -0.006495952606201172, -0.0061370134353637695, -0.005778074264526367, -0.005419135093688965, -0.0050601959228515625, -0.00470125675201416, -0.004342317581176758, -0.0039833784103393555, -0.003624439239501953, -0.0032655000686645508, -0.0029065608978271484, -0.002547621726989746, -0.0021886825561523438, -0.0018297433853149414, -0.001470804214477539, -0.0011118650436401367, -0.0007529258728027344, -0.00039398670196533203, -3.504753112792969e-05, 0.00032389163970947266, 0.000682830810546875, 0.0010417699813842773, 0.0014007091522216797, 0.001759648323059082, 0.0021185874938964844, 0.0024775266647338867, 0.002836465835571289, 0.0031954050064086914, 0.0035543441772460938, 0.003913283348083496, 0.0042722225189208984, 0.004631161689758301, 0.004990100860595703, 0.0053490400314331055, 0.005707979202270508, 0.00606691837310791, 0.0064258575439453125, 0.006784796714782715, 0.007143735885620117, 0.0075026750564575195, 0.007861614227294922, 0.008220553398132324, 0.008579492568969727, 0.008938431739807129, 0.009297370910644531, 0.009656310081481934, 0.010015249252319336, 0.010374188423156738, 0.01073312759399414, 0.011092066764831543, 0.011451005935668945, 0.011809945106506348, 0.01216888427734375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 16.0, 39.0, 69.0, 180.0, 419.0, 1137.0, 3352.0, 14577.0, 3926220.0, 235746.0, 8754.0, 2380.0, 779.0, 331.0, 140.0, 58.0, 29.0, 16.0, 6.0, 10.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04827880859375, -0.04633617401123047, -0.04439353942871094, -0.042450904846191406, -0.040508270263671875, -0.038565635681152344, -0.03662300109863281, -0.03468036651611328, -0.03273773193359375, -0.03079509735107422, -0.028852462768554688, -0.026909828186035156, -0.024967193603515625, -0.023024559020996094, -0.021081924438476562, -0.01913928985595703, -0.0171966552734375, -0.015254020690917969, -0.013311386108398438, -0.011368751525878906, -0.009426116943359375, -0.007483482360839844, -0.0055408477783203125, -0.0035982131958007812, -0.00165557861328125, 0.00028705596923828125, 0.0022296905517578125, 0.004172325134277344, 0.006114959716796875, 0.008057594299316406, 0.010000228881835938, 0.011942863464355469, 0.013885498046875, 0.01582813262939453, 0.017770767211914062, 0.019713401794433594, 0.021656036376953125, 0.023598670959472656, 0.025541305541992188, 0.02748394012451172, 0.02942657470703125, 0.03136920928955078, 0.03331184387207031, 0.035254478454589844, 0.037197113037109375, 0.039139747619628906, 0.04108238220214844, 0.04302501678466797, 0.0449676513671875, 0.04691028594970703, 0.04885292053222656, 0.050795555114746094, 0.052738189697265625, 0.054680824279785156, 0.05662345886230469, 0.05856609344482422, 0.06050872802734375, 0.06245136260986328, 0.06439399719238281, 0.06633663177490234, 0.06827926635742188, 0.0702219009399414, 0.07216453552246094, 0.07410717010498047, 0.0760498046875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 22.0, 37.0, 101.0, 331.0, 2570.0, 656.0, 198.0, 61.0, 33.0, 18.0, 4.0, 7.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0086669921875, -0.008437395095825195, -0.00820779800415039, -0.007978200912475586, -0.007748603820800781, -0.0075190067291259766, -0.007289409637451172, -0.007059812545776367, -0.0068302154541015625, -0.006600618362426758, -0.006371021270751953, -0.0061414241790771484, -0.005911827087402344, -0.005682229995727539, -0.005452632904052734, -0.00522303581237793, -0.004993438720703125, -0.00476384162902832, -0.004534244537353516, -0.004304647445678711, -0.004075050354003906, -0.0038454532623291016, -0.003615856170654297, -0.003386259078979492, -0.0031566619873046875, -0.002927064895629883, -0.002697467803955078, -0.0024678707122802734, -0.0022382736206054688, -0.002008676528930664, -0.0017790794372558594, -0.0015494823455810547, -0.00131988525390625, -0.0010902881622314453, -0.0008606910705566406, -0.0006310939788818359, -0.00040149688720703125, -0.00017189979553222656, 5.7697296142578125e-05, 0.0002872943878173828, 0.0005168914794921875, 0.0007464885711669922, 0.0009760856628417969, 0.0012056827545166016, 0.0014352798461914062, 0.001664876937866211, 0.0018944740295410156, 0.0021240711212158203, 0.002353668212890625, 0.0025832653045654297, 0.0028128623962402344, 0.003042459487915039, 0.0032720565795898438, 0.0035016536712646484, 0.003731250762939453, 0.003960847854614258, 0.0041904449462890625, 0.004420042037963867, 0.004649639129638672, 0.0048792362213134766, 0.005108833312988281, 0.005338430404663086, 0.005568027496337891, 0.005797624588012695, 0.0060272216796875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 4.0, 5.0, 1.0, 6.0, 5.0, 22.0, 16.0, 23.0, 34.0, 33.0, 45.0, 71.0, 86.0, 129.0, 118.0, 102.0, 72.0, 47.0, 45.0, 35.0, 20.0, 14.0, 17.0, 13.0, 7.0, 6.0, 10.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01969556137919426, -0.019117265939712524, -0.01853896863758564, -0.017960673198103905, -0.01738237589597702, -0.016804080456495285, -0.01622578501701355, -0.015647487714886665, -0.01506919227540493, -0.01449089590460062, -0.01391259953379631, -0.013334304094314575, -0.012756007723510265, -0.012177711352705956, -0.011599414981901646, -0.011021118611097336, -0.010442822240293026, -0.009864525869488716, -0.009286229498684406, -0.008707933127880096, -0.008129637688398361, -0.007551341317594051, -0.0069730449467897415, -0.006394749041646719, -0.005816452670842409, -0.005238156300038099, -0.004659860394895077, -0.004081564024090767, -0.0035032678861171007, -0.0029249717481434345, -0.0023466753773391247, -0.0017683794721961021, -0.0011900831013917923, -0.0006117869052104652, -3.349070902913809e-05, 0.0005448055453598499, 0.0011231016833335161, 0.0017013978213071823, 0.002279694192111492, 0.0028579900972545147, 0.0034362864680588245, 0.004014582838863134, 0.004592878744006157, 0.005171175114810467, 0.005749471485614777, 0.006327767390757799, 0.006906063761562109, 0.0074843596667051315, 0.008062656037509441, 0.008640952408313751, 0.009219248779118061, 0.009797545149922371, 0.010375840589404106, 0.010954136960208416, 0.011532433331012726, 0.012110728770494461, 0.012689026072621346, 0.013267322443425655, 0.013845618814229965, 0.0144239142537117, 0.01500221062451601, 0.01558050699532032, 0.016158804297447205, 0.01673709973692894, 0.017315395176410675]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 10.0, 4.0, 5.0, 7.0, 10.0, 12.0, 13.0, 16.0, 24.0, 21.0, 23.0, 27.0, 27.0, 36.0, 25.0, 39.0, 38.0, 35.0, 42.0, 30.0, 34.0, 41.0, 42.0, 32.0, 37.0, 24.0, 36.0, 22.0, 32.0, 28.0, 34.0, 22.0, 28.0, 25.0, 17.0, 18.0, 9.0, 7.0, 9.0, 12.0, 12.0, 12.0, 4.0, 9.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.010718977078795433, -0.010380616411566734, -0.010042255744338036, -0.009703894145786762, -0.009365533478558064, -0.009027172811329365, -0.008688812144100666, -0.008350450545549393, -0.008012089878320694, -0.007673729211091995, -0.007335368078202009, -0.0069970074109733105, -0.006658646278083324, -0.006320285610854626, -0.005981924943625927, -0.005643563810735941, -0.005305203143507242, -0.0049668424762785435, -0.0046284813433885574, -0.004290120676159859, -0.003951759543269873, -0.003613398876041174, -0.0032750379759818316, -0.002936677075922489, -0.0025983161758631468, -0.0022599552758038044, -0.001921594375744462, -0.0015832335921004415, -0.001244872692041099, -0.0009065117919817567, -0.0005681510083377361, -0.00022979010827839375, 0.00010857079178094864, 0.00044693166273646057, 0.0007852925336919725, 0.001123653375543654, 0.0014620142756029963, 0.0018003751756623387, 0.0021387359593063593, 0.0024770968593657017, 0.002815457759425044, 0.0031538186594843864, 0.003492179559543729, 0.003830540459603071, 0.00416890112683177, 0.004507262259721756, 0.004845622926950455, 0.0051839835941791534, 0.0055223447270691395, 0.005860705394297838, 0.006199066527187824, 0.006537427194416523, 0.006875788327306509, 0.007214148994535208, 0.007552510127425194, 0.007890870794653893, 0.008229231461882591, 0.00856759212911129, 0.008905952796339989, 0.009244314394891262, 0.00958267506211996, 0.00992103572934866, 0.010259396396577358, 0.010597757995128632, 0.01093611866235733]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 3.0, 4.0, 8.0, 15.0, 15.0, 27.0, 37.0, 64.0, 88.0, 152.0, 194.0, 320.0, 472.0, 784.0, 1278.0, 1977.0, 3073.0, 4890.0, 7995.0, 13346.0, 22501.0, 40069.0, 73834.0, 151277.0, 308049.0, 204245.0, 94384.0, 49850.0, 27759.0, 16197.0, 9732.0, 5967.0, 3605.0, 2293.0, 1452.0, 943.0, 590.0, 345.0, 242.0, 161.0, 106.0, 43.0, 48.0, 38.0, 19.0, 14.0, 8.0, 10.0, 3.0, 8.0, 10.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.016845703125, -0.016314029693603516, -0.01578235626220703, -0.015250682830810547, -0.014719009399414062, -0.014187335968017578, -0.013655662536621094, -0.01312398910522461, -0.012592315673828125, -0.01206064224243164, -0.011528968811035156, -0.010997295379638672, -0.010465621948242188, -0.009933948516845703, -0.009402275085449219, -0.008870601654052734, -0.00833892822265625, -0.007807254791259766, -0.007275581359863281, -0.006743907928466797, -0.0062122344970703125, -0.005680561065673828, -0.005148887634277344, -0.004617214202880859, -0.004085540771484375, -0.0035538673400878906, -0.0030221939086914062, -0.002490520477294922, -0.0019588470458984375, -0.0014271736145019531, -0.0008955001831054688, -0.0003638267517089844, 0.0001678466796875, 0.0006995201110839844, 0.0012311935424804688, 0.0017628669738769531, 0.0022945404052734375, 0.002826213836669922, 0.0033578872680664062, 0.0038895606994628906, 0.004421234130859375, 0.004952907562255859, 0.005484580993652344, 0.006016254425048828, 0.0065479278564453125, 0.007079601287841797, 0.007611274719238281, 0.008142948150634766, 0.00867462158203125, 0.009206295013427734, 0.009737968444824219, 0.010269641876220703, 0.010801315307617188, 0.011332988739013672, 0.011864662170410156, 0.01239633560180664, 0.012928009033203125, 0.01345968246459961, 0.013991355895996094, 0.014523029327392578, 0.015054702758789062, 0.015586376190185547, 0.01611804962158203, 0.016649723052978516, 0.017181396484375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 5.0, 13.0, 14.0, 12.0, 17.0, 22.0, 21.0, 21.0, 20.0, 35.0, 34.0, 32.0, 44.0, 39.0, 34.0, 35.0, 31.0, 38.0, 45.0, 49.0, 34.0, 47.0, 42.0, 22.0, 27.0, 26.0, 29.0, 29.0, 33.0, 25.0, 18.0, 12.0, 15.0, 13.0, 10.0, 6.0, 12.0, 5.0, 8.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01018524169921875, -0.009852051734924316, -0.009518861770629883, -0.00918567180633545, -0.008852481842041016, -0.008519291877746582, -0.008186101913452148, -0.007852911949157715, -0.007519721984863281, -0.007186532020568848, -0.006853342056274414, -0.0065201520919799805, -0.006186962127685547, -0.005853772163391113, -0.00552058219909668, -0.005187392234802246, -0.0048542022705078125, -0.004521012306213379, -0.004187822341918945, -0.0038546323776245117, -0.003521442413330078, -0.0031882524490356445, -0.002855062484741211, -0.0025218725204467773, -0.0021886825561523438, -0.0018554925918579102, -0.0015223026275634766, -0.001189112663269043, -0.0008559226989746094, -0.0005227327346801758, -0.0001895427703857422, 0.0001436471939086914, 0.000476837158203125, 0.0008100271224975586, 0.0011432170867919922, 0.0014764070510864258, 0.0018095970153808594, 0.002142786979675293, 0.0024759769439697266, 0.00280916690826416, 0.0031423568725585938, 0.0034755468368530273, 0.003808736801147461, 0.0041419267654418945, 0.004475116729736328, 0.004808306694030762, 0.005141496658325195, 0.005474686622619629, 0.0058078765869140625, 0.006141066551208496, 0.00647425651550293, 0.006807446479797363, 0.007140636444091797, 0.0074738264083862305, 0.007807016372680664, 0.008140206336975098, 0.008473396301269531, 0.008806586265563965, 0.009139776229858398, 0.009472966194152832, 0.009806156158447266, 0.0101393461227417, 0.010472536087036133, 0.010805726051330566, 0.011138916015625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 15.0, 10.0, 23.0, 31.0, 32.0, 66.0, 96.0, 130.0, 189.0, 281.0, 383.0, 588.0, 882.0, 1361.0, 2052.0, 3282.0, 5447.0, 9713.0, 18712.0, 40819.0, 123737.0, 540554.0, 193815.0, 54523.0, 22920.0, 11656.0, 6485.0, 3745.0, 2372.0, 1557.0, 952.0, 682.0, 481.0, 291.0, 213.0, 153.0, 91.0, 54.0, 54.0, 35.0, 25.0, 15.0, 8.0, 7.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.018585205078125, -0.01799798011779785, -0.017410755157470703, -0.016823530197143555, -0.016236305236816406, -0.015649080276489258, -0.01506185531616211, -0.014474630355834961, -0.013887405395507812, -0.013300180435180664, -0.012712955474853516, -0.012125730514526367, -0.011538505554199219, -0.01095128059387207, -0.010364055633544922, -0.009776830673217773, -0.009189605712890625, -0.008602380752563477, -0.008015155792236328, -0.00742793083190918, -0.006840705871582031, -0.006253480911254883, -0.005666255950927734, -0.005079030990600586, -0.0044918060302734375, -0.003904581069946289, -0.0033173561096191406, -0.002730131149291992, -0.0021429061889648438, -0.0015556812286376953, -0.0009684562683105469, -0.00038123130798339844, 0.00020599365234375, 0.0007932186126708984, 0.0013804435729980469, 0.0019676685333251953, 0.0025548934936523438, 0.003142118453979492, 0.0037293434143066406, 0.004316568374633789, 0.0049037933349609375, 0.005491018295288086, 0.006078243255615234, 0.006665468215942383, 0.007252693176269531, 0.00783991813659668, 0.008427143096923828, 0.009014368057250977, 0.009601593017578125, 0.010188817977905273, 0.010776042938232422, 0.01136326789855957, 0.011950492858886719, 0.012537717819213867, 0.013124942779541016, 0.013712167739868164, 0.014299392700195312, 0.014886617660522461, 0.01547384262084961, 0.016061067581176758, 0.016648292541503906, 0.017235517501831055, 0.017822742462158203, 0.01840996742248535, 0.0189971923828125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 3.0, 7.0, 9.0, 5.0, 5.0, 5.0, 8.0, 9.0, 15.0, 20.0, 29.0, 20.0, 20.0, 32.0, 28.0, 38.0, 32.0, 36.0, 40.0, 37.0, 46.0, 39.0, 51.0, 33.0, 36.0, 51.0, 36.0, 30.0, 29.0, 28.0, 34.0, 30.0, 28.0, 18.0, 17.0, 14.0, 11.0, 13.0, 10.0, 8.0, 8.0, 10.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006988525390625, -0.006762206554412842, -0.006535887718200684, -0.006309568881988525, -0.006083250045776367, -0.005856931209564209, -0.005630612373352051, -0.005404293537139893, -0.005177974700927734, -0.004951655864715576, -0.004725337028503418, -0.00449901819229126, -0.0042726993560791016, -0.004046380519866943, -0.003820061683654785, -0.003593742847442627, -0.0033674240112304688, -0.0031411051750183105, -0.0029147863388061523, -0.002688467502593994, -0.002462148666381836, -0.0022358298301696777, -0.0020095109939575195, -0.0017831921577453613, -0.0015568733215332031, -0.001330554485321045, -0.0011042356491088867, -0.0008779168128967285, -0.0006515979766845703, -0.0004252791404724121, -0.0001989603042602539, 2.7358531951904297e-05, 0.0002536773681640625, 0.0004799962043762207, 0.0007063150405883789, 0.0009326338768005371, 0.0011589527130126953, 0.0013852715492248535, 0.0016115903854370117, 0.00183790922164917, 0.002064228057861328, 0.0022905468940734863, 0.0025168657302856445, 0.0027431845664978027, 0.002969503402709961, 0.003195822238922119, 0.0034221410751342773, 0.0036484599113464355, 0.0038747787475585938, 0.004101097583770752, 0.00432741641998291, 0.004553735256195068, 0.0047800540924072266, 0.005006372928619385, 0.005232691764831543, 0.005459010601043701, 0.005685329437255859, 0.005911648273468018, 0.006137967109680176, 0.006364285945892334, 0.006590604782104492, 0.00681692361831665, 0.007043242454528809, 0.007269561290740967, 0.007495880126953125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 8.0, 4.0, 2.0, 13.0, 22.0, 18.0, 29.0, 29.0, 59.0, 65.0, 100.0, 134.0, 182.0, 237.0, 341.0, 382.0, 567.0, 727.0, 1112.0, 1558.0, 2369.0, 3375.0, 5665.0, 9853.0, 17872.0, 39353.0, 129636.0, 732077.0, 50368.0, 21704.0, 11285.0, 6700.0, 3870.0, 2628.0, 1803.0, 1169.0, 877.0, 577.0, 473.0, 353.0, 276.0, 183.0, 133.0, 106.0, 63.0, 58.0, 51.0, 22.0, 29.0, 12.0, 14.0, 12.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.01129913330078125, -0.010947585105895996, -0.010596036911010742, -0.010244488716125488, -0.009892940521240234, -0.00954139232635498, -0.009189844131469727, -0.008838295936584473, -0.008486747741699219, -0.008135199546813965, -0.007783651351928711, -0.007432103157043457, -0.007080554962158203, -0.006729006767272949, -0.006377458572387695, -0.006025910377502441, -0.0056743621826171875, -0.005322813987731934, -0.00497126579284668, -0.004619717597961426, -0.004268169403076172, -0.003916621208190918, -0.003565073013305664, -0.00321352481842041, -0.0028619766235351562, -0.0025104284286499023, -0.0021588802337646484, -0.0018073320388793945, -0.0014557838439941406, -0.0011042356491088867, -0.0007526874542236328, -0.0004011392593383789, -4.9591064453125e-05, 0.0003019571304321289, 0.0006535053253173828, 0.0010050535202026367, 0.0013566017150878906, 0.0017081499099731445, 0.0020596981048583984, 0.0024112462997436523, 0.0027627944946289062, 0.00311434268951416, 0.003465890884399414, 0.003817439079284668, 0.004168987274169922, 0.004520535469055176, 0.00487208366394043, 0.005223631858825684, 0.0055751800537109375, 0.005926728248596191, 0.006278276443481445, 0.006629824638366699, 0.006981372833251953, 0.007332921028137207, 0.007684469223022461, 0.008036017417907715, 0.008387565612792969, 0.008739113807678223, 0.009090662002563477, 0.00944221019744873, 0.009793758392333984, 0.010145306587219238, 0.010496854782104492, 0.010848402976989746, 0.011199951171875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 3.0, 10.0, 5.0, 4.0, 14.0, 12.0, 9.0, 26.0, 18.0, 40.0, 22.0, 33.0, 42.0, 34.0, 50.0, 35.0, 39.0, 62.0, 57.0, 63.0, 44.0, 37.0, 55.0, 37.0, 42.0, 28.0, 25.0, 36.0, 15.0, 15.0, 28.0, 11.0, 14.0, 5.0, 9.0, 6.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-4.887580871582031e-06, -4.745088517665863e-06, -4.602596163749695e-06, -4.460103809833527e-06, -4.317611455917358e-06, -4.17511910200119e-06, -4.032626748085022e-06, -3.890134394168854e-06, -3.7476420402526855e-06, -3.6051496863365173e-06, -3.462657332420349e-06, -3.320164978504181e-06, -3.1776726245880127e-06, -3.0351802706718445e-06, -2.8926879167556763e-06, -2.750195562839508e-06, -2.60770320892334e-06, -2.4652108550071716e-06, -2.3227185010910034e-06, -2.180226147174835e-06, -2.037733793258667e-06, -1.8952414393424988e-06, -1.7527490854263306e-06, -1.6102567315101624e-06, -1.4677643775939941e-06, -1.325272023677826e-06, -1.1827796697616577e-06, -1.0402873158454895e-06, -8.977949619293213e-07, -7.553026080131531e-07, -6.128102540969849e-07, -4.7031790018081665e-07, -3.2782554626464844e-07, -1.8533319234848022e-07, -4.284083843231201e-08, 9.96515154838562e-08, 2.421438694000244e-07, 3.8463622331619263e-07, 5.271285772323608e-07, 6.69620931148529e-07, 8.121132850646973e-07, 9.546056389808655e-07, 1.0970979928970337e-06, 1.239590346813202e-06, 1.3820827007293701e-06, 1.5245750546455383e-06, 1.6670674085617065e-06, 1.8095597624778748e-06, 1.952052116394043e-06, 2.094544470310211e-06, 2.2370368242263794e-06, 2.3795291781425476e-06, 2.522021532058716e-06, 2.664513885974884e-06, 2.8070062398910522e-06, 2.9494985938072205e-06, 3.0919909477233887e-06, 3.234483301639557e-06, 3.376975655555725e-06, 3.5194680094718933e-06, 3.6619603633880615e-06, 3.8044527173042297e-06, 3.946945071220398e-06, 4.089437425136566e-06, 4.231929779052734e-06]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 3.0, 3.0, 4.0, 8.0, 10.0, 11.0, 9.0, 20.0, 25.0, 49.0, 132.0, 310.0, 783.0, 2200.0, 6775.0, 26572.0, 163811.0, 797734.0, 36828.0, 8858.0, 2739.0, 960.0, 365.0, 134.0, 69.0, 38.0, 25.0, 11.0, 9.0, 8.0, 7.0, 6.0, 7.0, 7.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0232086181640625, -0.022547483444213867, -0.021886348724365234, -0.0212252140045166, -0.02056407928466797, -0.019902944564819336, -0.019241809844970703, -0.01858067512512207, -0.017919540405273438, -0.017258405685424805, -0.016597270965576172, -0.01593613624572754, -0.015275001525878906, -0.014613866806030273, -0.01395273208618164, -0.013291597366333008, -0.012630462646484375, -0.011969327926635742, -0.01130819320678711, -0.010647058486938477, -0.009985923767089844, -0.009324789047241211, -0.008663654327392578, -0.008002519607543945, -0.0073413848876953125, -0.00668025016784668, -0.006019115447998047, -0.005357980728149414, -0.004696846008300781, -0.0040357112884521484, -0.0033745765686035156, -0.002713441848754883, -0.00205230712890625, -0.0013911724090576172, -0.0007300376892089844, -6.890296936035156e-05, 0.0005922317504882812, 0.001253366470336914, 0.0019145011901855469, 0.0025756359100341797, 0.0032367706298828125, 0.0038979053497314453, 0.004559040069580078, 0.005220174789428711, 0.005881309509277344, 0.0065424442291259766, 0.007203578948974609, 0.007864713668823242, 0.008525848388671875, 0.009186983108520508, 0.00984811782836914, 0.010509252548217773, 0.011170387268066406, 0.011831521987915039, 0.012492656707763672, 0.013153791427612305, 0.013814926147460938, 0.01447606086730957, 0.015137195587158203, 0.015798330307006836, 0.01645946502685547, 0.0171205997467041, 0.017781734466552734, 0.018442869186401367, 0.01910400390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 5.0, 1.0, 7.0, 8.0, 9.0, 10.0, 12.0, 15.0, 16.0, 18.0, 15.0, 13.0, 22.0, 18.0, 24.0, 18.0, 212.0, 348.0, 29.0, 20.0, 15.0, 25.0, 17.0, 19.0, 11.0, 13.0, 4.0, 7.0, 10.0, 12.0, 7.0, 5.0, 3.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0019054412841796875, -0.001842200756072998, -0.0017789602279663086, -0.0017157196998596191, -0.0016524791717529297, -0.0015892386436462402, -0.0015259981155395508, -0.0014627575874328613, -0.0013995170593261719, -0.0013362765312194824, -0.001273036003112793, -0.0012097954750061035, -0.001146554946899414, -0.0010833144187927246, -0.0010200738906860352, -0.0009568333625793457, -0.0008935928344726562, -0.0008303523063659668, -0.0007671117782592773, -0.0007038712501525879, -0.0006406307220458984, -0.000577390193939209, -0.0005141496658325195, -0.0004509091377258301, -0.0003876686096191406, -0.00032442808151245117, -0.0002611875534057617, -0.00019794702529907227, -0.0001347064971923828, -7.146596908569336e-05, -8.225440979003906e-06, 5.501508712768555e-05, 0.000118255615234375, 0.00018149614334106445, 0.0002447366714477539, 0.00030797719955444336, 0.0003712177276611328, 0.00043445825576782227, 0.0004976987838745117, 0.0005609393119812012, 0.0006241798400878906, 0.0006874203681945801, 0.0007506608963012695, 0.000813901424407959, 0.0008771419525146484, 0.0009403824806213379, 0.0010036230087280273, 0.0010668635368347168, 0.0011301040649414062, 0.0011933445930480957, 0.0012565851211547852, 0.0013198256492614746, 0.001383066177368164, 0.0014463067054748535, 0.001509547233581543, 0.0015727877616882324, 0.0016360282897949219, 0.0016992688179016113, 0.0017625093460083008, 0.0018257498741149902, 0.0018889904022216797, 0.0019522309303283691, 0.0020154714584350586, 0.002078711986541748, 0.0021419525146484375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 15.0, 15.0, 17.0, 20.0, 38.0, 38.0, 42.0, 56.0, 95.0, 107.0, 125.0, 110.0, 68.0, 47.0, 29.0, 45.0, 24.0, 18.0, 11.0, 16.0, 10.0, 9.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014996398240327835, -0.014482976868748665, -0.01396955456584692, -0.013456132262945175, -0.012942710891366005, -0.012429289519786835, -0.01191586721688509, -0.011402444913983345, -0.010889023542404175, -0.010375602170825005, -0.00986217986792326, -0.009348757565021515, -0.008835336193442345, -0.008321914821863174, -0.00780849251896143, -0.007295070681720972, -0.0067816488444805145, -0.006268227007240057, -0.0057548051699995995, -0.005241383332759142, -0.004727961495518684, -0.004214539658278227, -0.0037011178210377693, -0.0031876959837973118, -0.0026742741465568542, -0.0021608523093163967, -0.0016474304720759392, -0.0011340086348354816, -0.0006205867975950241, -0.00010716496035456657, 0.00040625687688589096, 0.0009196787141263485, 0.0014330986887216568, 0.0019465205259621143, 0.002459942363202572, 0.0029733642004430294, 0.003486786037683487, 0.0040002078749239445, 0.004513629712164402, 0.0050270515494048595, 0.005540473386645317, 0.006053895223885775, 0.006567317061126232, 0.00708073889836669, 0.007594160735607147, 0.008107582107186317, 0.008621004410088062, 0.009134426712989807, 0.009647848084568977, 0.010161269456148148, 0.010674691759049892, 0.011188114061951637, 0.011701535433530807, 0.012214956805109978, 0.012728379108011723, 0.013241801410913467, 0.013755222782492638, 0.014268644154071808, 0.014782066456973553, 0.015295488759875298, 0.015808910131454468, 0.016322331503033638, 0.016835752874612808, 0.017349176108837128, 0.017862597480416298]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 4.0, 6.0, 6.0, 9.0, 15.0, 14.0, 16.0, 14.0, 26.0, 25.0, 25.0, 23.0, 31.0, 35.0, 36.0, 28.0, 33.0, 35.0, 37.0, 35.0, 26.0, 41.0, 51.0, 40.0, 32.0, 34.0, 24.0, 22.0, 27.0, 29.0, 29.0, 36.0, 15.0, 18.0, 15.0, 18.0, 16.0, 10.0, 5.0, 12.0, 8.0, 8.0, 5.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.009295455180108547, -0.008996021933853626, -0.00869658775627613, -0.00839715451002121, -0.008097720332443714, -0.007798287086188793, -0.007498853374272585, -0.007199419662356377, -0.006899985950440168, -0.00660055223852396, -0.006301118526607752, -0.006001684814691544, -0.005702251568436623, -0.005402817390859127, -0.005103384144604206, -0.004803950432687998, -0.0045045167207717896, -0.004205083008855581, -0.003905649296939373, -0.0036062158178538084, -0.0033067821059376, -0.003007348394021392, -0.0027079149149358273, -0.002408481203019619, -0.0021090474911034107, -0.0018096137791872025, -0.001510180183686316, -0.0012107465881854296, -0.0009113128762692213, -0.000611879164353013, -0.0003124455688521266, -1.3011973351240158e-05, 0.0002864226698875427, 0.0005858563235960901, 0.0008852899773046374, 0.0011847235728055239, 0.0014841572847217321, 0.0017835909966379404, 0.002083024475723505, 0.0023824581876397133, 0.0026818918995559216, 0.00298132561147213, 0.003280759323388338, 0.0035801928024739027, 0.003879626514390111, 0.004179060459136963, 0.004478493705391884, 0.004777927417308092, 0.0050773611292243, 0.005376794841140509, 0.005676228553056717, 0.005975662264972925, 0.0062750959768891335, 0.006574529223144054, 0.006873962935060263, 0.007173396646976471, 0.007472830358892679, 0.0077722640708088875, 0.008071697317063808, 0.008371131494641304, 0.008670564740896225, 0.00896999891847372, 0.009269432164728642, 0.009568866342306137, 0.009868299588561058]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 3.0, 8.0, 10.0, 30.0, 30.0, 42.0, 68.0, 85.0, 123.0, 185.0, 256.0, 426.0, 662.0, 1055.0, 1555.0, 2640.0, 4292.0, 7230.0, 12477.0, 22223.0, 40209.0, 78328.0, 169005.0, 317135.0, 196975.0, 89331.0, 45196.0, 24302.0, 13867.0, 7920.0, 4798.0, 3004.0, 1857.0, 1167.0, 646.0, 472.0, 324.0, 214.0, 133.0, 86.0, 57.0, 47.0, 15.0, 27.0, 11.0, 13.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.02069091796875, -0.020035982131958008, -0.019381046295166016, -0.018726110458374023, -0.01807117462158203, -0.01741623878479004, -0.016761302947998047, -0.016106367111206055, -0.015451431274414062, -0.01479649543762207, -0.014141559600830078, -0.013486623764038086, -0.012831687927246094, -0.012176752090454102, -0.01152181625366211, -0.010866880416870117, -0.010211944580078125, -0.009557008743286133, -0.00890207290649414, -0.008247137069702148, -0.007592201232910156, -0.006937265396118164, -0.006282329559326172, -0.00562739372253418, -0.0049724578857421875, -0.004317522048950195, -0.003662586212158203, -0.003007650375366211, -0.0023527145385742188, -0.0016977787017822266, -0.0010428428649902344, -0.0003879070281982422, 0.00026702880859375, 0.0009219646453857422, 0.0015769004821777344, 0.0022318363189697266, 0.0028867721557617188, 0.003541707992553711, 0.004196643829345703, 0.004851579666137695, 0.0055065155029296875, 0.00616145133972168, 0.006816387176513672, 0.007471323013305664, 0.008126258850097656, 0.008781194686889648, 0.00943613052368164, 0.010091066360473633, 0.010746002197265625, 0.011400938034057617, 0.01205587387084961, 0.012710809707641602, 0.013365745544433594, 0.014020681381225586, 0.014675617218017578, 0.01533055305480957, 0.015985488891601562, 0.016640424728393555, 0.017295360565185547, 0.01795029640197754, 0.01860523223876953, 0.019260168075561523, 0.019915103912353516, 0.020570039749145508, 0.0212249755859375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 8.0, 7.0, 9.0, 10.0, 14.0, 15.0, 9.0, 21.0, 25.0, 25.0, 24.0, 34.0, 41.0, 33.0, 26.0, 38.0, 49.0, 46.0, 37.0, 40.0, 46.0, 46.0, 42.0, 36.0, 40.0, 27.0, 33.0, 26.0, 34.0, 24.0, 23.0, 14.0, 17.0, 17.0, 6.0, 8.0, 15.0, 6.0, 6.0, 4.0, 9.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0062255859375, -0.006029009819030762, -0.0058324337005615234, -0.005635857582092285, -0.005439281463623047, -0.005242705345153809, -0.00504612922668457, -0.004849553108215332, -0.004652976989746094, -0.0044564008712768555, -0.004259824752807617, -0.004063248634338379, -0.0038666725158691406, -0.0036700963973999023, -0.003473520278930664, -0.0032769441604614258, -0.0030803680419921875, -0.0028837919235229492, -0.002687215805053711, -0.0024906396865844727, -0.0022940635681152344, -0.002097487449645996, -0.0019009113311767578, -0.0017043352127075195, -0.0015077590942382812, -0.001311182975769043, -0.0011146068572998047, -0.0009180307388305664, -0.0007214546203613281, -0.0005248785018920898, -0.00032830238342285156, -0.00013172626495361328, 6.4849853515625e-05, 0.0002614259719848633, 0.00045800209045410156, 0.0006545782089233398, 0.0008511543273925781, 0.0010477304458618164, 0.0012443065643310547, 0.001440882682800293, 0.0016374588012695312, 0.0018340349197387695, 0.002030611038208008, 0.002227187156677246, 0.0024237632751464844, 0.0026203393936157227, 0.002816915512084961, 0.0030134916305541992, 0.0032100677490234375, 0.0034066438674926758, 0.003603219985961914, 0.0037997961044311523, 0.003996372222900391, 0.004192948341369629, 0.004389524459838867, 0.0045861005783081055, 0.004782676696777344, 0.004979252815246582, 0.00517582893371582, 0.005372405052185059, 0.005568981170654297, 0.005765557289123535, 0.0059621334075927734, 0.006158709526062012, 0.00635528564453125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 6.0, 3.0, 7.0, 2.0, 8.0, 7.0, 12.0, 11.0, 28.0, 37.0, 45.0, 52.0, 111.0, 202.0, 500.0, 1196.0, 3050.0, 8395.0, 27242.0, 98839.0, 400957.0, 376997.0, 92131.0, 25759.0, 8016.0, 2798.0, 1078.0, 481.0, 228.0, 107.0, 70.0, 36.0, 29.0, 27.0, 25.0, 20.0, 9.0, 8.0, 6.0, 3.0, 8.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.031768798828125, -0.030805349349975586, -0.029841899871826172, -0.028878450393676758, -0.027915000915527344, -0.02695155143737793, -0.025988101959228516, -0.0250246524810791, -0.024061203002929688, -0.023097753524780273, -0.02213430404663086, -0.021170854568481445, -0.02020740509033203, -0.019243955612182617, -0.018280506134033203, -0.01731705665588379, -0.016353607177734375, -0.015390157699584961, -0.014426708221435547, -0.013463258743286133, -0.012499809265136719, -0.011536359786987305, -0.01057291030883789, -0.009609460830688477, -0.008646011352539062, -0.0076825618743896484, -0.006719112396240234, -0.00575566291809082, -0.004792213439941406, -0.003828763961791992, -0.002865314483642578, -0.001901865005493164, -0.00093841552734375, 2.5033950805664062e-05, 0.0009884834289550781, 0.0019519329071044922, 0.0029153823852539062, 0.0038788318634033203, 0.004842281341552734, 0.0058057308197021484, 0.0067691802978515625, 0.0077326297760009766, 0.00869607925415039, 0.009659528732299805, 0.010622978210449219, 0.011586427688598633, 0.012549877166748047, 0.013513326644897461, 0.014476776123046875, 0.015440225601196289, 0.016403675079345703, 0.017367124557495117, 0.01833057403564453, 0.019294023513793945, 0.02025747299194336, 0.021220922470092773, 0.022184371948242188, 0.0231478214263916, 0.024111270904541016, 0.02507472038269043, 0.026038169860839844, 0.027001619338989258, 0.027965068817138672, 0.028928518295288086, 0.0298919677734375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 14.0, 13.0, 18.0, 12.0, 14.0, 23.0, 23.0, 20.0, 21.0, 25.0, 25.0, 40.0, 41.0, 36.0, 39.0, 54.0, 39.0, 45.0, 35.0, 37.0, 43.0, 31.0, 52.0, 44.0, 34.0, 23.0, 24.0, 25.0, 25.0, 31.0, 17.0, 12.0, 10.0, 9.0, 8.0, 6.0, 4.0, 7.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00478363037109375, -0.004623830318450928, -0.0044640302658081055, -0.004304230213165283, -0.004144430160522461, -0.003984630107879639, -0.0038248300552368164, -0.003665030002593994, -0.003505229949951172, -0.0033454298973083496, -0.0031856298446655273, -0.003025829792022705, -0.002866029739379883, -0.0027062296867370605, -0.0025464296340942383, -0.002386629581451416, -0.0022268295288085938, -0.0020670294761657715, -0.0019072294235229492, -0.001747429370880127, -0.0015876293182373047, -0.0014278292655944824, -0.0012680292129516602, -0.0011082291603088379, -0.0009484291076660156, -0.0007886290550231934, -0.0006288290023803711, -0.00046902894973754883, -0.00030922889709472656, -0.0001494288444519043, 1.0371208190917969e-05, 0.00017017126083374023, 0.0003299713134765625, 0.0004897713661193848, 0.000649571418762207, 0.0008093714714050293, 0.0009691715240478516, 0.0011289715766906738, 0.001288771629333496, 0.0014485716819763184, 0.0016083717346191406, 0.0017681717872619629, 0.0019279718399047852, 0.0020877718925476074, 0.0022475719451904297, 0.002407371997833252, 0.0025671720504760742, 0.0027269721031188965, 0.0028867721557617188, 0.003046572208404541, 0.0032063722610473633, 0.0033661723136901855, 0.003525972366333008, 0.00368577241897583, 0.0038455724716186523, 0.004005372524261475, 0.004165172576904297, 0.004324972629547119, 0.004484772682189941, 0.004644572734832764, 0.004804372787475586, 0.004964172840118408, 0.0051239728927612305, 0.005283772945404053, 0.005443572998046875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 5.0, 7.0, 6.0, 16.0, 12.0, 13.0, 30.0, 30.0, 48.0, 85.0, 116.0, 160.0, 264.0, 379.0, 660.0, 1157.0, 1999.0, 4205.0, 9742.0, 27338.0, 117127.0, 680416.0, 151355.0, 32160.0, 11071.0, 4765.0, 2302.0, 1174.0, 650.0, 418.0, 270.0, 160.0, 128.0, 84.0, 59.0, 40.0, 24.0, 19.0, 17.0, 14.0, 9.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005273818969726562, -0.0005095452070236206, -0.000491708517074585, -0.0004738718271255493, -0.00045603513717651367, -0.00043819844722747803, -0.0004203617572784424, -0.00040252506732940674, -0.0003846883773803711, -0.00036685168743133545, -0.0003490149974822998, -0.00033117830753326416, -0.0003133416175842285, -0.00029550492763519287, -0.0002776682376861572, -0.0002598315477371216, -0.00024199485778808594, -0.0002241581678390503, -0.00020632147789001465, -0.000188484787940979, -0.00017064809799194336, -0.00015281140804290771, -0.00013497471809387207, -0.00011713802814483643, -9.930133819580078e-05, -8.146464824676514e-05, -6.362795829772949e-05, -4.579126834869385e-05, -2.7954578399658203e-05, -1.0117888450622559e-05, 7.718801498413086e-06, 2.555549144744873e-05, 4.3392181396484375e-05, 6.122887134552002e-05, 7.906556129455566e-05, 9.690225124359131e-05, 0.00011473894119262695, 0.0001325756311416626, 0.00015041232109069824, 0.0001682490110397339, 0.00018608570098876953, 0.00020392239093780518, 0.00022175908088684082, 0.00023959577083587646, 0.0002574324607849121, 0.00027526915073394775, 0.0002931058406829834, 0.00031094253063201904, 0.0003287792205810547, 0.00034661591053009033, 0.000364452600479126, 0.0003822892904281616, 0.00040012598037719727, 0.0004179626703262329, 0.00043579936027526855, 0.0004536360502243042, 0.00047147274017333984, 0.0004893094301223755, 0.0005071461200714111, 0.0005249828100204468, 0.0005428194999694824, 0.0005606561899185181, 0.0005784928798675537, 0.0005963295698165894, 0.000614166259765625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 10.0, 8.0, 11.0, 10.0, 21.0, 30.0, 44.0, 55.0, 72.0, 93.0, 125.0, 153.0, 82.0, 76.0, 60.0, 40.0, 14.0, 33.0, 16.0, 9.0, 4.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4373016357421875e-06, -6.248243153095245e-06, -6.059184670448303e-06, -5.870126187801361e-06, -5.681067705154419e-06, -5.492009222507477e-06, -5.302950739860535e-06, -5.1138922572135925e-06, -4.92483377456665e-06, -4.735775291919708e-06, -4.546716809272766e-06, -4.357658326625824e-06, -4.168599843978882e-06, -3.97954136133194e-06, -3.7904828786849976e-06, -3.6014243960380554e-06, -3.4123659133911133e-06, -3.223307430744171e-06, -3.034248948097229e-06, -2.845190465450287e-06, -2.6561319828033447e-06, -2.4670735001564026e-06, -2.2780150175094604e-06, -2.0889565348625183e-06, -1.8998980522155762e-06, -1.710839569568634e-06, -1.521781086921692e-06, -1.3327226042747498e-06, -1.1436641216278076e-06, -9.546056389808655e-07, -7.655471563339233e-07, -5.764886736869812e-07, -3.8743019104003906e-07, -1.9837170839309692e-07, -9.313225746154785e-09, 1.7974525690078735e-07, 3.688037395477295e-07, 5.578622221946716e-07, 7.469207048416138e-07, 9.359791874885559e-07, 1.125037670135498e-06, 1.3140961527824402e-06, 1.5031546354293823e-06, 1.6922131180763245e-06, 1.8812716007232666e-06, 2.0703300833702087e-06, 2.259388566017151e-06, 2.448447048664093e-06, 2.637505531311035e-06, 2.8265640139579773e-06, 3.0156224966049194e-06, 3.2046809792518616e-06, 3.3937394618988037e-06, 3.582797944545746e-06, 3.771856427192688e-06, 3.96091490983963e-06, 4.149973392486572e-06, 4.339031875133514e-06, 4.5280903577804565e-06, 4.717148840427399e-06, 4.906207323074341e-06, 5.095265805721283e-06, 5.284324288368225e-06, 5.473382771015167e-06, 5.662441253662109e-06]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 3.0, 8.0, 18.0, 19.0, 31.0, 61.0, 64.0, 93.0, 180.0, 291.0, 543.0, 1133.0, 2291.0, 5673.0, 15668.0, 52330.0, 241837.0, 549828.0, 127961.0, 32498.0, 10443.0, 4014.0, 1651.0, 818.0, 453.0, 233.0, 136.0, 104.0, 59.0, 38.0, 25.0, 9.0, 15.0, 9.0, 6.0, 3.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00025153160095214844, -0.0002429485321044922, -0.00023436546325683594, -0.0002257823944091797, -0.00021719932556152344, -0.0002086162567138672, -0.00020003318786621094, -0.0001914501190185547, -0.00018286705017089844, -0.0001742839813232422, -0.00016570091247558594, -0.0001571178436279297, -0.00014853477478027344, -0.0001399517059326172, -0.00013136863708496094, -0.0001227855682373047, -0.00011420249938964844, -0.00010561943054199219, -9.703636169433594e-05, -8.845329284667969e-05, -7.987022399902344e-05, -7.128715515136719e-05, -6.270408630371094e-05, -5.412101745605469e-05, -4.553794860839844e-05, -3.695487976074219e-05, -2.8371810913085938e-05, -1.9788742065429688e-05, -1.1205673217773438e-05, -2.6226043701171875e-06, 5.9604644775390625e-06, 1.4543533325195312e-05, 2.3126602172851562e-05, 3.170967102050781e-05, 4.029273986816406e-05, 4.887580871582031e-05, 5.745887756347656e-05, 6.604194641113281e-05, 7.462501525878906e-05, 8.320808410644531e-05, 9.179115295410156e-05, 0.00010037422180175781, 0.00010895729064941406, 0.00011754035949707031, 0.00012612342834472656, 0.0001347064971923828, 0.00014328956604003906, 0.0001518726348876953, 0.00016045570373535156, 0.0001690387725830078, 0.00017762184143066406, 0.0001862049102783203, 0.00019478797912597656, 0.0002033710479736328, 0.00021195411682128906, 0.0002205371856689453, 0.00022912025451660156, 0.0002377033233642578, 0.00024628639221191406, 0.0002548694610595703, 0.00026345252990722656, 0.0002720355987548828, 0.00028061866760253906, 0.0002892017364501953, 0.00029778480529785156]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 5.0, 5.0, 4.0, 10.0, 22.0, 30.0, 22.0, 29.0, 28.0, 62.0, 58.0, 58.0, 78.0, 86.0, 75.0, 80.0, 67.0, 68.0, 35.0, 40.0, 38.0, 32.0, 19.0, 13.0, 10.0, 11.0, 2.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41942024230957e-05, -6.213411688804626e-05, -6.0074031352996826e-05, -5.801394581794739e-05, -5.595386028289795e-05, -5.389377474784851e-05, -5.183368921279907e-05, -4.9773603677749634e-05, -4.7713518142700195e-05, -4.565343260765076e-05, -4.359334707260132e-05, -4.153326153755188e-05, -3.947317600250244e-05, -3.7413090467453e-05, -3.5353004932403564e-05, -3.3292919397354126e-05, -3.123283386230469e-05, -2.917274832725525e-05, -2.711266279220581e-05, -2.5052577257156372e-05, -2.2992491722106934e-05, -2.0932406187057495e-05, -1.8872320652008057e-05, -1.6812235116958618e-05, -1.475214958190918e-05, -1.2692064046859741e-05, -1.0631978511810303e-05, -8.571892976760864e-06, -6.511807441711426e-06, -4.451721906661987e-06, -2.391636371612549e-06, -3.3155083656311035e-07, 1.7285346984863281e-06, 3.7886202335357666e-06, 5.848705768585205e-06, 7.908791303634644e-06, 9.968876838684082e-06, 1.202896237373352e-05, 1.4089047908782959e-05, 1.6149133443832397e-05, 1.8209218978881836e-05, 2.0269304513931274e-05, 2.2329390048980713e-05, 2.438947558403015e-05, 2.644956111907959e-05, 2.850964665412903e-05, 3.056973218917847e-05, 3.2629817724227905e-05, 3.4689903259277344e-05, 3.674998879432678e-05, 3.881007432937622e-05, 4.087015986442566e-05, 4.29302453994751e-05, 4.4990330934524536e-05, 4.7050416469573975e-05, 4.911050200462341e-05, 5.117058753967285e-05, 5.323067307472229e-05, 5.529075860977173e-05, 5.735084414482117e-05, 5.9410929679870605e-05, 6.147101521492004e-05, 6.353110074996948e-05, 6.559118628501892e-05, 6.765127182006836e-05]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 8.0, 7.0, 19.0, 41.0, 75.0, 142.0, 275.0, 216.0, 108.0, 55.0, 26.0, 26.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03518841415643692, -0.03428130969405174, -0.033374201506376266, -0.03246709704399109, -0.03155998885631561, -0.030652884393930435, -0.02974577806890011, -0.02883867174386978, -0.027931567281484604, -0.027024460956454277, -0.02611735463142395, -0.025210250169038773, -0.024303143844008446, -0.02339603751897812, -0.022488931193947792, -0.021581824868917465, -0.02067471854388714, -0.01976761221885681, -0.018860505893826485, -0.017953399568796158, -0.01704629510641098, -0.016139188781380653, -0.015232082456350327, -0.01432497613132, -0.013417870737612247, -0.01251076441258192, -0.011603659018874168, -0.010696552693843842, -0.009789446368813515, -0.008882340975105762, -0.007975234650075436, -0.007068128790706396, -0.006161022931337357, -0.005253917071968317, -0.0043468112125992775, -0.0034397048875689507, -0.002532599028199911, -0.0016254931688308716, -0.0007183868438005447, 0.0001887190155684948, 0.0010958248749375343, 0.002002930734306574, 0.002910036826506257, 0.0038171429187059402, 0.00472424877807498, 0.005631354637444019, 0.006538460962474346, 0.007445566821843386, 0.008352672681212425, 0.009259779006242752, 0.010166884399950504, 0.011073990724980831, 0.011981096118688583, 0.01288820244371891, 0.013795308768749237, 0.014702415093779564, 0.015609520487487316, 0.01651662588119507, 0.017423732206225395, 0.018330838531255722, 0.01923794485628605, 0.020145051181316376, 0.021052155643701553, 0.02195926196873188, 0.022866368293762207]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 5.0, 13.0, 8.0, 10.0, 14.0, 13.0, 17.0, 18.0, 24.0, 21.0, 27.0, 43.0, 27.0, 34.0, 31.0, 33.0, 48.0, 41.0, 43.0, 33.0, 42.0, 43.0, 51.0, 39.0, 35.0, 36.0, 22.0, 34.0, 24.0, 20.0, 23.0, 19.0, 17.0, 19.0, 14.0, 10.0, 8.0, 7.0, 13.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.007837858982384205, -0.007600145880132914, -0.00736243324354291, -0.007124720141291618, -0.006887007504701614, -0.006649294402450323, -0.006411581300199032, -0.006173868663609028, -0.005936156027019024, -0.005698442924767733, -0.005460730288177729, -0.005223017185926437, -0.004985304549336433, -0.004747591447085142, -0.004509878344833851, -0.004272165708243847, -0.004034452605992556, -0.003796739736571908, -0.0035590268671512604, -0.003321313764899969, -0.003083601128309965, -0.002845888026058674, -0.0026081751566380262, -0.0023704622872173786, -0.002132749417796731, -0.0018950365483760834, -0.0016573236789554358, -0.0014196106931194663, -0.0011818978236988187, -0.0009441849542781711, -0.0007064719684422016, -0.000468759099021554, -0.00023104576393961906, 6.6671345848590136e-06, 0.0002443800331093371, 0.0004820929607376456, 0.0007198058301582932, 0.0009575186995789409, 0.0011952316854149103, 0.001432944554835558, 0.0016706574242562056, 0.0019083702936768532, 0.002146083163097501, 0.0023837960325181484, 0.0026215091347694397, 0.0028592217713594437, 0.003096934873610735, 0.0033346477430313826, 0.00357236061245203, 0.003810073481872678, 0.004047786351293325, 0.004285499453544617, 0.004523212090134621, 0.004760925192385912, 0.004998638294637203, 0.005236350931227207, 0.005474063567817211, 0.005711776670068502, 0.005949489306658506, 0.006187202408909798, 0.006424915045499802, 0.006662628147751093, 0.006900341250002384, 0.007138053886592388, 0.007375766988843679]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 10.0, 20.0, 17.0, 30.0, 29.0, 46.0, 45.0, 57.0, 67.0, 88.0, 130.0, 191.0, 277.0, 410.0, 648.0, 1261.0, 2411.0, 11174.0, 4115390.0, 54746.0, 3309.0, 1533.0, 756.0, 508.0, 279.0, 166.0, 163.0, 113.0, 74.0, 52.0, 68.0, 26.0, 32.0, 29.0, 24.0, 17.0, 18.0, 11.0, 11.0, 5.0, 7.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.021820068359375, -0.021108388900756836, -0.020396709442138672, -0.019685029983520508, -0.018973350524902344, -0.01826167106628418, -0.017549991607666016, -0.01683831214904785, -0.016126632690429688, -0.015414953231811523, -0.01470327377319336, -0.013991594314575195, -0.013279914855957031, -0.012568235397338867, -0.011856555938720703, -0.011144876480102539, -0.010433197021484375, -0.009721517562866211, -0.009009838104248047, -0.008298158645629883, -0.007586479187011719, -0.006874799728393555, -0.006163120269775391, -0.0054514408111572266, -0.0047397613525390625, -0.0040280818939208984, -0.0033164024353027344, -0.0026047229766845703, -0.0018930435180664062, -0.0011813640594482422, -0.0004696846008300781, 0.00024199485778808594, 0.00095367431640625, 0.001665353775024414, 0.002377033233642578, 0.003088712692260742, 0.0038003921508789062, 0.00451207160949707, 0.005223751068115234, 0.0059354305267333984, 0.0066471099853515625, 0.0073587894439697266, 0.00807046890258789, 0.008782148361206055, 0.009493827819824219, 0.010205507278442383, 0.010917186737060547, 0.011628866195678711, 0.012340545654296875, 0.013052225112915039, 0.013763904571533203, 0.014475584030151367, 0.015187263488769531, 0.015898942947387695, 0.01661062240600586, 0.017322301864624023, 0.018033981323242188, 0.01874566078186035, 0.019457340240478516, 0.02016901969909668, 0.020880699157714844, 0.021592378616333008, 0.022304058074951172, 0.023015737533569336, 0.0237274169921875]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 5.0, 3.0, 9.0, 7.0, 8.0, 12.0, 12.0, 15.0, 14.0, 19.0, 21.0, 27.0, 29.0, 32.0, 37.0, 27.0, 41.0, 38.0, 41.0, 19.0, 39.0, 39.0, 53.0, 41.0, 47.0, 44.0, 37.0, 29.0, 33.0, 33.0, 21.0, 20.0, 18.0, 21.0, 19.0, 19.0, 11.0, 14.0, 8.0, 6.0, 9.0, 7.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005184173583984375, -0.005014300346374512, -0.0048444271087646484, -0.004674553871154785, -0.004504680633544922, -0.004334807395935059, -0.004164934158325195, -0.003995060920715332, -0.0038251876831054688, -0.0036553144454956055, -0.003485441207885742, -0.003315567970275879, -0.0031456947326660156, -0.0029758214950561523, -0.002805948257446289, -0.0026360750198364258, -0.0024662017822265625, -0.0022963285446166992, -0.002126455307006836, -0.0019565820693969727, -0.0017867088317871094, -0.001616835594177246, -0.0014469623565673828, -0.0012770891189575195, -0.0011072158813476562, -0.000937342643737793, -0.0007674694061279297, -0.0005975961685180664, -0.0004277229309082031, -0.00025784969329833984, -8.797645568847656e-05, 8.189678192138672e-05, 0.00025177001953125, 0.0004216432571411133, 0.0005915164947509766, 0.0007613897323608398, 0.0009312629699707031, 0.0011011362075805664, 0.0012710094451904297, 0.001440882682800293, 0.0016107559204101562, 0.0017806291580200195, 0.0019505023956298828, 0.002120375633239746, 0.0022902488708496094, 0.0024601221084594727, 0.002629995346069336, 0.0027998685836791992, 0.0029697418212890625, 0.0031396150588989258, 0.003309488296508789, 0.0034793615341186523, 0.0036492347717285156, 0.003819108009338379, 0.003988981246948242, 0.0041588544845581055, 0.004328727722167969, 0.004498600959777832, 0.004668474197387695, 0.004838347434997559, 0.005008220672607422, 0.005178093910217285, 0.0053479671478271484, 0.005517840385437012, 0.005687713623046875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 6.0, 9.0, 10.0, 14.0, 22.0, 31.0, 48.0, 63.0, 128.0, 302.0, 638.0, 1580.0, 4175.0, 25254.0, 4129624.0, 25310.0, 4279.0, 1539.0, 627.0, 266.0, 141.0, 69.0, 50.0, 26.0, 24.0, 15.0, 6.0, 6.0, 10.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0239715576171875, -0.02303147315979004, -0.022091388702392578, -0.021151304244995117, -0.020211219787597656, -0.019271135330200195, -0.018331050872802734, -0.017390966415405273, -0.016450881958007812, -0.015510797500610352, -0.01457071304321289, -0.01363062858581543, -0.012690544128417969, -0.011750459671020508, -0.010810375213623047, -0.009870290756225586, -0.008930206298828125, -0.007990121841430664, -0.007050037384033203, -0.006109952926635742, -0.005169868469238281, -0.00422978401184082, -0.0032896995544433594, -0.0023496150970458984, -0.0014095306396484375, -0.00046944618225097656, 0.0004706382751464844, 0.0014107227325439453, 0.0023508071899414062, 0.003290891647338867, 0.004230976104736328, 0.005171060562133789, 0.00611114501953125, 0.007051229476928711, 0.007991313934326172, 0.008931398391723633, 0.009871482849121094, 0.010811567306518555, 0.011751651763916016, 0.012691736221313477, 0.013631820678710938, 0.014571905136108398, 0.01551198959350586, 0.01645207405090332, 0.01739215850830078, 0.018332242965698242, 0.019272327423095703, 0.020212411880493164, 0.021152496337890625, 0.022092580795288086, 0.023032665252685547, 0.023972749710083008, 0.02491283416748047, 0.02585291862487793, 0.02679300308227539, 0.02773308753967285, 0.028673171997070312, 0.029613256454467773, 0.030553340911865234, 0.031493425369262695, 0.032433509826660156, 0.03337359428405762, 0.03431367874145508, 0.03525376319885254, 0.03619384765625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 19.0, 66.0, 217.0, 3103.0, 492.0, 106.0, 28.0, 8.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.005985260009765625, -0.005848288536071777, -0.00571131706237793, -0.005574345588684082, -0.005437374114990234, -0.005300402641296387, -0.005163431167602539, -0.005026459693908691, -0.004889488220214844, -0.004752516746520996, -0.0046155452728271484, -0.004478573799133301, -0.004341602325439453, -0.0042046308517456055, -0.004067659378051758, -0.00393068790435791, -0.0037937164306640625, -0.003656744956970215, -0.003519773483276367, -0.0033828020095825195, -0.003245830535888672, -0.0031088590621948242, -0.0029718875885009766, -0.002834916114807129, -0.0026979446411132812, -0.0025609731674194336, -0.002424001693725586, -0.0022870302200317383, -0.0021500587463378906, -0.002013087272644043, -0.0018761157989501953, -0.0017391443252563477, -0.0016021728515625, -0.0014652013778686523, -0.0013282299041748047, -0.001191258430480957, -0.0010542869567871094, -0.0009173154830932617, -0.0007803440093994141, -0.0006433725357055664, -0.0005064010620117188, -0.0003694295883178711, -0.00023245811462402344, -9.548664093017578e-05, 4.1484832763671875e-05, 0.00017845630645751953, 0.0003154277801513672, 0.00045239925384521484, 0.0005893707275390625, 0.0007263422012329102, 0.0008633136749267578, 0.0010002851486206055, 0.0011372566223144531, 0.0012742280960083008, 0.0014111995697021484, 0.001548171043395996, 0.0016851425170898438, 0.0018221139907836914, 0.001959085464477539, 0.0020960569381713867, 0.0022330284118652344, 0.002369999885559082, 0.0025069713592529297, 0.0026439428329467773, 0.002780914306640625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 8.0, 9.0, 8.0, 15.0, 17.0, 32.0, 33.0, 56.0, 56.0, 76.0, 109.0, 150.0, 98.0, 88.0, 68.0, 33.0, 36.0, 31.0, 29.0, 10.0, 9.0, 7.0, 6.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007801873609423637, -0.007496330887079239, -0.007190787699073553, -0.006885244976729155, -0.006579701788723469, -0.00627415906637907, -0.005968616344034672, -0.005663073621690273, -0.0053575304336845875, -0.005051987711340189, -0.004746444523334503, -0.004440901800990105, -0.004135359078645706, -0.0038298158906400204, -0.003524273168295622, -0.0032187302131205797, -0.0029131872579455376, -0.0026076443027704954, -0.0023021013475954533, -0.0019965586252510548, -0.0016910156700760126, -0.0013854727149009705, -0.0010799298761412501, -0.0007743870373815298, -0.00046884408220648766, -0.00016330118523910642, 0.00014224171172827482, 0.00044778460869565606, 0.0007533275056630373, 0.0010588704608380795, 0.0013644132995977998, 0.00166995613835752, 0.0019754981622099876, 0.00228104111738503, 0.002586584072560072, 0.0028921267949044704, 0.0031976697500795126, 0.0035032127052545547, 0.0038087554275989532, 0.004114298149943352, 0.0044198413379490376, 0.004725384060293436, 0.005030927248299122, 0.00533646997064352, 0.005642012692987919, 0.005947555880993605, 0.006253098603338003, 0.006558641791343689, 0.0068641845136880875, 0.007169727236032486, 0.007475270424038172, 0.00778081314638257, 0.008086356334388256, 0.008391899056732655, 0.008697441779077053, 0.009002984501421452, 0.009308528155088425, 0.009614070877432823, 0.009919613599777222, 0.010225157253444195, 0.010530699975788593, 0.010836242698132992, 0.01114178542047739, 0.011447328142821789, 0.011752870865166187]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 6.0, 7.0, 5.0, 8.0, 15.0, 16.0, 14.0, 11.0, 22.0, 19.0, 23.0, 28.0, 42.0, 29.0, 22.0, 38.0, 37.0, 39.0, 58.0, 34.0, 41.0, 49.0, 41.0, 34.0, 45.0, 31.0, 36.0, 29.0, 37.0, 19.0, 22.0, 18.0, 23.0, 15.0, 20.0, 17.0, 15.0, 9.0, 5.0, 7.0, 2.0, 7.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004970081150531769, -0.004801404196768999, -0.004632727243006229, -0.00446405028924346, -0.00429537333548069, -0.004126696847379208, -0.003958019893616438, -0.003789342939853668, -0.0036206659860908985, -0.003451989032328129, -0.003283312078565359, -0.003114635357633233, -0.0029459584038704634, -0.0027772814501076937, -0.0026086047291755676, -0.002439927775412798, -0.0022712508216500282, -0.0021025738678872585, -0.0019338970305398107, -0.0017652201931923628, -0.001596543239429593, -0.0014278662856668234, -0.0012591894483193755, -0.0010905126109719276, -0.0009218356572091579, -0.0007531587616540492, -0.0005844818660989404, -0.0004158049705438316, -0.0002471280749887228, -7.845117943361402e-05, 9.022571612149477e-05, 0.00025890255346894264, 0.00042757950723171234, 0.0005962564027868211, 0.0007649332983419299, 0.0009336101938970387, 0.0011022870894521475, 0.0012709640432149172, 0.001439640880562365, 0.001608317717909813, 0.0017769946716725826, 0.0019456716254353523, 0.002114348579198122, 0.002283025300130248, 0.0024517022538930178, 0.0026203792076557875, 0.0027890559285879135, 0.002957732882350683, 0.003126409836113453, 0.0032950867898762226, 0.0034637637436389923, 0.0036324404645711184, 0.003801117418333888, 0.003969794139266014, 0.004138471093028784, 0.0043071480467915535, 0.004475825000554323, 0.004644501954317093, 0.004813178908079863, 0.004981855861842632, 0.005150532349944115, 0.005319209303706884, 0.005487886257469654, 0.005656563211232424, 0.0058252401649951935]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 8.0, 15.0, 15.0, 32.0, 38.0, 64.0, 76.0, 99.0, 152.0, 210.0, 325.0, 429.0, 675.0, 1066.0, 1491.0, 2353.0, 3649.0, 6050.0, 9636.0, 15728.0, 26367.0, 45323.0, 79768.0, 149758.0, 261661.0, 197590.0, 103999.0, 57379.0, 32721.0, 19543.0, 11846.0, 7349.0, 4593.0, 2853.0, 1895.0, 1203.0, 786.0, 514.0, 352.0, 278.0, 224.0, 127.0, 99.0, 64.0, 42.0, 40.0, 25.0, 17.0, 12.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00498199462890625, -0.004829704761505127, -0.004677414894104004, -0.004525125026702881, -0.004372835159301758, -0.004220545291900635, -0.004068255424499512, -0.003915965557098389, -0.0037636756896972656, -0.0036113858222961426, -0.0034590959548950195, -0.0033068060874938965, -0.0031545162200927734, -0.0030022263526916504, -0.0028499364852905273, -0.0026976466178894043, -0.0025453567504882812, -0.002393066883087158, -0.002240777015686035, -0.002088487148284912, -0.001936197280883789, -0.001783907413482666, -0.001631617546081543, -0.00147932767868042, -0.0013270378112792969, -0.0011747479438781738, -0.0010224580764770508, -0.0008701682090759277, -0.0007178783416748047, -0.0005655884742736816, -0.0004132986068725586, -0.00026100873947143555, -0.0001087188720703125, 4.357099533081055e-05, 0.0001958608627319336, 0.00034815073013305664, 0.0005004405975341797, 0.0006527304649353027, 0.0008050203323364258, 0.0009573101997375488, 0.0011096000671386719, 0.001261889934539795, 0.001414179801940918, 0.001566469669342041, 0.001718759536743164, 0.0018710494041442871, 0.00202333927154541, 0.002175629138946533, 0.0023279190063476562, 0.0024802088737487793, 0.0026324987411499023, 0.0027847886085510254, 0.0029370784759521484, 0.0030893683433532715, 0.0032416582107543945, 0.0033939480781555176, 0.0035462379455566406, 0.0036985278129577637, 0.0038508176803588867, 0.00400310754776001, 0.004155397415161133, 0.004307687282562256, 0.004459977149963379, 0.004612267017364502, 0.004764556884765625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 3.0, 10.0, 9.0, 14.0, 7.0, 13.0, 12.0, 16.0, 23.0, 19.0, 26.0, 34.0, 24.0, 24.0, 27.0, 25.0, 43.0, 45.0, 41.0, 42.0, 42.0, 39.0, 45.0, 46.0, 37.0, 30.0, 32.0, 26.0, 33.0, 32.0, 15.0, 22.0, 24.0, 23.0, 14.0, 10.0, 9.0, 12.0, 12.0, 6.0, 4.0, 8.0, 6.0, 4.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.005092620849609375, -0.0049367547035217285, -0.004780888557434082, -0.0046250224113464355, -0.004469156265258789, -0.004313290119171143, -0.004157423973083496, -0.00400155782699585, -0.003845691680908203, -0.0036898255348205566, -0.00353395938873291, -0.0033780932426452637, -0.003222227096557617, -0.0030663609504699707, -0.0029104948043823242, -0.0027546286582946777, -0.0025987625122070312, -0.0024428963661193848, -0.0022870302200317383, -0.002131164073944092, -0.0019752979278564453, -0.0018194317817687988, -0.0016635656356811523, -0.0015076994895935059, -0.0013518333435058594, -0.0011959671974182129, -0.0010401010513305664, -0.0008842349052429199, -0.0007283687591552734, -0.000572502613067627, -0.00041663646697998047, -0.000260770320892334, -0.0001049041748046875, 5.0961971282958984e-05, 0.00020682811737060547, 0.00036269426345825195, 0.0005185604095458984, 0.0006744265556335449, 0.0008302927017211914, 0.0009861588478088379, 0.0011420249938964844, 0.0012978911399841309, 0.0014537572860717773, 0.0016096234321594238, 0.0017654895782470703, 0.0019213557243347168, 0.0020772218704223633, 0.0022330880165100098, 0.0023889541625976562, 0.0025448203086853027, 0.0027006864547729492, 0.0028565526008605957, 0.003012418746948242, 0.0031682848930358887, 0.003324151039123535, 0.0034800171852111816, 0.003635883331298828, 0.0037917494773864746, 0.003947615623474121, 0.004103481769561768, 0.004259347915649414, 0.0044152140617370605, 0.004571080207824707, 0.0047269463539123535, 0.0048828125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 7.0, 12.0, 15.0, 20.0, 25.0, 33.0, 32.0, 60.0, 78.0, 131.0, 188.0, 277.0, 433.0, 702.0, 1099.0, 2007.0, 3611.0, 7412.0, 16702.0, 43762.0, 148910.0, 566415.0, 172783.0, 48395.0, 18379.0, 7842.0, 3808.0, 2149.0, 1199.0, 703.0, 425.0, 299.0, 196.0, 119.0, 83.0, 71.0, 49.0, 33.0, 26.0, 18.0, 11.0, 8.0, 11.0, 3.0, 5.0, 9.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007190704345703125, -0.006947338581085205, -0.006703972816467285, -0.006460607051849365, -0.006217241287231445, -0.005973875522613525, -0.0057305097579956055, -0.0054871439933776855, -0.005243778228759766, -0.005000412464141846, -0.004757046699523926, -0.004513680934906006, -0.004270315170288086, -0.004026949405670166, -0.003783583641052246, -0.003540217876434326, -0.0032968521118164062, -0.0030534863471984863, -0.0028101205825805664, -0.0025667548179626465, -0.0023233890533447266, -0.0020800232887268066, -0.0018366575241088867, -0.0015932917594909668, -0.0013499259948730469, -0.001106560230255127, -0.000863194465637207, -0.0006198287010192871, -0.0003764629364013672, -0.00013309717178344727, 0.00011026859283447266, 0.0003536343574523926, 0.0005970001220703125, 0.0008403658866882324, 0.0010837316513061523, 0.0013270974159240723, 0.0015704631805419922, 0.0018138289451599121, 0.002057194709777832, 0.002300560474395752, 0.002543926239013672, 0.002787292003631592, 0.0030306577682495117, 0.0032740235328674316, 0.0035173892974853516, 0.0037607550621032715, 0.004004120826721191, 0.004247486591339111, 0.004490852355957031, 0.004734218120574951, 0.004977583885192871, 0.005220949649810791, 0.005464315414428711, 0.005707681179046631, 0.005951046943664551, 0.006194412708282471, 0.006437778472900391, 0.0066811442375183105, 0.0069245100021362305, 0.00716787576675415, 0.00741124153137207, 0.00765460729598999, 0.00789797306060791, 0.00814133882522583, 0.00838470458984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 2.0, 12.0, 9.0, 11.0, 10.0, 14.0, 17.0, 15.0, 23.0, 29.0, 27.0, 24.0, 33.0, 35.0, 34.0, 31.0, 45.0, 44.0, 36.0, 36.0, 36.0, 37.0, 45.0, 33.0, 31.0, 29.0, 19.0, 26.0, 39.0, 25.0, 23.0, 18.0, 28.0, 26.0, 14.0, 21.0, 10.0, 9.0, 9.0, 7.0, 6.0, 6.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00274658203125, -0.002648383378982544, -0.002550184726715088, -0.002451986074447632, -0.0023537874221801758, -0.0022555887699127197, -0.0021573901176452637, -0.0020591914653778076, -0.0019609928131103516, -0.0018627941608428955, -0.0017645955085754395, -0.0016663968563079834, -0.0015681982040405273, -0.0014699995517730713, -0.0013718008995056152, -0.0012736022472381592, -0.0011754035949707031, -0.001077204942703247, -0.000979006290435791, -0.000880807638168335, -0.0007826089859008789, -0.0006844103336334229, -0.0005862116813659668, -0.00048801302909851074, -0.0003898143768310547, -0.00029161572456359863, -0.00019341707229614258, -9.521842002868652e-05, 2.9802322387695312e-06, 0.00010117888450622559, 0.00019937753677368164, 0.0002975761890411377, 0.00039577484130859375, 0.0004939734935760498, 0.0005921721458435059, 0.0006903707981109619, 0.000788569450378418, 0.000886768102645874, 0.00098496675491333, 0.0010831654071807861, 0.0011813640594482422, 0.0012795627117156982, 0.0013777613639831543, 0.0014759600162506104, 0.0015741586685180664, 0.0016723573207855225, 0.0017705559730529785, 0.0018687546253204346, 0.0019669532775878906, 0.0020651519298553467, 0.0021633505821228027, 0.002261549234390259, 0.002359747886657715, 0.002457946538925171, 0.002556145191192627, 0.002654343843460083, 0.002752542495727539, 0.002850741147994995, 0.002948939800262451, 0.0030471384525299072, 0.0031453371047973633, 0.0032435357570648193, 0.0033417344093322754, 0.0034399330615997314, 0.0035381317138671875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 4.0, 14.0, 13.0, 14.0, 16.0, 36.0, 35.0, 74.0, 84.0, 107.0, 170.0, 243.0, 363.0, 597.0, 900.0, 1445.0, 2245.0, 3807.0, 6923.0, 14332.0, 37246.0, 180955.0, 689387.0, 65974.0, 21379.0, 9549.0, 4824.0, 2841.0, 1781.0, 1085.0, 715.0, 430.0, 302.0, 190.0, 139.0, 99.0, 49.0, 62.0, 38.0, 31.0, 12.0, 11.0, 8.0, 9.0, 9.0, 4.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016832351684570312, -0.0016275495290756226, -0.0015718638896942139, -0.0015161782503128052, -0.0014604926109313965, -0.0014048069715499878, -0.001349121332168579, -0.0012934356927871704, -0.0012377500534057617, -0.001182064414024353, -0.0011263787746429443, -0.0010706931352615356, -0.001015007495880127, -0.0009593218564987183, -0.0009036362171173096, -0.0008479505777359009, -0.0007922649383544922, -0.0007365792989730835, -0.0006808936595916748, -0.0006252080202102661, -0.0005695223808288574, -0.0005138367414474487, -0.00045815110206604004, -0.00040246546268463135, -0.00034677982330322266, -0.00029109418392181396, -0.00023540854454040527, -0.00017972290515899658, -0.0001240372657775879, -6.83516263961792e-05, -1.2665987014770508e-05, 4.3019652366638184e-05, 9.870529174804688e-05, 0.00015439093112945557, 0.00021007657051086426, 0.00026576220989227295, 0.00032144784927368164, 0.00037713348865509033, 0.000432819128036499, 0.0004885047674179077, 0.0005441904067993164, 0.0005998760461807251, 0.0006555616855621338, 0.0007112473249435425, 0.0007669329643249512, 0.0008226186037063599, 0.0008783042430877686, 0.0009339898824691772, 0.000989675521850586, 0.0010453611612319946, 0.0011010468006134033, 0.001156732439994812, 0.0012124180793762207, 0.0012681037187576294, 0.001323789358139038, 0.0013794749975204468, 0.0014351606369018555, 0.0014908462762832642, 0.0015465319156646729, 0.0016022175550460815, 0.0016579031944274902, 0.001713588833808899, 0.0017692744731903076, 0.0018249601125717163, 0.001880645751953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 8.0, 11.0, 11.0, 4.0, 13.0, 5.0, 13.0, 18.0, 34.0, 34.0, 59.0, 76.0, 109.0, 74.0, 83.0, 123.0, 60.0, 80.0, 36.0, 41.0, 24.0, 22.0, 11.0, 10.0, 6.0, 7.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.589557647705078e-06, -4.4424086809158325e-06, -4.295259714126587e-06, -4.148110747337341e-06, -4.000961780548096e-06, -3.85381281375885e-06, -3.7066638469696045e-06, -3.559514880180359e-06, -3.4123659133911133e-06, -3.2652169466018677e-06, -3.118067979812622e-06, -2.9709190130233765e-06, -2.823770046234131e-06, -2.6766210794448853e-06, -2.5294721126556396e-06, -2.382323145866394e-06, -2.2351741790771484e-06, -2.088025212287903e-06, -1.9408762454986572e-06, -1.7937272787094116e-06, -1.646578311920166e-06, -1.4994293451309204e-06, -1.3522803783416748e-06, -1.2051314115524292e-06, -1.0579824447631836e-06, -9.10833477973938e-07, -7.636845111846924e-07, -6.165355443954468e-07, -4.6938657760620117e-07, -3.2223761081695557e-07, -1.7508864402770996e-07, -2.7939677238464355e-08, 1.1920928955078125e-07, 2.6635825634002686e-07, 4.1350722312927246e-07, 5.606561899185181e-07, 7.078051567077637e-07, 8.549541234970093e-07, 1.0021030902862549e-06, 1.1492520570755005e-06, 1.296401023864746e-06, 1.4435499906539917e-06, 1.5906989574432373e-06, 1.737847924232483e-06, 1.8849968910217285e-06, 2.032145857810974e-06, 2.1792948246002197e-06, 2.3264437913894653e-06, 2.473592758178711e-06, 2.6207417249679565e-06, 2.767890691757202e-06, 2.9150396585464478e-06, 3.0621886253356934e-06, 3.209337592124939e-06, 3.3564865589141846e-06, 3.50363552570343e-06, 3.6507844924926758e-06, 3.7979334592819214e-06, 3.945082426071167e-06, 4.092231392860413e-06, 4.239380359649658e-06, 4.386529326438904e-06, 4.533678293228149e-06, 4.680827260017395e-06, 4.827976226806641e-06]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 6.0, 18.0, 17.0, 18.0, 33.0, 49.0, 95.0, 161.0, 268.0, 529.0, 1019.0, 2125.0, 5039.0, 14361.0, 54342.0, 664750.0, 250915.0, 36543.0, 10637.0, 4038.0, 1756.0, 791.0, 420.0, 240.0, 143.0, 78.0, 64.0, 31.0, 19.0, 8.0, 13.0, 11.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002681732177734375, -0.0025819242000579834, -0.002482116222381592, -0.0023823082447052, -0.0022825002670288086, -0.002182692289352417, -0.0020828843116760254, -0.001983076333999634, -0.0018832683563232422, -0.0017834603786468506, -0.001683652400970459, -0.0015838444232940674, -0.0014840364456176758, -0.0013842284679412842, -0.0012844204902648926, -0.001184612512588501, -0.0010848045349121094, -0.0009849965572357178, -0.0008851885795593262, -0.0007853806018829346, -0.000685572624206543, -0.0005857646465301514, -0.00048595666885375977, -0.00038614869117736816, -0.00028634071350097656, -0.00018653273582458496, -8.672475814819336e-05, 1.3083219528198242e-05, 0.00011289119720458984, 0.00021269917488098145, 0.00031250715255737305, 0.00041231513023376465, 0.0005121231079101562, 0.0006119310855865479, 0.0007117390632629395, 0.0008115470409393311, 0.0009113550186157227, 0.0010111629962921143, 0.0011109709739685059, 0.0012107789516448975, 0.001310586929321289, 0.0014103949069976807, 0.0015102028846740723, 0.0016100108623504639, 0.0017098188400268555, 0.001809626817703247, 0.0019094347953796387, 0.0020092427730560303, 0.002109050750732422, 0.0022088587284088135, 0.002308666706085205, 0.0024084746837615967, 0.0025082826614379883, 0.00260809063911438, 0.0027078986167907715, 0.002807706594467163, 0.0029075145721435547, 0.0030073225498199463, 0.003107130527496338, 0.0032069385051727295, 0.003306746482849121, 0.0034065544605255127, 0.0035063624382019043, 0.003606170415878296, 0.0037059783935546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 1.0, 9.0, 7.0, 11.0, 13.0, 16.0, 16.0, 28.0, 41.0, 49.0, 55.0, 75.0, 176.0, 143.0, 81.0, 68.0, 51.0, 39.0, 24.0, 11.0, 23.0, 14.0, 10.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0006079673767089844, -0.0005915127694606781, -0.0005750581622123718, -0.0005586035549640656, -0.0005421489477157593, -0.000525694340467453, -0.0005092397332191467, -0.0004927851259708405, -0.0004763305187225342, -0.0004598759114742279, -0.00044342130422592163, -0.00042696669697761536, -0.0004105120897293091, -0.0003940574824810028, -0.00037760287523269653, -0.00036114826798439026, -0.000344693660736084, -0.0003282390534877777, -0.00031178444623947144, -0.00029532983899116516, -0.0002788752317428589, -0.0002624206244945526, -0.00024596601724624634, -0.00022951140999794006, -0.0002130568027496338, -0.00019660219550132751, -0.00018014758825302124, -0.00016369298100471497, -0.0001472383737564087, -0.00013078376650810242, -0.00011432915925979614, -9.787455201148987e-05, -8.14199447631836e-05, -6.496533751487732e-05, -4.8510730266571045e-05, -3.205612301826477e-05, -1.5601515769958496e-05, 8.530914783477783e-07, 1.7307698726654053e-05, 3.376230597496033e-05, 5.02169132232666e-05, 6.667152047157288e-05, 8.312612771987915e-05, 9.958073496818542e-05, 0.0001160353422164917, 0.00013248994946479797, 0.00014894455671310425, 0.00016539916396141052, 0.0001818537712097168, 0.00019830837845802307, 0.00021476298570632935, 0.00023121759295463562, 0.0002476722002029419, 0.00026412680745124817, 0.00028058141469955444, 0.0002970360219478607, 0.000313490629196167, 0.00032994523644447327, 0.00034639984369277954, 0.0003628544509410858, 0.0003793090581893921, 0.00039576366543769836, 0.00041221827268600464, 0.0004286728799343109, 0.0004451274871826172]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 6.0, 11.0, 10.0, 12.0, 17.0, 29.0, 32.0, 53.0, 55.0, 100.0, 136.0, 125.0, 106.0, 72.0, 50.0, 39.0, 33.0, 26.0, 20.0, 19.0, 12.0, 12.0, 5.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007131132762879133, -0.006848030723631382, -0.006564928684383631, -0.0062818266451358795, -0.005998724605888128, -0.005715622566640377, -0.0054325200617313385, -0.005149418488144875, -0.004866315983235836, -0.004583213943988085, -0.0043001119047403336, -0.004017009865492582, -0.003733907826244831, -0.00345080578699708, -0.003167703514918685, -0.0028846014756709337, -0.002601499669253826, -0.002318397630006075, -0.0020352955907583237, -0.0017521934350952506, -0.0014690913958474994, -0.0011859893565997481, -0.0009028872009366751, -0.0006197851616889238, -0.0003366831224411726, -5.358105408959091e-05, 0.00022952101426199079, 0.0005126231117174029, 0.0007957251509651542, 0.0010788271902129054, 0.0013619293458759785, 0.0016450313851237297, 0.0019281338900327682, 0.0022112359292805195, 0.0024943379685282707, 0.002777440007776022, 0.003060542047023773, 0.0033436440862715244, 0.0036267463583499193, 0.003909848630428314, 0.004192950204014778, 0.004476052243262529, 0.004759154282510281, 0.005042256321758032, 0.005325358361005783, 0.005608460400253534, 0.0058915624395012856, 0.006174664944410324, 0.006457766983658075, 0.006740869022905827, 0.007023971062153578, 0.007307073101401329, 0.00759017514064908, 0.007873277179896832, 0.00815637968480587, 0.008439481258392334, 0.008722583763301373, 0.009005686268210411, 0.009288787841796875, 0.009571890346705914, 0.009854991920292377, 0.010138094425201416, 0.01042119599878788, 0.010704298503696918, 0.010987400077283382]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 9.0, 7.0, 16.0, 8.0, 14.0, 21.0, 13.0, 20.0, 27.0, 21.0, 44.0, 30.0, 31.0, 31.0, 34.0, 39.0, 55.0, 43.0, 47.0, 47.0, 35.0, 40.0, 41.0, 32.0, 34.0, 35.0, 31.0, 21.0, 30.0, 20.0, 16.0, 13.0, 27.0, 11.0, 12.0, 8.0, 5.0, 10.0, 1.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004860639572143555, -0.004696132615208626, -0.004531625658273697, -0.004367118701338768, -0.004202612210065126, -0.0040381052531301975, -0.0038735982961952686, -0.0037090913392603397, -0.0035445846151560545, -0.0033800776582211256, -0.0032155709341168404, -0.0030510639771819115, -0.0028865570202469826, -0.0027220502961426973, -0.0025575433392077684, -0.002393036615103483, -0.0022285296581685543, -0.0020640227012336254, -0.0018995159771293402, -0.0017350090201944113, -0.0015705021796748042, -0.0014059953391551971, -0.0012414883822202682, -0.0010769815417006612, -0.0009124747011810541, -0.000747967860661447, -0.0005834609619341791, -0.0004189540632069111, -0.000254447222687304, -8.994038216769695e-05, 7.456657476723194e-05, 0.000239073415286839, 0.0004035807214677334, 0.0005680875619873405, 0.0007325944607146084, 0.0008971013594418764, 0.0010616081999614835, 0.0012261150404810905, 0.0013906219974160194, 0.0015551288379356265, 0.0017196356784552336, 0.0018841425189748406, 0.0020486493594944477, 0.0022131563164293766, 0.0023776632733643055, 0.0025421699974685907, 0.0027066769544035196, 0.002871183678507805, 0.0030356906354427338, 0.0032001975923776627, 0.003364704316481948, 0.003529211273416877, 0.003693717997521162, 0.003858224954456091, 0.00402273191139102, 0.004187238868325949, 0.00435174535959959, 0.004516252316534519, 0.004680759273469448, 0.004845266230404377, 0.005009772721678019, 0.0051742796786129475, 0.005338786635547876, 0.005503293592482805, 0.005667800549417734]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 10.0, 6.0, 9.0, 10.0, 22.0, 31.0, 31.0, 55.0, 86.0, 93.0, 118.0, 163.0, 233.0, 304.0, 456.0, 640.0, 960.0, 1267.0, 1852.0, 2788.0, 4187.0, 6152.0, 9594.0, 14391.0, 23232.0, 37265.0, 63448.0, 114789.0, 212790.0, 234110.0, 132134.0, 71677.0, 41996.0, 25947.0, 16001.0, 10439.0, 6749.0, 4542.0, 2990.0, 2033.0, 1414.0, 1019.0, 714.0, 523.0, 363.0, 266.0, 196.0, 115.0, 101.0, 62.0, 57.0, 49.0, 27.0, 18.0, 11.0, 11.0, 8.0, 8.0, 3.0, 2.0, 1.0, 5.0], "bins": [-0.0080108642578125, -0.0077533721923828125, -0.007495880126953125, -0.0072383880615234375, -0.00698089599609375, -0.0067234039306640625, -0.006465911865234375, -0.0062084197998046875, -0.005950927734375, -0.0056934356689453125, -0.005435943603515625, -0.0051784515380859375, -0.00492095947265625, -0.0046634674072265625, -0.004405975341796875, -0.0041484832763671875, -0.0038909912109375, -0.0036334991455078125, -0.003376007080078125, -0.0031185150146484375, -0.00286102294921875, -0.0026035308837890625, -0.002346038818359375, -0.0020885467529296875, -0.0018310546875, -0.0015735626220703125, -0.001316070556640625, -0.0010585784912109375, -0.00080108642578125, -0.0005435943603515625, -0.000286102294921875, -2.86102294921875e-05, 0.0002288818359375, 0.0004863739013671875, 0.000743865966796875, 0.0010013580322265625, 0.00125885009765625, 0.0015163421630859375, 0.001773834228515625, 0.0020313262939453125, 0.002288818359375, 0.0025463104248046875, 0.002803802490234375, 0.0030612945556640625, 0.00331878662109375, 0.0035762786865234375, 0.003833770751953125, 0.0040912628173828125, 0.0043487548828125, 0.0046062469482421875, 0.004863739013671875, 0.0051212310791015625, 0.00537872314453125, 0.0056362152099609375, 0.005893707275390625, 0.0061511993408203125, 0.00640869140625, 0.0066661834716796875, 0.006923675537109375, 0.0071811676025390625, 0.00743865966796875, 0.0076961517333984375, 0.007953643798828125, 0.008211135864257812, 0.0084686279296875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 10.0, 15.0, 12.0, 14.0, 12.0, 10.0, 11.0, 21.0, 17.0, 30.0, 20.0, 25.0, 29.0, 27.0, 27.0, 44.0, 25.0, 52.0, 43.0, 40.0, 35.0, 38.0, 49.0, 43.0, 36.0, 31.0, 27.0, 29.0, 26.0, 21.0, 21.0, 22.0, 18.0, 20.0, 16.0, 13.0, 11.0, 12.0, 10.0, 6.0, 5.0, 3.0, 2.0, 6.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.002716064453125, -0.002625793218612671, -0.002535521984100342, -0.0024452507495880127, -0.0023549795150756836, -0.0022647082805633545, -0.0021744370460510254, -0.0020841658115386963, -0.001993894577026367, -0.001903623342514038, -0.001813352108001709, -0.0017230808734893799, -0.0016328096389770508, -0.0015425384044647217, -0.0014522671699523926, -0.0013619959354400635, -0.0012717247009277344, -0.0011814534664154053, -0.0010911822319030762, -0.001000910997390747, -0.000910639762878418, -0.0008203685283660889, -0.0007300972938537598, -0.0006398260593414307, -0.0005495548248291016, -0.00045928359031677246, -0.00036901235580444336, -0.00027874112129211426, -0.00018846988677978516, -9.819865226745605e-05, -7.927417755126953e-06, 8.234381675720215e-05, 0.00017261505126953125, 0.00026288628578186035, 0.00035315752029418945, 0.00044342875480651855, 0.0005336999893188477, 0.0006239712238311768, 0.0007142424583435059, 0.000804513692855835, 0.0008947849273681641, 0.0009850561618804932, 0.0010753273963928223, 0.0011655986309051514, 0.0012558698654174805, 0.0013461410999298096, 0.0014364123344421387, 0.0015266835689544678, 0.0016169548034667969, 0.001707226037979126, 0.001797497272491455, 0.0018877685070037842, 0.0019780397415161133, 0.0020683109760284424, 0.0021585822105407715, 0.0022488534450531006, 0.0023391246795654297, 0.002429395914077759, 0.002519667148590088, 0.002609938383102417, 0.002700209617614746, 0.002790480852127075, 0.0028807520866394043, 0.0029710233211517334, 0.0030612945556640625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 10.0, 23.0, 30.0, 53.0, 90.0, 127.0, 196.0, 344.0, 523.0, 887.0, 1615.0, 3058.0, 5573.0, 10900.0, 22699.0, 49335.0, 117231.0, 285080.0, 312201.0, 132123.0, 55585.0, 25134.0, 12099.0, 6130.0, 3246.0, 1753.0, 990.0, 596.0, 345.0, 205.0, 135.0, 76.0, 58.0, 31.0, 17.0, 11.0, 8.0, 8.0, 5.0, 7.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.01116180419921875, -0.010843515396118164, -0.010525226593017578, -0.010206937789916992, -0.009888648986816406, -0.00957036018371582, -0.009252071380615234, -0.008933782577514648, -0.008615493774414062, -0.008297204971313477, -0.00797891616821289, -0.007660627365112305, -0.007342338562011719, -0.007024049758911133, -0.006705760955810547, -0.006387472152709961, -0.006069183349609375, -0.005750894546508789, -0.005432605743408203, -0.005114316940307617, -0.004796028137207031, -0.004477739334106445, -0.004159450531005859, -0.0038411617279052734, -0.0035228729248046875, -0.0032045841217041016, -0.0028862953186035156, -0.0025680065155029297, -0.0022497177124023438, -0.0019314289093017578, -0.0016131401062011719, -0.001294851303100586, -0.0009765625, -0.0006582736968994141, -0.0003399848937988281, -2.1696090698242188e-05, 0.00029659271240234375, 0.0006148815155029297, 0.0009331703186035156, 0.0012514591217041016, 0.0015697479248046875, 0.0018880367279052734, 0.0022063255310058594, 0.0025246143341064453, 0.0028429031372070312, 0.003161191940307617, 0.003479480743408203, 0.003797769546508789, 0.004116058349609375, 0.004434347152709961, 0.004752635955810547, 0.005070924758911133, 0.005389213562011719, 0.005707502365112305, 0.006025791168212891, 0.0063440799713134766, 0.0066623687744140625, 0.0069806575775146484, 0.007298946380615234, 0.00761723518371582, 0.007935523986816406, 0.008253812789916992, 0.008572101593017578, 0.008890390396118164, 0.00920867919921875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 9.0, 6.0, 5.0, 12.0, 20.0, 11.0, 13.0, 20.0, 22.0, 23.0, 36.0, 31.0, 29.0, 26.0, 49.0, 50.0, 29.0, 38.0, 42.0, 41.0, 38.0, 43.0, 37.0, 41.0, 39.0, 35.0, 33.0, 34.0, 28.0, 26.0, 23.0, 15.0, 19.0, 17.0, 10.0, 8.0, 13.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.002475738525390625, -0.0023965835571289062, -0.0023174285888671875, -0.0022382736206054688, -0.00215911865234375, -0.0020799636840820312, -0.0020008087158203125, -0.0019216537475585938, -0.001842498779296875, -0.0017633438110351562, -0.0016841888427734375, -0.0016050338745117188, -0.00152587890625, -0.0014467239379882812, -0.0013675689697265625, -0.0012884140014648438, -0.001209259033203125, -0.0011301040649414062, -0.0010509490966796875, -0.0009717941284179688, -0.00089263916015625, -0.0008134841918945312, -0.0007343292236328125, -0.0006551742553710938, -0.000576019287109375, -0.0004968643188476562, -0.0004177093505859375, -0.00033855438232421875, -0.0002593994140625, -0.00018024444580078125, -0.0001010894775390625, -2.193450927734375e-05, 5.7220458984375e-05, 0.00013637542724609375, 0.0002155303955078125, 0.00029468536376953125, 0.00037384033203125, 0.00045299530029296875, 0.0005321502685546875, 0.0006113052368164062, 0.000690460205078125, 0.0007696151733398438, 0.0008487701416015625, 0.0009279251098632812, 0.001007080078125, 0.0010862350463867188, 0.0011653900146484375, 0.0012445449829101562, 0.001323699951171875, 0.0014028549194335938, 0.0014820098876953125, 0.0015611648559570312, 0.00164031982421875, 0.0017194747924804688, 0.0017986297607421875, 0.0018777847290039062, 0.001956939697265625, 0.0020360946655273438, 0.0021152496337890625, 0.0021944046020507812, 0.0022735595703125, 0.0023527145385742188, 0.0024318695068359375, 0.0025110244750976562, 0.002590179443359375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 8.0, 10.0, 14.0, 14.0, 30.0, 27.0, 32.0, 51.0, 66.0, 130.0, 190.0, 325.0, 502.0, 883.0, 1471.0, 2767.0, 5765.0, 14346.0, 48134.0, 390583.0, 499805.0, 54546.0, 15867.0, 6251.0, 2928.0, 1466.0, 825.0, 531.0, 306.0, 226.0, 155.0, 106.0, 55.0, 39.0, 27.0, 22.0, 15.0, 10.0, 8.0, 8.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00031495094299316406, -0.00030446797609329224, -0.0002939850091934204, -0.0002835020422935486, -0.00027301907539367676, -0.00026253610849380493, -0.0002520531415939331, -0.00024157017469406128, -0.00023108720779418945, -0.00022060424089431763, -0.0002101212739944458, -0.00019963830709457397, -0.00018915534019470215, -0.00017867237329483032, -0.0001681894063949585, -0.00015770643949508667, -0.00014722347259521484, -0.00013674050569534302, -0.0001262575387954712, -0.00011577457189559937, -0.00010529160499572754, -9.480863809585571e-05, -8.432567119598389e-05, -7.384270429611206e-05, -6.335973739624023e-05, -5.287677049636841e-05, -4.239380359649658e-05, -3.1910836696624756e-05, -2.142786979675293e-05, -1.0944902896881104e-05, -4.6193599700927734e-07, 1.0021030902862549e-05, 2.0503997802734375e-05, 3.09869647026062e-05, 4.146993160247803e-05, 5.1952898502349854e-05, 6.243586540222168e-05, 7.29188323020935e-05, 8.340179920196533e-05, 9.388476610183716e-05, 0.00010436773300170898, 0.00011485069990158081, 0.00012533366680145264, 0.00013581663370132446, 0.0001462996006011963, 0.00015678256750106812, 0.00016726553440093994, 0.00017774850130081177, 0.0001882314682006836, 0.00019871443510055542, 0.00020919740200042725, 0.00021968036890029907, 0.0002301633358001709, 0.00024064630270004272, 0.00025112926959991455, 0.0002616122364997864, 0.0002720952033996582, 0.00028257817029953003, 0.00029306113719940186, 0.0003035441040992737, 0.0003140270709991455, 0.00032451003789901733, 0.00033499300479888916, 0.000345475971698761, 0.0003559589385986328]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 12.0, 9.0, 16.0, 28.0, 55.0, 122.0, 194.0, 280.0, 128.0, 48.0, 35.0, 27.0, 10.0, 15.0, 6.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.569789886474609e-06, -7.255002856254578e-06, -6.940215826034546e-06, -6.625428795814514e-06, -6.310641765594482e-06, -5.995854735374451e-06, -5.681067705154419e-06, -5.366280674934387e-06, -5.0514936447143555e-06, -4.736706614494324e-06, -4.421919584274292e-06, -4.10713255405426e-06, -3.7923455238342285e-06, -3.4775584936141968e-06, -3.162771463394165e-06, -2.8479844331741333e-06, -2.5331974029541016e-06, -2.21841037273407e-06, -1.903623342514038e-06, -1.5888363122940063e-06, -1.2740492820739746e-06, -9.592622518539429e-07, -6.444752216339111e-07, -3.296881914138794e-07, -1.4901161193847656e-08, 2.998858690261841e-07, 6.146728992462158e-07, 9.294599294662476e-07, 1.2442469596862793e-06, 1.559033989906311e-06, 1.8738210201263428e-06, 2.1886080503463745e-06, 2.5033950805664062e-06, 2.818182110786438e-06, 3.1329691410064697e-06, 3.4477561712265015e-06, 3.762543201446533e-06, 4.077330231666565e-06, 4.392117261886597e-06, 4.706904292106628e-06, 5.02169132232666e-06, 5.336478352546692e-06, 5.651265382766724e-06, 5.966052412986755e-06, 6.280839443206787e-06, 6.595626473426819e-06, 6.910413503646851e-06, 7.225200533866882e-06, 7.539987564086914e-06, 7.854774594306946e-06, 8.169561624526978e-06, 8.48434865474701e-06, 8.799135684967041e-06, 9.113922715187073e-06, 9.428709745407104e-06, 9.743496775627136e-06, 1.0058283805847168e-05, 1.03730708360672e-05, 1.0687857866287231e-05, 1.1002644896507263e-05, 1.1317431926727295e-05, 1.1632218956947327e-05, 1.1947005987167358e-05, 1.226179301738739e-05, 1.2576580047607422e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 4.0, 10.0, 9.0, 19.0, 23.0, 42.0, 57.0, 76.0, 116.0, 173.0, 281.0, 478.0, 743.0, 1191.0, 1942.0, 3330.0, 5445.0, 9959.0, 18123.0, 37267.0, 81574.0, 223567.0, 379363.0, 158737.0, 61672.0, 29352.0, 15001.0, 8153.0, 4607.0, 2880.0, 1635.0, 992.0, 583.0, 415.0, 267.0, 159.0, 87.0, 76.0, 42.0, 25.0, 24.0, 17.0, 15.0, 7.0, 9.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-9.834766387939453e-05, -9.53972339630127e-05, -9.244680404663086e-05, -8.949637413024902e-05, -8.654594421386719e-05, -8.359551429748535e-05, -8.064508438110352e-05, -7.769465446472168e-05, -7.474422454833984e-05, -7.179379463195801e-05, -6.884336471557617e-05, -6.589293479919434e-05, -6.29425048828125e-05, -5.9992074966430664e-05, -5.704164505004883e-05, -5.409121513366699e-05, -5.1140785217285156e-05, -4.819035530090332e-05, -4.5239925384521484e-05, -4.228949546813965e-05, -3.933906555175781e-05, -3.6388635635375977e-05, -3.343820571899414e-05, -3.0487775802612305e-05, -2.753734588623047e-05, -2.4586915969848633e-05, -2.1636486053466797e-05, -1.868605613708496e-05, -1.5735626220703125e-05, -1.2785196304321289e-05, -9.834766387939453e-06, -6.884336471557617e-06, -3.933906555175781e-06, -9.834766387939453e-07, 1.9669532775878906e-06, 4.9173831939697266e-06, 7.867813110351562e-06, 1.0818243026733398e-05, 1.3768672943115234e-05, 1.671910285949707e-05, 1.9669532775878906e-05, 2.2619962692260742e-05, 2.5570392608642578e-05, 2.8520822525024414e-05, 3.147125244140625e-05, 3.4421682357788086e-05, 3.737211227416992e-05, 4.032254219055176e-05, 4.3272972106933594e-05, 4.622340202331543e-05, 4.9173831939697266e-05, 5.21242618560791e-05, 5.507469177246094e-05, 5.8025121688842773e-05, 6.097555160522461e-05, 6.392598152160645e-05, 6.687641143798828e-05, 6.982684135437012e-05, 7.277727127075195e-05, 7.572770118713379e-05, 7.867813110351562e-05, 8.162856101989746e-05, 8.45789909362793e-05, 8.752942085266113e-05, 9.047985076904297e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 6.0, 1.0, 12.0, 4.0, 5.0, 9.0, 15.0, 8.0, 18.0, 17.0, 6.0, 25.0, 28.0, 33.0, 32.0, 44.0, 40.0, 40.0, 53.0, 66.0, 69.0, 52.0, 43.0, 44.0, 37.0, 39.0, 36.0, 35.0, 29.0, 27.0, 29.0, 18.0, 12.0, 15.0, 12.0, 9.0, 8.0, 7.0, 6.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6524066925048828e-05, -2.5666318833827972e-05, -2.4808570742607117e-05, -2.395082265138626e-05, -2.3093074560165405e-05, -2.223532646894455e-05, -2.1377578377723694e-05, -2.0519830286502838e-05, -1.9662082195281982e-05, -1.8804334104061127e-05, -1.794658601284027e-05, -1.7088837921619415e-05, -1.623108983039856e-05, -1.5373341739177704e-05, -1.4515593647956848e-05, -1.3657845556735992e-05, -1.2800097465515137e-05, -1.1942349374294281e-05, -1.1084601283073425e-05, -1.022685319185257e-05, -9.369105100631714e-06, -8.511357009410858e-06, -7.653608918190002e-06, -6.795860826969147e-06, -5.938112735748291e-06, -5.080364644527435e-06, -4.22261655330658e-06, -3.364868462085724e-06, -2.507120370864868e-06, -1.6493722796440125e-06, -7.916241884231567e-07, 6.612390279769897e-08, 9.238719940185547e-07, 1.7816200852394104e-06, 2.639368176460266e-06, 3.497116267681122e-06, 4.3548643589019775e-06, 5.212612450122833e-06, 6.070360541343689e-06, 6.928108632564545e-06, 7.7858567237854e-06, 8.643604815006256e-06, 9.501352906227112e-06, 1.0359100997447968e-05, 1.1216849088668823e-05, 1.2074597179889679e-05, 1.2932345271110535e-05, 1.379009336233139e-05, 1.4647841453552246e-05, 1.5505589544773102e-05, 1.6363337635993958e-05, 1.7221085727214813e-05, 1.807883381843567e-05, 1.8936581909656525e-05, 1.979433000087738e-05, 2.0652078092098236e-05, 2.1509826183319092e-05, 2.2367574274539948e-05, 2.3225322365760803e-05, 2.408307045698166e-05, 2.4940818548202515e-05, 2.579856663942337e-05, 2.6656314730644226e-05, 2.7514062821865082e-05, 2.8371810913085938e-05]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 11.0, 20.0, 23.0, 61.0, 100.0, 147.0, 187.0, 175.0, 95.0, 54.0, 35.0, 28.0, 26.0, 11.0, 10.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01027395948767662, -0.009960658848285675, -0.009647357277572155, -0.00933405663818121, -0.00902075506746769, -0.008707454428076744, -0.008394152857363224, -0.008080852217972279, -0.007767551112920046, -0.007454250007867813, -0.00714094890281558, -0.006827647797763348, -0.006514347158372402, -0.006201045587658882, -0.005887744948267937, -0.005574443843215704, -0.005261142738163471, -0.0049478416331112385, -0.004634540528059006, -0.004321239423006773, -0.00400793831795454, -0.003694637445732951, -0.003381336573511362, -0.0030680354684591293, -0.0027547343634068966, -0.002441433258354664, -0.002128132153302431, -0.001814831281080842, -0.0015015301760286093, -0.0011882290709763765, -0.0008749280823394656, -0.0005616270937025547, -0.00024832505732774734, 6.497598951682448e-05, 0.0003782770363613963, 0.0006915780832059681, 0.00100487913005054, 0.0013181802351027727, 0.0016314812237396836, 0.0019447822123765945, 0.0022580833174288273, 0.00257138442248106, 0.0028846855275332928, 0.003197986399754882, 0.0035112875048071146, 0.0038245886098593473, 0.004137889482080936, 0.004451190587133169, 0.004764491692185402, 0.005077792797237635, 0.005391093902289867, 0.0057043950073421, 0.006017696112394333, 0.006330996751785278, 0.006644297856837511, 0.006957598961889744, 0.0072709000669419765, 0.007584201171994209, 0.007897501811385155, 0.008210803382098675, 0.00852410402148962, 0.00883740559220314, 0.009150706231594086, 0.009464006870985031, 0.009777308441698551]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 11.0, 8.0, 12.0, 12.0, 7.0, 15.0, 9.0, 15.0, 17.0, 19.0, 24.0, 25.0, 33.0, 33.0, 24.0, 46.0, 28.0, 41.0, 35.0, 44.0, 41.0, 35.0, 46.0, 46.0, 35.0, 23.0, 37.0, 34.0, 25.0, 28.0, 32.0, 29.0, 13.0, 23.0, 13.0, 11.0, 18.0, 6.0, 8.0, 7.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031095927115529776, -0.003004947677254677, -0.002900302642956376, -0.0027956576086580753, -0.0026910125743597746, -0.002586367540061474, -0.0024817222729325294, -0.0023770774714648724, -0.002272432204335928, -0.0021677871700376272, -0.0020631421357393265, -0.0019584971014410257, -0.001853852067142725, -0.0017492070328444242, -0.0016445618821308017, -0.001539916847832501, -0.001435271929949522, -0.0013306268956512213, -0.0012259818613529205, -0.0011213368270546198, -0.001016691792756319, -0.0009120467002503574, -0.0008074016077443957, -0.000702756573446095, -0.0005981115391477942, -0.0004934665048494935, -0.0003888214414473623, -0.0002841763780452311, -0.00017953134374693036, -7.488630944862962e-05, 2.975878305733204e-05, 0.00013440381735563278, 0.00023904885165393353, 0.00034369388595223427, 0.00044833894935436547, 0.0005529840127564967, 0.0006576290470547974, 0.0007622740813530982, 0.0008669191738590598, 0.0009715642081573606, 0.0010762092424556613, 0.001180854276753962, 0.0012854993110522628, 0.0013901444617658854, 0.001494789496064186, 0.0015994345303624868, 0.0017040795646607876, 0.0018087245989590883, 0.001913369633257389, 0.00201801466755569, 0.0021226597018539906, 0.0022273047361522913, 0.002331949770450592, 0.002436594804748893, 0.0025412398390471935, 0.002645885106176138, 0.002750529907643795, 0.0028551749419420958, 0.0029598199762403965, 0.0030644650105386972, 0.003169110044836998, 0.0032737550791352987, 0.0033784001134335995, 0.003483045380562544, 0.0035876904148608446]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 9.0, 3.0, 6.0, 11.0, 13.0, 15.0, 20.0, 19.0, 24.0, 53.0, 44.0, 61.0, 82.0, 89.0, 136.0, 158.0, 203.0, 305.0, 451.0, 688.0, 1199.0, 2401.0, 4906.0, 21084.0, 3799288.0, 343364.0, 10762.0, 3895.0, 1890.0, 1014.0, 605.0, 384.0, 245.0, 187.0, 142.0, 112.0, 95.0, 76.0, 58.0, 51.0, 41.0, 24.0, 21.0, 21.0, 6.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00853729248046875, -0.008260488510131836, -0.007983684539794922, -0.007706880569458008, -0.007430076599121094, -0.00715327262878418, -0.006876468658447266, -0.0065996646881103516, -0.0063228607177734375, -0.0060460567474365234, -0.005769252777099609, -0.005492448806762695, -0.005215644836425781, -0.004938840866088867, -0.004662036895751953, -0.004385232925415039, -0.004108428955078125, -0.003831624984741211, -0.003554821014404297, -0.003278017044067383, -0.0030012130737304688, -0.0027244091033935547, -0.0024476051330566406, -0.0021708011627197266, -0.0018939971923828125, -0.0016171932220458984, -0.0013403892517089844, -0.0010635852813720703, -0.0007867813110351562, -0.0005099773406982422, -0.00023317337036132812, 4.363059997558594e-05, 0.0003204345703125, 0.0005972385406494141, 0.0008740425109863281, 0.0011508464813232422, 0.0014276504516601562, 0.0017044544219970703, 0.0019812583923339844, 0.0022580623626708984, 0.0025348663330078125, 0.0028116703033447266, 0.0030884742736816406, 0.0033652782440185547, 0.0036420822143554688, 0.003918886184692383, 0.004195690155029297, 0.004472494125366211, 0.004749298095703125, 0.005026102066040039, 0.005302906036376953, 0.005579710006713867, 0.005856513977050781, 0.006133317947387695, 0.006410121917724609, 0.0066869258880615234, 0.0069637298583984375, 0.0072405338287353516, 0.007517337799072266, 0.00779414176940918, 0.008070945739746094, 0.008347749710083008, 0.008624553680419922, 0.008901357650756836, 0.00917816162109375]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 2.0, 10.0, 4.0, 9.0, 9.0, 10.0, 7.0, 14.0, 22.0, 25.0, 17.0, 24.0, 22.0, 31.0, 27.0, 25.0, 42.0, 43.0, 23.0, 44.0, 46.0, 36.0, 47.0, 41.0, 43.0, 37.0, 37.0, 29.0, 26.0, 34.0, 34.0, 28.0, 24.0, 28.0, 14.0, 17.0, 12.0, 12.0, 10.0, 7.0, 2.0, 4.0, 8.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025997161865234375, -0.0025152266025543213, -0.002430737018585205, -0.002346247434616089, -0.0022617578506469727, -0.0021772682666778564, -0.0020927786827087402, -0.002008289098739624, -0.0019237995147705078, -0.0018393099308013916, -0.0017548203468322754, -0.0016703307628631592, -0.001585841178894043, -0.0015013515949249268, -0.0014168620109558105, -0.0013323724269866943, -0.0012478828430175781, -0.001163393259048462, -0.0010789036750793457, -0.0009944140911102295, -0.0009099245071411133, -0.0008254349231719971, -0.0007409453392028809, -0.0006564557552337646, -0.0005719661712646484, -0.0004874765872955322, -0.000402987003326416, -0.0003184974193572998, -0.0002340078353881836, -0.00014951825141906738, -6.502866744995117e-05, 1.946091651916504e-05, 0.00010395050048828125, 0.00018844008445739746, 0.00027292966842651367, 0.0003574192523956299, 0.0004419088363647461, 0.0005263984203338623, 0.0006108880043029785, 0.0006953775882720947, 0.0007798671722412109, 0.0008643567562103271, 0.0009488463401794434, 0.0010333359241485596, 0.0011178255081176758, 0.001202315092086792, 0.0012868046760559082, 0.0013712942600250244, 0.0014557838439941406, 0.0015402734279632568, 0.001624763011932373, 0.0017092525959014893, 0.0017937421798706055, 0.0018782317638397217, 0.001962721347808838, 0.002047210931777954, 0.0021317005157470703, 0.0022161900997161865, 0.0023006796836853027, 0.002385169267654419, 0.002469658851623535, 0.0025541484355926514, 0.0026386380195617676, 0.002723127603530884, 0.0028076171875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 7.0, 13.0, 16.0, 32.0, 40.0, 73.0, 131.0, 162.0, 300.0, 487.0, 805.0, 1598.0, 3150.0, 7626.0, 30578.0, 3784825.0, 335136.0, 17960.0, 5643.0, 2585.0, 1315.0, 727.0, 418.0, 243.0, 146.0, 90.0, 58.0, 37.0, 23.0, 15.0, 11.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01126861572265625, -0.010914802551269531, -0.010560989379882812, -0.010207176208496094, -0.009853363037109375, -0.009499549865722656, -0.009145736694335938, -0.008791923522949219, -0.0084381103515625, -0.008084297180175781, -0.0077304840087890625, -0.007376670837402344, -0.007022857666015625, -0.006669044494628906, -0.0063152313232421875, -0.005961418151855469, -0.00560760498046875, -0.005253791809082031, -0.0048999786376953125, -0.004546165466308594, -0.004192352294921875, -0.0038385391235351562, -0.0034847259521484375, -0.0031309127807617188, -0.002777099609375, -0.0024232864379882812, -0.0020694732666015625, -0.0017156600952148438, -0.001361846923828125, -0.0010080337524414062, -0.0006542205810546875, -0.00030040740966796875, 5.340576171875e-05, 0.00040721893310546875, 0.0007610321044921875, 0.0011148452758789062, 0.001468658447265625, 0.0018224716186523438, 0.0021762847900390625, 0.0025300979614257812, 0.0028839111328125, 0.0032377243041992188, 0.0035915374755859375, 0.003945350646972656, 0.004299163818359375, 0.004652976989746094, 0.0050067901611328125, 0.005360603332519531, 0.00571441650390625, 0.006068229675292969, 0.0064220428466796875, 0.006775856018066406, 0.007129669189453125, 0.007483482360839844, 0.007837295532226562, 0.008191108703613281, 0.008544921875, 0.008898735046386719, 0.009252548217773438, 0.009606361389160156, 0.009960174560546875, 0.010313987731933594, 0.010667800903320312, 0.011021614074707031, 0.01137542724609375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 6.0, 4.0, 5.0, 13.0, 13.0, 23.0, 70.0, 144.0, 436.0, 2637.0, 436.0, 148.0, 51.0, 24.0, 20.0, 6.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0018749237060546875, -0.001817256212234497, -0.0017595887184143066, -0.0017019212245941162, -0.0016442537307739258, -0.0015865862369537354, -0.001528918743133545, -0.0014712512493133545, -0.001413583755493164, -0.0013559162616729736, -0.0012982487678527832, -0.0012405812740325928, -0.0011829137802124023, -0.001125246286392212, -0.0010675787925720215, -0.001009911298751831, -0.0009522438049316406, -0.0008945763111114502, -0.0008369088172912598, -0.0007792413234710693, -0.0007215738296508789, -0.0006639063358306885, -0.000606238842010498, -0.0005485713481903076, -0.0004909038543701172, -0.00043323636054992676, -0.00037556886672973633, -0.0003179013729095459, -0.00026023387908935547, -0.00020256638526916504, -0.0001448988914489746, -8.723139762878418e-05, -2.956390380859375e-05, 2.810359001159668e-05, 8.577108383178711e-05, 0.00014343857765197754, 0.00020110607147216797, 0.0002587735652923584, 0.00031644105911254883, 0.00037410855293273926, 0.0004317760467529297, 0.0004894435405731201, 0.0005471110343933105, 0.000604778528213501, 0.0006624460220336914, 0.0007201135158538818, 0.0007777810096740723, 0.0008354485034942627, 0.0008931159973144531, 0.0009507834911346436, 0.001008450984954834, 0.0010661184787750244, 0.0011237859725952148, 0.0011814534664154053, 0.0012391209602355957, 0.0012967884540557861, 0.0013544559478759766, 0.001412123441696167, 0.0014697909355163574, 0.0015274584293365479, 0.0015851259231567383, 0.0016427934169769287, 0.0017004609107971191, 0.0017581284046173096, 0.0018157958984375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 10.0, 6.0, 9.0, 13.0, 30.0, 48.0, 63.0, 87.0, 139.0, 143.0, 141.0, 104.0, 54.0, 46.0, 30.0, 21.0, 13.0, 11.0, 10.0, 8.0, 5.0, 3.0, 4.0, 0.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034235245548188686, -0.003231944516301155, -0.003040364710614085, -0.0028487846720963717, -0.0026572048664093018, -0.002465624827891588, -0.0022740447893738747, -0.002082464750856161, -0.0018908849451690912, -0.0016993050230666995, -0.0015077251009643078, -0.0013161450624465942, -0.0011245651403442025, -0.0009329852182418108, -0.0007414051797240973, -0.0005498252576217055, -0.0003582453355193138, -0.00016666538431309164, 2.491456689313054e-05, 0.00021649454720318317, 0.0004080744693055749, 0.0005996543914079666, 0.0007912344299256802, 0.0009828143520280719, 0.0011743942741304636, 0.0013659741962328553, 0.001557554118335247, 0.0017491341568529606, 0.0019407140789553523, 0.002132294001057744, 0.0023238740395754576, 0.0025154538452625275, 0.0027070334181189537, 0.0028986134566366673, 0.003090193262323737, 0.0032817733008414507, 0.0034733531065285206, 0.003664933145046234, 0.0038565131835639477, 0.004048093222081661, 0.0042396727949380875, 0.004431252833455801, 0.0046228328719735146, 0.004814412444829941, 0.005005992483347654, 0.005197572521865368, 0.0053891525603830814, 0.005580732598900795, 0.0057723126374185085, 0.005963892675936222, 0.006155472714453936, 0.006347052752971649, 0.006538632325828075, 0.006730212364345789, 0.0069217924028635025, 0.007113372441381216, 0.00730495247989893, 0.007496532518416643, 0.007688112556934357, 0.007879692129790783, 0.008071272633969784, 0.00826285220682621, 0.008454432711005211, 0.008646012283861637, 0.008837591856718063]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 5.0, 7.0, 13.0, 7.0, 10.0, 11.0, 15.0, 17.0, 19.0, 17.0, 27.0, 30.0, 37.0, 35.0, 32.0, 29.0, 35.0, 38.0, 44.0, 37.0, 43.0, 35.0, 49.0, 37.0, 31.0, 31.0, 31.0, 34.0, 24.0, 35.0, 22.0, 26.0, 22.0, 18.0, 23.0, 10.0, 15.0, 7.0, 5.0, 6.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0024768502917140722, -0.0023955528158694506, -0.002314255340024829, -0.0022329576313495636, -0.002151660155504942, -0.0020703626796603203, -0.0019890652038156986, -0.001907767727971077, -0.0018264701357111335, -0.0017451726598665118, -0.0016638750676065683, -0.0015825775917619467, -0.001501280115917325, -0.0014199825236573815, -0.0013386850478127599, -0.0012573874555528164, -0.0011760899797081947, -0.001094792503863573, -0.0010134949116036296, -0.0009321974357590079, -0.0008508999017067254, -0.0007696023676544428, -0.0006883048918098211, -0.0006070073577575386, -0.000525709823705256, -0.0004444122896529734, -0.0003631147847045213, -0.0002818172797560692, -0.0002005197457037866, -0.00011922221165150404, -3.7924706703051925e-05, 4.337279824540019e-05, 0.0001246700994670391, 0.00020596761896740645, 0.0002872651384677738, 0.0003685626434162259, 0.0004498601774685085, 0.000531157711520791, 0.0006124551873654127, 0.0006937527214176953, 0.0007750502554699779, 0.0008563477895222604, 0.000937645323574543, 0.0010189427994191647, 0.0011002402752637863, 0.0011815378675237298, 0.0012628353433683515, 0.001344132935628295, 0.0014254304114729166, 0.0015067278873175383, 0.0015880254795774817, 0.0016693229554221034, 0.0017506205476820469, 0.0018319180235266685, 0.0019132154993712902, 0.001994512975215912, 0.0020758104510605335, 0.002157107926905155, 0.002238405402749777, 0.002319703111425042, 0.002401000587269664, 0.0024822980631142855, 0.002563595538958907, 0.002644893014803529, 0.002726190723478794]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 11.0, 18.0, 19.0, 30.0, 37.0, 45.0, 96.0, 131.0, 222.0, 374.0, 623.0, 1046.0, 1760.0, 3275.0, 5644.0, 10270.0, 18891.0, 35790.0, 69389.0, 137524.0, 266480.0, 242969.0, 122031.0, 61876.0, 31792.0, 17015.0, 9238.0, 5042.0, 2871.0, 1638.0, 957.0, 540.0, 338.0, 207.0, 115.0, 79.0, 60.0, 36.0, 27.0, 19.0, 8.0, 8.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0026836395263671875, -0.002596825361251831, -0.0025100111961364746, -0.002423197031021118, -0.0023363828659057617, -0.0022495687007904053, -0.002162754535675049, -0.0020759403705596924, -0.001989126205444336, -0.0019023120403289795, -0.001815497875213623, -0.0017286837100982666, -0.0016418695449829102, -0.0015550553798675537, -0.0014682412147521973, -0.0013814270496368408, -0.0012946128845214844, -0.001207798719406128, -0.0011209845542907715, -0.001034170389175415, -0.0009473562240600586, -0.0008605420589447021, -0.0007737278938293457, -0.0006869137287139893, -0.0006000995635986328, -0.0005132853984832764, -0.0004264712333679199, -0.0003396570682525635, -0.00025284290313720703, -0.00016602873802185059, -7.921457290649414e-05, 7.599592208862305e-06, 9.441375732421875e-05, 0.0001812279224395752, 0.00026804208755493164, 0.0003548562526702881, 0.00044167041778564453, 0.000528484582901001, 0.0006152987480163574, 0.0007021129131317139, 0.0007889270782470703, 0.0008757412433624268, 0.0009625554084777832, 0.0010493695735931396, 0.001136183738708496, 0.0012229979038238525, 0.001309812068939209, 0.0013966262340545654, 0.0014834403991699219, 0.0015702545642852783, 0.0016570687294006348, 0.0017438828945159912, 0.0018306970596313477, 0.001917511224746704, 0.0020043253898620605, 0.002091139554977417, 0.0021779537200927734, 0.00226476788520813, 0.0023515820503234863, 0.0024383962154388428, 0.0025252103805541992, 0.0026120245456695557, 0.002698838710784912, 0.0027856528759002686, 0.002872467041015625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 11.0, 5.0, 5.0, 8.0, 10.0, 10.0, 11.0, 13.0, 16.0, 16.0, 26.0, 27.0, 42.0, 34.0, 29.0, 37.0, 32.0, 37.0, 46.0, 35.0, 43.0, 39.0, 51.0, 40.0, 40.0, 37.0, 37.0, 22.0, 28.0, 28.0, 31.0, 24.0, 21.0, 16.0, 17.0, 15.0, 17.0, 9.0, 10.0, 7.0, 2.0, 2.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0026836395263671875, -0.0025943517684936523, -0.002505064010620117, -0.002415776252746582, -0.002326488494873047, -0.0022372007369995117, -0.0021479129791259766, -0.0020586252212524414, -0.0019693374633789062, -0.001880049705505371, -0.001790761947631836, -0.0017014741897583008, -0.0016121864318847656, -0.0015228986740112305, -0.0014336109161376953, -0.0013443231582641602, -0.001255035400390625, -0.0011657476425170898, -0.0010764598846435547, -0.0009871721267700195, -0.0008978843688964844, -0.0008085966110229492, -0.0007193088531494141, -0.0006300210952758789, -0.0005407333374023438, -0.0004514455795288086, -0.00036215782165527344, -0.0002728700637817383, -0.00018358230590820312, -9.429454803466797e-05, -5.0067901611328125e-06, 8.428096771240234e-05, 0.0001735687255859375, 0.00026285648345947266, 0.0003521442413330078, 0.00044143199920654297, 0.0005307197570800781, 0.0006200075149536133, 0.0007092952728271484, 0.0007985830307006836, 0.0008878707885742188, 0.000977158546447754, 0.001066446304321289, 0.0011557340621948242, 0.0012450218200683594, 0.0013343095779418945, 0.0014235973358154297, 0.0015128850936889648, 0.0016021728515625, 0.0016914606094360352, 0.0017807483673095703, 0.0018700361251831055, 0.0019593238830566406, 0.0020486116409301758, 0.002137899398803711, 0.002227187156677246, 0.0023164749145507812, 0.0024057626724243164, 0.0024950504302978516, 0.0025843381881713867, 0.002673625946044922, 0.002762913703918457, 0.002852201461791992, 0.0029414892196655273, 0.0030307769775390625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 12.0, 4.0, 9.0, 17.0, 21.0, 27.0, 40.0, 55.0, 90.0, 138.0, 223.0, 352.0, 565.0, 1122.0, 1784.0, 3511.0, 6607.0, 12706.0, 27564.0, 64318.0, 189488.0, 478891.0, 156071.0, 55730.0, 24359.0, 11720.0, 5777.0, 3176.0, 1705.0, 939.0, 562.0, 366.0, 201.0, 141.0, 71.0, 60.0, 36.0, 27.0, 17.0, 14.0, 9.0, 5.0, 3.0, 8.0, 5.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.003108978271484375, -0.0030067861080169678, -0.0029045939445495605, -0.0028024017810821533, -0.002700209617614746, -0.002598017454147339, -0.0024958252906799316, -0.0023936331272125244, -0.002291440963745117, -0.00218924880027771, -0.0020870566368103027, -0.0019848644733428955, -0.0018826723098754883, -0.001780480146408081, -0.0016782879829406738, -0.0015760958194732666, -0.0014739036560058594, -0.0013717114925384521, -0.001269519329071045, -0.0011673271656036377, -0.0010651350021362305, -0.0009629428386688232, -0.000860750675201416, -0.0007585585117340088, -0.0006563663482666016, -0.0005541741847991943, -0.0004519820213317871, -0.0003497898578643799, -0.00024759769439697266, -0.00014540553092956543, -4.32133674621582e-05, 5.8978796005249023e-05, 0.00016117095947265625, 0.0002633631229400635, 0.0003655552864074707, 0.00046774744987487793, 0.0005699396133422852, 0.0006721317768096924, 0.0007743239402770996, 0.0008765161037445068, 0.000978708267211914, 0.0010809004306793213, 0.0011830925941467285, 0.0012852847576141357, 0.001387476921081543, 0.0014896690845489502, 0.0015918612480163574, 0.0016940534114837646, 0.0017962455749511719, 0.001898437738418579, 0.0020006299018859863, 0.0021028220653533936, 0.0022050142288208008, 0.002307206392288208, 0.0024093985557556152, 0.0025115907192230225, 0.0026137828826904297, 0.002715975046157837, 0.002818167209625244, 0.0029203593730926514, 0.0030225515365600586, 0.003124743700027466, 0.003226935863494873, 0.0033291280269622803, 0.0034313201904296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 7.0, 8.0, 7.0, 7.0, 7.0, 4.0, 12.0, 15.0, 17.0, 18.0, 28.0, 24.0, 27.0, 23.0, 37.0, 31.0, 35.0, 40.0, 41.0, 39.0, 46.0, 43.0, 46.0, 40.0, 27.0, 32.0, 39.0, 39.0, 29.0, 41.0, 28.0, 24.0, 26.0, 24.0, 17.0, 16.0, 7.0, 7.0, 7.0, 12.0, 7.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.001926422119140625, -0.0018689483404159546, -0.0018114745616912842, -0.0017540007829666138, -0.0016965270042419434, -0.001639053225517273, -0.0015815794467926025, -0.0015241056680679321, -0.0014666318893432617, -0.0014091581106185913, -0.001351684331893921, -0.0012942105531692505, -0.00123673677444458, -0.0011792629957199097, -0.0011217892169952393, -0.0010643154382705688, -0.0010068416595458984, -0.000949367880821228, -0.0008918941020965576, -0.0008344203233718872, -0.0007769465446472168, -0.0007194727659225464, -0.000661998987197876, -0.0006045252084732056, -0.0005470514297485352, -0.0004895776510238647, -0.00043210387229919434, -0.0003746300935745239, -0.0003171563148498535, -0.0002596825361251831, -0.0002022087574005127, -0.00014473497867584229, -8.726119995117188e-05, -2.9787421226501465e-05, 2.7686357498168945e-05, 8.516013622283936e-05, 0.00014263391494750977, 0.00020010769367218018, 0.0002575814723968506, 0.000315055251121521, 0.0003725290298461914, 0.0004300028085708618, 0.0004874765872955322, 0.0005449503660202026, 0.000602424144744873, 0.0006598979234695435, 0.0007173717021942139, 0.0007748454809188843, 0.0008323192596435547, 0.0008897930383682251, 0.0009472668170928955, 0.001004740595817566, 0.0010622143745422363, 0.0011196881532669067, 0.0011771619319915771, 0.0012346357107162476, 0.001292109489440918, 0.0013495832681655884, 0.0014070570468902588, 0.0014645308256149292, 0.0015220046043395996, 0.00157947838306427, 0.0016369521617889404, 0.0016944259405136108, 0.0017518997192382812]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 1.0, 5.0, 4.0, 6.0, 13.0, 10.0, 25.0, 21.0, 23.0, 50.0, 59.0, 77.0, 105.0, 176.0, 302.0, 446.0, 720.0, 1298.0, 2647.0, 5591.0, 15203.0, 63237.0, 789290.0, 131764.0, 22654.0, 7571.0, 3267.0, 1579.0, 932.0, 514.0, 308.0, 197.0, 135.0, 92.0, 71.0, 39.0, 27.0, 32.0, 22.0, 15.0, 5.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0009245872497558594, -0.0008962824940681458, -0.0008679777383804321, -0.0008396729826927185, -0.0008113682270050049, -0.0007830634713172913, -0.0007547587156295776, -0.000726453959941864, -0.0006981492042541504, -0.0006698444485664368, -0.0006415396928787231, -0.0006132349371910095, -0.0005849301815032959, -0.0005566254258155823, -0.0005283206701278687, -0.000500015914440155, -0.0004717111587524414, -0.0004434064030647278, -0.00041510164737701416, -0.00038679689168930054, -0.0003584921360015869, -0.0003301873803138733, -0.00030188262462615967, -0.00027357786893844604, -0.0002452731132507324, -0.0002169683575630188, -0.00018866360187530518, -0.00016035884618759155, -0.00013205409049987793, -0.0001037493348121643, -7.544457912445068e-05, -4.713982343673706e-05, -1.8835067749023438e-05, 9.469687938690186e-06, 3.777444362640381e-05, 6.607919931411743e-05, 9.438395500183105e-05, 0.00012268871068954468, 0.0001509934663772583, 0.00017929822206497192, 0.00020760297775268555, 0.00023590773344039917, 0.0002642124891281128, 0.0002925172448158264, 0.00032082200050354004, 0.00034912675619125366, 0.0003774315118789673, 0.0004057362675666809, 0.00043404102325439453, 0.00046234577894210815, 0.0004906505346298218, 0.0005189552903175354, 0.000547260046005249, 0.0005755648016929626, 0.0006038695573806763, 0.0006321743130683899, 0.0006604790687561035, 0.0006887838244438171, 0.0007170885801315308, 0.0007453933358192444, 0.000773698091506958, 0.0008020028471946716, 0.0008303076028823853, 0.0008586123585700989, 0.0008869171142578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 8.0, 10.0, 6.0, 14.0, 6.0, 19.0, 16.0, 17.0, 44.0, 30.0, 61.0, 32.0, 102.0, 43.0, 38.0, 104.0, 50.0, 90.0, 38.0, 77.0, 24.0, 37.0, 19.0, 16.0, 22.0, 7.0, 22.0, 6.0, 15.0, 2.0, 5.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.7418136596679688e-06, -2.6561319828033447e-06, -2.5704503059387207e-06, -2.4847686290740967e-06, -2.3990869522094727e-06, -2.3134052753448486e-06, -2.2277235984802246e-06, -2.1420419216156006e-06, -2.0563602447509766e-06, -1.9706785678863525e-06, -1.8849968910217285e-06, -1.7993152141571045e-06, -1.7136335372924805e-06, -1.6279518604278564e-06, -1.5422701835632324e-06, -1.4565885066986084e-06, -1.3709068298339844e-06, -1.2852251529693604e-06, -1.1995434761047363e-06, -1.1138617992401123e-06, -1.0281801223754883e-06, -9.424984455108643e-07, -8.568167686462402e-07, -7.711350917816162e-07, -6.854534149169922e-07, -5.997717380523682e-07, -5.140900611877441e-07, -4.284083843231201e-07, -3.427267074584961e-07, -2.5704503059387207e-07, -1.7136335372924805e-07, -8.568167686462402e-08, 0.0, 8.568167686462402e-08, 1.7136335372924805e-07, 2.5704503059387207e-07, 3.427267074584961e-07, 4.284083843231201e-07, 5.140900611877441e-07, 5.997717380523682e-07, 6.854534149169922e-07, 7.711350917816162e-07, 8.568167686462402e-07, 9.424984455108643e-07, 1.0281801223754883e-06, 1.1138617992401123e-06, 1.1995434761047363e-06, 1.2852251529693604e-06, 1.3709068298339844e-06, 1.4565885066986084e-06, 1.5422701835632324e-06, 1.6279518604278564e-06, 1.7136335372924805e-06, 1.7993152141571045e-06, 1.8849968910217285e-06, 1.9706785678863525e-06, 2.0563602447509766e-06, 2.1420419216156006e-06, 2.2277235984802246e-06, 2.3134052753448486e-06, 2.3990869522094727e-06, 2.4847686290740967e-06, 2.5704503059387207e-06, 2.6561319828033447e-06, 2.7418136596679688e-06]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 12.0, 25.0, 32.0, 57.0, 92.0, 162.0, 288.0, 585.0, 1258.0, 3311.0, 10575.0, 49178.0, 723882.0, 221433.0, 26692.0, 6791.0, 2213.0, 908.0, 460.0, 230.0, 133.0, 94.0, 47.0, 25.0, 20.0, 15.0, 7.0, 4.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001201629638671875, -0.0011650174856185913, -0.0011284053325653076, -0.001091793179512024, -0.0010551810264587402, -0.0010185688734054565, -0.0009819567203521729, -0.0009453445672988892, -0.0009087324142456055, -0.0008721202611923218, -0.0008355081081390381, -0.0007988959550857544, -0.0007622838020324707, -0.000725671648979187, -0.0006890594959259033, -0.0006524473428726196, -0.0006158351898193359, -0.0005792230367660522, -0.0005426108837127686, -0.0005059987306594849, -0.00046938657760620117, -0.0004327744245529175, -0.0003961622714996338, -0.0003595501184463501, -0.0003229379653930664, -0.0002863258123397827, -0.000249713659286499, -0.00021310150623321533, -0.00017648935317993164, -0.00013987720012664795, -0.00010326504707336426, -6.665289402008057e-05, -3.0040740966796875e-05, 6.571412086486816e-06, 4.318356513977051e-05, 7.97957181930542e-05, 0.00011640787124633789, 0.00015302002429962158, 0.00018963217735290527, 0.00022624433040618896, 0.00026285648345947266, 0.00029946863651275635, 0.00033608078956604004, 0.00037269294261932373, 0.0004093050956726074, 0.0004459172487258911, 0.0004825294017791748, 0.0005191415548324585, 0.0005557537078857422, 0.0005923658609390259, 0.0006289780139923096, 0.0006655901670455933, 0.000702202320098877, 0.0007388144731521606, 0.0007754266262054443, 0.000812038779258728, 0.0008486509323120117, 0.0008852630853652954, 0.0009218752384185791, 0.0009584873914718628, 0.0009950995445251465, 0.0010317116975784302, 0.0010683238506317139, 0.0011049360036849976, 0.0011415481567382812]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 5.0, 15.0, 15.0, 20.0, 24.0, 37.0, 41.0, 62.0, 79.0, 148.0, 163.0, 100.0, 62.0, 57.0, 44.0, 33.0, 18.0, 21.0, 7.0, 10.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001722574234008789, -0.00016672909259796143, -0.00016120076179504395, -0.00015567243099212646, -0.00015014410018920898, -0.0001446157693862915, -0.00013908743858337402, -0.00013355910778045654, -0.00012803077697753906, -0.00012250244617462158, -0.0001169741153717041, -0.00011144578456878662, -0.00010591745376586914, -0.00010038912296295166, -9.486079216003418e-05, -8.93324613571167e-05, -8.380413055419922e-05, -7.827579975128174e-05, -7.274746894836426e-05, -6.721913814544678e-05, -6.16908073425293e-05, -5.6162476539611816e-05, -5.0634145736694336e-05, -4.5105814933776855e-05, -3.9577484130859375e-05, -3.4049153327941895e-05, -2.8520822525024414e-05, -2.2992491722106934e-05, -1.7464160919189453e-05, -1.1935830116271973e-05, -6.407499313354492e-06, -8.791685104370117e-07, 4.649162292480469e-06, 1.017749309539795e-05, 1.570582389831543e-05, 2.123415470123291e-05, 2.676248550415039e-05, 3.229081630706787e-05, 3.781914710998535e-05, 4.334747791290283e-05, 4.887580871582031e-05, 5.440413951873779e-05, 5.9932470321655273e-05, 6.546080112457275e-05, 7.098913192749023e-05, 7.651746273040771e-05, 8.20457935333252e-05, 8.757412433624268e-05, 9.310245513916016e-05, 9.863078594207764e-05, 0.00010415911674499512, 0.0001096874475479126, 0.00011521577835083008, 0.00012074410915374756, 0.00012627243995666504, 0.00013180077075958252, 0.0001373291015625, 0.00014285743236541748, 0.00014838576316833496, 0.00015391409397125244, 0.00015944242477416992, 0.0001649707555770874, 0.00017049908638000488, 0.00017602741718292236, 0.00018155574798583984]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 9.0, 13.0, 15.0, 24.0, 46.0, 71.0, 103.0, 122.0, 141.0, 143.0, 96.0, 53.0, 38.0, 28.0, 22.0, 18.0, 24.0, 5.0, 6.0, 3.0, 6.0, 2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036290129646658897, -0.00344454194419086, -0.00326007092371583, -0.0030755999032408, -0.00289112888276577, -0.00270665786229074, -0.00252218684181571, -0.00233771582134068, -0.00215324480086565, -0.0019687737803906202, -0.0017843027599155903, -0.0015998317394405603, -0.0014153607189655304, -0.0012308896984905005, -0.0010464186780154705, -0.0008619476575404406, -0.0006774766370654106, -0.0004930056165903807, -0.0003085345961153507, -0.00012406357564032078, 6.040744483470917e-05, 0.0002448784653097391, 0.00042934948578476906, 0.000613820506259799, 0.000798291526734829, 0.000982762547209859, 0.0011672335676848888, 0.0013517045881599188, 0.0015361756086349487, 0.0017206466291099787, 0.0019051176495850086, 0.0020895886700600386, 0.0022740596905350685, 0.0024585307110100985, 0.0026430017314851284, 0.0028274727519601583, 0.0030119437724351883, 0.0031964147929102182, 0.003380885813385248, 0.003565356833860278, 0.003749827854335308, 0.003934298641979694, 0.004118769895285368, 0.0043032411485910416, 0.004487711936235428, 0.004672182723879814, 0.004856653977185488, 0.005041125230491161, 0.005225596018135548, 0.005410066805779934, 0.0055945380590856075, 0.005779009312391281, 0.005963480100035667, 0.006147950887680054, 0.006332422140985727, 0.006516893394291401, 0.006701364181935787, 0.0068858349695801735, 0.007070306222885847, 0.007254777476191521, 0.007439248263835907, 0.007623719051480293, 0.007808190304785967, 0.00799266155809164, 0.008177132345736027]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 6.0, 5.0, 7.0, 7.0, 11.0, 11.0, 10.0, 10.0, 18.0, 16.0, 18.0, 22.0, 30.0, 28.0, 44.0, 34.0, 33.0, 29.0, 35.0, 41.0, 38.0, 45.0, 41.0, 43.0, 39.0, 35.0, 31.0, 30.0, 36.0, 26.0, 33.0, 27.0, 21.0, 25.0, 18.0, 22.0, 14.0, 17.0, 7.0, 7.0, 5.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002453440800309181, -0.0023714271374046803, -0.0022894134745001793, -0.0022073998115956783, -0.0021253861486911774, -0.0020433724857866764, -0.0019613588228821754, -0.0018793451599776745, -0.0017973314970731735, -0.0017153178341686726, -0.0016333041712641716, -0.0015512905083596706, -0.0014692768454551697, -0.0013872631825506687, -0.0013052495196461678, -0.0012232358567416668, -0.0011412221938371658, -0.0010592085309326649, -0.000977194868028164, -0.000895181205123663, -0.000813167542219162, -0.000731153879314661, -0.0006491402164101601, -0.0005671265535056591, -0.00048511289060115814, -0.0004030992276966572, -0.0003210855647921562, -0.00023907190188765526, -0.0001570582389831543, -7.504457607865334e-05, 6.969086825847626e-06, 8.898274973034859e-05, 0.0001709961798042059, 0.00025300984270870686, 0.0003350235056132078, 0.0004170371685177088, 0.0004990508314222097, 0.0005810644943267107, 0.0006630781572312117, 0.0007450918201357126, 0.0008271054830402136, 0.0009091191459447145, 0.0009911328088492155, 0.0010731464717537165, 0.0011551601346582174, 0.0012371737975627184, 0.0013191874604672194, 0.0014012011233717203, 0.0014832147862762213, 0.0015652284491807222, 0.0016472421120852232, 0.0017292557749897242, 0.0018112694378942251, 0.001893283100798726, 0.001975296763703227, 0.002057310426607728, 0.002139324089512229, 0.00222133775241673, 0.002303351415321231, 0.002385365078225732, 0.002467378741130233, 0.0025493924040347338, 0.0026314060669392347, 0.0027134197298437357, 0.0027954333927482367]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 6.0, 9.0, 10.0, 9.0, 20.0, 16.0, 36.0, 65.0, 140.0, 321.0, 549.0, 1089.0, 2291.0, 5037.0, 11187.0, 26692.0, 71459.0, 220170.0, 435323.0, 174797.0, 58859.0, 22611.0, 9603.0, 4260.0, 1935.0, 951.0, 489.0, 285.0, 110.0, 64.0, 33.0, 27.0, 19.0, 20.0, 13.0, 9.0, 5.0, 4.0, 9.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00873565673828125, -0.008428096771240234, -0.008120536804199219, -0.007812976837158203, -0.0075054168701171875, -0.007197856903076172, -0.006890296936035156, -0.006582736968994141, -0.006275177001953125, -0.005967617034912109, -0.005660057067871094, -0.005352497100830078, -0.0050449371337890625, -0.004737377166748047, -0.004429817199707031, -0.004122257232666016, -0.003814697265625, -0.0035071372985839844, -0.0031995773315429688, -0.002892017364501953, -0.0025844573974609375, -0.002276897430419922, -0.0019693374633789062, -0.0016617774963378906, -0.001354217529296875, -0.0010466575622558594, -0.0007390975952148438, -0.0004315376281738281, -0.0001239776611328125, 0.00018358230590820312, 0.0004911422729492188, 0.0007987022399902344, 0.00110626220703125, 0.0014138221740722656, 0.0017213821411132812, 0.002028942108154297, 0.0023365020751953125, 0.002644062042236328, 0.0029516220092773438, 0.0032591819763183594, 0.003566741943359375, 0.0038743019104003906, 0.004181861877441406, 0.004489421844482422, 0.0047969818115234375, 0.005104541778564453, 0.005412101745605469, 0.005719661712646484, 0.0060272216796875, 0.006334781646728516, 0.006642341613769531, 0.006949901580810547, 0.0072574615478515625, 0.007565021514892578, 0.007872581481933594, 0.00818014144897461, 0.008487701416015625, 0.00879526138305664, 0.009102821350097656, 0.009410381317138672, 0.009717941284179688, 0.010025501251220703, 0.010333061218261719, 0.010640621185302734, 0.01094818115234375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 3.0, 4.0, 8.0, 6.0, 13.0, 16.0, 15.0, 24.0, 40.0, 39.0, 44.0, 53.0, 66.0, 47.0, 63.0, 61.0, 64.0, 71.0, 60.0, 47.0, 44.0, 51.0, 38.0, 33.0, 28.0, 23.0, 12.0, 12.0, 6.0, 5.0, 8.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001613616943359375, -0.0015282034873962402, -0.0014427900314331055, -0.0013573765754699707, -0.001271963119506836, -0.0011865496635437012, -0.0011011362075805664, -0.0010157227516174316, -0.0009303092956542969, -0.0008448958396911621, -0.0007594823837280273, -0.0006740689277648926, -0.0005886554718017578, -0.000503242015838623, -0.0004178285598754883, -0.0003324151039123535, -0.00024700164794921875, -0.00016158819198608398, -7.617473602294922e-05, 9.238719940185547e-06, 9.465217590332031e-05, 0.00018006563186645508, 0.00026547908782958984, 0.0003508925437927246, 0.0004363059997558594, 0.0005217194557189941, 0.0006071329116821289, 0.0006925463676452637, 0.0007779598236083984, 0.0008633732795715332, 0.000948786735534668, 0.0010342001914978027, 0.0011196136474609375, 0.0012050271034240723, 0.001290440559387207, 0.0013758540153503418, 0.0014612674713134766, 0.0015466809272766113, 0.001632094383239746, 0.0017175078392028809, 0.0018029212951660156, 0.0018883347511291504, 0.001973748207092285, 0.00205916166305542, 0.0021445751190185547, 0.0022299885749816895, 0.0023154020309448242, 0.002400815486907959, 0.0024862289428710938, 0.0025716423988342285, 0.0026570558547973633, 0.002742469310760498, 0.002827882766723633, 0.0029132962226867676, 0.0029987096786499023, 0.003084123134613037, 0.003169536590576172, 0.0032549500465393066, 0.0033403635025024414, 0.003425776958465576, 0.003511190414428711, 0.0035966038703918457, 0.0036820173263549805, 0.0037674307823181152, 0.00385284423828125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 6.0, 6.0, 12.0, 14.0, 20.0, 38.0, 47.0, 55.0, 80.0, 151.0, 258.0, 399.0, 655.0, 1167.0, 2067.0, 3729.0, 6993.0, 13990.0, 28917.0, 65814.0, 168190.0, 376473.0, 223592.0, 83990.0, 36130.0, 17004.0, 8559.0, 4524.0, 2305.0, 1307.0, 775.0, 465.0, 262.0, 187.0, 124.0, 62.0, 56.0, 33.0, 21.0, 15.0, 19.0, 8.0, 13.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.006359100341796875, -0.006151556968688965, -0.005944013595581055, -0.0057364702224731445, -0.005528926849365234, -0.005321383476257324, -0.005113840103149414, -0.004906296730041504, -0.004698753356933594, -0.004491209983825684, -0.0042836666107177734, -0.004076123237609863, -0.003868579864501953, -0.003661036491394043, -0.003453493118286133, -0.0032459497451782227, -0.0030384063720703125, -0.0028308629989624023, -0.002623319625854492, -0.002415776252746582, -0.002208232879638672, -0.0020006895065307617, -0.0017931461334228516, -0.0015856027603149414, -0.0013780593872070312, -0.001170516014099121, -0.0009629726409912109, -0.0007554292678833008, -0.0005478858947753906, -0.00034034252166748047, -0.0001327991485595703, 7.474422454833984e-05, 0.00028228759765625, 0.0004898309707641602, 0.0006973743438720703, 0.0009049177169799805, 0.0011124610900878906, 0.0013200044631958008, 0.001527547836303711, 0.001735091209411621, 0.0019426345825195312, 0.0021501779556274414, 0.0023577213287353516, 0.0025652647018432617, 0.002772808074951172, 0.002980351448059082, 0.003187894821166992, 0.0033954381942749023, 0.0036029815673828125, 0.0038105249404907227, 0.004018068313598633, 0.004225611686706543, 0.004433155059814453, 0.004640698432922363, 0.0048482418060302734, 0.005055785179138184, 0.005263328552246094, 0.005470871925354004, 0.005678415298461914, 0.005885958671569824, 0.006093502044677734, 0.0063010454177856445, 0.006508588790893555, 0.006716132164001465, 0.006923675537109375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 8.0, 3.0, 9.0, 11.0, 16.0, 18.0, 23.0, 19.0, 16.0, 21.0, 31.0, 34.0, 32.0, 38.0, 41.0, 38.0, 58.0, 46.0, 52.0, 61.0, 39.0, 41.0, 43.0, 42.0, 31.0, 26.0, 42.0, 30.0, 15.0, 24.0, 17.0, 13.0, 10.0, 6.0, 8.0, 11.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0018072128295898438, -0.0017547160387039185, -0.0017022192478179932, -0.0016497224569320679, -0.0015972256660461426, -0.0015447288751602173, -0.001492232084274292, -0.0014397352933883667, -0.0013872385025024414, -0.0013347417116165161, -0.0012822449207305908, -0.0012297481298446655, -0.0011772513389587402, -0.001124754548072815, -0.0010722577571868896, -0.0010197609663009644, -0.0009672641754150391, -0.0009147673845291138, -0.0008622705936431885, -0.0008097738027572632, -0.0007572770118713379, -0.0007047802209854126, -0.0006522834300994873, -0.000599786639213562, -0.0005472898483276367, -0.0004947930574417114, -0.00044229626655578613, -0.00038979947566986084, -0.00033730268478393555, -0.00028480589389801025, -0.00023230910301208496, -0.00017981231212615967, -0.00012731552124023438, -7.481873035430908e-05, -2.232193946838379e-05, 3.0174851417541504e-05, 8.26716423034668e-05, 0.0001351684331893921, 0.00018766522407531738, 0.00024016201496124268, 0.00029265880584716797, 0.00034515559673309326, 0.00039765238761901855, 0.00045014917850494385, 0.0005026459693908691, 0.0005551427602767944, 0.0006076395511627197, 0.000660136342048645, 0.0007126331329345703, 0.0007651299238204956, 0.0008176267147064209, 0.0008701235055923462, 0.0009226202964782715, 0.0009751170873641968, 0.001027613878250122, 0.0010801106691360474, 0.0011326074600219727, 0.001185104250907898, 0.0012376010417938232, 0.0012900978326797485, 0.0013425946235656738, 0.0013950914144515991, 0.0014475882053375244, 0.0015000849962234497, 0.001552581787109375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 4.0, 5.0, 1.0, 13.0, 10.0, 13.0, 35.0, 29.0, 44.0, 62.0, 85.0, 148.0, 181.0, 254.0, 461.0, 737.0, 1130.0, 1946.0, 3751.0, 7433.0, 17789.0, 52427.0, 263223.0, 561479.0, 89259.0, 26427.0, 10478.0, 4820.0, 2486.0, 1359.0, 865.0, 543.0, 364.0, 225.0, 142.0, 105.0, 51.0, 40.0, 42.0, 26.0, 21.0, 13.0, 7.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021588802337646484, -0.00020873919129371643, -0.00020159035921096802, -0.0001944415271282196, -0.0001872926950454712, -0.00018014386296272278, -0.00017299503087997437, -0.00016584619879722595, -0.00015869736671447754, -0.00015154853463172913, -0.0001443997025489807, -0.0001372508704662323, -0.0001301020383834839, -0.00012295320630073547, -0.00011580437421798706, -0.00010865554213523865, -0.00010150671005249023, -9.435787796974182e-05, -8.720904588699341e-05, -8.0060213804245e-05, -7.291138172149658e-05, -6.576254963874817e-05, -5.8613717555999756e-05, -5.146488547325134e-05, -4.431605339050293e-05, -3.7167221307754517e-05, -3.0018389225006104e-05, -2.286955714225769e-05, -1.5720725059509277e-05, -8.571892976760864e-06, -1.4230608940124512e-06, 5.725771188735962e-06, 1.2874603271484375e-05, 2.0023435354232788e-05, 2.71722674369812e-05, 3.4321099519729614e-05, 4.146993160247803e-05, 4.861876368522644e-05, 5.5767595767974854e-05, 6.291642785072327e-05, 7.006525993347168e-05, 7.721409201622009e-05, 8.43629240989685e-05, 9.151175618171692e-05, 9.866058826446533e-05, 0.00010580942034721375, 0.00011295825242996216, 0.00012010708451271057, 0.00012725591659545898, 0.0001344047486782074, 0.0001415535807609558, 0.00014870241284370422, 0.00015585124492645264, 0.00016300007700920105, 0.00017014890909194946, 0.00017729774117469788, 0.0001844465732574463, 0.0001915954053401947, 0.00019874423742294312, 0.00020589306950569153, 0.00021304190158843994, 0.00022019073367118835, 0.00022733956575393677, 0.00023448839783668518, 0.0002416372299194336]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 14.0, 25.0, 22.0, 58.0, 43.0, 100.0, 134.0, 221.0, 161.0, 49.0, 62.0, 24.0, 23.0, 15.0, 8.0, 9.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.344650268554688e-06, -8.132308721542358e-06, -7.91996717453003e-06, -7.7076256275177e-06, -7.495284080505371e-06, -7.282942533493042e-06, -7.070600986480713e-06, -6.858259439468384e-06, -6.645917892456055e-06, -6.433576345443726e-06, -6.2212347984313965e-06, -6.008893251419067e-06, -5.796551704406738e-06, -5.584210157394409e-06, -5.37186861038208e-06, -5.159527063369751e-06, -4.947185516357422e-06, -4.734843969345093e-06, -4.522502422332764e-06, -4.3101608753204346e-06, -4.0978193283081055e-06, -3.885477781295776e-06, -3.6731362342834473e-06, -3.460794687271118e-06, -3.248453140258789e-06, -3.03611159324646e-06, -2.823770046234131e-06, -2.6114284992218018e-06, -2.3990869522094727e-06, -2.1867454051971436e-06, -1.9744038581848145e-06, -1.7620623111724854e-06, -1.5497207641601562e-06, -1.3373792171478271e-06, -1.125037670135498e-06, -9.126961231231689e-07, -7.003545761108398e-07, -4.880130290985107e-07, -2.7567148208618164e-07, -6.332993507385254e-08, 1.4901161193847656e-07, 3.6135315895080566e-07, 5.736947059631348e-07, 7.860362529754639e-07, 9.98377799987793e-07, 1.210719347000122e-06, 1.4230608940124512e-06, 1.6354024410247803e-06, 1.8477439880371094e-06, 2.0600855350494385e-06, 2.2724270820617676e-06, 2.4847686290740967e-06, 2.6971101760864258e-06, 2.909451723098755e-06, 3.121793270111084e-06, 3.334134817123413e-06, 3.546476364135742e-06, 3.7588179111480713e-06, 3.9711594581604e-06, 4.1835010051727295e-06, 4.395842552185059e-06, 4.608184099197388e-06, 4.820525646209717e-06, 5.032867193222046e-06, 5.245208740234375e-06]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 6.0, 10.0, 11.0, 14.0, 22.0, 37.0, 49.0, 91.0, 113.0, 220.0, 341.0, 547.0, 973.0, 1764.0, 3123.0, 5743.0, 10306.0, 20908.0, 42272.0, 101109.0, 296915.0, 351151.0, 117055.0, 47343.0, 22581.0, 11874.0, 6073.0, 3322.0, 1888.0, 1124.0, 601.0, 361.0, 201.0, 126.0, 88.0, 44.0, 34.0, 36.0, 16.0, 12.0, 15.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0], "bins": [-8.07642936706543e-05, -7.824599742889404e-05, -7.572770118713379e-05, -7.320940494537354e-05, -7.069110870361328e-05, -6.817281246185303e-05, -6.565451622009277e-05, -6.313621997833252e-05, -6.0617923736572266e-05, -5.809962749481201e-05, -5.558133125305176e-05, -5.3063035011291504e-05, -5.054473876953125e-05, -4.8026442527770996e-05, -4.550814628601074e-05, -4.298985004425049e-05, -4.0471553802490234e-05, -3.795325756072998e-05, -3.5434961318969727e-05, -3.291666507720947e-05, -3.039836883544922e-05, -2.7880072593688965e-05, -2.536177635192871e-05, -2.2843480110168457e-05, -2.0325183868408203e-05, -1.780688762664795e-05, -1.5288591384887695e-05, -1.2770295143127441e-05, -1.0251998901367188e-05, -7.733702659606934e-06, -5.21540641784668e-06, -2.6971101760864258e-06, -1.7881393432617188e-07, 2.339482307434082e-06, 4.857778549194336e-06, 7.37607479095459e-06, 9.894371032714844e-06, 1.2412667274475098e-05, 1.4930963516235352e-05, 1.7449259757995605e-05, 1.996755599975586e-05, 2.2485852241516113e-05, 2.5004148483276367e-05, 2.752244472503662e-05, 3.0040740966796875e-05, 3.255903720855713e-05, 3.507733345031738e-05, 3.759562969207764e-05, 4.011392593383789e-05, 4.2632222175598145e-05, 4.51505184173584e-05, 4.766881465911865e-05, 5.0187110900878906e-05, 5.270540714263916e-05, 5.5223703384399414e-05, 5.774199962615967e-05, 6.026029586791992e-05, 6.277859210968018e-05, 6.529688835144043e-05, 6.781518459320068e-05, 7.033348083496094e-05, 7.285177707672119e-05, 7.537007331848145e-05, 7.78883695602417e-05, 8.040666580200195e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 7.0, 6.0, 5.0, 13.0, 9.0, 13.0, 15.0, 14.0, 15.0, 26.0, 24.0, 24.0, 31.0, 28.0, 37.0, 47.0, 36.0, 54.0, 41.0, 56.0, 44.0, 46.0, 50.0, 51.0, 43.0, 34.0, 33.0, 28.0, 31.0, 20.0, 16.0, 13.0, 12.0, 16.0, 10.0, 14.0, 9.0, 5.0, 6.0, 6.0, 0.0, 3.0, 7.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.990795135498047e-05, -1.9281171262264252e-05, -1.8654391169548035e-05, -1.8027611076831818e-05, -1.74008309841156e-05, -1.6774050891399384e-05, -1.6147270798683167e-05, -1.552049070596695e-05, -1.4893710613250732e-05, -1.4266930520534515e-05, -1.3640150427818298e-05, -1.3013370335102081e-05, -1.2386590242385864e-05, -1.1759810149669647e-05, -1.113303005695343e-05, -1.0506249964237213e-05, -9.879469871520996e-06, -9.252689778804779e-06, -8.625909686088562e-06, -7.999129593372345e-06, -7.372349500656128e-06, -6.745569407939911e-06, -6.118789315223694e-06, -5.492009222507477e-06, -4.86522912979126e-06, -4.238449037075043e-06, -3.6116689443588257e-06, -2.9848888516426086e-06, -2.3581087589263916e-06, -1.7313286662101746e-06, -1.1045485734939575e-06, -4.777684807777405e-07, 1.4901161193847656e-07, 7.757917046546936e-07, 1.4025717973709106e-06, 2.0293518900871277e-06, 2.6561319828033447e-06, 3.2829120755195618e-06, 3.909692168235779e-06, 4.536472260951996e-06, 5.163252353668213e-06, 5.79003244638443e-06, 6.416812539100647e-06, 7.043592631816864e-06, 7.670372724533081e-06, 8.297152817249298e-06, 8.923932909965515e-06, 9.550713002681732e-06, 1.017749309539795e-05, 1.0804273188114166e-05, 1.1431053280830383e-05, 1.20578333735466e-05, 1.2684613466262817e-05, 1.3311393558979034e-05, 1.3938173651695251e-05, 1.4564953744411469e-05, 1.5191733837127686e-05, 1.5818513929843903e-05, 1.644529402256012e-05, 1.7072074115276337e-05, 1.7698854207992554e-05, 1.832563430070877e-05, 1.8952414393424988e-05, 1.9579194486141205e-05, 2.0205974578857422e-05]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 2.0, 4.0, 8.0, 11.0, 11.0, 14.0, 34.0, 23.0, 38.0, 91.0, 98.0, 152.0, 133.0, 116.0, 76.0, 34.0, 39.0, 23.0, 29.0, 17.0, 12.0, 4.0, 7.0, 3.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030823678243905306, -0.002960355021059513, -0.002838341984897852, -0.0027163291815668344, -0.002594316378235817, -0.002472303342074156, -0.0023502905387431383, -0.002228277735412121, -0.0021062646992504597, -0.001984251895919442, -0.0018622389761731029, -0.0017402260564267635, -0.001618213253095746, -0.0014962003333494067, -0.0013741874136030674, -0.00125217461027205, -0.0011301618069410324, -0.001008148887194693, -0.0008861360838636756, -0.0007641231641173363, -0.0006421103025786579, -0.0005200974410399795, -0.00039808452129364014, -0.00027607165975496173, -0.00015405879821628332, -3.2045922125689685e-05, 8.996695396490395e-05, 0.00021197984460741282, 0.0003339927061460912, 0.00045600556768476963, 0.000578018487431109, 0.0007000313489697874, 0.0008220439776778221, 0.0009440568392165005, 0.001066069700755179, 0.0011880826205015182, 0.0013100954238325357, 0.001432108343578875, 0.0015541212633252144, 0.0016761340666562319, 0.0017981469864025712, 0.0019201599061489105, 0.002042172709479928, 0.0021641855128109455, 0.0022861985489726067, 0.002408211352303624, 0.0025302241556346416, 0.002652237191796303, 0.0027742499951273203, 0.002896262798458338, 0.003018275834619999, 0.0031402886379510164, 0.003262301441282034, 0.003384314477443695, 0.0035063272807747126, 0.00362834008410573, 0.003750353120267391, 0.0038723659235984087, 0.003994378726929426, 0.004116391763091087, 0.0042384047992527485, 0.004360417369753122, 0.0044824304059147835, 0.004604443442076445, 0.0047264560125768185]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 6.0, 6.0, 7.0, 9.0, 10.0, 7.0, 11.0, 18.0, 14.0, 22.0, 28.0, 25.0, 26.0, 31.0, 32.0, 36.0, 57.0, 34.0, 50.0, 49.0, 51.0, 46.0, 60.0, 43.0, 45.0, 36.0, 30.0, 31.0, 26.0, 34.0, 26.0, 20.0, 15.0, 8.0, 12.0, 13.0, 6.0, 4.0, 4.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020382783841341734, -0.0019651069305837154, -0.0018919353606179357, -0.0018187637906521559, -0.001745592337101698, -0.00167242088355124, -0.0015992493135854602, -0.0015260777436196804, -0.0014529062900692225, -0.0013797348365187645, -0.0013065632665529847, -0.001233391696587205, -0.001160220243036747, -0.001087048789486289, -0.0010138772195205092, -0.0009407057077623904, -0.0008675341960042715, -0.0007943626842461526, -0.0007211911724880338, -0.0006480196607299149, -0.000574848148971796, -0.0005016766372136772, -0.0004285051254555583, -0.00035533361369743943, -0.00028216210193932056, -0.0002089905901812017, -0.00013581907842308283, -6.264756666496396e-05, 1.0523945093154907e-05, 8.369545685127378e-05, 0.00015686696860939264, 0.0002300384803675115, 0.00030321022495627403, 0.0003763817367143929, 0.00044955324847251177, 0.0005227247602306306, 0.0005958962719887495, 0.0006690677837468684, 0.0007422392955049872, 0.0008154108072631061, 0.000888582319021225, 0.0009617538307793438, 0.0010349253425374627, 0.0011080969125032425, 0.0011812683660537004, 0.0012544398196041584, 0.0013276113895699382, 0.001400782959535718, 0.001473954413086176, 0.0015471258666366339, 0.0016202974366024137, 0.0016934690065681934, 0.0017666404601186514, 0.0018398119136691093, 0.0019129834836348891, 0.001986155053600669, 0.002059326507151127, 0.002132497960701585, 0.0022056694142520428, 0.0022788411006331444, 0.0023520125541836023, 0.0024251840077340603, 0.002498355694115162, 0.00257152714766562, 0.002644698601216078]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 8.0, 8.0, 5.0, 8.0, 7.0, 15.0, 18.0, 15.0, 30.0, 35.0, 52.0, 70.0, 113.0, 150.0, 180.0, 291.0, 456.0, 686.0, 1077.0, 1889.0, 3928.0, 11079.0, 529272.0, 3618928.0, 15313.0, 4766.0, 2347.0, 1254.0, 769.0, 474.0, 302.0, 183.0, 161.0, 90.0, 81.0, 55.0, 40.0, 34.0, 20.0, 22.0, 11.0, 7.0, 9.0, 3.0, 6.0, 4.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00720977783203125, -0.0069702863693237305, -0.006730794906616211, -0.006491303443908691, -0.006251811981201172, -0.006012320518493652, -0.005772829055786133, -0.005533337593078613, -0.005293846130371094, -0.005054354667663574, -0.004814863204956055, -0.004575371742248535, -0.004335880279541016, -0.004096388816833496, -0.0038568973541259766, -0.003617405891418457, -0.0033779144287109375, -0.003138422966003418, -0.0028989315032958984, -0.002659440040588379, -0.0024199485778808594, -0.00218045711517334, -0.0019409656524658203, -0.0017014741897583008, -0.0014619827270507812, -0.0012224912643432617, -0.0009829998016357422, -0.0007435083389282227, -0.0005040168762207031, -0.0002645254135131836, -2.5033950805664062e-05, 0.00021445751190185547, 0.000453948974609375, 0.0006934404373168945, 0.0009329319000244141, 0.0011724233627319336, 0.0014119148254394531, 0.0016514062881469727, 0.0018908977508544922, 0.0021303892135620117, 0.0023698806762695312, 0.0026093721389770508, 0.0028488636016845703, 0.00308835506439209, 0.0033278465270996094, 0.003567337989807129, 0.0038068294525146484, 0.004046320915222168, 0.0042858123779296875, 0.004525303840637207, 0.0047647953033447266, 0.005004286766052246, 0.005243778228759766, 0.005483269691467285, 0.005722761154174805, 0.005962252616882324, 0.006201744079589844, 0.006441235542297363, 0.006680727005004883, 0.006920218467712402, 0.007159709930419922, 0.007399201393127441, 0.007638692855834961, 0.00787818431854248, 0.00811767578125]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 5.0, 8.0, 14.0, 12.0, 11.0, 23.0, 12.0, 25.0, 17.0, 32.0, 27.0, 39.0, 44.0, 47.0, 36.0, 47.0, 57.0, 56.0, 51.0, 48.0, 44.0, 56.0, 38.0, 38.0, 28.0, 23.0, 26.0, 24.0, 23.0, 15.0, 18.0, 7.0, 9.0, 5.0, 3.0, 7.0, 6.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001430511474609375, -0.0013759136199951172, -0.0013213157653808594, -0.0012667179107666016, -0.0012121200561523438, -0.001157522201538086, -0.0011029243469238281, -0.0010483264923095703, -0.0009937286376953125, -0.0009391307830810547, -0.0008845329284667969, -0.0008299350738525391, -0.0007753372192382812, -0.0007207393646240234, -0.0006661415100097656, -0.0006115436553955078, -0.00055694580078125, -0.0005023479461669922, -0.0004477500915527344, -0.00039315223693847656, -0.00033855438232421875, -0.00028395652770996094, -0.00022935867309570312, -0.0001747608184814453, -0.0001201629638671875, -6.556510925292969e-05, -1.0967254638671875e-05, 4.363059997558594e-05, 9.822845458984375e-05, 0.00015282630920410156, 0.00020742416381835938, 0.0002620220184326172, 0.000316619873046875, 0.0003712177276611328, 0.0004258155822753906, 0.00048041343688964844, 0.0005350112915039062, 0.0005896091461181641, 0.0006442070007324219, 0.0006988048553466797, 0.0007534027099609375, 0.0008080005645751953, 0.0008625984191894531, 0.0009171962738037109, 0.0009717941284179688, 0.0010263919830322266, 0.0010809898376464844, 0.0011355876922607422, 0.001190185546875, 0.0012447834014892578, 0.0012993812561035156, 0.0013539791107177734, 0.0014085769653320312, 0.001463174819946289, 0.0015177726745605469, 0.0015723705291748047, 0.0016269683837890625, 0.0016815662384033203, 0.0017361640930175781, 0.001790761947631836, 0.0018453598022460938, 0.0018999576568603516, 0.0019545555114746094, 0.002009153366088867, 0.002063751220703125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 8.0, 3.0, 12.0, 17.0, 26.0, 37.0, 66.0, 110.0, 202.0, 494.0, 1149.0, 3442.0, 13965.0, 375466.0, 3771201.0, 20979.0, 4453.0, 1463.0, 617.0, 244.0, 146.0, 74.0, 42.0, 30.0, 14.0, 13.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0094146728515625, -0.009067416191101074, -0.008720159530639648, -0.008372902870178223, -0.008025646209716797, -0.007678389549255371, -0.007331132888793945, -0.0069838762283325195, -0.006636619567871094, -0.006289362907409668, -0.005942106246948242, -0.005594849586486816, -0.005247592926025391, -0.004900336265563965, -0.004553079605102539, -0.004205822944641113, -0.0038585662841796875, -0.0035113096237182617, -0.003164052963256836, -0.00281679630279541, -0.0024695396423339844, -0.0021222829818725586, -0.0017750263214111328, -0.001427769660949707, -0.0010805130004882812, -0.0007332563400268555, -0.0003859996795654297, -3.8743019104003906e-05, 0.0003085136413574219, 0.0006557703018188477, 0.0010030269622802734, 0.0013502836227416992, 0.001697540283203125, 0.0020447969436645508, 0.0023920536041259766, 0.0027393102645874023, 0.003086566925048828, 0.003433823585510254, 0.0037810802459716797, 0.0041283369064331055, 0.004475593566894531, 0.004822850227355957, 0.005170106887817383, 0.005517363548278809, 0.005864620208740234, 0.00621187686920166, 0.006559133529663086, 0.006906390190124512, 0.0072536468505859375, 0.007600903511047363, 0.007948160171508789, 0.008295416831970215, 0.00864267349243164, 0.008989930152893066, 0.009337186813354492, 0.009684443473815918, 0.010031700134277344, 0.01037895679473877, 0.010726213455200195, 0.011073470115661621, 0.011420726776123047, 0.011767983436584473, 0.012115240097045898, 0.012462496757507324, 0.01280975341796875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 2.0, 1.0, 4.0, 10.0, 6.0, 10.0, 13.0, 15.0, 22.0, 53.0, 174.0, 699.0, 2441.0, 416.0, 104.0, 37.0, 19.0, 16.0, 12.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001739501953125, -0.0016929209232330322, -0.0016463398933410645, -0.0015997588634490967, -0.001553177833557129, -0.0015065968036651611, -0.0014600157737731934, -0.0014134347438812256, -0.0013668537139892578, -0.00132027268409729, -0.0012736916542053223, -0.0012271106243133545, -0.0011805295944213867, -0.001133948564529419, -0.0010873675346374512, -0.0010407865047454834, -0.0009942054748535156, -0.0009476244449615479, -0.0009010434150695801, -0.0008544623851776123, -0.0008078813552856445, -0.0007613003253936768, -0.000714719295501709, -0.0006681382656097412, -0.0006215572357177734, -0.0005749762058258057, -0.0005283951759338379, -0.0004818141460418701, -0.00043523311614990234, -0.00038865208625793457, -0.0003420710563659668, -0.000295490026473999, -0.00024890899658203125, -0.00020232796669006348, -0.0001557469367980957, -0.00010916590690612793, -6.258487701416016e-05, -1.6003847122192383e-05, 3.057718276977539e-05, 7.715821266174316e-05, 0.00012373924255371094, 0.0001703202724456787, 0.00021690130233764648, 0.00026348233222961426, 0.00031006336212158203, 0.0003566443920135498, 0.0004032254219055176, 0.00044980645179748535, 0.0004963874816894531, 0.0005429685115814209, 0.0005895495414733887, 0.0006361305713653564, 0.0006827116012573242, 0.000729292631149292, 0.0007758736610412598, 0.0008224546909332275, 0.0008690357208251953, 0.0009156167507171631, 0.0009621977806091309, 0.0010087788105010986, 0.0010553598403930664, 0.0011019408702850342, 0.001148521900177002, 0.0011951029300689697, 0.0012416839599609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 8.0, 11.0, 13.0, 20.0, 31.0, 28.0, 78.0, 119.0, 177.0, 184.0, 115.0, 70.0, 44.0, 20.0, 26.0, 16.0, 14.0, 7.0, 4.0, 4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023600009735673666, -0.0022484068758785725, -0.0021368125453591347, -0.0020252184476703405, -0.0019136242335662246, -0.0018020300194621086, -0.0016904359217733145, -0.0015788417076691985, -0.0014672474935650826, -0.0013556532794609666, -0.0012440590653568506, -0.0011324649676680565, -0.0010208707535639405, -0.0009092765394598246, -0.0007976823835633695, -0.0006860882276669145, -0.0005744940135627985, -0.000462899828562513, -0.0003513056435622275, -0.00023971145856194198, -0.00012811727356165648, -1.6523059457540512e-05, 9.507109643891454e-05, 0.0002066652523353696, 0.00031825946643948555, 0.00042985365143977106, 0.0005414478364400566, 0.0006530419923365116, 0.0007646362064406276, 0.0008762304205447435, 0.0009878245182335377, 0.0010994187323376536, 0.001211012713611126, 0.001322606927715242, 0.0014342011418193579, 0.001545795239508152, 0.001657389453612268, 0.001768983667716384, 0.001880577765405178, 0.001992172095924616, 0.00210376619361341, 0.002215360291302204, 0.002326954621821642, 0.002438548719510436, 0.00255014281719923, 0.002661737147718668, 0.002773331245407462, 0.0028849253430962563, 0.002996519673615694, 0.003108113771304488, 0.003219708101823926, 0.00333130219951272, 0.003442896530032158, 0.003554490627720952, 0.003666084725409746, 0.003777679055929184, 0.003889273153617978, 0.004000867251306772, 0.00411246158182621, 0.004224055912345648, 0.004335649777203798, 0.004447244107723236, 0.004558838438242674, 0.004670432303100824, 0.004782026633620262]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 5.0, 6.0, 11.0, 11.0, 18.0, 14.0, 12.0, 12.0, 11.0, 16.0, 22.0, 29.0, 32.0, 35.0, 43.0, 45.0, 49.0, 41.0, 51.0, 37.0, 38.0, 42.0, 52.0, 36.0, 40.0, 41.0, 33.0, 35.0, 23.0, 31.0, 17.0, 24.0, 15.0, 15.0, 7.0, 9.0, 8.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014712107367813587, -0.0014199421275407076, -0.0013686735183000565, -0.0013174050254747272, -0.001266136416234076, -0.001214867806993425, -0.0011635993141680956, -0.0011123307049274445, -0.0010610620956867933, -0.0010097934864461422, -0.000958524935413152, -0.0009072563843801618, -0.0008559877751395106, -0.0008047191658988595, -0.0007534506148658693, -0.0007021820638328791, -0.0006509134545922279, -0.0005996448453515768, -0.0005483762943185866, -0.0004971077432855964, -0.00044583913404494524, -0.00039457055390812457, -0.0003433019737713039, -0.0002920333936344832, -0.00024076481349766254, -0.00018949623336084187, -0.0001382276532240212, -8.695907308720052e-05, -3.569049295037985e-05, 1.5578087186440825e-05, 6.68466673232615e-05, 0.00011811524746008217, 0.00016938382759690285, 0.00022065240773372352, 0.0002719209878705442, 0.00032318956800736487, 0.00037445814814418554, 0.0004257267282810062, 0.0004769953084178269, 0.0005282638594508171, 0.0005795324686914682, 0.0006308010779321194, 0.0006820696289651096, 0.0007333381799980998, 0.0007846067892387509, 0.0008358753984794021, 0.0008871439495123923, 0.0009384125005453825, 0.0009896811097860336, 0.0010409497190266848, 0.001092218328267336, 0.0011434868210926652, 0.0011947554303333163, 0.0012460240395739675, 0.0012972925323992968, 0.0013485611416399479, 0.001399829750880599, 0.0014510983601212502, 0.0015023669693619013, 0.0015536354621872306, 0.0016049040714278817, 0.0016561726806685328, 0.0017074411734938622, 0.0017587097827345133, 0.0018099783919751644]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 16.0, 26.0, 21.0, 52.0, 68.0, 96.0, 170.0, 219.0, 333.0, 477.0, 786.0, 1252.0, 1896.0, 2801.0, 4507.0, 6879.0, 10640.0, 16569.0, 25410.0, 39733.0, 62995.0, 101442.0, 163759.0, 210139.0, 148112.0, 91273.0, 57005.0, 36461.0, 23120.0, 14894.0, 9534.0, 6226.0, 4035.0, 2736.0, 1724.0, 1052.0, 740.0, 442.0, 311.0, 185.0, 118.0, 91.0, 59.0, 53.0, 26.0, 17.0, 9.0, 12.0, 7.0, 5.0, 2.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.0010280609130859375, -0.000996321439743042, -0.0009645819664001465, -0.000932842493057251, -0.0009011030197143555, -0.00086936354637146, -0.0008376240730285645, -0.0008058845996856689, -0.0007741451263427734, -0.0007424056529998779, -0.0007106661796569824, -0.0006789267063140869, -0.0006471872329711914, -0.0006154477596282959, -0.0005837082862854004, -0.0005519688129425049, -0.0005202293395996094, -0.0004884898662567139, -0.00045675039291381836, -0.00042501091957092285, -0.00039327144622802734, -0.00036153197288513184, -0.00032979249954223633, -0.0002980530261993408, -0.0002663135528564453, -0.0002345740795135498, -0.0002028346061706543, -0.0001710951328277588, -0.00013935565948486328, -0.00010761618614196777, -7.587671279907227e-05, -4.413723945617676e-05, -1.239776611328125e-05, 1.9341707229614258e-05, 5.1081180572509766e-05, 8.282065391540527e-05, 0.00011456012725830078, 0.0001462996006011963, 0.0001780390739440918, 0.0002097785472869873, 0.0002415180206298828, 0.0002732574939727783, 0.00030499696731567383, 0.00033673644065856934, 0.00036847591400146484, 0.00040021538734436035, 0.00043195486068725586, 0.00046369433403015137, 0.0004954338073730469, 0.0005271732807159424, 0.0005589127540588379, 0.0005906522274017334, 0.0006223917007446289, 0.0006541311740875244, 0.0006858706474304199, 0.0007176101207733154, 0.0007493495941162109, 0.0007810890674591064, 0.000812828540802002, 0.0008445680141448975, 0.000876307487487793, 0.0009080469608306885, 0.000939786434173584, 0.0009715259075164795, 0.001003265380859375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 9.0, 9.0, 4.0, 10.0, 10.0, 8.0, 18.0, 9.0, 16.0, 18.0, 17.0, 22.0, 24.0, 31.0, 33.0, 47.0, 49.0, 49.0, 36.0, 40.0, 57.0, 40.0, 39.0, 40.0, 37.0, 40.0, 34.0, 37.0, 28.0, 21.0, 24.0, 20.0, 21.0, 17.0, 14.0, 14.0, 12.0, 11.0, 9.0, 2.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0015707015991210938, -0.00151766836643219, -0.0014646351337432861, -0.0014116019010543823, -0.0013585686683654785, -0.0013055354356765747, -0.001252502202987671, -0.001199468970298767, -0.0011464357376098633, -0.0010934025049209595, -0.0010403692722320557, -0.0009873360395431519, -0.000934302806854248, -0.0008812695741653442, -0.0008282363414764404, -0.0007752031087875366, -0.0007221698760986328, -0.000669136643409729, -0.0006161034107208252, -0.0005630701780319214, -0.0005100369453430176, -0.00045700371265411377, -0.00040397047996520996, -0.00035093724727630615, -0.00029790401458740234, -0.00024487078189849854, -0.00019183754920959473, -0.00013880431652069092, -8.577108383178711e-05, -3.27378511428833e-05, 2.0295381546020508e-05, 7.332861423492432e-05, 0.00012636184692382812, 0.00017939507961273193, 0.00023242831230163574, 0.00028546154499053955, 0.00033849477767944336, 0.00039152801036834717, 0.000444561243057251, 0.0004975944757461548, 0.0005506277084350586, 0.0006036609411239624, 0.0006566941738128662, 0.00070972740650177, 0.0007627606391906738, 0.0008157938718795776, 0.0008688271045684814, 0.0009218603372573853, 0.0009748935699462891, 0.0010279268026351929, 0.0010809600353240967, 0.0011339932680130005, 0.0011870265007019043, 0.001240059733390808, 0.001293092966079712, 0.0013461261987686157, 0.0013991594314575195, 0.0014521926641464233, 0.0015052258968353271, 0.001558259129524231, 0.0016112923622131348, 0.0016643255949020386, 0.0017173588275909424, 0.0017703920602798462, 0.00182342529296875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 9.0, 11.0, 15.0, 25.0, 40.0, 55.0, 87.0, 121.0, 188.0, 336.0, 512.0, 860.0, 1247.0, 2078.0, 3385.0, 5631.0, 9826.0, 17007.0, 31247.0, 60936.0, 136709.0, 369569.0, 223418.0, 88506.0, 42469.0, 22634.0, 12809.0, 7531.0, 4380.0, 2586.0, 1595.0, 1009.0, 593.0, 400.0, 283.0, 167.0, 112.0, 64.0, 39.0, 17.0, 14.0, 15.0, 10.0, 2.0, 0.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014295578002929688, -0.0013871937990188599, -0.001344829797744751, -0.001302465796470642, -0.0012601017951965332, -0.0012177377939224243, -0.0011753737926483154, -0.0011330097913742065, -0.0010906457901000977, -0.0010482817888259888, -0.0010059177875518799, -0.000963553786277771, -0.0009211897850036621, -0.0008788257837295532, -0.0008364617824554443, -0.0007940977811813354, -0.0007517337799072266, -0.0007093697786331177, -0.0006670057773590088, -0.0006246417760848999, -0.000582277774810791, -0.0005399137735366821, -0.0004975497722625732, -0.00045518577098846436, -0.00041282176971435547, -0.0003704577684402466, -0.0003280937671661377, -0.0002857297658920288, -0.00024336576461791992, -0.00020100176334381104, -0.00015863776206970215, -0.00011627376079559326, -7.390975952148438e-05, -3.154575824737549e-05, 1.0818243026733398e-05, 5.3182244300842285e-05, 9.554624557495117e-05, 0.00013791024684906006, 0.00018027424812316895, 0.00022263824939727783, 0.0002650022506713867, 0.0003073662519454956, 0.0003497302532196045, 0.0003920942544937134, 0.00043445825576782227, 0.00047682225704193115, 0.00051918625831604, 0.0005615502595901489, 0.0006039142608642578, 0.0006462782621383667, 0.0006886422634124756, 0.0007310062646865845, 0.0007733702659606934, 0.0008157342672348022, 0.0008580982685089111, 0.00090046226978302, 0.0009428262710571289, 0.0009851902723312378, 0.0010275542736053467, 0.0010699182748794556, 0.0011122822761535645, 0.0011546462774276733, 0.0011970102787017822, 0.0012393742799758911, 0.00128173828125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 6.0, 3.0, 7.0, 10.0, 5.0, 8.0, 13.0, 16.0, 12.0, 19.0, 16.0, 27.0, 24.0, 32.0, 25.0, 25.0, 44.0, 40.0, 43.0, 40.0, 31.0, 39.0, 43.0, 39.0, 37.0, 37.0, 37.0, 38.0, 47.0, 22.0, 38.0, 31.0, 28.0, 25.0, 21.0, 11.0, 18.0, 12.0, 6.0, 6.0, 4.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001068115234375, -0.0010350793600082397, -0.0010020434856414795, -0.0009690076112747192, -0.000935971736907959, -0.0009029358625411987, -0.0008698999881744385, -0.0008368641138076782, -0.000803828239440918, -0.0007707923650741577, -0.0007377564907073975, -0.0007047206163406372, -0.000671684741973877, -0.0006386488676071167, -0.0006056129932403564, -0.0005725771188735962, -0.0005395412445068359, -0.0005065053701400757, -0.00047346949577331543, -0.0004404336214065552, -0.0004073977470397949, -0.00037436187267303467, -0.0003413259983062744, -0.00030829012393951416, -0.0002752542495727539, -0.00024221837520599365, -0.0002091825008392334, -0.00017614662647247314, -0.0001431107521057129, -0.00011007487773895264, -7.703900337219238e-05, -4.400312900543213e-05, -1.0967254638671875e-05, 2.206861972808838e-05, 5.510449409484863e-05, 8.814036846160889e-05, 0.00012117624282836914, 0.0001542121171951294, 0.00018724799156188965, 0.0002202838659286499, 0.00025331974029541016, 0.0002863556146621704, 0.00031939148902893066, 0.0003524273633956909, 0.00038546323776245117, 0.0004184991121292114, 0.0004515349864959717, 0.00048457086086273193, 0.0005176067352294922, 0.0005506426095962524, 0.0005836784839630127, 0.000616714358329773, 0.0006497502326965332, 0.0006827861070632935, 0.0007158219814300537, 0.000748857855796814, 0.0007818937301635742, 0.0008149296045303345, 0.0008479654788970947, 0.000881001353263855, 0.0009140372276306152, 0.0009470731019973755, 0.0009801089763641357, 0.001013144850730896, 0.0010461807250976562]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 6.0, 13.0, 25.0, 27.0, 62.0, 60.0, 100.0, 160.0, 264.0, 426.0, 601.0, 1049.0, 1700.0, 3097.0, 5736.0, 11784.0, 26894.0, 82297.0, 580136.0, 244800.0, 50661.0, 19113.0, 8741.0, 4420.0, 2549.0, 1407.0, 841.0, 578.0, 332.0, 214.0, 145.0, 100.0, 64.0, 53.0, 26.0, 24.0, 18.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002593994140625, -0.0002517271786928177, -0.00024405494332313538, -0.00023638270795345306, -0.00022871047258377075, -0.00022103823721408844, -0.00021336600184440613, -0.00020569376647472382, -0.0001980215311050415, -0.0001903492957353592, -0.00018267706036567688, -0.00017500482499599457, -0.00016733258962631226, -0.00015966035425662994, -0.00015198811888694763, -0.00014431588351726532, -0.000136643648147583, -0.0001289714127779007, -0.00012129917740821838, -0.00011362694203853607, -0.00010595470666885376, -9.828247129917145e-05, -9.061023592948914e-05, -8.293800055980682e-05, -7.526576519012451e-05, -6.75935298204422e-05, -5.992129445075989e-05, -5.2249059081077576e-05, -4.4576823711395264e-05, -3.690458834171295e-05, -2.923235297203064e-05, -2.1560117602348328e-05, -1.3887882232666016e-05, -6.215646862983704e-06, 1.4565885066986084e-06, 9.12882387638092e-06, 1.6801059246063232e-05, 2.4473294615745544e-05, 3.2145529985427856e-05, 3.981776535511017e-05, 4.749000072479248e-05, 5.516223609447479e-05, 6.28344714641571e-05, 7.050670683383942e-05, 7.817894220352173e-05, 8.585117757320404e-05, 9.352341294288635e-05, 0.00010119564831256866, 0.00010886788368225098, 0.00011654011905193329, 0.0001242123544216156, 0.0001318845897912979, 0.00013955682516098022, 0.00014722906053066254, 0.00015490129590034485, 0.00016257353127002716, 0.00017024576663970947, 0.00017791800200939178, 0.0001855902373790741, 0.0001932624727487564, 0.00020093470811843872, 0.00020860694348812103, 0.00021627917885780334, 0.00022395141422748566, 0.00023162364959716797]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 7.0, 7.0, 12.0, 10.0, 12.0, 27.0, 28.0, 23.0, 54.0, 68.0, 53.0, 90.0, 109.0, 70.0, 99.0, 49.0, 61.0, 49.0, 23.0, 35.0, 26.0, 12.0, 14.0, 16.0, 5.0, 7.0, 7.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.589557647705078e-06, -4.431232810020447e-06, -4.2729079723358154e-06, -4.114583134651184e-06, -3.956258296966553e-06, -3.7979334592819214e-06, -3.63960862159729e-06, -3.4812837839126587e-06, -3.3229589462280273e-06, -3.164634108543396e-06, -3.0063092708587646e-06, -2.8479844331741333e-06, -2.689659595489502e-06, -2.5313347578048706e-06, -2.3730099201202393e-06, -2.214685082435608e-06, -2.0563602447509766e-06, -1.8980354070663452e-06, -1.7397105693817139e-06, -1.5813857316970825e-06, -1.4230608940124512e-06, -1.2647360563278198e-06, -1.1064112186431885e-06, -9.480863809585571e-07, -7.897615432739258e-07, -6.314367055892944e-07, -4.731118679046631e-07, -3.1478703022003174e-07, -1.564621925354004e-07, 1.862645149230957e-09, 1.601874828338623e-07, 3.1851232051849365e-07, 4.76837158203125e-07, 6.351619958877563e-07, 7.934868335723877e-07, 9.51811671257019e-07, 1.1101365089416504e-06, 1.2684613466262817e-06, 1.426786184310913e-06, 1.5851110219955444e-06, 1.7434358596801758e-06, 1.9017606973648071e-06, 2.0600855350494385e-06, 2.21841037273407e-06, 2.376735210418701e-06, 2.5350600481033325e-06, 2.693384885787964e-06, 2.8517097234725952e-06, 3.0100345611572266e-06, 3.168359398841858e-06, 3.3266842365264893e-06, 3.4850090742111206e-06, 3.643333911895752e-06, 3.8016587495803833e-06, 3.959983587265015e-06, 4.118308424949646e-06, 4.276633262634277e-06, 4.434958100318909e-06, 4.59328293800354e-06, 4.751607775688171e-06, 4.909932613372803e-06, 5.068257451057434e-06, 5.2265822887420654e-06, 5.384907126426697e-06, 5.543231964111328e-06]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 5.0, 10.0, 6.0, 5.0, 9.0, 14.0, 10.0, 30.0, 28.0, 72.0, 120.0, 226.0, 542.0, 1155.0, 2938.0, 8249.0, 27785.0, 145954.0, 714645.0, 111732.0, 23307.0, 7138.0, 2504.0, 1051.0, 488.0, 202.0, 105.0, 64.0, 46.0, 24.0, 22.0, 14.0, 14.0, 12.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0004010200500488281, -0.00038970261812210083, -0.00037838518619537354, -0.00036706775426864624, -0.00035575032234191895, -0.00034443289041519165, -0.00033311545848846436, -0.00032179802656173706, -0.00031048059463500977, -0.00029916316270828247, -0.0002878457307815552, -0.0002765282988548279, -0.0002652108669281006, -0.0002538934350013733, -0.000242576003074646, -0.0002312585711479187, -0.0002199411392211914, -0.0002086237072944641, -0.00019730627536773682, -0.00018598884344100952, -0.00017467141151428223, -0.00016335397958755493, -0.00015203654766082764, -0.00014071911573410034, -0.00012940168380737305, -0.00011808425188064575, -0.00010676681995391846, -9.544938802719116e-05, -8.413195610046387e-05, -7.281452417373657e-05, -6.149709224700928e-05, -5.017966032028198e-05, -3.886222839355469e-05, -2.7544796466827393e-05, -1.6227364540100098e-05, -4.909932613372803e-06, 6.407499313354492e-06, 1.7724931240081787e-05, 2.9042363166809082e-05, 4.035979509353638e-05, 5.167722702026367e-05, 6.299465894699097e-05, 7.431209087371826e-05, 8.562952280044556e-05, 9.694695472717285e-05, 0.00010826438665390015, 0.00011958181858062744, 0.00013089925050735474, 0.00014221668243408203, 0.00015353411436080933, 0.00016485154628753662, 0.00017616897821426392, 0.0001874864101409912, 0.0001988038420677185, 0.0002101212739944458, 0.0002214387059211731, 0.0002327561378479004, 0.00024407356977462769, 0.000255391001701355, 0.0002667084336280823, 0.00027802586555480957, 0.00028934329748153687, 0.00030066072940826416, 0.00031197816133499146, 0.00032329559326171875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 8.0, 4.0, 6.0, 10.0, 11.0, 14.0, 20.0, 26.0, 18.0, 23.0, 18.0, 54.0, 45.0, 70.0, 69.0, 89.0, 67.0, 70.0, 62.0, 58.0, 49.0, 26.0, 27.0, 32.0, 16.0, 15.0, 13.0, 8.0, 8.0, 10.0, 5.0, 10.0, 7.0, 2.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.731250762939453e-05, -3.60291451215744e-05, -3.474578261375427e-05, -3.346242010593414e-05, -3.2179057598114014e-05, -3.0895695090293884e-05, -2.9612332582473755e-05, -2.8328970074653625e-05, -2.7045607566833496e-05, -2.5762245059013367e-05, -2.4478882551193237e-05, -2.3195520043373108e-05, -2.191215753555298e-05, -2.062879502773285e-05, -1.934543251991272e-05, -1.806207001209259e-05, -1.677870750427246e-05, -1.549534499645233e-05, -1.4211982488632202e-05, -1.2928619980812073e-05, -1.1645257472991943e-05, -1.0361894965171814e-05, -9.078532457351685e-06, -7.795169949531555e-06, -6.511807441711426e-06, -5.228444933891296e-06, -3.945082426071167e-06, -2.6617199182510376e-06, -1.3783574104309082e-06, -9.499490261077881e-08, 1.1883676052093506e-06, 2.47173011302948e-06, 3.7550926208496094e-06, 5.038455128669739e-06, 6.321817636489868e-06, 7.6051801443099976e-06, 8.888542652130127e-06, 1.0171905159950256e-05, 1.1455267667770386e-05, 1.2738630175590515e-05, 1.4021992683410645e-05, 1.5305355191230774e-05, 1.6588717699050903e-05, 1.7872080206871033e-05, 1.9155442714691162e-05, 2.043880522251129e-05, 2.172216773033142e-05, 2.300553023815155e-05, 2.428889274597168e-05, 2.557225525379181e-05, 2.685561776161194e-05, 2.8138980269432068e-05, 2.9422342777252197e-05, 3.070570528507233e-05, 3.1989067792892456e-05, 3.3272430300712585e-05, 3.4555792808532715e-05, 3.5839155316352844e-05, 3.7122517824172974e-05, 3.84058803319931e-05, 3.968924283981323e-05, 4.097260534763336e-05, 4.225596785545349e-05, 4.353933036327362e-05, 4.482269287109375e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 11.0, 14.0, 17.0, 13.0, 28.0, 44.0, 54.0, 103.0, 160.0, 146.0, 125.0, 88.0, 51.0, 34.0, 23.0, 20.0, 18.0, 13.0, 9.0, 3.0, 2.0, 5.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023277150467038155, -0.002228298457339406, -0.0021288818679749966, -0.002029465278610587, -0.0019300486892461777, -0.0018306320998817682, -0.0017312155105173588, -0.0016317989211529493, -0.0015323823317885399, -0.0014329657424241304, -0.001333549153059721, -0.0012341325636953115, -0.001134715974330902, -0.0010352993849664927, -0.0009358827373944223, -0.0008364661480300128, -0.0007370495004579425, -0.000637632911093533, -0.0005382163217291236, -0.0004387997032608837, -0.00033938311389647424, -0.00023996649542823434, -0.0001405499060638249, -4.1133316699415445e-05, 5.8283272664994e-05, 0.00015769986202940345, 0.0002571164513938129, 0.0003565330698620528, 0.00045594965922646224, 0.0005553662776947021, 0.0006547828670591116, 0.000754199456423521, 0.0008536160457879305, 0.0009530326351523399, 0.0010524492245167494, 0.0011518658138811588, 0.0012512824032455683, 0.0013506989926099777, 0.0014501155819743872, 0.0015495321713387966, 0.001648948760703206, 0.0017483653500676155, 0.001847781939432025, 0.0019471985287964344, 0.002046615118160844, 0.0021460317075252533, 0.0022454482968896627, 0.002344864886254072, 0.0024442817084491253, 0.0025436982978135347, 0.002643114887177944, 0.0027425314765423536, 0.002841948065906763, 0.0029413646552711725, 0.003040781244635582, 0.0031401978339999914, 0.003239614423364401, 0.0033390310127288103, 0.0034384476020932198, 0.003537864191457629, 0.0036372807808220387, 0.003736697370186448, 0.0038361139595508575, 0.003935530781745911, 0.0040349471382796764]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 3.0, 6.0, 7.0, 6.0, 10.0, 15.0, 21.0, 11.0, 9.0, 16.0, 12.0, 24.0, 24.0, 28.0, 34.0, 47.0, 40.0, 51.0, 41.0, 47.0, 43.0, 36.0, 49.0, 47.0, 37.0, 38.0, 46.0, 33.0, 34.0, 28.0, 28.0, 23.0, 21.0, 12.0, 20.0, 6.0, 11.0, 8.0, 6.0, 3.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0015165491495281458, -0.0014640658628195524, -0.0014115826925262809, -0.0013590994058176875, -0.001306616235524416, -0.0012541329488158226, -0.001201649778522551, -0.0011491664918139577, -0.0010966833215206861, -0.0010442000348120928, -0.0009917168645188212, -0.0009392336360178888, -0.0008867504075169563, -0.000834267120808363, -0.0007817839505150914, -0.000729300663806498, -0.0006768174353055656, -0.0006243342068046331, -0.0005718509783037007, -0.0005193677498027682, -0.0004668845213018358, -0.00041440126369707286, -0.0003619180351961404, -0.00030943480669520795, -0.0002569515781942755, -0.00020446834969334304, -0.0001519851211924106, -9.95018781395629e-05, -4.701864963863045e-05, 5.464593414217234e-06, 5.794782191514969e-05, 0.00011043105041608214, 0.0001629142789170146, 0.00021539750741794705, 0.0002678807359188795, 0.00032036396441981196, 0.0003728471929207444, 0.00042533045052550733, 0.0004778136790264398, 0.0005302969366312027, 0.0005827801069244742, 0.0006352633354254067, 0.0006877465639263391, 0.0007402297924272716, 0.0007927130209282041, 0.0008451963076367974, 0.000897679477930069, 0.0009501627646386623, 0.0010026460513472557, 0.001055129338055849, 0.0011076125083491206, 0.001160095795057714, 0.0012125789653509855, 0.001265062252059579, 0.0013175454223528504, 0.0013700287090614438, 0.0014225118793547153, 0.0014749951660633087, 0.0015274783363565803, 0.0015799616230651736, 0.0016324447933584452, 0.0016849280800670385, 0.00173741125036031, 0.0017898945370689034, 0.001842377707362175]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 14.0, 18.0, 24.0, 40.0, 65.0, 94.0, 123.0, 174.0, 342.0, 487.0, 811.0, 1312.0, 1983.0, 3428.0, 5658.0, 9812.0, 17638.0, 34034.0, 70653.0, 160546.0, 308454.0, 229992.0, 101511.0, 46594.0, 23726.0, 12860.0, 7194.0, 4148.0, 2586.0, 1574.0, 988.0, 558.0, 426.0, 243.0, 147.0, 110.0, 56.0, 44.0, 31.0, 21.0, 7.0, 12.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0040283203125, -0.003908872604370117, -0.0037894248962402344, -0.0036699771881103516, -0.0035505294799804688, -0.003431081771850586, -0.003311634063720703, -0.0031921863555908203, -0.0030727386474609375, -0.0029532909393310547, -0.002833843231201172, -0.002714395523071289, -0.0025949478149414062, -0.0024755001068115234, -0.0023560523986816406, -0.002236604690551758, -0.002117156982421875, -0.001997709274291992, -0.0018782615661621094, -0.0017588138580322266, -0.0016393661499023438, -0.001519918441772461, -0.0014004707336425781, -0.0012810230255126953, -0.0011615753173828125, -0.0010421276092529297, -0.0009226799011230469, -0.0008032321929931641, -0.0006837844848632812, -0.0005643367767333984, -0.0004448890686035156, -0.0003254413604736328, -0.00020599365234375, -8.654594421386719e-05, 3.2901763916015625e-05, 0.00015234947204589844, 0.00027179718017578125, 0.00039124488830566406, 0.0005106925964355469, 0.0006301403045654297, 0.0007495880126953125, 0.0008690357208251953, 0.0009884834289550781, 0.001107931137084961, 0.0012273788452148438, 0.0013468265533447266, 0.0014662742614746094, 0.0015857219696044922, 0.001705169677734375, 0.0018246173858642578, 0.0019440650939941406, 0.0020635128021240234, 0.0021829605102539062, 0.002302408218383789, 0.002421855926513672, 0.0025413036346435547, 0.0026607513427734375, 0.0027801990509033203, 0.002899646759033203, 0.003019094467163086, 0.0031385421752929688, 0.0032579898834228516, 0.0033774375915527344, 0.003496885299682617, 0.0036163330078125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 2.0, 9.0, 9.0, 12.0, 8.0, 12.0, 15.0, 15.0, 15.0, 24.0, 12.0, 31.0, 46.0, 55.0, 47.0, 51.0, 54.0, 45.0, 53.0, 48.0, 48.0, 45.0, 44.0, 45.0, 50.0, 37.0, 31.0, 29.0, 20.0, 16.0, 17.0, 9.0, 6.0, 15.0, 5.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0013132095336914062, -0.001274213194847107, -0.0012352168560028076, -0.0011962205171585083, -0.001157224178314209, -0.0011182278394699097, -0.0010792315006256104, -0.001040235161781311, -0.0010012388229370117, -0.0009622424840927124, -0.0009232461452484131, -0.0008842498064041138, -0.0008452534675598145, -0.0008062571287155151, -0.0007672607898712158, -0.0007282644510269165, -0.0006892681121826172, -0.0006502717733383179, -0.0006112754344940186, -0.0005722790956497192, -0.0005332827568054199, -0.0004942864179611206, -0.0004552900791168213, -0.00041629374027252197, -0.00037729740142822266, -0.00033830106258392334, -0.000299304723739624, -0.0002603083848953247, -0.0002213120460510254, -0.00018231570720672607, -0.00014331936836242676, -0.00010432302951812744, -6.532669067382812e-05, -2.633035182952881e-05, 1.2665987014770508e-05, 5.1662325859069824e-05, 9.065866470336914e-05, 0.00012965500354766846, 0.00016865134239196777, 0.0002076476812362671, 0.0002466440200805664, 0.0002856403589248657, 0.00032463669776916504, 0.00036363303661346436, 0.00040262937545776367, 0.000441625714302063, 0.0004806220531463623, 0.0005196183919906616, 0.0005586147308349609, 0.0005976110696792603, 0.0006366074085235596, 0.0006756037473678589, 0.0007146000862121582, 0.0007535964250564575, 0.0007925927639007568, 0.0008315891027450562, 0.0008705854415893555, 0.0009095817804336548, 0.0009485781192779541, 0.0009875744581222534, 0.0010265707969665527, 0.001065567135810852, 0.0011045634746551514, 0.0011435598134994507, 0.00118255615234375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 8.0, 9.0, 9.0, 13.0, 24.0, 28.0, 47.0, 64.0, 119.0, 152.0, 271.0, 446.0, 808.0, 1421.0, 2638.0, 5153.0, 10549.0, 22582.0, 51670.0, 142805.0, 418081.0, 249162.0, 80254.0, 32302.0, 14720.0, 7214.0, 3567.0, 1884.0, 1031.0, 575.0, 337.0, 215.0, 116.0, 86.0, 59.0, 47.0, 25.0, 23.0, 10.0, 11.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0037212371826171875, -0.0035870373249053955, -0.0034528374671936035, -0.0033186376094818115, -0.0031844377517700195, -0.0030502378940582275, -0.0029160380363464355, -0.0027818381786346436, -0.0026476383209228516, -0.0025134384632110596, -0.0023792386054992676, -0.0022450387477874756, -0.0021108388900756836, -0.0019766390323638916, -0.0018424391746520996, -0.0017082393169403076, -0.0015740394592285156, -0.0014398396015167236, -0.0013056397438049316, -0.0011714398860931396, -0.0010372400283813477, -0.0009030401706695557, -0.0007688403129577637, -0.0006346404552459717, -0.0005004405975341797, -0.0003662407398223877, -0.0002320408821105957, -9.784102439880371e-05, 3.635883331298828e-05, 0.00017055869102478027, 0.00030475854873657227, 0.00043895840644836426, 0.0005731582641601562, 0.0007073581218719482, 0.0008415579795837402, 0.0009757578372955322, 0.0011099576950073242, 0.0012441575527191162, 0.0013783574104309082, 0.0015125572681427002, 0.0016467571258544922, 0.0017809569835662842, 0.0019151568412780762, 0.002049356698989868, 0.00218355655670166, 0.002317756414413452, 0.002451956272125244, 0.002586156129837036, 0.002720355987548828, 0.00285455584526062, 0.002988755702972412, 0.003122955560684204, 0.003257155418395996, 0.003391355276107788, 0.00352555513381958, 0.003659754991531372, 0.003793954849243164, 0.003928154706954956, 0.004062354564666748, 0.00419655442237854, 0.004330754280090332, 0.004464954137802124, 0.004599153995513916, 0.004733353853225708, 0.0048675537109375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 10.0, 11.0, 12.0, 7.0, 19.0, 23.0, 16.0, 36.0, 31.0, 36.0, 48.0, 55.0, 45.0, 49.0, 51.0, 47.0, 55.0, 61.0, 54.0, 52.0, 41.0, 32.0, 32.0, 28.0, 20.0, 20.0, 22.0, 13.0, 14.0, 9.0, 10.0, 10.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0011882781982421875, -0.0011550411581993103, -0.001121804118156433, -0.001088567078113556, -0.0010553300380706787, -0.0010220929980278015, -0.0009888559579849243, -0.0009556189179420471, -0.0009223818778991699, -0.0008891448378562927, -0.0008559077978134155, -0.0008226707577705383, -0.0007894337177276611, -0.0007561966776847839, -0.0007229596376419067, -0.0006897225975990295, -0.0006564855575561523, -0.0006232485175132751, -0.000590011477470398, -0.0005567744374275208, -0.0005235373973846436, -0.0004903003573417664, -0.00045706331729888916, -0.00042382627725601196, -0.00039058923721313477, -0.00035735219717025757, -0.00032411515712738037, -0.0002908781170845032, -0.000257641077041626, -0.00022440403699874878, -0.00019116699695587158, -0.00015792995691299438, -0.0001246929168701172, -9.145587682723999e-05, -5.821883678436279e-05, -2.4981796741485596e-05, 8.255243301391602e-06, 4.14922833442688e-05, 7.4729323387146e-05, 0.0001079663634300232, 0.0001412034034729004, 0.0001744404435157776, 0.00020767748355865479, 0.00024091452360153198, 0.0002741515636444092, 0.0003073886036872864, 0.0003406256437301636, 0.00037386268377304077, 0.00040709972381591797, 0.00044033676385879517, 0.00047357380390167236, 0.0005068108439445496, 0.0005400478839874268, 0.000573284924030304, 0.0006065219640731812, 0.0006397590041160583, 0.0006729960441589355, 0.0007062330842018127, 0.0007394701242446899, 0.0007727071642875671, 0.0008059442043304443, 0.0008391812443733215, 0.0008724182844161987, 0.0009056553244590759, 0.0009388923645019531]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 14.0, 15.0, 10.0, 27.0, 33.0, 51.0, 76.0, 137.0, 199.0, 363.0, 667.0, 1332.0, 2963.0, 7389.0, 23965.0, 123743.0, 741519.0, 110814.0, 22439.0, 7055.0, 2773.0, 1344.0, 632.0, 397.0, 217.0, 153.0, 67.0, 48.0, 38.0, 24.0, 9.0, 15.0, 5.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001703500747680664, -0.0001647602766752243, -0.0001591704785823822, -0.0001535806804895401, -0.000147990882396698, -0.0001424010843038559, -0.0001368112862110138, -0.0001312214881181717, -0.0001256316900253296, -0.00012004189193248749, -0.00011445209383964539, -0.00010886229574680328, -0.00010327249765396118, -9.768269956111908e-05, -9.209290146827698e-05, -8.650310337543488e-05, -8.091330528259277e-05, -7.532350718975067e-05, -6.973370909690857e-05, -6.414391100406647e-05, -5.8554112911224365e-05, -5.296431481838226e-05, -4.737451672554016e-05, -4.178471863269806e-05, -3.619492053985596e-05, -3.0605122447013855e-05, -2.5015324354171753e-05, -1.942552626132965e-05, -1.3835728168487549e-05, -8.245930075645447e-06, -2.6561319828033447e-06, 2.9336661100387573e-06, 8.52346420288086e-06, 1.4113262295722961e-05, 1.9703060388565063e-05, 2.5292858481407166e-05, 3.088265657424927e-05, 3.647245466709137e-05, 4.206225275993347e-05, 4.7652050852775574e-05, 5.3241848945617676e-05, 5.883164703845978e-05, 6.442144513130188e-05, 7.001124322414398e-05, 7.560104131698608e-05, 8.119083940982819e-05, 8.678063750267029e-05, 9.237043559551239e-05, 9.796023368835449e-05, 0.0001035500317811966, 0.0001091398298740387, 0.0001147296279668808, 0.0001203194260597229, 0.000125909224152565, 0.0001314990222454071, 0.0001370888203382492, 0.0001426786184310913, 0.0001482684165239334, 0.0001538582146167755, 0.00015944801270961761, 0.00016503781080245972, 0.00017062760889530182, 0.00017621740698814392, 0.00018180720508098602, 0.00018739700317382812]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 8.0, 9.0, 16.0, 21.0, 30.0, 41.0, 84.0, 69.0, 126.0, 208.0, 114.0, 75.0, 48.0, 32.0, 24.0, 19.0, 7.0, 9.0, 9.0, 8.0, 3.0, 9.0, 1.0, 2.0, 2.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.569789886474609e-06, -7.372349500656128e-06, -7.1749091148376465e-06, -6.977468729019165e-06, -6.780028343200684e-06, -6.582587957382202e-06, -6.385147571563721e-06, -6.187707185745239e-06, -5.990266799926758e-06, -5.792826414108276e-06, -5.595386028289795e-06, -5.3979456424713135e-06, -5.200505256652832e-06, -5.003064870834351e-06, -4.805624485015869e-06, -4.608184099197388e-06, -4.410743713378906e-06, -4.213303327560425e-06, -4.015862941741943e-06, -3.818422555923462e-06, -3.6209821701049805e-06, -3.423541784286499e-06, -3.2261013984680176e-06, -3.028661012649536e-06, -2.8312206268310547e-06, -2.6337802410125732e-06, -2.436339855194092e-06, -2.2388994693756104e-06, -2.041459083557129e-06, -1.8440186977386475e-06, -1.646578311920166e-06, -1.4491379261016846e-06, -1.2516975402832031e-06, -1.0542571544647217e-06, -8.568167686462402e-07, -6.593763828277588e-07, -4.6193599700927734e-07, -2.644956111907959e-07, -6.705522537231445e-08, 1.30385160446167e-07, 3.2782554626464844e-07, 5.252659320831299e-07, 7.227063179016113e-07, 9.201467037200928e-07, 1.1175870895385742e-06, 1.3150274753570557e-06, 1.5124678611755371e-06, 1.7099082469940186e-06, 1.9073486328125e-06, 2.1047890186309814e-06, 2.302229404449463e-06, 2.4996697902679443e-06, 2.6971101760864258e-06, 2.8945505619049072e-06, 3.0919909477233887e-06, 3.28943133354187e-06, 3.4868717193603516e-06, 3.684312105178833e-06, 3.8817524909973145e-06, 4.079192876815796e-06, 4.276633262634277e-06, 4.474073648452759e-06, 4.67151403427124e-06, 4.868954420089722e-06, 5.066394805908203e-06]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 6.0, 9.0, 12.0, 22.0, 19.0, 31.0, 51.0, 70.0, 97.0, 184.0, 266.0, 448.0, 810.0, 1608.0, 3065.0, 5485.0, 10569.0, 21513.0, 52152.0, 146830.0, 446905.0, 232966.0, 68548.0, 28549.0, 13355.0, 7024.0, 3459.0, 1926.0, 1025.0, 606.0, 368.0, 209.0, 137.0, 75.0, 46.0, 25.0, 22.0, 14.0, 11.0, 7.0, 9.0, 6.0, 4.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0], "bins": [-5.429983139038086e-05, -5.2733346819877625e-05, -5.116686224937439e-05, -4.9600377678871155e-05, -4.803389310836792e-05, -4.6467408537864685e-05, -4.490092396736145e-05, -4.3334439396858215e-05, -4.176795482635498e-05, -4.0201470255851746e-05, -3.863498568534851e-05, -3.7068501114845276e-05, -3.550201654434204e-05, -3.3935531973838806e-05, -3.236904740333557e-05, -3.0802562832832336e-05, -2.92360782623291e-05, -2.7669593691825867e-05, -2.6103109121322632e-05, -2.4536624550819397e-05, -2.2970139980316162e-05, -2.1403655409812927e-05, -1.9837170839309692e-05, -1.8270686268806458e-05, -1.6704201698303223e-05, -1.5137717127799988e-05, -1.3571232557296753e-05, -1.2004747986793518e-05, -1.0438263416290283e-05, -8.871778845787048e-06, -7.3052942752838135e-06, -5.738809704780579e-06, -4.172325134277344e-06, -2.605840563774109e-06, -1.039355993270874e-06, 5.271285772323608e-07, 2.0936131477355957e-06, 3.6600977182388306e-06, 5.2265822887420654e-06, 6.7930668592453e-06, 8.359551429748535e-06, 9.92603600025177e-06, 1.1492520570755005e-05, 1.305900514125824e-05, 1.4625489711761475e-05, 1.619197428226471e-05, 1.7758458852767944e-05, 1.932494342327118e-05, 2.0891427993774414e-05, 2.245791256427765e-05, 2.4024397134780884e-05, 2.559088170528412e-05, 2.7157366275787354e-05, 2.872385084629059e-05, 3.0290335416793823e-05, 3.185681998729706e-05, 3.342330455780029e-05, 3.498978912830353e-05, 3.655627369880676e-05, 3.812275826931e-05, 3.968924283981323e-05, 4.125572741031647e-05, 4.28222119808197e-05, 4.438869655132294e-05, 4.595518112182617e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 8.0, 9.0, 3.0, 16.0, 12.0, 14.0, 15.0, 17.0, 21.0, 21.0, 40.0, 30.0, 35.0, 43.0, 32.0, 45.0, 47.0, 52.0, 56.0, 53.0, 56.0, 51.0, 42.0, 33.0, 42.0, 30.0, 22.0, 23.0, 19.0, 16.0, 16.0, 8.0, 11.0, 9.0, 6.0, 5.0, 3.0, 8.0, 10.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0371208190917969e-05, -1.0030344128608704e-05, -9.689480066299438e-06, -9.348616003990173e-06, -9.007751941680908e-06, -8.666887879371643e-06, -8.326023817062378e-06, -7.985159754753113e-06, -7.644295692443848e-06, -7.3034316301345825e-06, -6.962567567825317e-06, -6.621703505516052e-06, -6.280839443206787e-06, -5.939975380897522e-06, -5.599111318588257e-06, -5.258247256278992e-06, -4.9173831939697266e-06, -4.5765191316604614e-06, -4.235655069351196e-06, -3.894791007041931e-06, -3.553926944732666e-06, -3.213062882423401e-06, -2.8721988201141357e-06, -2.5313347578048706e-06, -2.1904706954956055e-06, -1.8496066331863403e-06, -1.5087425708770752e-06, -1.16787850856781e-06, -8.270144462585449e-07, -4.861503839492798e-07, -1.4528632164001465e-07, 1.955777406692505e-07, 5.364418029785156e-07, 8.773058652877808e-07, 1.218169927597046e-06, 1.559033989906311e-06, 1.8998980522155762e-06, 2.2407621145248413e-06, 2.5816261768341064e-06, 2.9224902391433716e-06, 3.2633543014526367e-06, 3.604218363761902e-06, 3.945082426071167e-06, 4.285946488380432e-06, 4.626810550689697e-06, 4.967674612998962e-06, 5.3085386753082275e-06, 5.649402737617493e-06, 5.990266799926758e-06, 6.331130862236023e-06, 6.671994924545288e-06, 7.012858986854553e-06, 7.353723049163818e-06, 7.694587111473083e-06, 8.035451173782349e-06, 8.376315236091614e-06, 8.717179298400879e-06, 9.058043360710144e-06, 9.39890742301941e-06, 9.739771485328674e-06, 1.008063554763794e-05, 1.0421499609947205e-05, 1.076236367225647e-05, 1.1103227734565735e-05, 1.1444091796875e-05]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 7.0, 7.0, 3.0, 8.0, 7.0, 17.0, 26.0, 38.0, 57.0, 73.0, 128.0, 180.0, 145.0, 94.0, 69.0, 37.0, 29.0, 19.0, 19.0, 10.0, 10.0, 11.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018735650228336453, -0.0017836415208876133, -0.0016937180189415812, -0.0016037945169955492, -0.0015138708986341953, -0.0014239473966881633, -0.0013340238947421312, -0.0012441002763807774, -0.0011541768908500671, -0.001064253388904035, -0.0009743298287503421, -0.0008844063268043101, -0.0007944827666506171, -0.0007045592647045851, -0.000614635762758553, -0.0005247122026048601, -0.0004347886424511671, -0.0003448651114013046, -0.0002549415803514421, -0.00016501807840541005, -7.509454735554755e-05, 1.4828983694314957e-05, 0.000104752485640347, 0.00019467604579403996, 0.000284599547740072, 0.0003745230787899345, 0.000464446609839797, 0.0005543701117858291, 0.0006442936137318611, 0.0007342171738855541, 0.0008241406758315861, 0.0009140642359852791, 0.0010039876215159893, 0.0010939111234620214, 0.0011838346254080534, 0.0012737582437694073, 0.0013636817457154393, 0.0014536052476614714, 0.0015435287496075034, 0.0016334522515535355, 0.0017233758699148893, 0.0018132993718609214, 0.0019032228738069534, 0.0019931464921683073, 0.0020830698776990175, 0.0021729934960603714, 0.0022629168815910816, 0.0023528404999524355, 0.0024427641183137894, 0.0025326877366751432, 0.0026226111222058535, 0.0027125347405672073, 0.0028024581260979176, 0.0028923817444592714, 0.0029823053628206253, 0.0030722287483513355, 0.0031621521338820457, 0.0032520757522433996, 0.00334199913777411, 0.0034319227561354637, 0.003521846141666174, 0.003611769760027528, 0.0037016933783888817, 0.003791616763919592, 0.0038815403822809458]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 3.0, 5.0, 7.0, 12.0, 5.0, 17.0, 8.0, 14.0, 17.0, 20.0, 20.0, 14.0, 20.0, 23.0, 34.0, 33.0, 27.0, 34.0, 43.0, 47.0, 54.0, 35.0, 33.0, 45.0, 31.0, 38.0, 37.0, 40.0, 29.0, 29.0, 31.0, 20.0, 18.0, 30.0, 27.0, 12.0, 21.0, 12.0, 9.0, 14.0, 8.0, 8.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011978077236562967, -0.0011571773793548346, -0.0011165469186380506, -0.0010759165743365884, -0.0010352861136198044, -0.0009946557693183422, -0.0009540253668092191, -0.000913394964300096, -0.000872764561790973, -0.0008321341592818499, -0.0007915037567727268, -0.0007508733542636037, -0.0007102430099621415, -0.0006696125492453575, -0.0006289822049438953, -0.0005883518024347723, -0.0005477213999256492, -0.0005070909974165261, -0.000466460594907403, -0.00042583022150211036, -0.0003851998189929873, -0.0003445694164838642, -0.00030393904307857156, -0.00026330864056944847, -0.00022267823806032538, -0.0001820478355512023, -0.00014141744759399444, -0.00010078705236082897, -6.015665712766349e-05, -1.9526254618540406e-05, 2.1104133338667452e-05, 6.173452129587531e-05, 0.00010236480738967657, 0.00014299520989879966, 0.00018362559785600752, 0.00022425598581321537, 0.00026488638832233846, 0.00030551679083146155, 0.0003461471642367542, 0.00038677756674587727, 0.00042740796925500035, 0.00046803837176412344, 0.0005086687742732465, 0.0005492991767823696, 0.0005899295210838318, 0.0006305599818006158, 0.000671190326102078, 0.000711820728611201, 0.0007524511311203241, 0.0007930815336294472, 0.0008337119361385703, 0.0008743423386476934, 0.0009149727411568165, 0.0009556030854582787, 0.0009962335461750627, 0.0010368638904765248, 0.0010774943511933088, 0.001118124695494771, 0.001158755156211555, 0.0011993855005130172, 0.0012400159612298012, 0.0012806463055312634, 0.0013212767662480474, 0.0013619071105495095, 0.0014025374548509717]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 9.0, 3.0, 5.0, 15.0, 10.0, 17.0, 23.0, 32.0, 42.0, 52.0, 64.0, 82.0, 116.0, 161.0, 220.0, 288.0, 379.0, 636.0, 1022.0, 2033.0, 4382.0, 12322.0, 406891.0, 3738981.0, 15668.0, 5296.0, 2152.0, 1090.0, 678.0, 463.0, 319.0, 211.0, 175.0, 114.0, 89.0, 54.0, 42.0, 39.0, 28.0, 23.0, 19.0, 7.0, 12.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00701904296875, -0.006800293922424316, -0.006581544876098633, -0.006362795829772949, -0.006144046783447266, -0.005925297737121582, -0.0057065486907958984, -0.005487799644470215, -0.005269050598144531, -0.005050301551818848, -0.004831552505493164, -0.0046128034591674805, -0.004394054412841797, -0.004175305366516113, -0.00395655632019043, -0.003737807273864746, -0.0035190582275390625, -0.003300309181213379, -0.0030815601348876953, -0.0028628110885620117, -0.002644062042236328, -0.0024253129959106445, -0.002206563949584961, -0.0019878149032592773, -0.0017690658569335938, -0.0015503168106079102, -0.0013315677642822266, -0.001112818717956543, -0.0008940696716308594, -0.0006753206253051758, -0.0004565715789794922, -0.0002378225326538086, -1.9073486328125e-05, 0.0001996755599975586, 0.0004184246063232422, 0.0006371736526489258, 0.0008559226989746094, 0.001074671745300293, 0.0012934207916259766, 0.0015121698379516602, 0.0017309188842773438, 0.0019496679306030273, 0.002168416976928711, 0.0023871660232543945, 0.002605915069580078, 0.0028246641159057617, 0.0030434131622314453, 0.003262162208557129, 0.0034809112548828125, 0.003699660301208496, 0.00391840934753418, 0.004137158393859863, 0.004355907440185547, 0.0045746564865112305, 0.004793405532836914, 0.005012154579162598, 0.005230903625488281, 0.005449652671813965, 0.0056684017181396484, 0.005887150764465332, 0.006105899810791016, 0.006324648857116699, 0.006543397903442383, 0.006762146949768066, 0.00698089599609375]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 7.0, 5.0, 5.0, 8.0, 8.0, 9.0, 12.0, 8.0, 16.0, 14.0, 13.0, 22.0, 20.0, 16.0, 23.0, 28.0, 33.0, 36.0, 42.0, 44.0, 44.0, 40.0, 52.0, 36.0, 36.0, 43.0, 42.0, 30.0, 34.0, 27.0, 35.0, 26.0, 27.0, 26.0, 15.0, 22.0, 19.0, 18.0, 11.0, 13.0, 11.0, 8.0, 7.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0008516311645507812, -0.0008242130279541016, -0.0007967948913574219, -0.0007693767547607422, -0.0007419586181640625, -0.0007145404815673828, -0.0006871223449707031, -0.0006597042083740234, -0.0006322860717773438, -0.0006048679351806641, -0.0005774497985839844, -0.0005500316619873047, -0.000522613525390625, -0.0004951953887939453, -0.0004677772521972656, -0.00044035911560058594, -0.00041294097900390625, -0.00038552284240722656, -0.0003581047058105469, -0.0003306865692138672, -0.0003032684326171875, -0.0002758502960205078, -0.0002484321594238281, -0.00022101402282714844, -0.00019359588623046875, -0.00016617774963378906, -0.00013875961303710938, -0.00011134147644042969, -8.392333984375e-05, -5.650520324707031e-05, -2.9087066650390625e-05, -1.6689300537109375e-06, 2.574920654296875e-05, 5.316734313964844e-05, 8.058547973632812e-05, 0.00010800361633300781, 0.0001354217529296875, 0.0001628398895263672, 0.00019025802612304688, 0.00021767616271972656, 0.00024509429931640625, 0.00027251243591308594, 0.0002999305725097656, 0.0003273487091064453, 0.000354766845703125, 0.0003821849822998047, 0.0004096031188964844, 0.00043702125549316406, 0.00046443939208984375, 0.0004918575286865234, 0.0005192756652832031, 0.0005466938018798828, 0.0005741119384765625, 0.0006015300750732422, 0.0006289482116699219, 0.0006563663482666016, 0.0006837844848632812, 0.0007112026214599609, 0.0007386207580566406, 0.0007660388946533203, 0.00079345703125, 0.0008208751678466797, 0.0008482933044433594, 0.0008757114410400391, 0.0009031295776367188]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 3.0, 7.0, 12.0, 21.0, 44.0, 65.0, 105.0, 214.0, 399.0, 999.0, 2807.0, 11236.0, 109095.0, 4027918.0, 32317.0, 5932.0, 1793.0, 693.0, 288.0, 145.0, 79.0, 40.0, 32.0, 8.0, 9.0, 9.0, 7.0, 0.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00958251953125, -0.009332239627838135, -0.00908195972442627, -0.008831679821014404, -0.008581399917602539, -0.008331120014190674, -0.008080840110778809, -0.007830560207366943, -0.007580280303955078, -0.007330000400543213, -0.007079720497131348, -0.006829440593719482, -0.006579160690307617, -0.006328880786895752, -0.006078600883483887, -0.0058283209800720215, -0.005578041076660156, -0.005327761173248291, -0.005077481269836426, -0.0048272013664245605, -0.004576921463012695, -0.00432664155960083, -0.004076361656188965, -0.0038260817527770996, -0.0035758018493652344, -0.003325521945953369, -0.003075242042541504, -0.0028249621391296387, -0.0025746822357177734, -0.002324402332305908, -0.002074122428894043, -0.0018238425254821777, -0.0015735626220703125, -0.0013232827186584473, -0.001073002815246582, -0.0008227229118347168, -0.0005724430084228516, -0.00032216310501098633, -7.18832015991211e-05, 0.00017839670181274414, 0.0004286766052246094, 0.0006789565086364746, 0.0009292364120483398, 0.001179516315460205, 0.0014297962188720703, 0.0016800761222839355, 0.0019303560256958008, 0.002180635929107666, 0.0024309158325195312, 0.0026811957359313965, 0.0029314756393432617, 0.003181755542755127, 0.003432035446166992, 0.0036823153495788574, 0.003932595252990723, 0.004182875156402588, 0.004433155059814453, 0.004683434963226318, 0.004933714866638184, 0.005183994770050049, 0.005434274673461914, 0.005684554576873779, 0.0059348344802856445, 0.00618511438369751, 0.006435394287109375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 12.0, 13.0, 13.0, 25.0, 48.0, 168.0, 1141.0, 2250.0, 202.0, 67.0, 35.0, 23.0, 15.0, 10.0, 14.0, 15.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008459091186523438, -0.000812143087387085, -0.0007783770561218262, -0.0007446110248565674, -0.0007108449935913086, -0.0006770789623260498, -0.000643312931060791, -0.0006095468997955322, -0.0005757808685302734, -0.0005420148372650146, -0.0005082488059997559, -0.00047448277473449707, -0.0004407167434692383, -0.0004069507122039795, -0.0003731846809387207, -0.0003394186496734619, -0.0003056526184082031, -0.00027188658714294434, -0.00023812055587768555, -0.00020435452461242676, -0.00017058849334716797, -0.00013682246208190918, -0.00010305643081665039, -6.92903995513916e-05, -3.552436828613281e-05, -1.7583370208740234e-06, 3.2007694244384766e-05, 6.577372550964355e-05, 9.953975677490234e-05, 0.00013330578804016113, 0.00016707181930541992, 0.0002008378505706787, 0.0002346038818359375, 0.0002683699131011963, 0.0003021359443664551, 0.00033590197563171387, 0.00036966800689697266, 0.00040343403816223145, 0.00043720006942749023, 0.000470966100692749, 0.0005047321319580078, 0.0005384981632232666, 0.0005722641944885254, 0.0006060302257537842, 0.000639796257019043, 0.0006735622882843018, 0.0007073283195495605, 0.0007410943508148193, 0.0007748603820800781, 0.0008086264133453369, 0.0008423924446105957, 0.0008761584758758545, 0.0009099245071411133, 0.0009436905384063721, 0.0009774565696716309, 0.0010112226009368896, 0.0010449886322021484, 0.0010787546634674072, 0.001112520694732666, 0.0011462867259979248, 0.0011800527572631836, 0.0012138187885284424, 0.0012475848197937012, 0.00128135085105896, 0.0013151168823242188]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 2.0, 1.0, 12.0, 16.0, 13.0, 16.0, 31.0, 38.0, 63.0, 86.0, 131.0, 155.0, 120.0, 96.0, 62.0, 37.0, 35.0, 26.0, 11.0, 15.0, 10.0, 3.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001821695826947689, -0.0017603172454982996, -0.0016989386640489101, -0.0016375600825995207, -0.001576181617565453, -0.0015148030361160636, -0.0014534244546666741, -0.0013920458732172847, -0.001330667408183217, -0.0012692888267338276, -0.0012079102452844381, -0.0011465316638350487, -0.001085153198800981, -0.0010237746173515916, -0.0009623960359022021, -0.0009010174544528127, -0.0008396388730034232, -0.0007782602915540338, -0.0007168817683123052, -0.0006555031868629158, -0.0005941246636211872, -0.0005327460821717978, -0.0004713675007224083, -0.0004099889483768493, -0.0003486103960312903, -0.0002872318436857313, -0.00022585327678825706, -0.00016447470989078283, -0.00010309615754522383, -4.171760519966483e-05, 1.9660976249724627e-05, 8.103952859528363e-05, 0.00014241808094084263, 0.00020379663328640163, 0.00026517518563196063, 0.0003265537670813501, 0.0003879323194269091, 0.0004493108717724681, 0.0005106894532218575, 0.000572068034671247, 0.0006334465579129755, 0.000694825139362365, 0.0007562036626040936, 0.000817582244053483, 0.0008789608255028725, 0.000940339348744601, 0.0010017179884016514, 0.001063096453435719, 0.0011244750348851085, 0.001185853616334498, 0.0012472321977838874, 0.001308610662817955, 0.0013699892442673445, 0.001431367825716734, 0.0014927464071661234, 0.0015541249886155128, 0.0016155035700649023, 0.0016768821515142918, 0.0017382607329636812, 0.0017996393144130707, 0.0018610177794471383, 0.0019223963608965278, 0.0019837748259305954, 0.002045153407379985, 0.0021065319888293743]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 8.0, 10.0, 8.0, 11.0, 15.0, 20.0, 19.0, 19.0, 16.0, 26.0, 29.0, 26.0, 35.0, 40.0, 33.0, 34.0, 31.0, 31.0, 49.0, 40.0, 34.0, 42.0, 44.0, 48.0, 47.0, 33.0, 35.0, 35.0, 39.0, 23.0, 15.0, 18.0, 15.0, 13.0, 15.0, 12.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.001021876814775169, -0.000990988570265472, -0.0009601004421710968, -0.0009292122558690608, -0.0008983240695670247, -0.0008674358250573277, -0.0008365476387552917, -0.0008056594524532557, -0.0007747712661512196, -0.0007438830798491836, -0.0007129948935471475, -0.0006821067072451115, -0.0006512184627354145, -0.0006203303346410394, -0.0005894420901313424, -0.0005585539038293064, -0.0005276657175272703, -0.0004967775312252343, -0.0004658893449231982, -0.0004350011295173317, -0.00040411294321529567, -0.0003732247569132596, -0.0003423365415073931, -0.0003114483552053571, -0.00028056016890332103, -0.000249671982601285, -0.0002187837817473337, -0.00018789558089338243, -0.00015700739459134638, -0.00012611920828931034, -9.523100743535906e-05, -6.434280658140779e-05, -3.345450386404991e-05, -2.5663102860562503e-06, 2.832188329193741e-05, 5.921007686993107e-05, 9.009827044792473e-05, 0.00012098645674996078, 0.00015187465760391206, 0.00018276285845786333, 0.00021365104475989938, 0.0002445392310619354, 0.00027542741736397147, 0.000306315632769838, 0.000337203819071874, 0.00036809200537391007, 0.0003989802207797766, 0.0004298684070818126, 0.00046075659338384867, 0.0004916447796858847, 0.0005225329659879208, 0.0005534211522899568, 0.0005843093385919929, 0.0006151975831016898, 0.0006460857694037259, 0.0006769739557057619, 0.000707862142007798, 0.000738750328309834, 0.00076963851461187, 0.0008005267009139061, 0.0008314149454236031, 0.0008623030735179782, 0.0008931913180276752, 0.0009240795043297112, 0.0009549676906317472]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 9.0, 18.0, 20.0, 43.0, 53.0, 72.0, 101.0, 132.0, 226.0, 342.0, 547.0, 845.0, 1190.0, 1820.0, 2963.0, 4430.0, 6915.0, 11002.0, 17349.0, 27900.0, 44831.0, 72868.0, 118189.0, 181005.0, 196762.0, 135527.0, 84006.0, 51775.0, 32256.0, 20080.0, 12812.0, 7944.0, 5194.0, 3133.0, 2086.0, 1333.0, 950.0, 597.0, 411.0, 286.0, 171.0, 107.0, 78.0, 59.0, 49.0, 31.0, 12.0, 13.0, 11.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006203651428222656, -0.0006004497408866882, -0.0005805343389511108, -0.0005606189370155334, -0.0005407035350799561, -0.0005207881331443787, -0.0005008727312088013, -0.0004809573292732239, -0.0004610419273376465, -0.0004411265254020691, -0.0004212111234664917, -0.0004012957215309143, -0.0003813803195953369, -0.0003614649176597595, -0.00034154951572418213, -0.00032163411378860474, -0.00030171871185302734, -0.00028180330991744995, -0.00026188790798187256, -0.00024197250604629517, -0.00022205710411071777, -0.00020214170217514038, -0.000182226300239563, -0.0001623108983039856, -0.0001423954963684082, -0.0001224800944328308, -0.00010256469249725342, -8.264929056167603e-05, -6.273388862609863e-05, -4.281848669052124e-05, -2.2903084754943848e-05, -2.987682819366455e-06, 1.6927719116210938e-05, 3.684312105178833e-05, 5.675852298736572e-05, 7.667392492294312e-05, 9.658932685852051e-05, 0.0001165047287940979, 0.0001364201307296753, 0.00015633553266525269, 0.00017625093460083008, 0.00019616633653640747, 0.00021608173847198486, 0.00023599714040756226, 0.00025591254234313965, 0.00027582794427871704, 0.00029574334621429443, 0.0003156587481498718, 0.0003355741500854492, 0.0003554895520210266, 0.000375404953956604, 0.0003953203558921814, 0.0004152357578277588, 0.0004351511597633362, 0.0004550665616989136, 0.00047498196363449097, 0.0004948973655700684, 0.0005148127675056458, 0.0005347281694412231, 0.0005546435713768005, 0.0005745589733123779, 0.0005944743752479553, 0.0006143897771835327, 0.0006343051791191101, 0.0006542205810546875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 2.0, 9.0, 11.0, 8.0, 14.0, 12.0, 12.0, 16.0, 21.0, 19.0, 25.0, 26.0, 36.0, 31.0, 32.0, 39.0, 36.0, 39.0, 40.0, 43.0, 48.0, 37.0, 52.0, 37.0, 52.0, 39.0, 41.0, 36.0, 39.0, 28.0, 20.0, 14.0, 15.0, 20.0, 13.0, 13.0, 10.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.001178741455078125, -0.00114402174949646, -0.001109302043914795, -0.0010745823383331299, -0.0010398626327514648, -0.0010051429271697998, -0.0009704232215881348, -0.0009357035160064697, -0.0009009838104248047, -0.0008662641048431396, -0.0008315443992614746, -0.0007968246936798096, -0.0007621049880981445, -0.0007273852825164795, -0.0006926655769348145, -0.0006579458713531494, -0.0006232261657714844, -0.0005885064601898193, -0.0005537867546081543, -0.0005190670490264893, -0.0004843473434448242, -0.0004496276378631592, -0.00041490793228149414, -0.0003801882266998291, -0.00034546852111816406, -0.000310748815536499, -0.000276029109954834, -0.00024130940437316895, -0.0002065896987915039, -0.00017186999320983887, -0.00013715028762817383, -0.00010243058204650879, -6.771087646484375e-05, -3.299117088317871e-05, 1.7285346984863281e-06, 3.644824028015137e-05, 7.11679458618164e-05, 0.00010588765144348145, 0.00014060735702514648, 0.00017532706260681152, 0.00021004676818847656, 0.0002447664737701416, 0.00027948617935180664, 0.0003142058849334717, 0.0003489255905151367, 0.00038364529609680176, 0.0004183650016784668, 0.00045308470726013184, 0.0004878044128417969, 0.0005225241184234619, 0.000557243824005127, 0.000591963529586792, 0.000626683235168457, 0.0006614029407501221, 0.0006961226463317871, 0.0007308423519134521, 0.0007655620574951172, 0.0008002817630767822, 0.0008350014686584473, 0.0008697211742401123, 0.0009044408798217773, 0.0009391605854034424, 0.0009738802909851074, 0.0010085999965667725, 0.0010433197021484375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 7.0, 10.0, 4.0, 15.0, 28.0, 32.0, 55.0, 53.0, 103.0, 157.0, 237.0, 321.0, 545.0, 813.0, 1257.0, 1980.0, 3041.0, 4810.0, 7797.0, 13354.0, 22565.0, 41223.0, 81300.0, 188748.0, 365193.0, 156492.0, 70325.0, 36241.0, 20470.0, 11789.0, 7116.0, 4582.0, 2762.0, 1761.0, 1119.0, 744.0, 503.0, 349.0, 200.0, 149.0, 106.0, 58.0, 47.0, 33.0, 16.0, 20.0, 12.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007748603820800781, -0.0007501840591430664, -0.0007255077362060547, -0.000700831413269043, -0.0006761550903320312, -0.0006514787673950195, -0.0006268024444580078, -0.0006021261215209961, -0.0005774497985839844, -0.0005527734756469727, -0.0005280971527099609, -0.0005034208297729492, -0.0004787445068359375, -0.0004540681838989258, -0.00042939186096191406, -0.00040471553802490234, -0.0003800392150878906, -0.0003553628921508789, -0.0003306865692138672, -0.00030601024627685547, -0.00028133392333984375, -0.00025665760040283203, -0.0002319812774658203, -0.0002073049545288086, -0.00018262863159179688, -0.00015795230865478516, -0.00013327598571777344, -0.00010859966278076172, -8.392333984375e-05, -5.924701690673828e-05, -3.457069396972656e-05, -9.894371032714844e-06, 1.4781951904296875e-05, 3.9458274841308594e-05, 6.413459777832031e-05, 8.881092071533203e-05, 0.00011348724365234375, 0.00013816356658935547, 0.0001628398895263672, 0.0001875162124633789, 0.00021219253540039062, 0.00023686885833740234, 0.00026154518127441406, 0.0002862215042114258, 0.0003108978271484375, 0.0003355741500854492, 0.00036025047302246094, 0.00038492679595947266, 0.0004096031188964844, 0.0004342794418334961, 0.0004589557647705078, 0.00048363208770751953, 0.0005083084106445312, 0.000532984733581543, 0.0005576610565185547, 0.0005823373794555664, 0.0006070137023925781, 0.0006316900253295898, 0.0006563663482666016, 0.0006810426712036133, 0.000705718994140625, 0.0007303953170776367, 0.0007550716400146484, 0.0007797479629516602, 0.0008044242858886719]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 3.0, 5.0, 8.0, 3.0, 7.0, 10.0, 21.0, 16.0, 10.0, 18.0, 26.0, 19.0, 29.0, 31.0, 31.0, 36.0, 36.0, 36.0, 35.0, 35.0, 51.0, 53.0, 46.0, 31.0, 55.0, 39.0, 42.0, 32.0, 24.0, 30.0, 16.0, 34.0, 27.0, 17.0, 17.0, 20.0, 9.0, 7.0, 4.0, 11.0, 7.0, 4.0, 1.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0007076263427734375, -0.0006864219903945923, -0.0006652176380157471, -0.0006440132856369019, -0.0006228089332580566, -0.0006016045808792114, -0.0005804002285003662, -0.000559195876121521, -0.0005379915237426758, -0.0005167871713638306, -0.0004955828189849854, -0.00047437846660614014, -0.0004531741142272949, -0.0004319697618484497, -0.0004107654094696045, -0.0003895610570907593, -0.00036835670471191406, -0.00034715235233306885, -0.00032594799995422363, -0.0003047436475753784, -0.0002835392951965332, -0.000262334942817688, -0.00024113059043884277, -0.00021992623805999756, -0.00019872188568115234, -0.00017751753330230713, -0.00015631318092346191, -0.0001351088285446167, -0.00011390447616577148, -9.270012378692627e-05, -7.149577140808105e-05, -5.029141902923584e-05, -2.9087066650390625e-05, -7.88271427154541e-06, 1.3321638107299805e-05, 3.452599048614502e-05, 5.5730342864990234e-05, 7.693469524383545e-05, 9.813904762268066e-05, 0.00011934340000152588, 0.0001405477523803711, 0.0001617521047592163, 0.00018295645713806152, 0.00020416080951690674, 0.00022536516189575195, 0.00024656951427459717, 0.0002677738666534424, 0.0002889782190322876, 0.0003101825714111328, 0.00033138692378997803, 0.00035259127616882324, 0.00037379562854766846, 0.00039499998092651367, 0.0004162043333053589, 0.0004374086856842041, 0.0004586130380630493, 0.00047981739044189453, 0.0005010217428207397, 0.000522226095199585, 0.0005434304475784302, 0.0005646347999572754, 0.0005858391523361206, 0.0006070435047149658, 0.000628247857093811, 0.0006494522094726562]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 14.0, 17.0, 23.0, 21.0, 42.0, 52.0, 78.0, 91.0, 143.0, 228.0, 338.0, 479.0, 671.0, 1034.0, 1771.0, 2945.0, 5452.0, 11416.0, 28760.0, 115333.0, 713835.0, 112475.0, 28837.0, 11159.0, 5434.0, 2947.0, 1680.0, 1117.0, 694.0, 437.0, 284.0, 209.0, 162.0, 101.0, 84.0, 63.0, 44.0, 24.0, 16.0, 7.0, 6.0, 9.0, 6.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001531839370727539, -0.00014816038310527802, -0.00014313682913780212, -0.00013811327517032623, -0.00013308972120285034, -0.00012806616723537445, -0.00012304261326789856, -0.00011801905930042267, -0.00011299550533294678, -0.00010797195136547089, -0.000102948397397995, -9.79248434305191e-05, -9.290128946304321e-05, -8.787773549556732e-05, -8.285418152809143e-05, -7.783062756061554e-05, -7.280707359313965e-05, -6.778351962566376e-05, -6.275996565818787e-05, -5.7736411690711975e-05, -5.2712857723236084e-05, -4.768930375576019e-05, -4.26657497882843e-05, -3.764219582080841e-05, -3.261864185333252e-05, -2.759508788585663e-05, -2.2571533918380737e-05, -1.7547979950904846e-05, -1.2524425983428955e-05, -7.500872015953064e-06, -2.477318048477173e-06, 2.5462359189987183e-06, 7.569789886474609e-06, 1.25933438539505e-05, 1.761689782142639e-05, 2.2640451788902283e-05, 2.7664005756378174e-05, 3.2687559723854065e-05, 3.7711113691329956e-05, 4.273466765880585e-05, 4.775822162628174e-05, 5.278177559375763e-05, 5.780532956123352e-05, 6.282888352870941e-05, 6.78524374961853e-05, 7.28759914636612e-05, 7.789954543113708e-05, 8.292309939861298e-05, 8.794665336608887e-05, 9.297020733356476e-05, 9.799376130104065e-05, 0.00010301731526851654, 0.00010804086923599243, 0.00011306442320346832, 0.00011808797717094421, 0.0001231115311384201, 0.000128135085105896, 0.0001331586390733719, 0.00013818219304084778, 0.00014320574700832367, 0.00014822930097579956, 0.00015325285494327545, 0.00015827640891075134, 0.00016329996287822723, 0.00016832351684570312]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 4.0, 10.0, 9.0, 13.0, 7.0, 12.0, 18.0, 17.0, 13.0, 36.0, 41.0, 52.0, 80.0, 83.0, 119.0, 113.0, 91.0, 40.0, 57.0, 46.0, 30.0, 26.0, 9.0, 17.0, 10.0, 10.0, 8.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.708766937255859e-06, -4.542991518974304e-06, -4.377216100692749e-06, -4.211440682411194e-06, -4.045665264129639e-06, -3.8798898458480835e-06, -3.7141144275665283e-06, -3.548339009284973e-06, -3.382563591003418e-06, -3.216788172721863e-06, -3.0510127544403076e-06, -2.8852373361587524e-06, -2.7194619178771973e-06, -2.553686499595642e-06, -2.387911081314087e-06, -2.2221356630325317e-06, -2.0563602447509766e-06, -1.8905848264694214e-06, -1.7248094081878662e-06, -1.559033989906311e-06, -1.3932585716247559e-06, -1.2274831533432007e-06, -1.0617077350616455e-06, -8.959323167800903e-07, -7.301568984985352e-07, -5.6438148021698e-07, -3.986060619354248e-07, -2.3283064365386963e-07, -6.705522537231445e-08, 9.872019290924072e-08, 2.644956111907959e-07, 4.302710294723511e-07, 5.960464477539062e-07, 7.618218660354614e-07, 9.275972843170166e-07, 1.0933727025985718e-06, 1.259148120880127e-06, 1.4249235391616821e-06, 1.5906989574432373e-06, 1.7564743757247925e-06, 1.9222497940063477e-06, 2.088025212287903e-06, 2.253800630569458e-06, 2.419576048851013e-06, 2.5853514671325684e-06, 2.7511268854141235e-06, 2.9169023036956787e-06, 3.082677721977234e-06, 3.248453140258789e-06, 3.4142285585403442e-06, 3.5800039768218994e-06, 3.7457793951034546e-06, 3.91155481338501e-06, 4.077330231666565e-06, 4.24310564994812e-06, 4.408881068229675e-06, 4.5746564865112305e-06, 4.740431904792786e-06, 4.906207323074341e-06, 5.071982741355896e-06, 5.237758159637451e-06, 5.403533577919006e-06, 5.5693089962005615e-06, 5.735084414482117e-06, 5.900859832763672e-06]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 1.0, 6.0, 4.0, 8.0, 6.0, 4.0, 5.0, 8.0, 15.0, 14.0, 15.0, 43.0, 72.0, 136.0, 280.0, 663.0, 1602.0, 4223.0, 12153.0, 49034.0, 563647.0, 360695.0, 39502.0, 10247.0, 3593.0, 1422.0, 600.0, 271.0, 94.0, 57.0, 38.0, 19.0, 11.0, 11.0, 10.0, 8.0, 6.0, 6.0, 6.0, 5.0, 2.0, 0.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0002560615539550781, -0.0002482850104570389, -0.00024050846695899963, -0.0002327319234609604, -0.00022495537996292114, -0.0002171788364648819, -0.00020940229296684265, -0.0002016257494688034, -0.00019384920597076416, -0.00018607266247272491, -0.00017829611897468567, -0.00017051957547664642, -0.00016274303197860718, -0.00015496648848056793, -0.0001471899449825287, -0.00013941340148448944, -0.0001316368579864502, -0.00012386031448841095, -0.0001160837709903717, -0.00010830722749233246, -0.00010053068399429321, -9.275414049625397e-05, -8.497759699821472e-05, -7.720105350017548e-05, -6.942451000213623e-05, -6.164796650409698e-05, -5.387142300605774e-05, -4.6094879508018494e-05, -3.831833600997925e-05, -3.054179251194e-05, -2.2765249013900757e-05, -1.4988705515861511e-05, -7.212162017822266e-06, 5.6438148021698e-07, 8.340924978256226e-06, 1.611746847629547e-05, 2.3894011974334717e-05, 3.167055547237396e-05, 3.944709897041321e-05, 4.7223642468452454e-05, 5.50001859664917e-05, 6.277672946453094e-05, 7.055327296257019e-05, 7.832981646060944e-05, 8.610635995864868e-05, 9.388290345668793e-05, 0.00010165944695472717, 0.00010943599045276642, 0.00011721253395080566, 0.0001249890774488449, 0.00013276562094688416, 0.0001405421644449234, 0.00014831870794296265, 0.0001560952514410019, 0.00016387179493904114, 0.00017164833843708038, 0.00017942488193511963, 0.00018720142543315887, 0.00019497796893119812, 0.00020275451242923737, 0.0002105310559272766, 0.00021830759942531586, 0.0002260841429233551, 0.00023386068642139435, 0.0002416372299194336]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 5.0, 4.0, 7.0, 3.0, 5.0, 7.0, 7.0, 9.0, 11.0, 17.0, 12.0, 20.0, 26.0, 36.0, 37.0, 51.0, 62.0, 84.0, 80.0, 73.0, 75.0, 65.0, 47.0, 53.0, 45.0, 32.0, 24.0, 19.0, 12.0, 10.0, 7.0, 12.0, 5.0, 6.0, 8.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.771615982055664e-05, -2.6827678084373474e-05, -2.5939196348190308e-05, -2.505071461200714e-05, -2.4162232875823975e-05, -2.3273751139640808e-05, -2.238526940345764e-05, -2.1496787667274475e-05, -2.060830593109131e-05, -1.9719824194908142e-05, -1.8831342458724976e-05, -1.794286072254181e-05, -1.7054378986358643e-05, -1.6165897250175476e-05, -1.527741551399231e-05, -1.4388933777809143e-05, -1.3500452041625977e-05, -1.261197030544281e-05, -1.1723488569259644e-05, -1.0835006833076477e-05, -9.94652509689331e-06, -9.058043360710144e-06, -8.169561624526978e-06, -7.281079888343811e-06, -6.3925981521606445e-06, -5.504116415977478e-06, -4.6156346797943115e-06, -3.727152943611145e-06, -2.8386712074279785e-06, -1.950189471244812e-06, -1.0617077350616455e-06, -1.73225998878479e-07, 7.152557373046875e-07, 1.603737473487854e-06, 2.4922192096710205e-06, 3.380700945854187e-06, 4.2691826820373535e-06, 5.15766441822052e-06, 6.0461461544036865e-06, 6.934627890586853e-06, 7.82310962677002e-06, 8.711591362953186e-06, 9.600073099136353e-06, 1.0488554835319519e-05, 1.1377036571502686e-05, 1.2265518307685852e-05, 1.3154000043869019e-05, 1.4042481780052185e-05, 1.4930963516235352e-05, 1.5819445252418518e-05, 1.6707926988601685e-05, 1.759640872478485e-05, 1.8484890460968018e-05, 1.9373372197151184e-05, 2.026185393333435e-05, 2.1150335669517517e-05, 2.2038817405700684e-05, 2.292729914188385e-05, 2.3815780878067017e-05, 2.4704262614250183e-05, 2.559274435043335e-05, 2.6481226086616516e-05, 2.7369707822799683e-05, 2.825818955898285e-05, 2.9146671295166016e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 15.0, 12.0, 27.0, 26.0, 51.0, 85.0, 129.0, 205.0, 136.0, 93.0, 57.0, 51.0, 32.0, 20.0, 17.0, 12.0, 6.0, 2.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020623677410185337, -0.0019905937369912863, -0.0019188195001333952, -0.0018470454961061478, -0.0017752713756635785, -0.0017034972552210093, -0.0016317232511937618, -0.0015599491307511926, -0.0014881750103086233, -0.001416400889866054, -0.0013446267694234848, -0.0012728527653962374, -0.0012010786449536681, -0.0011293045245110989, -0.0010575305204838514, -0.0009857564000412822, -0.0009139822795987129, -0.0008422081591561437, -0.0007704340969212353, -0.000698660034686327, -0.0006268859142437577, -0.0005551117938011885, -0.0004833377315662801, -0.0004115636693313718, -0.00033978954888880253, -0.00026801545755006373, -0.00019624136621132493, -0.00012446727487258613, -5.269318353384733e-05, 1.9080907804891467e-05, 9.085499914363027e-05, 0.0001626290613785386, 0.0002344029489904642, 0.000306177040329203, 0.0003779511316679418, 0.0004497252230066806, 0.0005214993143454194, 0.0005932734347879887, 0.000665047497022897, 0.0007368215592578053, 0.0008085956797003746, 0.0008803698001429439, 0.0009521438623778522, 0.0010239179246127605, 0.0010956920450553298, 0.001167466165497899, 0.0012392401695251465, 0.0013110142899677157, 0.001382788410410285, 0.0014545625308528543, 0.0015263366512954235, 0.001598110655322671, 0.0016698847757652402, 0.0017416588962078094, 0.0018134329002350569, 0.0018852070206776261, 0.0019569811411201954, 0.002028755145147443, 0.002100529382005334, 0.0021723033860325813, 0.0022440776228904724, 0.00231585162691772, 0.0023876256309449673, 0.0024593998678028584, 0.0025311738718301058]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 7.0, 6.0, 11.0, 11.0, 15.0, 16.0, 25.0, 12.0, 18.0, 25.0, 22.0, 35.0, 28.0, 42.0, 36.0, 32.0, 29.0, 35.0, 44.0, 41.0, 41.0, 35.0, 47.0, 41.0, 52.0, 35.0, 38.0, 34.0, 37.0, 24.0, 22.0, 14.0, 15.0, 15.0, 14.0, 12.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0010442022467032075, -0.0010128474095836282, -0.0009814925724640489, -0.0009501376771368086, -0.0009187828400172293, -0.0008874279446899891, -0.0008560731075704098, -0.0008247182704508305, -0.0007933634333312511, -0.0007620085962116718, -0.0007306537008844316, -0.0006992988637648523, -0.000667944026645273, -0.0006365891313180327, -0.0006052342941984534, -0.0005738794570788741, -0.0005425245617516339, -0.0005111697246320546, -0.0004798148584086448, -0.000448459992185235, -0.0004171051550656557, -0.00038575028884224594, -0.00035439542261883616, -0.00032304058549925685, -0.0002916857192758471, -0.0002603308530524373, -0.000228976015932858, -0.00019762114970944822, -0.00016626629803795367, -0.00013491144636645913, -0.00010355658014304936, -7.220172847155482e-05, -4.084687680006027e-05, -9.492021490586922e-06, 2.186283381888643e-05, 5.321769276633859e-05, 8.457254443783313e-05, 0.00011592739610932767, 0.00014728226233273745, 0.000178637114004232, 0.00020999196567572653, 0.00024134681734722108, 0.0002727016690187156, 0.0003040565352421254, 0.00033541140146553516, 0.0003667662385851145, 0.00039812110480852425, 0.000429475971031934, 0.00046083080815151334, 0.0004921856452710927, 0.0005235405405983329, 0.0005548953777179122, 0.0005862502148374915, 0.0006176050519570708, 0.0006489599472843111, 0.0006803147844038904, 0.0007116696797311306, 0.0007430245168507099, 0.0007743794121779501, 0.0008057342492975295, 0.0008370890864171088, 0.000868443981744349, 0.0008997988188639283, 0.0009311536559835076, 0.000962508493103087]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 11.0, 12.0, 22.0, 38.0, 56.0, 72.0, 121.0, 193.0, 345.0, 565.0, 925.0, 1639.0, 2802.0, 5172.0, 10051.0, 19683.0, 40645.0, 96546.0, 268465.0, 355498.0, 137510.0, 54738.0, 25329.0, 12755.0, 6734.0, 3713.0, 2038.0, 1135.0, 702.0, 381.0, 233.0, 148.0, 91.0, 49.0, 41.0, 28.0, 22.0, 9.0, 12.0, 6.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.003391265869140625, -0.0032920539379119873, -0.0031928420066833496, -0.003093630075454712, -0.0029944181442260742, -0.0028952062129974365, -0.002795994281768799, -0.002696782350540161, -0.0025975704193115234, -0.0024983584880828857, -0.002399146556854248, -0.0022999346256256104, -0.0022007226943969727, -0.002101510763168335, -0.0020022988319396973, -0.0019030869007110596, -0.0018038749694824219, -0.0017046630382537842, -0.0016054511070251465, -0.0015062391757965088, -0.001407027244567871, -0.0013078153133392334, -0.0012086033821105957, -0.001109391450881958, -0.0010101795196533203, -0.0009109675884246826, -0.0008117556571960449, -0.0007125437259674072, -0.0006133317947387695, -0.0005141198635101318, -0.00041490793228149414, -0.00031569600105285645, -0.00021648406982421875, -0.00011727213859558105, -1.806020736694336e-05, 8.115172386169434e-05, 0.00018036365509033203, 0.0002795755863189697, 0.0003787875175476074, 0.0004779994487762451, 0.0005772113800048828, 0.0006764233112335205, 0.0007756352424621582, 0.0008748471736907959, 0.0009740591049194336, 0.0010732710361480713, 0.001172482967376709, 0.0012716948986053467, 0.0013709068298339844, 0.001470118761062622, 0.0015693306922912598, 0.0016685426235198975, 0.0017677545547485352, 0.0018669664859771729, 0.0019661784172058105, 0.0020653903484344482, 0.002164602279663086, 0.0022638142108917236, 0.0023630261421203613, 0.002462238073348999, 0.0025614500045776367, 0.0026606619358062744, 0.002759873867034912, 0.00285908579826355, 0.0029582977294921875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 1.0, 7.0, 13.0, 13.0, 9.0, 14.0, 15.0, 20.0, 28.0, 37.0, 40.0, 43.0, 42.0, 51.0, 66.0, 46.0, 41.0, 62.0, 55.0, 66.0, 62.0, 40.0, 36.0, 55.0, 34.0, 25.0, 22.0, 25.0, 11.0, 7.0, 9.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0009555816650390625, -0.0009302571415901184, -0.0009049326181411743, -0.0008796080946922302, -0.0008542835712432861, -0.000828959047794342, -0.000803634524345398, -0.0007783100008964539, -0.0007529854774475098, -0.0007276609539985657, -0.0007023364305496216, -0.0006770119071006775, -0.0006516873836517334, -0.0006263628602027893, -0.0006010383367538452, -0.0005757138133049011, -0.000550389289855957, -0.0005250647664070129, -0.0004997402429580688, -0.00047441571950912476, -0.00044909119606018066, -0.00042376667261123657, -0.0003984421491622925, -0.0003731176257133484, -0.0003477931022644043, -0.0003224685788154602, -0.0002971440553665161, -0.000271819531917572, -0.00024649500846862793, -0.00022117048501968384, -0.00019584596157073975, -0.00017052143812179565, -0.00014519691467285156, -0.00011987239122390747, -9.454786777496338e-05, -6.922334432601929e-05, -4.3898820877075195e-05, -1.8574297428131104e-05, 6.750226020812988e-06, 3.207474946975708e-05, 5.739927291870117e-05, 8.272379636764526e-05, 0.00010804831981658936, 0.00013337284326553345, 0.00015869736671447754, 0.00018402189016342163, 0.00020934641361236572, 0.00023467093706130981, 0.0002599954605102539, 0.000285319983959198, 0.0003106445074081421, 0.0003359690308570862, 0.0003612935543060303, 0.00038661807775497437, 0.00041194260120391846, 0.00043726712465286255, 0.00046259164810180664, 0.00048791617155075073, 0.0005132406949996948, 0.0005385652184486389, 0.000563889741897583, 0.0005892142653465271, 0.0006145387887954712, 0.0006398633122444153, 0.0006651878356933594]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 2.0, 5.0, 8.0, 3.0, 13.0, 21.0, 34.0, 41.0, 61.0, 90.0, 128.0, 234.0, 379.0, 712.0, 1329.0, 2733.0, 5706.0, 12249.0, 29191.0, 76744.0, 252866.0, 430803.0, 148630.0, 49618.0, 19912.0, 8604.0, 4043.0, 1957.0, 1050.0, 535.0, 309.0, 195.0, 96.0, 61.0, 46.0, 30.0, 33.0, 20.0, 19.0, 12.0, 4.0, 8.0, 4.0, 7.0, 1.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0023403167724609375, -0.0022545456886291504, -0.0021687746047973633, -0.002083003520965576, -0.001997232437133789, -0.001911461353302002, -0.0018256902694702148, -0.0017399191856384277, -0.0016541481018066406, -0.0015683770179748535, -0.0014826059341430664, -0.0013968348503112793, -0.0013110637664794922, -0.001225292682647705, -0.001139521598815918, -0.0010537505149841309, -0.0009679794311523438, -0.0008822083473205566, -0.0007964372634887695, -0.0007106661796569824, -0.0006248950958251953, -0.0005391240119934082, -0.0004533529281616211, -0.000367581844329834, -0.0002818107604980469, -0.00019603967666625977, -0.00011026859283447266, -2.4497509002685547e-05, 6.127357482910156e-05, 0.00014704465866088867, 0.00023281574249267578, 0.0003185868263244629, 0.00040435791015625, 0.0004901289939880371, 0.0005759000778198242, 0.0006616711616516113, 0.0007474422454833984, 0.0008332133293151855, 0.0009189844131469727, 0.0010047554969787598, 0.0010905265808105469, 0.001176297664642334, 0.001262068748474121, 0.0013478398323059082, 0.0014336109161376953, 0.0015193819999694824, 0.0016051530838012695, 0.0016909241676330566, 0.0017766952514648438, 0.0018624663352966309, 0.001948237419128418, 0.002034008502960205, 0.002119779586791992, 0.0022055506706237793, 0.0022913217544555664, 0.0023770928382873535, 0.0024628639221191406, 0.0025486350059509277, 0.002634406089782715, 0.002720177173614502, 0.002805948257446289, 0.002891719341278076, 0.0029774904251098633, 0.0030632615089416504, 0.0031490325927734375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 4.0, 6.0, 7.0, 11.0, 9.0, 14.0, 14.0, 16.0, 19.0, 19.0, 21.0, 37.0, 46.0, 36.0, 42.0, 40.0, 42.0, 45.0, 47.0, 46.0, 43.0, 50.0, 41.0, 50.0, 40.0, 38.0, 33.0, 29.0, 20.0, 25.0, 22.0, 23.0, 12.0, 14.0, 12.0, 8.0, 5.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0006413459777832031, -0.0006240308284759521, -0.0006067156791687012, -0.0005894005298614502, -0.0005720853805541992, -0.0005547702312469482, -0.0005374550819396973, -0.0005201399326324463, -0.0005028247833251953, -0.00048550963401794434, -0.00046819448471069336, -0.0004508793354034424, -0.0004335641860961914, -0.00041624903678894043, -0.00039893388748168945, -0.0003816187381744385, -0.0003643035888671875, -0.0003469884395599365, -0.00032967329025268555, -0.00031235814094543457, -0.0002950429916381836, -0.0002777278423309326, -0.00026041269302368164, -0.00024309754371643066, -0.0002257823944091797, -0.0002084672451019287, -0.00019115209579467773, -0.00017383694648742676, -0.00015652179718017578, -0.0001392066478729248, -0.00012189149856567383, -0.00010457634925842285, -8.726119995117188e-05, -6.99460506439209e-05, -5.263090133666992e-05, -3.5315752029418945e-05, -1.800060272216797e-05, -6.854534149169922e-07, 1.6629695892333984e-05, 3.394484519958496e-05, 5.125999450683594e-05, 6.857514381408691e-05, 8.589029312133789e-05, 0.00010320544242858887, 0.00012052059173583984, 0.00013783574104309082, 0.0001551508903503418, 0.00017246603965759277, 0.00018978118896484375, 0.00020709633827209473, 0.0002244114875793457, 0.00024172663688659668, 0.00025904178619384766, 0.00027635693550109863, 0.0002936720848083496, 0.0003109872341156006, 0.00032830238342285156, 0.00034561753273010254, 0.0003629326820373535, 0.0003802478313446045, 0.00039756298065185547, 0.00041487812995910645, 0.0004321932792663574, 0.0004495084285736084, 0.0004668235778808594]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 8.0, 4.0, 8.0, 10.0, 20.0, 12.0, 15.0, 18.0, 23.0, 31.0, 44.0, 71.0, 105.0, 167.0, 318.0, 438.0, 729.0, 1345.0, 2556.0, 5915.0, 16044.0, 58367.0, 565628.0, 327931.0, 45423.0, 12948.0, 5060.0, 2370.0, 1175.0, 641.0, 363.0, 208.0, 159.0, 101.0, 76.0, 76.0, 44.0, 37.0, 20.0, 13.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.594989776611328e-05, -8.316896855831146e-05, -8.038803935050964e-05, -7.760711014270782e-05, -7.4826180934906e-05, -7.204525172710419e-05, -6.926432251930237e-05, -6.648339331150055e-05, -6.370246410369873e-05, -6.092153489589691e-05, -5.814060568809509e-05, -5.5359676480293274e-05, -5.2578747272491455e-05, -4.9797818064689636e-05, -4.701688885688782e-05, -4.4235959649086e-05, -4.145503044128418e-05, -3.867410123348236e-05, -3.589317202568054e-05, -3.311224281787872e-05, -3.0331313610076904e-05, -2.7550384402275085e-05, -2.4769455194473267e-05, -2.1988525986671448e-05, -1.920759677886963e-05, -1.642666757106781e-05, -1.3645738363265991e-05, -1.0864809155464172e-05, -8.083879947662354e-06, -5.302950739860535e-06, -2.522021532058716e-06, 2.5890767574310303e-07, 3.039836883544922e-06, 5.820766091346741e-06, 8.60169529914856e-06, 1.1382624506950378e-05, 1.4163553714752197e-05, 1.6944482922554016e-05, 1.9725412130355835e-05, 2.2506341338157654e-05, 2.5287270545959473e-05, 2.806819975376129e-05, 3.084912896156311e-05, 3.363005816936493e-05, 3.641098737716675e-05, 3.919191658496857e-05, 4.1972845792770386e-05, 4.4753775000572205e-05, 4.7534704208374023e-05, 5.031563341617584e-05, 5.309656262397766e-05, 5.587749183177948e-05, 5.86584210395813e-05, 6.143935024738312e-05, 6.422027945518494e-05, 6.700120866298676e-05, 6.978213787078857e-05, 7.256306707859039e-05, 7.534399628639221e-05, 7.812492549419403e-05, 8.090585470199585e-05, 8.368678390979767e-05, 8.646771311759949e-05, 8.92486423254013e-05, 9.202957153320312e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 9.0, 21.0, 32.0, 51.0, 67.0, 177.0, 164.0, 188.0, 127.0, 45.0, 46.0, 21.0, 18.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-06, -3.482215106487274e-06, -3.3285468816757202e-06, -3.1748786568641663e-06, -3.0212104320526123e-06, -2.8675422072410583e-06, -2.7138739824295044e-06, -2.5602057576179504e-06, -2.4065375328063965e-06, -2.2528693079948425e-06, -2.0992010831832886e-06, -1.9455328583717346e-06, -1.7918646335601807e-06, -1.6381964087486267e-06, -1.4845281839370728e-06, -1.3308599591255188e-06, -1.1771917343139648e-06, -1.0235235095024109e-06, -8.698552846908569e-07, -7.16187059879303e-07, -5.62518835067749e-07, -4.0885061025619507e-07, -2.551823854446411e-07, -1.0151416063308716e-07, 5.21540641784668e-08, 2.0582228899002075e-07, 3.594905138015747e-07, 5.131587386131287e-07, 6.668269634246826e-07, 8.204951882362366e-07, 9.741634130477905e-07, 1.1278316378593445e-06, 1.2814998626708984e-06, 1.4351680874824524e-06, 1.5888363122940063e-06, 1.7425045371055603e-06, 1.8961727619171143e-06, 2.0498409867286682e-06, 2.203509211540222e-06, 2.357177436351776e-06, 2.51084566116333e-06, 2.664513885974884e-06, 2.818182110786438e-06, 2.971850335597992e-06, 3.125518560409546e-06, 3.2791867852211e-06, 3.432855010032654e-06, 3.5865232348442078e-06, 3.7401914596557617e-06, 3.893859684467316e-06, 4.04752790927887e-06, 4.201196134090424e-06, 4.3548643589019775e-06, 4.5085325837135315e-06, 4.6622008085250854e-06, 4.815869033336639e-06, 4.969537258148193e-06, 5.123205482959747e-06, 5.276873707771301e-06, 5.430541932582855e-06, 5.584210157394409e-06, 5.737878382205963e-06, 5.891546607017517e-06, 6.045214831829071e-06, 6.198883056640625e-06]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 7.0, 16.0, 22.0, 35.0, 52.0, 55.0, 86.0, 121.0, 236.0, 454.0, 740.0, 1287.0, 2675.0, 5458.0, 11838.0, 31494.0, 90037.0, 397685.0, 369863.0, 84251.0, 30000.0, 11397.0, 5130.0, 2543.0, 1338.0, 696.0, 363.0, 220.0, 153.0, 109.0, 63.0, 45.0, 25.0, 16.0, 10.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-3.999471664428711e-05, -3.88510525226593e-05, -3.7707388401031494e-05, -3.6563724279403687e-05, -3.542006015777588e-05, -3.427639603614807e-05, -3.3132731914520264e-05, -3.1989067792892456e-05, -3.084540367126465e-05, -2.970173954963684e-05, -2.8558075428009033e-05, -2.7414411306381226e-05, -2.6270747184753418e-05, -2.512708306312561e-05, -2.3983418941497803e-05, -2.2839754819869995e-05, -2.1696090698242188e-05, -2.055242657661438e-05, -1.9408762454986572e-05, -1.8265098333358765e-05, -1.7121434211730957e-05, -1.597777009010315e-05, -1.4834105968475342e-05, -1.3690441846847534e-05, -1.2546777725219727e-05, -1.1403113603591919e-05, -1.0259449481964111e-05, -9.115785360336304e-06, -7.972121238708496e-06, -6.8284571170806885e-06, -5.684792995452881e-06, -4.541128873825073e-06, -3.3974647521972656e-06, -2.253800630569458e-06, -1.1101365089416504e-06, 3.3527612686157227e-08, 1.1771917343139648e-06, 2.3208558559417725e-06, 3.46451997756958e-06, 4.608184099197388e-06, 5.751848220825195e-06, 6.895512342453003e-06, 8.03917646408081e-06, 9.182840585708618e-06, 1.0326504707336426e-05, 1.1470168828964233e-05, 1.2613832950592041e-05, 1.3757497072219849e-05, 1.4901161193847656e-05, 1.6044825315475464e-05, 1.718848943710327e-05, 1.833215355873108e-05, 1.9475817680358887e-05, 2.0619481801986694e-05, 2.1763145923614502e-05, 2.290681004524231e-05, 2.4050474166870117e-05, 2.5194138288497925e-05, 2.6337802410125732e-05, 2.748146653175354e-05, 2.8625130653381348e-05, 2.9768794775009155e-05, 3.091245889663696e-05, 3.205612301826477e-05, 3.319978713989258e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 6.0, 12.0, 11.0, 21.0, 20.0, 21.0, 17.0, 27.0, 27.0, 46.0, 43.0, 51.0, 70.0, 69.0, 63.0, 55.0, 61.0, 73.0, 49.0, 45.0, 38.0, 37.0, 27.0, 14.0, 16.0, 9.0, 20.0, 4.0, 13.0, 9.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.450580596923828e-06, -7.199123501777649e-06, -6.94766640663147e-06, -6.6962093114852905e-06, -6.444752216339111e-06, -6.193295121192932e-06, -5.941838026046753e-06, -5.690380930900574e-06, -5.4389238357543945e-06, -5.187466740608215e-06, -4.936009645462036e-06, -4.684552550315857e-06, -4.433095455169678e-06, -4.1816383600234985e-06, -3.930181264877319e-06, -3.67872416973114e-06, -3.427267074584961e-06, -3.1758099794387817e-06, -2.9243528842926025e-06, -2.6728957891464233e-06, -2.421438694000244e-06, -2.169981598854065e-06, -1.9185245037078857e-06, -1.6670674085617065e-06, -1.4156103134155273e-06, -1.1641532182693481e-06, -9.126961231231689e-07, -6.612390279769897e-07, -4.0978193283081055e-07, -1.5832483768463135e-07, 9.313225746154785e-08, 3.4458935260772705e-07, 5.960464477539062e-07, 8.475035429000854e-07, 1.0989606380462646e-06, 1.3504177331924438e-06, 1.601874828338623e-06, 1.8533319234848022e-06, 2.1047890186309814e-06, 2.3562461137771606e-06, 2.60770320892334e-06, 2.859160304069519e-06, 3.1106173992156982e-06, 3.3620744943618774e-06, 3.6135315895080566e-06, 3.864988684654236e-06, 4.116445779800415e-06, 4.367902874946594e-06, 4.6193599700927734e-06, 4.870817065238953e-06, 5.122274160385132e-06, 5.373731255531311e-06, 5.62518835067749e-06, 5.8766454458236694e-06, 6.128102540969849e-06, 6.379559636116028e-06, 6.631016731262207e-06, 6.882473826408386e-06, 7.1339309215545654e-06, 7.385388016700745e-06, 7.636845111846924e-06, 7.888302206993103e-06, 8.139759302139282e-06, 8.391216397285461e-06, 8.64267349243164e-06]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 6.0, 3.0, 3.0, 7.0, 13.0, 14.0, 18.0, 27.0, 26.0, 37.0, 52.0, 91.0, 119.0, 140.0, 129.0, 88.0, 66.0, 36.0, 31.0, 26.0, 13.0, 18.0, 12.0, 10.0, 3.0, 4.0, 2.0, 3.0, 0.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013049495173618197, -0.0012673933524638414, -0.001229837303981185, -0.0011922811390832067, -0.0011547249741852283, -0.00111716880928725, -0.0010796126443892717, -0.0010420565959066153, -0.001004500431008637, -0.0009669442661106586, -0.0009293881594203413, -0.0008918320527300239, -0.0008542758878320456, -0.0008167197229340672, -0.0007791636162437499, -0.0007416075095534325, -0.0007040513446554542, -0.0006664951797574759, -0.0006289390730671585, -0.0005913829663768411, -0.0005538268014788628, -0.0005162706365808845, -0.00047871452989056706, -0.0004411583940964192, -0.00040360225830227137, -0.0003660461225081235, -0.00032848998671397567, -0.0002909338509198278, -0.00025337771512567997, -0.00021582157933153212, -0.00017826544353738427, -0.00014070930774323642, -0.00010315317194908857, -6.559703615494072e-05, -2.8040900360792875e-05, 9.515235433354974e-06, 4.707137122750282e-05, 8.462750702165067e-05, 0.00012218364281579852, 0.00015973977860994637, 0.00019729591440409422, 0.00023485205019824207, 0.0002724081859923899, 0.00030996432178653777, 0.0003475204575806856, 0.00038507659337483346, 0.0004226327291689813, 0.00046018886496312916, 0.000497745000757277, 0.0005353011656552553, 0.0005728572723455727, 0.0006104133790358901, 0.0006479695439338684, 0.0006855257088318467, 0.0007230818155221641, 0.0007606379222124815, 0.0007981940871104598, 0.0008357502520084381, 0.0008733063586987555, 0.0009108624653890729, 0.0009484186302870512, 0.0009859747951850295, 0.0010235309600830078, 0.0010610870085656643, 0.0010986431734636426]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 3.0, 8.0, 6.0, 12.0, 10.0, 14.0, 14.0, 18.0, 25.0, 28.0, 32.0, 30.0, 36.0, 33.0, 52.0, 33.0, 67.0, 55.0, 58.0, 55.0, 50.0, 41.0, 38.0, 33.0, 31.0, 35.0, 32.0, 36.0, 25.0, 26.0, 11.0, 11.0, 11.0, 10.0, 8.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008757420000620186, -0.0008501416887156665, -0.0008245413191616535, -0.0007989410078153014, -0.0007733406382612884, -0.0007477403269149363, -0.0007221399573609233, -0.0006965396460145712, -0.0006709393346682191, -0.000645339023321867, -0.000619738653767854, -0.0005941383424215019, -0.0005685379728674889, -0.0005429376615211368, -0.0005173373501747847, -0.0004917369806207716, -0.0004661366401705891, -0.00044053629972040653, -0.000414935959270224, -0.0003893356188200414, -0.0003637353074736893, -0.00033813496702350676, -0.0003125346265733242, -0.0002869343152269721, -0.0002613339456729591, -0.00023573360522277653, -0.0002101332793245092, -0.00018453293887432665, -0.00015893261297605932, -0.00013333227252587676, -0.0001077319320756942, -8.213160617742687e-05, -5.6531280279159546e-05, -3.09309471049346e-05, -5.330610292730853e-06, 2.0269726519472897e-05, 4.587005969369784e-05, 7.147039286792278e-05, 9.707073331810534e-05, 0.00012267105921637267, 0.00014827139966655523, 0.00017387174011673778, 0.0001994720660150051, 0.00022507240646518767, 0.0002506727469153702, 0.0002762730582617223, 0.00030187342781573534, 0.00032747373916208744, 0.00035307407961227, 0.00037867442006245255, 0.0004042747605126351, 0.00042987510096281767, 0.00045547541230916977, 0.0004810757527593523, 0.0005066760932095349, 0.000532276404555887, 0.0005578767741099, 0.0005834770854562521, 0.0006090774550102651, 0.0006346777663566172, 0.0006602781359106302, 0.0006858784472569823, 0.0007114787586033344, 0.0007370791281573474, 0.0007626794395036995]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 0.0, 1.0, 4.0, 5.0, 4.0, 4.0, 4.0, 4.0, 13.0, 8.0, 12.0, 20.0, 25.0, 38.0, 47.0, 61.0, 68.0, 112.0, 178.0, 318.0, 606.0, 1225.0, 2717.0, 7099.0, 25069.0, 3875084.0, 255093.0, 16526.0, 5512.0, 2145.0, 962.0, 520.0, 269.0, 165.0, 88.0, 63.0, 41.0, 31.0, 24.0, 28.0, 21.0, 18.0, 9.0, 4.0, 7.0, 6.0, 8.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0041961669921875, -0.004068434238433838, -0.003940701484680176, -0.0038129687309265137, -0.0036852359771728516, -0.0035575032234191895, -0.0034297704696655273, -0.0033020377159118652, -0.003174304962158203, -0.003046572208404541, -0.002918839454650879, -0.002791106700897217, -0.0026633739471435547, -0.0025356411933898926, -0.0024079084396362305, -0.0022801756858825684, -0.0021524429321289062, -0.002024710178375244, -0.001896977424621582, -0.00176924467086792, -0.0016415119171142578, -0.0015137791633605957, -0.0013860464096069336, -0.0012583136558532715, -0.0011305809020996094, -0.0010028481483459473, -0.0008751153945922852, -0.000747382640838623, -0.0006196498870849609, -0.0004919171333312988, -0.0003641843795776367, -0.0002364516258239746, -0.0001087188720703125, 1.901388168334961e-05, 0.00014674663543701172, 0.00027447938919067383, 0.00040221214294433594, 0.000529944896697998, 0.0006576776504516602, 0.0007854104042053223, 0.0009131431579589844, 0.0010408759117126465, 0.0011686086654663086, 0.0012963414192199707, 0.0014240741729736328, 0.001551806926727295, 0.001679539680480957, 0.0018072724342346191, 0.0019350051879882812, 0.0020627379417419434, 0.0021904706954956055, 0.0023182034492492676, 0.0024459362030029297, 0.002573668956756592, 0.002701401710510254, 0.002829134464263916, 0.002956867218017578, 0.0030845999717712402, 0.0032123327255249023, 0.0033400654792785645, 0.0034677982330322266, 0.0035955309867858887, 0.0037232637405395508, 0.003850996494293213, 0.003978729248046875]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 7.0, 5.0, 4.0, 6.0, 4.0, 15.0, 6.0, 7.0, 18.0, 20.0, 25.0, 22.0, 30.0, 21.0, 29.0, 30.0, 29.0, 40.0, 34.0, 34.0, 38.0, 47.0, 47.0, 40.0, 32.0, 47.0, 28.0, 32.0, 37.0, 26.0, 24.0, 25.0, 26.0, 23.0, 18.0, 20.0, 19.0, 22.0, 14.0, 9.0, 5.0, 11.0, 5.0, 4.0, 10.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0003619194030761719, -0.0003508441150188446, -0.00033976882696151733, -0.00032869353890419006, -0.0003176182508468628, -0.0003065429627895355, -0.00029546767473220825, -0.000284392386674881, -0.0002733170986175537, -0.00026224181056022644, -0.00025116652250289917, -0.0002400912344455719, -0.00022901594638824463, -0.00021794065833091736, -0.0002068653702735901, -0.00019579008221626282, -0.00018471479415893555, -0.00017363950610160828, -0.000162564218044281, -0.00015148892998695374, -0.00014041364192962646, -0.0001293383538722992, -0.00011826306581497192, -0.00010718777775764465, -9.611248970031738e-05, -8.503720164299011e-05, -7.396191358566284e-05, -6.288662552833557e-05, -5.18113374710083e-05, -4.073604941368103e-05, -2.966076135635376e-05, -1.858547329902649e-05, -7.510185241699219e-06, 3.5651028156280518e-06, 1.4640390872955322e-05, 2.5715678930282593e-05, 3.679096698760986e-05, 4.7866255044937134e-05, 5.8941543102264404e-05, 7.001683115959167e-05, 8.109211921691895e-05, 9.216740727424622e-05, 0.00010324269533157349, 0.00011431798338890076, 0.00012539327144622803, 0.0001364685595035553, 0.00014754384756088257, 0.00015861913561820984, 0.0001696944236755371, 0.00018076971173286438, 0.00019184499979019165, 0.00020292028784751892, 0.0002139955759048462, 0.00022507086396217346, 0.00023614615201950073, 0.000247221440076828, 0.0002582967281341553, 0.00026937201619148254, 0.0002804473042488098, 0.0002915225923061371, 0.00030259788036346436, 0.0003136731684207916, 0.0003247484564781189, 0.00033582374453544617, 0.00034689903259277344]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 7.0, 13.0, 15.0, 27.0, 30.0, 39.0, 77.0, 146.0, 308.0, 709.0, 1682.0, 4783.0, 16803.0, 137653.0, 3958485.0, 57095.0, 10646.0, 3431.0, 1259.0, 506.0, 242.0, 133.0, 84.0, 42.0, 18.0, 23.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00432586669921875, -0.004199892282485962, -0.004073917865753174, -0.003947943449020386, -0.0038219690322875977, -0.0036959946155548096, -0.0035700201988220215, -0.0034440457820892334, -0.0033180713653564453, -0.0031920969486236572, -0.003066122531890869, -0.002940148115158081, -0.002814173698425293, -0.002688199281692505, -0.002562224864959717, -0.0024362504482269287, -0.0023102760314941406, -0.0021843016147613525, -0.0020583271980285645, -0.0019323527812957764, -0.0018063783645629883, -0.0016804039478302002, -0.0015544295310974121, -0.001428455114364624, -0.001302480697631836, -0.0011765062808990479, -0.0010505318641662598, -0.0009245574474334717, -0.0007985830307006836, -0.0006726086139678955, -0.0005466341972351074, -0.00042065978050231934, -0.00029468536376953125, -0.00016871094703674316, -4.273653030395508e-05, 8.323788642883301e-05, 0.0002092123031616211, 0.0003351867198944092, 0.00046116113662719727, 0.0005871355533599854, 0.0007131099700927734, 0.0008390843868255615, 0.0009650588035583496, 0.0010910332202911377, 0.0012170076370239258, 0.0013429820537567139, 0.001468956470489502, 0.00159493088722229, 0.0017209053039550781, 0.0018468797206878662, 0.0019728541374206543, 0.0020988285541534424, 0.0022248029708862305, 0.0023507773876190186, 0.0024767518043518066, 0.0026027262210845947, 0.002728700637817383, 0.002854675054550171, 0.002980649471282959, 0.003106623888015747, 0.003232598304748535, 0.0033585727214813232, 0.0034845471382141113, 0.0036105215549468994, 0.0037364959716796875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 5.0, 8.0, 9.0, 6.0, 14.0, 20.0, 29.0, 48.0, 62.0, 151.0, 803.0, 2289.0, 367.0, 102.0, 53.0, 31.0, 14.0, 18.0, 11.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000507354736328125, -0.0004887580871582031, -0.00047016143798828125, -0.0004515647888183594, -0.0004329681396484375, -0.0004143714904785156, -0.00039577484130859375, -0.0003771781921386719, -0.00035858154296875, -0.0003399848937988281, -0.00032138824462890625, -0.0003027915954589844, -0.0002841949462890625, -0.0002655982971191406, -0.00024700164794921875, -0.00022840499877929688, -0.000209808349609375, -0.00019121170043945312, -0.00017261505126953125, -0.00015401840209960938, -0.0001354217529296875, -0.00011682510375976562, -9.822845458984375e-05, -7.963180541992188e-05, -6.103515625e-05, -4.2438507080078125e-05, -2.384185791015625e-05, -5.245208740234375e-06, 1.33514404296875e-05, 3.1948089599609375e-05, 5.054473876953125e-05, 6.914138793945312e-05, 8.7738037109375e-05, 0.00010633468627929688, 0.00012493133544921875, 0.00014352798461914062, 0.0001621246337890625, 0.00018072128295898438, 0.00019931793212890625, 0.00021791458129882812, 0.00023651123046875, 0.0002551078796386719, 0.00027370452880859375, 0.0002923011779785156, 0.0003108978271484375, 0.0003294944763183594, 0.00034809112548828125, 0.0003666877746582031, 0.000385284423828125, 0.0004038810729980469, 0.00042247772216796875, 0.0004410743713378906, 0.0004596710205078125, 0.0004782676696777344, 0.0004968643188476562, 0.0005154609680175781, 0.0005340576171875, 0.0005526542663574219, 0.0005712509155273438, 0.0005898475646972656, 0.0006084442138671875, 0.0006270408630371094, 0.0006456375122070312, 0.0006642341613769531, 0.000682830810546875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 7.0, 10.0, 12.0, 17.0, 19.0, 22.0, 29.0, 44.0, 48.0, 82.0, 108.0, 111.0, 134.0, 85.0, 74.0, 59.0, 27.0, 27.0, 23.0, 12.0, 12.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008328738622367382, -0.0008082307176664472, -0.000783587631303817, -0.0007589445449411869, -0.0007343014003708959, -0.0007096582558006048, -0.0006850151694379747, -0.0006603720830753446, -0.0006357289385050535, -0.0006110857939347625, -0.0005864427075721323, -0.0005617996212095022, -0.0005371564766392112, -0.0005125133320689201, -0.00048787024570629, -0.0004632271302398294, -0.00043858401477336884, -0.00041394089930690825, -0.00038929778384044766, -0.0003646546683739871, -0.0003400115529075265, -0.0003153684374410659, -0.0002907253219746053, -0.00026608220650814474, -0.00024143909104168415, -0.00021679597557522357, -0.00019215286010876298, -0.0001675097446423024, -0.0001428666291758418, -0.00011822351370938122, -9.358039824292064e-05, -6.893728277646005e-05, -4.429422551766038e-05, -1.9651110051199794e-05, 4.992005415260792e-06, 2.9635120881721377e-05, 5.427823634818196e-05, 7.892135181464255e-05, 0.00010356446728110313, 0.00012820758274756372, 0.0001528506982140243, 0.0001774938136804849, 0.00020213692914694548, 0.00022678004461340606, 0.00025142316007986665, 0.00027606627554632723, 0.0003007093910127878, 0.0003253525064792484, 0.000349995621945709, 0.0003746387374121696, 0.00039928185287863016, 0.00042392496834509075, 0.00044856808381155133, 0.0004732111992780119, 0.0004978543147444725, 0.0005224974593147635, 0.0005471405456773937, 0.0005717836320400238, 0.0005964267766103148, 0.0006210699211806059, 0.000645713007543236, 0.0006703560939058661, 0.0006949992384761572, 0.0007196423830464482, 0.0007442854694090784]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 10.0, 4.0, 3.0, 5.0, 7.0, 6.0, 14.0, 8.0, 13.0, 18.0, 20.0, 25.0, 29.0, 33.0, 26.0, 35.0, 32.0, 46.0, 37.0, 45.0, 33.0, 32.0, 45.0, 29.0, 36.0, 40.0, 43.0, 35.0, 24.0, 33.0, 32.0, 20.0, 31.0, 27.0, 15.0, 18.0, 22.0, 14.0, 15.0, 8.0, 8.0, 7.0, 10.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00046326310257427394, -0.0004498352063819766, -0.0004364072810858488, -0.00042297938489355147, -0.00040955145959742367, -0.00039612356340512633, -0.00038269563810899854, -0.0003692677419167012, -0.00035583984572440386, -0.0003424119495321065, -0.0003289840242359787, -0.0003155561280436814, -0.0003021282027475536, -0.00028870030655525625, -0.0002752724103629589, -0.0002618444850668311, -0.0002484165597707033, -0.00023498864902649075, -0.00022156073828227818, -0.00020813284208998084, -0.00019470493134576827, -0.0001812770206015557, -0.00016784910985734314, -0.00015442119911313057, -0.00014099330292083323, -0.00012756539217662066, -0.00011413748870836571, -0.00010070957796415314, -8.728167449589819e-05, -7.385376375168562e-05, -6.042585300747305e-05, -4.69979495392181e-05, -3.3570046070963144e-05, -2.0142138964729384e-05, -6.714230039506219e-06, 6.713678885716945e-06, 2.0141585991950706e-05, 3.3569493098184466e-05, 4.6997403842397034e-05, 6.042530731065199e-05, 7.385321805486456e-05, 8.728112879907712e-05, 0.00010070903226733208, 0.00011413694301154464, 0.0001275648537557572, 0.00014099274994805455, 0.00015442067524418235, 0.0001678485714364797, 0.00018127648218069226, 0.00019470439292490482, 0.0002081323036691174, 0.00022156021441332996, 0.0002349881106056273, 0.0002484160359017551, 0.00026184393209405243, 0.0002752718282863498, 0.00028869975358247757, 0.0003021276497747749, 0.0003155555750709027, 0.00032898347126320004, 0.00034241139655932784, 0.0003558392927516252, 0.0003692671889439225, 0.0003826951142400503, 0.00039612301043234766]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 10.0, 12.0, 19.0, 24.0, 41.0, 56.0, 83.0, 121.0, 154.0, 229.0, 380.0, 496.0, 739.0, 1186.0, 1871.0, 2723.0, 4317.0, 6659.0, 10590.0, 16304.0, 25679.0, 41185.0, 66749.0, 109349.0, 175303.0, 207363.0, 144159.0, 87307.0, 53925.0, 33074.0, 20545.0, 13090.0, 8743.0, 5463.0, 3567.0, 2353.0, 1524.0, 1013.0, 702.0, 457.0, 324.0, 206.0, 135.0, 90.0, 72.0, 42.0, 34.0, 32.0, 18.0, 10.0, 4.0, 10.0, 3.0, 5.0, 1.0, 2.0], "bins": [-0.00035452842712402344, -0.00034387409687042236, -0.0003332197666168213, -0.0003225654363632202, -0.00031191110610961914, -0.00030125677585601807, -0.000290602445602417, -0.0002799481153488159, -0.00026929378509521484, -0.00025863945484161377, -0.0002479851245880127, -0.00023733079433441162, -0.00022667646408081055, -0.00021602213382720947, -0.0002053678035736084, -0.00019471347332000732, -0.00018405914306640625, -0.00017340481281280518, -0.0001627504825592041, -0.00015209615230560303, -0.00014144182205200195, -0.00013078749179840088, -0.0001201331615447998, -0.00010947883129119873, -9.882450103759766e-05, -8.817017078399658e-05, -7.751584053039551e-05, -6.686151027679443e-05, -5.620718002319336e-05, -4.5552849769592285e-05, -3.489851951599121e-05, -2.4244189262390137e-05, -1.3589859008789062e-05, -2.9355287551879883e-06, 7.718801498413086e-06, 1.837313175201416e-05, 2.9027462005615234e-05, 3.968179225921631e-05, 5.033612251281738e-05, 6.099045276641846e-05, 7.164478302001953e-05, 8.22991132736206e-05, 9.295344352722168e-05, 0.00010360777378082275, 0.00011426210403442383, 0.0001249164342880249, 0.00013557076454162598, 0.00014622509479522705, 0.00015687942504882812, 0.0001675337553024292, 0.00017818808555603027, 0.00018884241580963135, 0.00019949674606323242, 0.0002101510763168335, 0.00022080540657043457, 0.00023145973682403564, 0.00024211406707763672, 0.0002527683973312378, 0.00026342272758483887, 0.00027407705783843994, 0.000284731388092041, 0.0002953857183456421, 0.00030604004859924316, 0.00031669437885284424, 0.0003273487091064453]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 12.0, 7.0, 18.0, 11.0, 10.0, 16.0, 19.0, 20.0, 33.0, 21.0, 24.0, 43.0, 36.0, 38.0, 32.0, 45.0, 32.0, 36.0, 30.0, 43.0, 32.0, 34.0, 38.0, 32.0, 34.0, 32.0, 24.0, 31.0, 26.0, 26.0, 24.0, 22.0, 13.0, 19.0, 12.0, 9.0, 9.0, 7.0, 8.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.00046062469482421875, -0.0004469528794288635, -0.0004332810640335083, -0.0004196092486381531, -0.00040593743324279785, -0.0003922656178474426, -0.0003785938024520874, -0.0003649219870567322, -0.00035125017166137695, -0.00033757835626602173, -0.0003239065408706665, -0.0003102347254753113, -0.00029656291007995605, -0.00028289109468460083, -0.0002692192792892456, -0.0002555474638938904, -0.00024187564849853516, -0.00022820383310317993, -0.0002145320177078247, -0.00020086020231246948, -0.00018718838691711426, -0.00017351657152175903, -0.0001598447561264038, -0.00014617294073104858, -0.00013250112533569336, -0.00011882930994033813, -0.00010515749454498291, -9.148567914962769e-05, -7.781386375427246e-05, -6.414204835891724e-05, -5.047023296356201e-05, -3.679841756820679e-05, -2.3126602172851562e-05, -9.454786777496338e-06, 4.217028617858887e-06, 1.788884401321411e-05, 3.1560659408569336e-05, 4.523247480392456e-05, 5.8904290199279785e-05, 7.257610559463501e-05, 8.624792098999023e-05, 9.991973638534546e-05, 0.00011359155178070068, 0.0001272633671760559, 0.00014093518257141113, 0.00015460699796676636, 0.00016827881336212158, 0.0001819506287574768, 0.00019562244415283203, 0.00020929425954818726, 0.00022296607494354248, 0.0002366378903388977, 0.00025030970573425293, 0.00026398152112960815, 0.0002776533365249634, 0.0002913251519203186, 0.00030499696731567383, 0.00031866878271102905, 0.0003323405981063843, 0.0003460124135017395, 0.0003596842288970947, 0.00037335604429244995, 0.0003870278596878052, 0.0004006996750831604, 0.0004143714904785156]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 11.0, 11.0, 16.0, 21.0, 18.0, 24.0, 44.0, 59.0, 75.0, 122.0, 146.0, 220.0, 367.0, 517.0, 813.0, 1168.0, 1865.0, 2924.0, 4683.0, 7879.0, 14048.0, 26513.0, 54671.0, 130514.0, 395004.0, 235918.0, 84910.0, 38497.0, 20035.0, 10743.0, 6213.0, 3753.0, 2312.0, 1495.0, 968.0, 640.0, 398.0, 316.0, 210.0, 117.0, 88.0, 55.0, 49.0, 39.0, 19.0, 17.0, 12.0, 4.0, 7.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.0005035400390625, -0.000488627701997757, -0.0004737153649330139, -0.0004588030278682709, -0.00044389069080352783, -0.0004289783537387848, -0.00041406601667404175, -0.0003991536796092987, -0.00038424134254455566, -0.0003693290054798126, -0.0003544166684150696, -0.00033950433135032654, -0.0003245919942855835, -0.00030967965722084045, -0.0002947673201560974, -0.00027985498309135437, -0.00026494264602661133, -0.0002500303089618683, -0.00023511797189712524, -0.0002202056348323822, -0.00020529329776763916, -0.00019038096070289612, -0.00017546862363815308, -0.00016055628657341003, -0.000145643949508667, -0.00013073161244392395, -0.00011581927537918091, -0.00010090693831443787, -8.599460124969482e-05, -7.108226418495178e-05, -5.616992712020874e-05, -4.12575900554657e-05, -2.6345252990722656e-05, -1.1432915925979614e-05, 3.4794211387634277e-06, 1.839175820350647e-05, 3.330409526824951e-05, 4.8216432332992554e-05, 6.31287693977356e-05, 7.804110646247864e-05, 9.295344352722168e-05, 0.00010786578059196472, 0.00012277811765670776, 0.0001376904547214508, 0.00015260279178619385, 0.0001675151288509369, 0.00018242746591567993, 0.00019733980298042297, 0.00021225214004516602, 0.00022716447710990906, 0.0002420768141746521, 0.00025698915123939514, 0.0002719014883041382, 0.0002868138253688812, 0.00030172616243362427, 0.0003166384994983673, 0.00033155083656311035, 0.0003464631736278534, 0.00036137551069259644, 0.0003762878477573395, 0.0003912001848220825, 0.00040611252188682556, 0.0004210248589515686, 0.00043593719601631165, 0.0004508495330810547]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 6.0, 2.0, 6.0, 11.0, 12.0, 10.0, 14.0, 10.0, 20.0, 20.0, 20.0, 31.0, 25.0, 24.0, 35.0, 24.0, 31.0, 32.0, 36.0, 39.0, 41.0, 41.0, 44.0, 47.0, 28.0, 36.0, 34.0, 31.0, 23.0, 26.0, 28.0, 31.0, 28.0, 22.0, 22.0, 27.0, 20.0, 15.0, 13.0, 6.0, 8.0, 4.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0002880096435546875, -0.00027915462851524353, -0.00027029961347579956, -0.0002614445984363556, -0.0002525895833969116, -0.00024373456835746765, -0.00023487955331802368, -0.0002260245382785797, -0.00021716952323913574, -0.00020831450819969177, -0.0001994594931602478, -0.00019060447812080383, -0.00018174946308135986, -0.0001728944480419159, -0.00016403943300247192, -0.00015518441796302795, -0.00014632940292358398, -0.00013747438788414001, -0.00012861937284469604, -0.00011976435780525208, -0.0001109093427658081, -0.00010205432772636414, -9.319931268692017e-05, -8.43442976474762e-05, -7.548928260803223e-05, -6.663426756858826e-05, -5.777925252914429e-05, -4.892423748970032e-05, -4.006922245025635e-05, -3.121420741081238e-05, -2.2359192371368408e-05, -1.3504177331924438e-05, -4.649162292480469e-06, 4.205852746963501e-06, 1.306086778640747e-05, 2.191588282585144e-05, 3.077089786529541e-05, 3.962591290473938e-05, 4.848092794418335e-05, 5.733594298362732e-05, 6.619095802307129e-05, 7.504597306251526e-05, 8.390098810195923e-05, 9.27560031414032e-05, 0.00010161101818084717, 0.00011046603322029114, 0.00011932104825973511, 0.00012817606329917908, 0.00013703107833862305, 0.00014588609337806702, 0.00015474110841751099, 0.00016359612345695496, 0.00017245113849639893, 0.0001813061535358429, 0.00019016116857528687, 0.00019901618361473083, 0.0002078711986541748, 0.00021672621369361877, 0.00022558122873306274, 0.00023443624377250671, 0.00024329125881195068, 0.00025214627385139465, 0.0002610012888908386, 0.0002698563039302826, 0.00027871131896972656]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 5.0, 21.0, 18.0, 18.0, 41.0, 52.0, 63.0, 110.0, 170.0, 254.0, 399.0, 671.0, 1315.0, 2418.0, 5176.0, 13040.0, 43772.0, 640888.0, 285857.0, 33896.0, 10927.0, 4443.0, 2097.0, 1115.0, 661.0, 405.0, 227.0, 148.0, 111.0, 75.0, 38.0, 33.0, 19.0, 20.0, 15.0, 6.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.26716423034668e-05, -7.990747690200806e-05, -7.714331150054932e-05, -7.437914609909058e-05, -7.161498069763184e-05, -6.88508152961731e-05, -6.608664989471436e-05, -6.332248449325562e-05, -6.0558319091796875e-05, -5.7794153690338135e-05, -5.5029988288879395e-05, -5.2265822887420654e-05, -4.9501657485961914e-05, -4.6737492084503174e-05, -4.3973326683044434e-05, -4.120916128158569e-05, -3.844499588012695e-05, -3.568083047866821e-05, -3.291666507720947e-05, -3.0152499675750732e-05, -2.7388334274291992e-05, -2.4624168872833252e-05, -2.1860003471374512e-05, -1.909583806991577e-05, -1.633167266845703e-05, -1.3567507266998291e-05, -1.080334186553955e-05, -8.03917646408081e-06, -5.27501106262207e-06, -2.51084566116333e-06, 2.5331974029541016e-07, 3.0174851417541504e-06, 5.781650543212891e-06, 8.545815944671631e-06, 1.1309981346130371e-05, 1.4074146747589111e-05, 1.683831214904785e-05, 1.9602477550506592e-05, 2.2366642951965332e-05, 2.5130808353424072e-05, 2.7894973754882812e-05, 3.065913915634155e-05, 3.342330455780029e-05, 3.618746995925903e-05, 3.8951635360717773e-05, 4.1715800762176514e-05, 4.4479966163635254e-05, 4.7244131565093994e-05, 5.0008296966552734e-05, 5.2772462368011475e-05, 5.5536627769470215e-05, 5.8300793170928955e-05, 6.10649585723877e-05, 6.382912397384644e-05, 6.659328937530518e-05, 6.935745477676392e-05, 7.212162017822266e-05, 7.48857855796814e-05, 7.764995098114014e-05, 8.041411638259888e-05, 8.317828178405762e-05, 8.594244718551636e-05, 8.87066125869751e-05, 9.147077798843384e-05, 9.423494338989258e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 7.0, 5.0, 14.0, 5.0, 11.0, 14.0, 16.0, 25.0, 10.0, 47.0, 30.0, 61.0, 41.0, 38.0, 73.0, 51.0, 85.0, 48.0, 103.0, 28.0, 63.0, 22.0, 19.0, 49.0, 18.0, 24.0, 12.0, 15.0, 7.0, 7.0, 9.0, 2.0, 7.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.9206275939941406e-06, -2.8349459171295166e-06, -2.7492642402648926e-06, -2.6635825634002686e-06, -2.5779008865356445e-06, -2.4922192096710205e-06, -2.4065375328063965e-06, -2.3208558559417725e-06, -2.2351741790771484e-06, -2.1494925022125244e-06, -2.0638108253479004e-06, -1.9781291484832764e-06, -1.8924474716186523e-06, -1.8067657947540283e-06, -1.7210841178894043e-06, -1.6354024410247803e-06, -1.5497207641601562e-06, -1.4640390872955322e-06, -1.3783574104309082e-06, -1.2926757335662842e-06, -1.2069940567016602e-06, -1.1213123798370361e-06, -1.0356307029724121e-06, -9.499490261077881e-07, -8.642673492431641e-07, -7.7858567237854e-07, -6.92903995513916e-07, -6.07222318649292e-07, -5.21540641784668e-07, -4.3585896492004395e-07, -3.501772880554199e-07, -2.644956111907959e-07, -1.7881393432617188e-07, -9.313225746154785e-08, -7.450580596923828e-09, 7.82310962677002e-08, 1.6391277313232422e-07, 2.4959444999694824e-07, 3.3527612686157227e-07, 4.209578037261963e-07, 5.066394805908203e-07, 5.923211574554443e-07, 6.780028343200684e-07, 7.636845111846924e-07, 8.493661880493164e-07, 9.350478649139404e-07, 1.0207295417785645e-06, 1.1064112186431885e-06, 1.1920928955078125e-06, 1.2777745723724365e-06, 1.3634562492370605e-06, 1.4491379261016846e-06, 1.5348196029663086e-06, 1.6205012798309326e-06, 1.7061829566955566e-06, 1.7918646335601807e-06, 1.8775463104248047e-06, 1.9632279872894287e-06, 2.0489096641540527e-06, 2.1345913410186768e-06, 2.2202730178833008e-06, 2.305954694747925e-06, 2.391636371612549e-06, 2.477318048477173e-06, 2.562999725341797e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 8.0, 13.0, 16.0, 38.0, 41.0, 74.0, 120.0, 240.0, 376.0, 725.0, 1775.0, 4547.0, 15575.0, 76621.0, 782749.0, 133343.0, 21989.0, 6172.0, 2152.0, 904.0, 481.0, 270.0, 134.0, 64.0, 41.0, 23.0, 22.0, 13.0, 8.0, 7.0, 3.0, 8.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001175999641418457, -0.00011376012116670609, -0.00010992027819156647, -0.00010608043521642685, -0.00010224059224128723, -9.840074926614761e-05, -9.4560906291008e-05, -9.072106331586838e-05, -8.688122034072876e-05, -8.304137736558914e-05, -7.920153439044952e-05, -7.53616914153099e-05, -7.152184844017029e-05, -6.768200546503067e-05, -6.384216248989105e-05, -6.0002319514751434e-05, -5.6162476539611816e-05, -5.23226335644722e-05, -4.848279058933258e-05, -4.464294761419296e-05, -4.0803104639053345e-05, -3.696326166391373e-05, -3.312341868877411e-05, -2.928357571363449e-05, -2.5443732738494873e-05, -2.1603889763355255e-05, -1.7764046788215637e-05, -1.392420381307602e-05, -1.0084360837936401e-05, -6.2445178627967834e-06, -2.4046748876571655e-06, 1.4351680874824524e-06, 5.27501106262207e-06, 9.114854037761688e-06, 1.2954697012901306e-05, 1.6794539988040924e-05, 2.0634382963180542e-05, 2.447422593832016e-05, 2.8314068913459778e-05, 3.2153911888599396e-05, 3.5993754863739014e-05, 3.983359783887863e-05, 4.367344081401825e-05, 4.751328378915787e-05, 5.1353126764297485e-05, 5.51929697394371e-05, 5.903281271457672e-05, 6.287265568971634e-05, 6.671249866485596e-05, 7.055234163999557e-05, 7.439218461513519e-05, 7.823202759027481e-05, 8.207187056541443e-05, 8.591171354055405e-05, 8.975155651569366e-05, 9.359139949083328e-05, 9.74312424659729e-05, 0.00010127108544111252, 0.00010511092841625214, 0.00010895077139139175, 0.00011279061436653137, 0.00011663045734167099, 0.00012047030031681061, 0.00012431014329195023, 0.00012814998626708984]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 9.0, 13.0, 21.0, 20.0, 32.0, 37.0, 45.0, 80.0, 104.0, 121.0, 116.0, 105.0, 77.0, 54.0, 33.0, 27.0, 19.0, 17.0, 12.0, 11.0, 9.0, 8.0, 4.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9669532775878906e-05, -1.9091181457042694e-05, -1.8512830138206482e-05, -1.793447881937027e-05, -1.7356127500534058e-05, -1.6777776181697845e-05, -1.6199424862861633e-05, -1.562107354402542e-05, -1.5042722225189209e-05, -1.4464370906352997e-05, -1.3886019587516785e-05, -1.3307668268680573e-05, -1.272931694984436e-05, -1.2150965631008148e-05, -1.1572614312171936e-05, -1.0994262993335724e-05, -1.0415911674499512e-05, -9.8375603556633e-06, -9.259209036827087e-06, -8.680857717990875e-06, -8.102506399154663e-06, -7.524155080318451e-06, -6.945803761482239e-06, -6.367452442646027e-06, -5.7891011238098145e-06, -5.210749804973602e-06, -4.63239848613739e-06, -4.054047167301178e-06, -3.475695848464966e-06, -2.8973445296287537e-06, -2.3189932107925415e-06, -1.7406418919563293e-06, -1.1622905731201172e-06, -5.83939254283905e-07, -5.587935447692871e-09, 5.727633833885193e-07, 1.1511147022247314e-06, 1.7294660210609436e-06, 2.3078173398971558e-06, 2.886168658733368e-06, 3.46451997756958e-06, 4.042871296405792e-06, 4.621222615242004e-06, 5.1995739340782166e-06, 5.777925252914429e-06, 6.356276571750641e-06, 6.934627890586853e-06, 7.512979209423065e-06, 8.091330528259277e-06, 8.66968184709549e-06, 9.248033165931702e-06, 9.826384484767914e-06, 1.0404735803604126e-05, 1.0983087122440338e-05, 1.156143844127655e-05, 1.2139789760112762e-05, 1.2718141078948975e-05, 1.3296492397785187e-05, 1.3874843716621399e-05, 1.4453195035457611e-05, 1.5031546354293823e-05, 1.5609897673130035e-05, 1.6188248991966248e-05, 1.676660031080246e-05, 1.7344951629638672e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 5.0, 6.0, 20.0, 15.0, 13.0, 23.0, 34.0, 44.0, 61.0, 98.0, 135.0, 149.0, 125.0, 79.0, 49.0, 30.0, 25.0, 20.0, 19.0, 7.0, 8.0, 9.0, 8.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000950415211264044, -0.0009234037133865058, -0.0008963921573013067, -0.0008693806594237685, -0.0008423691615462303, -0.0008153576054610312, -0.000788346107583493, -0.0007613345514982939, -0.0007343230536207557, -0.0007073115557432175, -0.0006802999996580184, -0.0006532885017804801, -0.000626276945695281, -0.0005992654478177428, -0.0005722539499402046, -0.0005452424520626664, -0.0005182308959774673, -0.0004912193980999291, -0.00046420784201473, -0.00043719634413719177, -0.0004101848171558231, -0.00038317329017445445, -0.00035616179229691625, -0.0003291502653155476, -0.0003021387383341789, -0.00027512721135281026, -0.0002481156843714416, -0.0002211041864939034, -0.00019409265951253474, -0.00016708113253116608, -0.00014006962010171264, -0.00011305810767225921, -8.604663889855146e-05, -5.903511919314042e-05, -3.202359948772937e-05, -5.012079782318324e-06, 2.1999439923092723e-05, 4.9010966904461384e-05, 7.602247933391482e-05, 0.00010303399176336825, 0.0001300455187447369, 0.00015705704572610557, 0.000184068558155559, 0.00021108007058501244, 0.0002380915975663811, 0.00026510312454774976, 0.00029211462242528796, 0.0003191261494066566, 0.0003461376763880253, 0.00037314920336939394, 0.0004001607303507626, 0.0004271722282283008, 0.00045418375520966947, 0.00048119528219103813, 0.0005082067800685763, 0.0005352182779461145, 0.0005622298340313137, 0.0005892413319088519, 0.000616252887994051, 0.0006432643858715892, 0.0006702758837491274, 0.0006972874398343265, 0.0007242989377118647, 0.0007513104937970638, 0.000778321991674602]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 1.0, 3.0, 0.0, 8.0, 4.0, 5.0, 4.0, 7.0, 6.0, 12.0, 9.0, 13.0, 14.0, 22.0, 25.0, 23.0, 39.0, 25.0, 31.0, 29.0, 49.0, 43.0, 37.0, 37.0, 33.0, 39.0, 36.0, 30.0, 42.0, 38.0, 40.0, 27.0, 26.0, 38.0, 24.0, 26.0, 28.0, 19.0, 17.0, 21.0, 17.0, 11.0, 12.0, 9.0, 6.0, 8.0, 7.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00047075634938664734, -0.00045718150795437396, -0.00044360666652210057, -0.0004300318250898272, -0.00041645695455372334, -0.00040288211312144995, -0.00038930727168917656, -0.00037573243025690317, -0.0003621575888246298, -0.0003485827473923564, -0.000335007905960083, -0.0003214330645278096, -0.00030785822309553623, -0.00029428338166326284, -0.000280708511127159, -0.0002671336696948856, -0.0002535588282626122, -0.00023998398683033884, -0.00022640914539806545, -0.00021283428941387683, -0.00019925944798160344, -0.00018568460654933006, -0.00017210975056514144, -0.00015853490913286805, -0.00014496006770059466, -0.00013138522626832128, -0.00011781037756009027, -0.00010423552885185927, -9.066068741958588e-05, -7.70858459873125e-05, -6.35109972790815e-05, -4.993614857085049e-05, -3.6361307138577104e-05, -2.278646206832491e-05, -9.211616998072714e-06, 4.363228072179481e-06, 1.7938073142431676e-05, 3.1512914574705064e-05, 4.5087763282936066e-05, 5.866261199116707e-05, 7.223745342344046e-05, 8.581229485571384e-05, 9.938714356394485e-05, 0.00011296199227217585, 0.00012653683370444924, 0.00014011167513672262, 0.00015368653112091124, 0.00016726137255318463, 0.00018083621398545802, 0.0001944110554177314, 0.0002079858968500048, 0.0002215607528341934, 0.0002351355942664668, 0.0002487104502506554, 0.0002622852916829288, 0.0002758601331152022, 0.0002894349745474756, 0.00030300981597974896, 0.00031658465741202235, 0.00033015949884429574, 0.00034373434027656913, 0.0003573091817088425, 0.00037088405224494636, 0.00038445889367721975, 0.00039803373510949314]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 8.0, 19.0, 23.0, 30.0, 65.0, 105.0, 139.0, 213.0, 383.0, 607.0, 971.0, 1615.0, 2504.0, 4036.0, 6798.0, 11723.0, 20797.0, 37894.0, 73291.0, 148214.0, 282437.0, 225137.0, 108173.0, 54493.0, 29025.0, 16301.0, 9353.0, 5511.0, 3291.0, 2111.0, 1186.0, 733.0, 479.0, 321.0, 184.0, 121.0, 86.0, 68.0, 34.0, 21.0, 17.0, 12.0, 7.0, 6.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.0011816024780273438, -0.0011485815048217773, -0.001115560531616211, -0.0010825395584106445, -0.0010495185852050781, -0.0010164976119995117, -0.0009834766387939453, -0.0009504556655883789, -0.0009174346923828125, -0.0008844137191772461, -0.0008513927459716797, -0.0008183717727661133, -0.0007853507995605469, -0.0007523298263549805, -0.0007193088531494141, -0.0006862878799438477, -0.0006532669067382812, -0.0006202459335327148, -0.0005872249603271484, -0.000554203987121582, -0.0005211830139160156, -0.0004881620407104492, -0.0004551410675048828, -0.0004221200942993164, -0.00038909912109375, -0.0003560781478881836, -0.0003230571746826172, -0.0002900362014770508, -0.0002570152282714844, -0.00022399425506591797, -0.00019097328186035156, -0.00015795230865478516, -0.00012493133544921875, -9.191036224365234e-05, -5.888938903808594e-05, -2.586841583251953e-05, 7.152557373046875e-06, 4.017353057861328e-05, 7.319450378417969e-05, 0.0001062154769897461, 0.0001392364501953125, 0.0001722574234008789, 0.0002052783966064453, 0.00023829936981201172, 0.0002713203430175781, 0.00030434131622314453, 0.00033736228942871094, 0.00037038326263427734, 0.00040340423583984375, 0.00043642520904541016, 0.00046944618225097656, 0.000502467155456543, 0.0005354881286621094, 0.0005685091018676758, 0.0006015300750732422, 0.0006345510482788086, 0.000667572021484375, 0.0007005929946899414, 0.0007336139678955078, 0.0007666349411010742, 0.0007996559143066406, 0.000832676887512207, 0.0008656978607177734, 0.0008987188339233398, 0.0009317398071289062]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 2.0, 4.0, 5.0, 5.0, 3.0, 11.0, 9.0, 14.0, 17.0, 14.0, 35.0, 34.0, 25.0, 25.0, 42.0, 40.0, 47.0, 40.0, 45.0, 49.0, 38.0, 41.0, 35.0, 33.0, 42.0, 38.0, 26.0, 42.0, 44.0, 27.0, 26.0, 25.0, 16.0, 24.0, 16.0, 16.0, 7.0, 11.0, 6.0, 6.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0003437995910644531, -0.0003345273435115814, -0.0003252550959587097, -0.000315982848405838, -0.0003067106008529663, -0.0002974383533000946, -0.0002881661057472229, -0.0002788938581943512, -0.0002696216106414795, -0.0002603493630886078, -0.0002510771155357361, -0.00024180486798286438, -0.00023253262042999268, -0.00022326037287712097, -0.00021398812532424927, -0.00020471587777137756, -0.00019544363021850586, -0.00018617138266563416, -0.00017689913511276245, -0.00016762688755989075, -0.00015835464000701904, -0.00014908239245414734, -0.00013981014490127563, -0.00013053789734840393, -0.00012126564979553223, -0.00011199340224266052, -0.00010272115468978882, -9.344890713691711e-05, -8.417665958404541e-05, -7.49044120311737e-05, -6.5632164478302e-05, -5.63599169254303e-05, -4.7087669372558594e-05, -3.781542181968689e-05, -2.8543174266815186e-05, -1.927092671394348e-05, -9.998679161071777e-06, -7.264316082000732e-07, 8.545815944671631e-06, 1.7818063497543335e-05, 2.709031105041504e-05, 3.636255860328674e-05, 4.563480615615845e-05, 5.490705370903015e-05, 6.417930126190186e-05, 7.345154881477356e-05, 8.272379636764526e-05, 9.199604392051697e-05, 0.00010126829147338867, 0.00011054053902626038, 0.00011981278657913208, 0.00012908503413200378, 0.0001383572816848755, 0.0001476295292377472, 0.0001569017767906189, 0.0001661740243434906, 0.0001754462718963623, 0.000184718519449234, 0.0001939907670021057, 0.00020326301455497742, 0.00021253526210784912, 0.00022180750966072083, 0.00023107975721359253, 0.00024035200476646423, 0.00024962425231933594]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 13.0, 11.0, 24.0, 18.0, 21.0, 28.0, 26.0, 51.0, 53.0, 96.0, 102.0, 138.0, 262.0, 454.0, 832.0, 1685.0, 3294.0, 7559.0, 18095.0, 48877.0, 164767.0, 474296.0, 225000.0, 62790.0, 22591.0, 9138.0, 4030.0, 1953.0, 899.0, 454.0, 299.0, 194.0, 122.0, 68.0, 63.0, 58.0, 39.0, 26.0, 21.0, 22.0, 13.0, 10.0, 12.0, 11.0, 7.0, 8.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-0.0016031265258789062, -0.0015524178743362427, -0.001501709222793579, -0.0014510005712509155, -0.001400291919708252, -0.0013495832681655884, -0.0012988746166229248, -0.0012481659650802612, -0.0011974573135375977, -0.001146748661994934, -0.0010960400104522705, -0.001045331358909607, -0.0009946227073669434, -0.0009439140558242798, -0.0008932054042816162, -0.0008424967527389526, -0.0007917881011962891, -0.0007410794496536255, -0.0006903707981109619, -0.0006396621465682983, -0.0005889534950256348, -0.0005382448434829712, -0.0004875361919403076, -0.00043682754039764404, -0.00038611888885498047, -0.0003354102373123169, -0.0002847015857696533, -0.00023399293422698975, -0.00018328428268432617, -0.0001325756311416626, -8.186697959899902e-05, -3.115832805633545e-05, 1.9550323486328125e-05, 7.02589750289917e-05, 0.00012096762657165527, 0.00017167627811431885, 0.00022238492965698242, 0.000273093581199646, 0.00032380223274230957, 0.00037451088428497314, 0.0004252195358276367, 0.0004759281873703003, 0.0005266368389129639, 0.0005773454904556274, 0.000628054141998291, 0.0006787627935409546, 0.0007294714450836182, 0.0007801800966262817, 0.0008308887481689453, 0.0008815973997116089, 0.0009323060512542725, 0.000983014702796936, 0.0010337233543395996, 0.0010844320058822632, 0.0011351406574249268, 0.0011858493089675903, 0.001236557960510254, 0.0012872666120529175, 0.001337975263595581, 0.0013886839151382446, 0.0014393925666809082, 0.0014901012182235718, 0.0015408098697662354, 0.001591518521308899, 0.0016422271728515625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 6.0, 6.0, 4.0, 7.0, 10.0, 14.0, 13.0, 9.0, 18.0, 18.0, 18.0, 35.0, 30.0, 36.0, 37.0, 24.0, 37.0, 36.0, 39.0, 42.0, 45.0, 57.0, 38.0, 42.0, 39.0, 52.0, 25.0, 36.0, 33.0, 21.0, 22.0, 19.0, 18.0, 22.0, 19.0, 9.0, 6.0, 8.0, 9.0, 11.0, 7.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002751350402832031, -0.00026667118072509766, -0.0002582073211669922, -0.0002497434616088867, -0.00024127960205078125, -0.00023281574249267578, -0.0002243518829345703, -0.00021588802337646484, -0.00020742416381835938, -0.0001989603042602539, -0.00019049644470214844, -0.00018203258514404297, -0.0001735687255859375, -0.00016510486602783203, -0.00015664100646972656, -0.0001481771469116211, -0.00013971328735351562, -0.00013124942779541016, -0.0001227855682373047, -0.00011432170867919922, -0.00010585784912109375, -9.739398956298828e-05, -8.893013000488281e-05, -8.046627044677734e-05, -7.200241088867188e-05, -6.35385513305664e-05, -5.507469177246094e-05, -4.661083221435547e-05, -3.814697265625e-05, -2.968311309814453e-05, -2.1219253540039062e-05, -1.2755393981933594e-05, -4.291534423828125e-06, 4.172325134277344e-06, 1.2636184692382812e-05, 2.110004425048828e-05, 2.956390380859375e-05, 3.802776336669922e-05, 4.649162292480469e-05, 5.4955482482910156e-05, 6.341934204101562e-05, 7.18832015991211e-05, 8.034706115722656e-05, 8.881092071533203e-05, 9.72747802734375e-05, 0.00010573863983154297, 0.00011420249938964844, 0.0001226663589477539, 0.00013113021850585938, 0.00013959407806396484, 0.0001480579376220703, 0.00015652179718017578, 0.00016498565673828125, 0.00017344951629638672, 0.0001819133758544922, 0.00019037723541259766, 0.00019884109497070312, 0.0002073049545288086, 0.00021576881408691406, 0.00022423267364501953, 0.000232696533203125, 0.00024116039276123047, 0.00024962425231933594, 0.0002580881118774414, 0.0002665519714355469]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 7.0, 5.0, 17.0, 22.0, 24.0, 30.0, 42.0, 62.0, 123.0, 211.0, 373.0, 665.0, 1432.0, 3290.0, 9967.0, 43708.0, 498326.0, 434483.0, 40133.0, 9522.0, 3302.0, 1352.0, 607.0, 328.0, 207.0, 104.0, 77.0, 41.0, 31.0, 20.0, 17.0, 7.0, 10.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-05, -3.5103410482406616e-05, -3.384798765182495e-05, -3.2592564821243286e-05, -3.133714199066162e-05, -3.0081719160079956e-05, -2.882629632949829e-05, -2.7570873498916626e-05, -2.631545066833496e-05, -2.5060027837753296e-05, -2.380460500717163e-05, -2.2549182176589966e-05, -2.12937593460083e-05, -2.0038336515426636e-05, -1.878291368484497e-05, -1.7527490854263306e-05, -1.627206802368164e-05, -1.5016645193099976e-05, -1.376122236251831e-05, -1.2505799531936646e-05, -1.125037670135498e-05, -9.994953870773315e-06, -8.73953104019165e-06, -7.484108209609985e-06, -6.22868537902832e-06, -4.973262548446655e-06, -3.7178397178649902e-06, -2.462416887283325e-06, -1.2069940567016602e-06, 4.842877388000488e-08, 1.30385160446167e-06, 2.559274435043335e-06, 3.814697265625e-06, 5.070120096206665e-06, 6.32554292678833e-06, 7.580965757369995e-06, 8.83638858795166e-06, 1.0091811418533325e-05, 1.134723424911499e-05, 1.2602657079696655e-05, 1.385807991027832e-05, 1.5113502740859985e-05, 1.636892557144165e-05, 1.7624348402023315e-05, 1.887977123260498e-05, 2.0135194063186646e-05, 2.139061689376831e-05, 2.2646039724349976e-05, 2.390146255493164e-05, 2.5156885385513306e-05, 2.641230821609497e-05, 2.7667731046676636e-05, 2.89231538772583e-05, 3.0178576707839966e-05, 3.143399953842163e-05, 3.2689422369003296e-05, 3.394484519958496e-05, 3.5200268030166626e-05, 3.645569086074829e-05, 3.7711113691329956e-05, 3.896653652191162e-05, 4.0221959352493286e-05, 4.147738218307495e-05, 4.2732805013656616e-05, 4.398822784423828e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 6.0, 5.0, 13.0, 5.0, 19.0, 15.0, 11.0, 54.0, 23.0, 94.0, 146.0, 74.0, 185.0, 127.0, 42.0, 69.0, 38.0, 12.0, 16.0, 12.0, 7.0, 8.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4570693969726562e-06, -3.3583492040634155e-06, -3.259629011154175e-06, -3.160908818244934e-06, -3.0621886253356934e-06, -2.9634684324264526e-06, -2.864748239517212e-06, -2.766028046607971e-06, -2.6673078536987305e-06, -2.5685876607894897e-06, -2.469867467880249e-06, -2.3711472749710083e-06, -2.2724270820617676e-06, -2.173706889152527e-06, -2.074986696243286e-06, -1.9762665033340454e-06, -1.8775463104248047e-06, -1.778826117515564e-06, -1.6801059246063232e-06, -1.5813857316970825e-06, -1.4826655387878418e-06, -1.383945345878601e-06, -1.2852251529693604e-06, -1.1865049600601196e-06, -1.087784767150879e-06, -9.890645742416382e-07, -8.903443813323975e-07, -7.916241884231567e-07, -6.92903995513916e-07, -5.941838026046753e-07, -4.954636096954346e-07, -3.9674341678619385e-07, -2.980232238769531e-07, -1.993030309677124e-07, -1.0058283805847168e-07, -1.862645149230957e-09, 9.685754776000977e-08, 1.955777406692505e-07, 2.942979335784912e-07, 3.9301812648773193e-07, 4.917383193969727e-07, 5.904585123062134e-07, 6.891787052154541e-07, 7.878988981246948e-07, 8.866190910339355e-07, 9.853392839431763e-07, 1.084059476852417e-06, 1.1827796697616577e-06, 1.2814998626708984e-06, 1.3802200555801392e-06, 1.4789402484893799e-06, 1.5776604413986206e-06, 1.6763806343078613e-06, 1.775100827217102e-06, 1.8738210201263428e-06, 1.9725412130355835e-06, 2.0712614059448242e-06, 2.169981598854065e-06, 2.2687017917633057e-06, 2.3674219846725464e-06, 2.466142177581787e-06, 2.564862370491028e-06, 2.6635825634002686e-06, 2.7623027563095093e-06, 2.86102294921875e-06]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 5.0, 6.0, 6.0, 8.0, 15.0, 16.0, 29.0, 41.0, 41.0, 58.0, 116.0, 181.0, 305.0, 597.0, 1128.0, 2585.0, 6243.0, 17676.0, 74318.0, 459798.0, 392782.0, 63563.0, 17615.0, 6361.0, 2556.0, 1144.0, 587.0, 285.0, 179.0, 112.0, 56.0, 29.0, 23.0, 31.0, 19.0, 9.0, 3.0, 10.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.4378299713134766e-05, -2.3661181330680847e-05, -2.294406294822693e-05, -2.222694456577301e-05, -2.1509826183319092e-05, -2.0792707800865173e-05, -2.0075589418411255e-05, -1.9358471035957336e-05, -1.8641352653503418e-05, -1.79242342710495e-05, -1.720711588859558e-05, -1.6489997506141663e-05, -1.5772879123687744e-05, -1.5055760741233826e-05, -1.4338642358779907e-05, -1.3621523976325989e-05, -1.290440559387207e-05, -1.2187287211418152e-05, -1.1470168828964233e-05, -1.0753050446510315e-05, -1.0035932064056396e-05, -9.318813681602478e-06, -8.60169529914856e-06, -7.884576916694641e-06, -7.167458534240723e-06, -6.450340151786804e-06, -5.733221769332886e-06, -5.016103386878967e-06, -4.298985004425049e-06, -3.5818666219711304e-06, -2.864748239517212e-06, -2.1476298570632935e-06, -1.430511474609375e-06, -7.133930921554565e-07, 3.725290298461914e-09, 7.208436727523804e-07, 1.4379620552062988e-06, 2.1550804376602173e-06, 2.8721988201141357e-06, 3.589317202568054e-06, 4.306435585021973e-06, 5.023553967475891e-06, 5.7406723499298096e-06, 6.457790732383728e-06, 7.1749091148376465e-06, 7.892027497291565e-06, 8.609145879745483e-06, 9.326264262199402e-06, 1.004338264465332e-05, 1.0760501027107239e-05, 1.1477619409561157e-05, 1.2194737792015076e-05, 1.2911856174468994e-05, 1.3628974556922913e-05, 1.4346092939376831e-05, 1.506321132183075e-05, 1.5780329704284668e-05, 1.6497448086738586e-05, 1.7214566469192505e-05, 1.7931684851646423e-05, 1.8648803234100342e-05, 1.936592161655426e-05, 2.008303999900818e-05, 2.0800158381462097e-05, 2.1517276763916016e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 4.0, 7.0, 14.0, 18.0, 16.0, 23.0, 26.0, 36.0, 49.0, 29.0, 58.0, 61.0, 76.0, 59.0, 35.0, 71.0, 56.0, 71.0, 38.0, 37.0, 27.0, 38.0, 27.0, 12.0, 23.0, 12.0, 10.0, 12.0, 11.0, 9.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-06, -3.460794687271118e-06, -3.345310688018799e-06, -3.2298266887664795e-06, -3.11434268951416e-06, -2.998858690261841e-06, -2.8833746910095215e-06, -2.767890691757202e-06, -2.652406692504883e-06, -2.5369226932525635e-06, -2.421438694000244e-06, -2.305954694747925e-06, -2.1904706954956055e-06, -2.074986696243286e-06, -1.959502696990967e-06, -1.8440186977386475e-06, -1.7285346984863281e-06, -1.6130506992340088e-06, -1.4975666999816895e-06, -1.3820827007293701e-06, -1.2665987014770508e-06, -1.1511147022247314e-06, -1.0356307029724121e-06, -9.201467037200928e-07, -8.046627044677734e-07, -6.891787052154541e-07, -5.736947059631348e-07, -4.5821070671081543e-07, -3.427267074584961e-07, -2.2724270820617676e-07, -1.1175870895385742e-07, 3.725290298461914e-09, 1.1920928955078125e-07, 2.3469328880310059e-07, 3.501772880554199e-07, 4.6566128730773926e-07, 5.811452865600586e-07, 6.966292858123779e-07, 8.121132850646973e-07, 9.275972843170166e-07, 1.043081283569336e-06, 1.1585652828216553e-06, 1.2740492820739746e-06, 1.389533281326294e-06, 1.5050172805786133e-06, 1.6205012798309326e-06, 1.735985279083252e-06, 1.8514692783355713e-06, 1.9669532775878906e-06, 2.08243727684021e-06, 2.1979212760925293e-06, 2.3134052753448486e-06, 2.428889274597168e-06, 2.5443732738494873e-06, 2.6598572731018066e-06, 2.775341272354126e-06, 2.8908252716064453e-06, 3.0063092708587646e-06, 3.121793270111084e-06, 3.2372772693634033e-06, 3.3527612686157227e-06, 3.468245267868042e-06, 3.5837292671203613e-06, 3.6992132663726807e-06, 3.814697265625e-06]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 10.0, 9.0, 15.0, 25.0, 40.0, 73.0, 104.0, 191.0, 174.0, 157.0, 70.0, 43.0, 25.0, 24.0, 14.0, 4.0, 6.0, 8.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006963840569369495, -0.0006664912216365337, -0.000636598386336118, -0.0006067055510357022, -0.0005768126575276256, -0.0005469198804348707, -0.000517026986926794, -0.0004871341516263783, -0.00045724131632596254, -0.0004273484810255468, -0.00039745564572513103, -0.0003675627813208848, -0.00033766994602046907, -0.0003077771107200533, -0.0002778842463158071, -0.00024799141101539135, -0.0002180985757149756, -0.00018820574041455984, -0.00015831289056222886, -0.00012842004070989788, -9.852720540948212e-05, -6.863437010906637e-05, -3.8741520256735384e-05, -8.848670404404402e-06, 2.1044164896011353e-05, 5.093700747238472e-05, 8.082985004875809e-05, 0.00011072269262513146, 0.00014061553520150483, 0.00017050837050192058, 0.00020040122035425156, 0.00023029407020658255, 0.0002601868472993374, 0.00029007968259975314, 0.0003199725179001689, 0.0003498653823044151, 0.00037975821760483086, 0.0004096510529052466, 0.0004395439173094928, 0.0004694367526099086, 0.0004993295879103243, 0.0005292224232107401, 0.0005591152585111558, 0.0005890080938115716, 0.0006189009873196483, 0.0006487937644124031, 0.0006786866579204798, 0.0007085794932208955, 0.0007384723285213113, 0.000768365163821727, 0.0007982579991221428, 0.0008281508344225585, 0.0008580436697229743, 0.000887936563231051, 0.0009178293985314667, 0.0009477222338318825, 0.0009776151273399591, 0.0010075080208480358, 0.0010374007979407907, 0.0010672936914488673, 0.0010971864685416222, 0.0011270793620496988, 0.0011569721391424537, 0.0011868650326505303, 0.0012167578097432852]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 12.0, 16.0, 15.0, 17.0, 19.0, 25.0, 30.0, 29.0, 32.0, 36.0, 46.0, 32.0, 37.0, 47.0, 39.0, 44.0, 32.0, 46.0, 43.0, 48.0, 32.0, 35.0, 28.0, 31.0, 34.0, 22.0, 30.0, 25.0, 14.0, 19.0, 15.0, 11.0, 9.0, 6.0, 10.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0004140892706345767, -0.00040227468707598746, -0.0003904600744135678, -0.00037864549085497856, -0.0003668308781925589, -0.00035501629463396966, -0.00034320168197155, -0.00033138709841296077, -0.00031957251485437155, -0.00030775793129578233, -0.00029594331863336265, -0.00028412873507477343, -0.00027231412241235375, -0.00026049953885376453, -0.0002486849552951753, -0.00023687034263275564, -0.00022505572997033596, -0.0002132411318598315, -0.00020142653374932706, -0.00018961195019073784, -0.00017779733752831817, -0.00016598275396972895, -0.0001541681558592245, -0.00014235355774872005, -0.0001305389596382156, -0.00011872436152771115, -0.0001069097634172067, -9.509517258265987e-05, -8.328057447215542e-05, -7.146597636165097e-05, -5.965138552710414e-05, -4.783678741659969e-05, -3.602218930609524e-05, -2.4207593014580198e-05, -1.2392996723065153e-05, -5.784022505395114e-07, 1.1236195859964937e-05, 2.3050793970469385e-05, 3.486538480501622e-05, 4.667998291552067e-05, 5.8494581026025116e-05, 7.030917913652956e-05, 8.212377724703401e-05, 9.393836808158085e-05, 0.0001057529661920853, 0.00011756756430258974, 0.00012938215513713658, 0.00014119675324764103, 0.00015301135135814548, 0.00016482594946864992, 0.00017664054757915437, 0.0001884551311377436, 0.00020026974380016327, 0.0002120843273587525, 0.00022389892546925694, 0.00023571352357976139, 0.00024752813624218106, 0.0002593427198007703, 0.00027115733246318996, 0.0002829719160217792, 0.00029478652868419886, 0.0003066011122427881, 0.0003184156958013773, 0.000330230308463797, 0.0003420448920223862]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 11.0, 13.0, 14.0, 23.0, 18.0, 32.0, 48.0, 67.0, 102.0, 128.0, 156.0, 224.0, 376.0, 595.0, 1005.0, 1833.0, 3962.0, 12016.0, 3793389.0, 365540.0, 7593.0, 3039.0, 1603.0, 878.0, 476.0, 326.0, 211.0, 169.0, 120.0, 85.0, 68.0, 37.0, 31.0, 29.0, 16.0, 13.0, 8.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0015764236450195312, -0.0015298426151275635, -0.0014832615852355957, -0.001436680555343628, -0.0013900995254516602, -0.0013435184955596924, -0.0012969374656677246, -0.0012503564357757568, -0.001203775405883789, -0.0011571943759918213, -0.0011106133460998535, -0.0010640323162078857, -0.001017451286315918, -0.0009708702564239502, -0.0009242892265319824, -0.0008777081966400146, -0.0008311271667480469, -0.0007845461368560791, -0.0007379651069641113, -0.0006913840770721436, -0.0006448030471801758, -0.000598222017288208, -0.0005516409873962402, -0.0005050599575042725, -0.0004584789276123047, -0.0004118978977203369, -0.00036531686782836914, -0.00031873583793640137, -0.0002721548080444336, -0.00022557377815246582, -0.00017899274826049805, -0.00013241171836853027, -8.58306884765625e-05, -3.9249658584594727e-05, 7.331371307373047e-06, 5.391240119934082e-05, 0.0001004934310913086, 0.00014707446098327637, 0.00019365549087524414, 0.00024023652076721191, 0.0002868175506591797, 0.00033339858055114746, 0.00037997961044311523, 0.000426560640335083, 0.0004731416702270508, 0.0005197227001190186, 0.0005663037300109863, 0.0006128847599029541, 0.0006594657897949219, 0.0007060468196868896, 0.0007526278495788574, 0.0007992088794708252, 0.000845789909362793, 0.0008923709392547607, 0.0009389519691467285, 0.0009855329990386963, 0.001032114028930664, 0.0010786950588226318, 0.0011252760887145996, 0.0011718571186065674, 0.0012184381484985352, 0.001265019178390503, 0.0013116002082824707, 0.0013581812381744385, 0.0014047622680664062]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 3.0, 7.0, 7.0, 10.0, 13.0, 5.0, 20.0, 22.0, 23.0, 31.0, 34.0, 35.0, 37.0, 43.0, 36.0, 55.0, 41.0, 61.0, 42.0, 44.0, 42.0, 35.0, 48.0, 40.0, 28.0, 36.0, 31.0, 34.0, 20.0, 25.0, 19.0, 14.0, 11.0, 13.0, 8.0, 10.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003581047058105469, -0.00034708529710769653, -0.0003360658884048462, -0.00032504647970199585, -0.0003140270709991455, -0.00030300766229629517, -0.0002919882535934448, -0.0002809688448905945, -0.00026994943618774414, -0.0002589300274848938, -0.00024791061878204346, -0.00023689121007919312, -0.00022587180137634277, -0.00021485239267349243, -0.0002038329839706421, -0.00019281357526779175, -0.0001817941665649414, -0.00017077475786209106, -0.00015975534915924072, -0.00014873594045639038, -0.00013771653175354004, -0.0001266971230506897, -0.00011567771434783936, -0.00010465830564498901, -9.363889694213867e-05, -8.261948823928833e-05, -7.160007953643799e-05, -6.0580670833587646e-05, -4.9561262130737305e-05, -3.854185342788696e-05, -2.752244472503662e-05, -1.650303602218628e-05, -5.4836273193359375e-06, 5.535781383514404e-06, 1.6555190086364746e-05, 2.7574598789215088e-05, 3.859400749206543e-05, 4.961341619491577e-05, 6.063282489776611e-05, 7.165223360061646e-05, 8.26716423034668e-05, 9.369105100631714e-05, 0.00010471045970916748, 0.00011572986841201782, 0.00012674927711486816, 0.0001377686858177185, 0.00014878809452056885, 0.0001598075032234192, 0.00017082691192626953, 0.00018184632062911987, 0.00019286572933197021, 0.00020388513803482056, 0.0002149045467376709, 0.00022592395544052124, 0.00023694336414337158, 0.0002479627728462219, 0.00025898218154907227, 0.0002700015902519226, 0.00028102099895477295, 0.0002920404076576233, 0.00030305981636047363, 0.000314079225063324, 0.0003250986337661743, 0.00033611804246902466, 0.000347137451171875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 10.0, 7.0, 17.0, 26.0, 44.0, 75.0, 112.0, 236.0, 667.0, 2237.0, 10806.0, 789391.0, 3374404.0, 12576.0, 2561.0, 644.0, 219.0, 100.0, 50.0, 38.0, 22.0, 13.0, 9.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020160675048828125, -0.0019321739673614502, -0.0018482804298400879, -0.0017643868923187256, -0.0016804933547973633, -0.001596599817276001, -0.0015127062797546387, -0.0014288127422332764, -0.001344919204711914, -0.0012610256671905518, -0.0011771321296691895, -0.0010932385921478271, -0.0010093450546264648, -0.0009254515171051025, -0.0008415579795837402, -0.0007576644420623779, -0.0006737709045410156, -0.0005898773670196533, -0.000505983829498291, -0.0004220902919769287, -0.0003381967544555664, -0.0002543032169342041, -0.0001704096794128418, -8.651614189147949e-05, -2.6226043701171875e-06, 8.127093315124512e-05, 0.00016516447067260742, 0.0002490580081939697, 0.00033295154571533203, 0.00041684508323669434, 0.0005007386207580566, 0.0005846321582794189, 0.0006685256958007812, 0.0007524192333221436, 0.0008363127708435059, 0.0009202063083648682, 0.0010040998458862305, 0.0010879933834075928, 0.001171886920928955, 0.0012557804584503174, 0.0013396739959716797, 0.001423567533493042, 0.0015074610710144043, 0.0015913546085357666, 0.001675248146057129, 0.0017591416835784912, 0.0018430352210998535, 0.0019269287586212158, 0.002010822296142578, 0.0020947158336639404, 0.0021786093711853027, 0.002262502908706665, 0.0023463964462280273, 0.0024302899837493896, 0.002514183521270752, 0.0025980770587921143, 0.0026819705963134766, 0.002765864133834839, 0.002849757671356201, 0.0029336512088775635, 0.0030175447463989258, 0.003101438283920288, 0.0031853318214416504, 0.0032692253589630127, 0.003353118896484375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 11.0, 14.0, 26.0, 57.0, 172.0, 500.0, 2414.0, 533.0, 169.0, 62.0, 23.0, 12.0, 13.0, 10.0, 8.0, 5.0, 7.0, 8.0, 7.0, 4.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0003228187561035156, -0.00031505152583122253, -0.00030728429555892944, -0.00029951706528663635, -0.00029174983501434326, -0.00028398260474205017, -0.0002762153744697571, -0.000268448144197464, -0.0002606809139251709, -0.0002529136836528778, -0.0002451464533805847, -0.00023737922310829163, -0.00022961199283599854, -0.00022184476256370544, -0.00021407753229141235, -0.00020631030201911926, -0.00019854307174682617, -0.00019077584147453308, -0.00018300861120224, -0.0001752413809299469, -0.0001674741506576538, -0.00015970692038536072, -0.00015193969011306763, -0.00014417245984077454, -0.00013640522956848145, -0.00012863799929618835, -0.00012087076902389526, -0.00011310353875160217, -0.00010533630847930908, -9.756907820701599e-05, -8.98018479347229e-05, -8.203461766242981e-05, -7.426738739013672e-05, -6.650015711784363e-05, -5.873292684555054e-05, -5.0965696573257446e-05, -4.3198466300964355e-05, -3.5431236028671265e-05, -2.7664005756378174e-05, -1.9896775484085083e-05, -1.2129545211791992e-05, -4.362314939498901e-06, 3.4049153327941895e-06, 1.117214560508728e-05, 1.893937587738037e-05, 2.6706606149673462e-05, 3.447383642196655e-05, 4.2241066694259644e-05, 5.0008296966552734e-05, 5.7775527238845825e-05, 6.554275751113892e-05, 7.330998778343201e-05, 8.10772180557251e-05, 8.884444832801819e-05, 9.661167860031128e-05, 0.00010437890887260437, 0.00011214613914489746, 0.00011991336941719055, 0.00012768059968948364, 0.00013544782996177673, 0.00014321506023406982, 0.00015098229050636292, 0.000158749520778656, 0.0001665167510509491, 0.0001742839813232422]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 13.0, 14.0, 21.0, 27.0, 48.0, 60.0, 99.0, 132.0, 165.0, 143.0, 77.0, 59.0, 41.0, 24.0, 21.0, 12.0, 11.0, 12.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005120275309309363, -0.0004919788334518671, -0.0004719301941804588, -0.00045188152580522, -0.00043183285742998123, -0.00041178418905474246, -0.0003917355206795037, -0.00037168682320043445, -0.0003516381839290261, -0.00033158951555378735, -0.0003115408471785486, -0.0002914921788033098, -0.000271443510428071, -0.00025139484205283225, -0.00023134615912567824, -0.00021129749075043947, -0.00019124880782328546, -0.00017120013944804668, -0.0001511514710728079, -0.00013110280269756913, -0.00011105412704637274, -9.100545867113397e-05, -7.095678301993757e-05, -5.09081146446988e-05, -3.085944626946002e-05, -1.0810776075231843e-05, 9.237894118996337e-06, 2.928656613221392e-05, 4.9335234507452697e-05, 6.938390288269147e-05, 8.943257853388786e-05, 0.00010948124690912664, 0.00012952991528436542, 0.0001495785836596042, 0.00016962725203484297, 0.00018967592041008174, 0.00020972458878532052, 0.0002297732571605593, 0.00024982192553579807, 0.0002698706230148673, 0.0002899192622862756, 0.0003099679306615144, 0.0003300165990367532, 0.00035006526741199195, 0.00037011393578723073, 0.0003901626041624695, 0.0004102112725377083, 0.0004302599700167775, 0.0004503086383920163, 0.00047035730676725507, 0.0004904060042463243, 0.0005104546435177326, 0.0005305033409968019, 0.0005505519802682102, 0.0005706006777472794, 0.0005906493170186877, 0.000610698014497757, 0.0006307467119768262, 0.0006507953512482345, 0.0006708440487273037, 0.0006908926879987121, 0.0007109413854777813, 0.0007309900247491896, 0.0007510387222282588, 0.0007710873614996672]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 8.0, 9.0, 18.0, 8.0, 25.0, 14.0, 17.0, 20.0, 36.0, 22.0, 35.0, 31.0, 38.0, 38.0, 41.0, 36.0, 42.0, 41.0, 54.0, 47.0, 34.0, 34.0, 32.0, 37.0, 39.0, 29.0, 32.0, 30.0, 18.0, 33.0, 12.0, 22.0, 13.0, 3.0, 6.0, 10.0, 6.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002929807815235108, -0.0002834897313732654, -0.0002739987103268504, -0.000264507660176605, -0.00025501663913019, -0.0002455255889799446, -0.00023603456793352962, -0.0002265435177832842, -0.00021705249673686922, -0.00020756146113853902, -0.00019807042554020882, -0.00018857938994187862, -0.00017908835434354842, -0.00016959731874521822, -0.00016010628314688802, -0.0001506152329966426, -0.0001411241973983124, -0.0001316331617999822, -0.000122142126201652, -0.00011265109060332179, -0.00010316005500499159, -9.366901940666139e-05, -8.417797653237358e-05, -7.468694093404338e-05, -6.519590533571318e-05, -5.570486973738298e-05, -4.621383413905278e-05, -3.672279490274377e-05, -2.7231759304413572e-05, -1.7740723706083372e-05, -8.249684469774365e-06, 1.2413511285558343e-06, 1.0732386726886034e-05, 2.0223422325216234e-05, 2.9714459742535837e-05, 3.920549715985544e-05, 4.869653275818564e-05, 5.818756835651584e-05, 6.767860759282485e-05, 7.716964319115505e-05, 8.666067878948525e-05, 9.615171438781545e-05, 0.00010564274998614565, 0.00011513379286043346, 0.00012462482845876366, 0.00013411586405709386, 0.00014360689965542406, 0.00015309793525375426, 0.00016258897085208446, 0.00017208000645041466, 0.00018157104204874486, 0.00019106207764707506, 0.00020055311324540526, 0.00021004414884373546, 0.00021953519899398088, 0.00022902622004039586, 0.00023851727019064128, 0.0002480083203408867, 0.0002574993413873017, 0.0002669903915375471, 0.0002764814125839621, 0.0002859724627342075, 0.0002954634837806225, 0.0003049545339308679, 0.0003144455549772829]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 7.0, 13.0, 27.0, 41.0, 46.0, 77.0, 107.0, 165.0, 248.0, 408.0, 663.0, 1046.0, 1853.0, 3111.0, 5337.0, 9072.0, 15629.0, 27342.0, 46782.0, 81542.0, 138795.0, 223788.0, 203173.0, 120966.0, 71157.0, 40779.0, 23510.0, 13435.0, 7838.0, 4760.0, 2728.0, 1619.0, 961.0, 534.0, 354.0, 219.0, 146.0, 90.0, 64.0, 39.0, 26.0, 17.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00021922588348388672, -0.0002123471349477768, -0.00020546838641166687, -0.00019858963787555695, -0.00019171088933944702, -0.0001848321408033371, -0.00017795339226722717, -0.00017107464373111725, -0.00016419589519500732, -0.0001573171466588974, -0.00015043839812278748, -0.00014355964958667755, -0.00013668090105056763, -0.0001298021525144577, -0.00012292340397834778, -0.00011604465544223785, -0.00010916590690612793, -0.000102287158370018, -9.540840983390808e-05, -8.852966129779816e-05, -8.165091276168823e-05, -7.477216422557831e-05, -6.789341568946838e-05, -6.101466715335846e-05, -5.4135918617248535e-05, -4.725717008113861e-05, -4.0378421545028687e-05, -3.349967300891876e-05, -2.6620924472808838e-05, -1.9742175936698914e-05, -1.286342740058899e-05, -5.984678864479065e-06, 8.940696716308594e-07, 7.772818207740784e-06, 1.4651566743850708e-05, 2.1530315279960632e-05, 2.8409063816070557e-05, 3.528781235218048e-05, 4.2166560888290405e-05, 4.904530942440033e-05, 5.5924057960510254e-05, 6.280280649662018e-05, 6.96815550327301e-05, 7.656030356884003e-05, 8.343905210494995e-05, 9.031780064105988e-05, 9.71965491771698e-05, 0.00010407529771327972, 0.00011095404624938965, 0.00011783279478549957, 0.0001247115433216095, 0.00013159029185771942, 0.00013846904039382935, 0.00014534778892993927, 0.0001522265374660492, 0.00015910528600215912, 0.00016598403453826904, 0.00017286278307437897, 0.0001797415316104889, 0.00018662028014659882, 0.00019349902868270874, 0.00020037777721881866, 0.0002072565257549286, 0.0002141352742910385, 0.00022101402282714844]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 11.0, 6.0, 12.0, 11.0, 15.0, 17.0, 20.0, 19.0, 20.0, 27.0, 21.0, 35.0, 45.0, 37.0, 38.0, 47.0, 42.0, 43.0, 44.0, 46.0, 48.0, 33.0, 43.0, 29.0, 43.0, 28.0, 25.0, 26.0, 25.0, 18.0, 20.0, 16.0, 18.0, 15.0, 9.0, 8.0, 9.0, 4.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003268718719482422, -0.0003171674907207489, -0.0003074631094932556, -0.00029775872826576233, -0.00028805434703826904, -0.00027834996581077576, -0.00026864558458328247, -0.0002589412033557892, -0.0002492368221282959, -0.0002395324409008026, -0.00022982805967330933, -0.00022012367844581604, -0.00021041929721832275, -0.00020071491599082947, -0.00019101053476333618, -0.0001813061535358429, -0.0001716017723083496, -0.00016189739108085632, -0.00015219300985336304, -0.00014248862862586975, -0.00013278424739837646, -0.00012307986617088318, -0.00011337548494338989, -0.0001036711037158966, -9.396672248840332e-05, -8.426234126091003e-05, -7.455796003341675e-05, -6.485357880592346e-05, -5.5149197578430176e-05, -4.544481635093689e-05, -3.5740435123443604e-05, -2.6036053895950317e-05, -1.633167266845703e-05, -6.627291440963745e-06, 3.077089786529541e-06, 1.2781471014022827e-05, 2.2485852241516113e-05, 3.21902334690094e-05, 4.1894614696502686e-05, 5.159899592399597e-05, 6.130337715148926e-05, 7.100775837898254e-05, 8.071213960647583e-05, 9.041652083396912e-05, 0.0001001209020614624, 0.00010982528328895569, 0.00011952966451644897, 0.00012923404574394226, 0.00013893842697143555, 0.00014864280819892883, 0.00015834718942642212, 0.0001680515706539154, 0.0001777559518814087, 0.00018746033310890198, 0.00019716471433639526, 0.00020686909556388855, 0.00021657347679138184, 0.00022627785801887512, 0.0002359822392463684, 0.0002456866204738617, 0.000255391001701355, 0.00026509538292884827, 0.00027479976415634155, 0.00028450414538383484, 0.0002942085266113281]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 14.0, 20.0, 24.0, 32.0, 38.0, 78.0, 125.0, 158.0, 242.0, 351.0, 689.0, 1015.0, 1711.0, 2854.0, 5102.0, 9311.0, 18325.0, 38956.0, 94421.0, 318730.0, 366462.0, 104849.0, 42291.0, 19627.0, 9937.0, 5399.0, 3044.0, 1828.0, 1043.0, 732.0, 421.0, 214.0, 147.0, 136.0, 79.0, 54.0, 26.0, 21.0, 12.0, 10.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003046989440917969, -0.00029455870389938354, -0.0002844184637069702, -0.0002742782235145569, -0.00026413798332214355, -0.0002539977431297302, -0.0002438575029373169, -0.00023371726274490356, -0.00022357702255249023, -0.0002134367823600769, -0.00020329654216766357, -0.00019315630197525024, -0.00018301606178283691, -0.00017287582159042358, -0.00016273558139801025, -0.00015259534120559692, -0.0001424551010131836, -0.00013231486082077026, -0.00012217462062835693, -0.0001120343804359436, -0.00010189414024353027, -9.175390005111694e-05, -8.161365985870361e-05, -7.147341966629028e-05, -6.133317947387695e-05, -5.119293928146362e-05, -4.105269908905029e-05, -3.091245889663696e-05, -2.0772218704223633e-05, -1.0631978511810303e-05, -4.917383193969727e-07, 9.648501873016357e-06, 1.9788742065429688e-05, 2.9928982257843018e-05, 4.006922245025635e-05, 5.020946264266968e-05, 6.034970283508301e-05, 7.048994302749634e-05, 8.063018321990967e-05, 9.0770423412323e-05, 0.00010091066360473633, 0.00011105090379714966, 0.00012119114398956299, 0.00013133138418197632, 0.00014147162437438965, 0.00015161186456680298, 0.0001617521047592163, 0.00017189234495162964, 0.00018203258514404297, 0.0001921728253364563, 0.00020231306552886963, 0.00021245330572128296, 0.0002225935459136963, 0.00023273378610610962, 0.00024287402629852295, 0.0002530142664909363, 0.0002631545066833496, 0.00027329474687576294, 0.00028343498706817627, 0.0002935752272605896, 0.00030371546745300293, 0.00031385570764541626, 0.0003239959478378296, 0.0003341361880302429, 0.00034427642822265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 7.0, 5.0, 5.0, 15.0, 11.0, 10.0, 15.0, 28.0, 19.0, 27.0, 31.0, 38.0, 42.0, 34.0, 40.0, 45.0, 50.0, 52.0, 51.0, 50.0, 46.0, 58.0, 34.0, 42.0, 39.0, 28.0, 34.0, 17.0, 20.0, 22.0, 23.0, 13.0, 14.0, 5.0, 11.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019073486328125, -0.0001837611198425293, -0.0001767873764038086, -0.0001698136329650879, -0.0001628398895263672, -0.00015586614608764648, -0.00014889240264892578, -0.00014191865921020508, -0.00013494491577148438, -0.00012797117233276367, -0.00012099742889404297, -0.00011402368545532227, -0.00010704994201660156, -0.00010007619857788086, -9.310245513916016e-05, -8.612871170043945e-05, -7.915496826171875e-05, -7.218122482299805e-05, -6.520748138427734e-05, -5.823373794555664e-05, -5.125999450683594e-05, -4.4286251068115234e-05, -3.731250762939453e-05, -3.0338764190673828e-05, -2.3365020751953125e-05, -1.6391277313232422e-05, -9.417533874511719e-06, -2.4437904357910156e-06, 4.5299530029296875e-06, 1.150369644165039e-05, 1.8477439880371094e-05, 2.5451183319091797e-05, 3.24249267578125e-05, 3.93986701965332e-05, 4.6372413635253906e-05, 5.334615707397461e-05, 6.031990051269531e-05, 6.729364395141602e-05, 7.426738739013672e-05, 8.124113082885742e-05, 8.821487426757812e-05, 9.518861770629883e-05, 0.00010216236114501953, 0.00010913610458374023, 0.00011610984802246094, 0.00012308359146118164, 0.00013005733489990234, 0.00013703107833862305, 0.00014400482177734375, 0.00015097856521606445, 0.00015795230865478516, 0.00016492605209350586, 0.00017189979553222656, 0.00017887353897094727, 0.00018584728240966797, 0.00019282102584838867, 0.00019979476928710938, 0.00020676851272583008, 0.00021374225616455078, 0.00022071599960327148, 0.0002276897430419922, 0.0002346634864807129, 0.0002416372299194336, 0.0002486109733581543, 0.000255584716796875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 7.0, 13.0, 14.0, 29.0, 32.0, 52.0, 66.0, 80.0, 129.0, 188.0, 235.0, 365.0, 562.0, 951.0, 1481.0, 2472.0, 4135.0, 8505.0, 18915.0, 55283.0, 389099.0, 468071.0, 56685.0, 20729.0, 8998.0, 4481.0, 2578.0, 1521.0, 955.0, 561.0, 400.0, 282.0, 218.0, 154.0, 91.0, 42.0, 52.0, 31.0, 30.0, 16.0, 13.0, 7.0, 4.0, 6.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.552436828613281e-05, -3.4341588616371155e-05, -3.31588089466095e-05, -3.197602927684784e-05, -3.079324960708618e-05, -2.9610469937324524e-05, -2.8427690267562866e-05, -2.724491059780121e-05, -2.606213092803955e-05, -2.4879351258277893e-05, -2.3696571588516235e-05, -2.2513791918754578e-05, -2.133101224899292e-05, -2.0148232579231262e-05, -1.8965452909469604e-05, -1.7782673239707947e-05, -1.659989356994629e-05, -1.541711390018463e-05, -1.4234334230422974e-05, -1.3051554560661316e-05, -1.1868774890899658e-05, -1.0685995221138e-05, -9.503215551376343e-06, -8.320435881614685e-06, -7.137656211853027e-06, -5.95487654209137e-06, -4.772096872329712e-06, -3.589317202568054e-06, -2.4065375328063965e-06, -1.2237578630447388e-06, -4.0978193283081055e-08, 1.1418014764785767e-06, 2.3245811462402344e-06, 3.507360816001892e-06, 4.69014048576355e-06, 5.8729201555252075e-06, 7.055699825286865e-06, 8.238479495048523e-06, 9.42125916481018e-06, 1.0604038834571838e-05, 1.1786818504333496e-05, 1.2969598174095154e-05, 1.4152377843856812e-05, 1.533515751361847e-05, 1.6517937183380127e-05, 1.7700716853141785e-05, 1.8883496522903442e-05, 2.00662761926651e-05, 2.1249055862426758e-05, 2.2431835532188416e-05, 2.3614615201950073e-05, 2.479739487171173e-05, 2.598017454147339e-05, 2.7162954211235046e-05, 2.8345733880996704e-05, 2.9528513550758362e-05, 3.071129322052002e-05, 3.189407289028168e-05, 3.3076852560043335e-05, 3.425963222980499e-05, 3.544241189956665e-05, 3.662519156932831e-05, 3.7807971239089966e-05, 3.8990750908851624e-05, 4.017353057861328e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 10.0, 17.0, 10.0, 22.0, 26.0, 29.0, 56.0, 58.0, 80.0, 89.0, 94.0, 57.0, 106.0, 87.0, 68.0, 61.0, 45.0, 21.0, 19.0, 11.0, 7.0, 10.0, 4.0, 5.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0531158447265625e-06, -3.94042581319809e-06, -3.827735781669617e-06, -3.715045750141144e-06, -3.602355718612671e-06, -3.489665687084198e-06, -3.376975655555725e-06, -3.264285624027252e-06, -3.1515955924987793e-06, -3.0389055609703064e-06, -2.9262155294418335e-06, -2.8135254979133606e-06, -2.7008354663848877e-06, -2.588145434856415e-06, -2.475455403327942e-06, -2.362765371799469e-06, -2.250075340270996e-06, -2.137385308742523e-06, -2.0246952772140503e-06, -1.9120052456855774e-06, -1.7993152141571045e-06, -1.6866251826286316e-06, -1.5739351511001587e-06, -1.4612451195716858e-06, -1.3485550880432129e-06, -1.23586505651474e-06, -1.123175024986267e-06, -1.0104849934577942e-06, -8.977949619293213e-07, -7.851049304008484e-07, -6.724148988723755e-07, -5.597248673439026e-07, -4.470348358154297e-07, -3.343448042869568e-07, -2.2165477275848389e-07, -1.0896474123001099e-07, 3.725290298461914e-09, 1.1641532182693481e-07, 2.2910535335540771e-07, 3.417953848838806e-07, 4.544854164123535e-07, 5.671754479408264e-07, 6.798654794692993e-07, 7.925555109977722e-07, 9.052455425262451e-07, 1.017935574054718e-06, 1.130625605583191e-06, 1.2433156371116638e-06, 1.3560056686401367e-06, 1.4686957001686096e-06, 1.5813857316970825e-06, 1.6940757632255554e-06, 1.8067657947540283e-06, 1.9194558262825012e-06, 2.032145857810974e-06, 2.144835889339447e-06, 2.25752592086792e-06, 2.370215952396393e-06, 2.4829059839248657e-06, 2.5955960154533386e-06, 2.7082860469818115e-06, 2.8209760785102844e-06, 2.9336661100387573e-06, 3.0463561415672302e-06, 3.159046173095703e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 4.0, 10.0, 2.0, 6.0, 11.0, 26.0, 34.0, 57.0, 119.0, 297.0, 1059.0, 5855.0, 113964.0, 905343.0, 18690.0, 2171.0, 535.0, 176.0, 72.0, 49.0, 26.0, 18.0, 8.0, 10.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015211105346679688, -0.0001469086855649948, -0.00014170631766319275, -0.00013650394976139069, -0.00013130158185958862, -0.00012609921395778656, -0.0001208968460559845, -0.00011569447815418243, -0.00011049211025238037, -0.00010528974235057831, -0.00010008737444877625, -9.488500654697418e-05, -8.968263864517212e-05, -8.448027074337006e-05, -7.927790284156799e-05, -7.407553493976593e-05, -6.887316703796387e-05, -6.36707991361618e-05, -5.846843123435974e-05, -5.326606333255768e-05, -4.8063695430755615e-05, -4.286132752895355e-05, -3.765895962715149e-05, -3.2456591725349426e-05, -2.7254223823547363e-05, -2.20518559217453e-05, -1.6849488019943237e-05, -1.1647120118141174e-05, -6.444752216339111e-06, -1.2423843145370483e-06, 3.959983587265015e-06, 9.162351489067078e-06, 1.436471939086914e-05, 1.9567087292671204e-05, 2.4769455194473267e-05, 2.997182309627533e-05, 3.517419099807739e-05, 4.0376558899879456e-05, 4.557892680168152e-05, 5.078129470348358e-05, 5.5983662605285645e-05, 6.118603050708771e-05, 6.638839840888977e-05, 7.159076631069183e-05, 7.67931342124939e-05, 8.199550211429596e-05, 8.719787001609802e-05, 9.240023791790009e-05, 9.760260581970215e-05, 0.00010280497372150421, 0.00010800734162330627, 0.00011320970952510834, 0.0001184120774269104, 0.00012361444532871246, 0.00012881681323051453, 0.0001340191811323166, 0.00013922154903411865, 0.00014442391693592072, 0.00014962628483772278, 0.00015482865273952484, 0.0001600310206413269, 0.00016523338854312897, 0.00017043575644493103, 0.0001756381243467331, 0.00018084049224853516]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 8.0, 3.0, 6.0, 7.0, 7.0, 9.0, 15.0, 25.0, 32.0, 35.0, 36.0, 71.0, 99.0, 148.0, 144.0, 103.0, 67.0, 43.0, 35.0, 24.0, 21.0, 23.0, 15.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2874603271484375e-05, -1.2506730854511261e-05, -1.2138858437538147e-05, -1.1770986020565033e-05, -1.1403113603591919e-05, -1.1035241186618805e-05, -1.0667368769645691e-05, -1.0299496352672577e-05, -9.931623935699463e-06, -9.563751518726349e-06, -9.195879101753235e-06, -8.828006684780121e-06, -8.460134267807007e-06, -8.092261850833893e-06, -7.724389433860779e-06, -7.356517016887665e-06, -6.988644599914551e-06, -6.620772182941437e-06, -6.252899765968323e-06, -5.885027348995209e-06, -5.517154932022095e-06, -5.149282515048981e-06, -4.781410098075867e-06, -4.413537681102753e-06, -4.045665264129639e-06, -3.6777928471565247e-06, -3.3099204301834106e-06, -2.9420480132102966e-06, -2.5741755962371826e-06, -2.2063031792640686e-06, -1.8384307622909546e-06, -1.4705583453178406e-06, -1.1026859283447266e-06, -7.348135113716125e-07, -3.6694109439849854e-07, 9.313225746154785e-10, 3.688037395477295e-07, 7.366761565208435e-07, 1.1045485734939575e-06, 1.4724209904670715e-06, 1.8402934074401855e-06, 2.2081658244132996e-06, 2.5760382413864136e-06, 2.9439106583595276e-06, 3.3117830753326416e-06, 3.6796554923057556e-06, 4.04752790927887e-06, 4.415400326251984e-06, 4.783272743225098e-06, 5.151145160198212e-06, 5.519017577171326e-06, 5.88688999414444e-06, 6.254762411117554e-06, 6.622634828090668e-06, 6.990507245063782e-06, 7.358379662036896e-06, 7.72625207901001e-06, 8.094124495983124e-06, 8.461996912956238e-06, 8.829869329929352e-06, 9.197741746902466e-06, 9.56561416387558e-06, 9.933486580848694e-06, 1.0301358997821808e-05, 1.0669231414794922e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 8.0, 13.0, 10.0, 13.0, 18.0, 15.0, 23.0, 32.0, 53.0, 64.0, 92.0, 120.0, 132.0, 94.0, 77.0, 69.0, 34.0, 30.0, 20.0, 16.0, 14.0, 8.0, 11.0, 12.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00035475450567901134, -0.00033955014077946544, -0.00032434574677608907, -0.00030914138187654316, -0.0002939369878731668, -0.0002787326229736209, -0.000263528258074075, -0.0002483238640706986, -0.0002331194991711527, -0.00021791511971969157, -0.00020271074026823044, -0.00018750637536868453, -0.0001723019959172234, -0.00015709761646576226, -0.00014189323701430112, -0.00012668885756283998, -0.00011148447811137885, -9.628009865991771e-05, -8.107572648441419e-05, -6.587134703295305e-05, -5.0666971219470724e-05, -3.5462595405988395e-05, -2.025821595452726e-05, -5.053843779023737e-06, 1.01505356724374e-05, 2.535491148591973e-05, 4.055928729940206e-05, 5.5763666750863194e-05, 7.096804620232433e-05, 8.617241837782785e-05, 0.00010137679782928899, 0.00011658117000479251, 0.00013178554945625365, 0.00014698992890771478, 0.00016219430835917592, 0.00017739867325872183, 0.00019260305271018296, 0.0002078074321616441, 0.00022301181161310524, 0.00023821619106456637, 0.0002534205559641123, 0.0002686249208636582, 0.00028382931486703455, 0.00029903367976658046, 0.00031423807376995683, 0.00032944243866950274, 0.00034464680356904864, 0.000359851197572425, 0.00037505559157580137, 0.0003902599564753473, 0.00040546435047872365, 0.00042066871537826955, 0.0004358731093816459, 0.0004510774742811918, 0.00046628183918073773, 0.0004814862331841141, 0.0004966905689798295, 0.0005118949338793755, 0.0005270992987789214, 0.0005423037218861282, 0.0005575080867856741, 0.00057271245168522, 0.0005879168165847659, 0.0006031211814843118, 0.0006183256045915186]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 10.0, 12.0, 14.0, 13.0, 15.0, 20.0, 17.0, 18.0, 32.0, 24.0, 36.0, 27.0, 39.0, 38.0, 39.0, 41.0, 34.0, 40.0, 46.0, 53.0, 34.0, 36.0, 26.0, 40.0, 40.0, 31.0, 35.0, 25.0, 23.0, 29.0, 19.0, 15.0, 20.0, 6.0, 4.0, 9.0, 10.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00027677451726049185, -0.0002678056189324707, -0.0002588367206044495, -0.00024986782227642834, -0.00024089892394840717, -0.000231930025620386, -0.00022296114184428006, -0.0002139922435162589, -0.00020502334518823773, -0.00019605444686021656, -0.0001870855485321954, -0.00017811665020417422, -0.00016914776642806828, -0.0001601788681000471, -0.00015120996977202594, -0.00014224107144400477, -0.0001332721731159836, -0.00012430327478796244, -0.00011533437645994127, -0.00010636548540787771, -9.739658707985654e-05, -8.842768875183538e-05, -7.945879769977182e-05, -7.048989937175065e-05, -6.152100104372948e-05, -5.2552102715708315e-05, -4.3583208025665954e-05, -3.461431333562359e-05, -2.5645415007602423e-05, -1.6676516679581255e-05, -7.707621989538893e-06, 1.2612727005034685e-06, 1.0230200132355094e-05, 1.919909664138686e-05, 2.8167993150418624e-05, 3.7136887840460986e-05, 4.6105786168482155e-05, 5.507468449650332e-05, 6.404357554856688e-05, 7.301247387658805e-05, 8.198137220460922e-05, 9.095027053263038e-05, 9.991916886065155e-05, 0.00010888805991271511, 0.00011785695824073628, 0.00012682584929279983, 0.000135794747620821, 0.00014476364594884217, 0.00015373254427686334, 0.0001627014426048845, 0.00017167034093290567, 0.00018063923926092684, 0.000189608137588948, 0.00019857703591696918, 0.00020754591969307512, 0.0002165148180210963, 0.00022548371634911746, 0.00023445261467713863, 0.0002434215130051598, 0.00025239039678126574, 0.0002613592951092869, 0.0002703281934373081, 0.00027929709176532924, 0.0002882659900933504, 0.0002972348884213716]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 10.0, 21.0, 25.0, 33.0, 47.0, 68.0, 112.0, 159.0, 205.0, 305.0, 494.0, 706.0, 1094.0, 1607.0, 2608.0, 3811.0, 5800.0, 9298.0, 14728.0, 23392.0, 38831.0, 67839.0, 125819.0, 221106.0, 225261.0, 129253.0, 69749.0, 40158.0, 24109.0, 15082.0, 9369.0, 6015.0, 3865.0, 2471.0, 1632.0, 1136.0, 776.0, 483.0, 334.0, 214.0, 156.0, 124.0, 80.0, 52.0, 40.0, 19.0, 18.0, 12.0, 11.0, 4.0, 4.0, 2.0, 3.0, 3.0], "bins": [-0.0006251335144042969, -0.0006067603826522827, -0.0005883872509002686, -0.0005700141191482544, -0.0005516409873962402, -0.0005332678556442261, -0.0005148947238922119, -0.0004965215921401978, -0.0004781484603881836, -0.00045977532863616943, -0.0004414021968841553, -0.0004230290651321411, -0.00040465593338012695, -0.0003862828016281128, -0.00036790966987609863, -0.00034953653812408447, -0.0003311634063720703, -0.00031279027462005615, -0.000294417142868042, -0.00027604401111602783, -0.00025767087936401367, -0.0002392977476119995, -0.00022092461585998535, -0.0002025514841079712, -0.00018417835235595703, -0.00016580522060394287, -0.0001474320888519287, -0.00012905895709991455, -0.00011068582534790039, -9.231269359588623e-05, -7.393956184387207e-05, -5.556643009185791e-05, -3.719329833984375e-05, -1.882016658782959e-05, -4.470348358154297e-07, 1.792609691619873e-05, 3.629922866821289e-05, 5.467236042022705e-05, 7.304549217224121e-05, 9.141862392425537e-05, 0.00010979175567626953, 0.0001281648874282837, 0.00014653801918029785, 0.000164911150932312, 0.00018328428268432617, 0.00020165741443634033, 0.0002200305461883545, 0.00023840367794036865, 0.0002567768096923828, 0.00027514994144439697, 0.00029352307319641113, 0.0003118962049484253, 0.00033026933670043945, 0.0003486424684524536, 0.0003670156002044678, 0.00038538873195648193, 0.0004037618637084961, 0.00042213499546051025, 0.0004405081272125244, 0.0004588812589645386, 0.00047725439071655273, 0.0004956275224685669, 0.0005140006542205811, 0.0005323737859725952, 0.0005507469177246094]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 9.0, 5.0, 7.0, 12.0, 16.0, 12.0, 15.0, 25.0, 24.0, 29.0, 42.0, 28.0, 41.0, 39.0, 32.0, 47.0, 44.0, 55.0, 39.0, 55.0, 60.0, 39.0, 33.0, 42.0, 37.0, 28.0, 34.0, 25.0, 24.0, 24.0, 19.0, 18.0, 9.0, 10.0, 5.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002453327178955078, -0.00023745372891426086, -0.00022957473993301392, -0.00022169575095176697, -0.00021381676197052002, -0.00020593777298927307, -0.00019805878400802612, -0.00019017979502677917, -0.00018230080604553223, -0.00017442181706428528, -0.00016654282808303833, -0.00015866383910179138, -0.00015078485012054443, -0.00014290586113929749, -0.00013502687215805054, -0.0001271478831768036, -0.00011926889419555664, -0.00011138990521430969, -0.00010351091623306274, -9.56319272518158e-05, -8.775293827056885e-05, -7.98739492893219e-05, -7.199496030807495e-05, -6.4115971326828e-05, -5.6236982345581055e-05, -4.8357993364334106e-05, -4.047900438308716e-05, -3.260001540184021e-05, -2.4721026420593262e-05, -1.6842037439346313e-05, -8.963048458099365e-06, -1.084059476852417e-06, 6.794929504394531e-06, 1.467391848564148e-05, 2.2552907466888428e-05, 3.0431896448135376e-05, 3.8310885429382324e-05, 4.618987441062927e-05, 5.406886339187622e-05, 6.194785237312317e-05, 6.982684135437012e-05, 7.770583033561707e-05, 8.558481931686401e-05, 9.346380829811096e-05, 0.00010134279727935791, 0.00010922178626060486, 0.0001171007752418518, 0.00012497976422309875, 0.0001328587532043457, 0.00014073774218559265, 0.0001486167311668396, 0.00015649572014808655, 0.0001643747091293335, 0.00017225369811058044, 0.0001801326870918274, 0.00018801167607307434, 0.0001958906650543213, 0.00020376965403556824, 0.00021164864301681519, 0.00021952763199806213, 0.00022740662097930908, 0.00023528560996055603, 0.00024316459894180298, 0.0002510435879230499, 0.0002589225769042969]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 9.0, 10.0, 15.0, 16.0, 35.0, 44.0, 63.0, 67.0, 100.0, 144.0, 227.0, 393.0, 594.0, 1037.0, 2042.0, 3893.0, 7887.0, 16916.0, 39973.0, 105597.0, 316020.0, 351383.0, 120665.0, 44355.0, 18961.0, 8668.0, 4262.0, 2162.0, 1127.0, 659.0, 435.0, 230.0, 144.0, 116.0, 67.0, 56.0, 41.0, 42.0, 24.0, 20.0, 13.0, 4.0, 5.0, 3.0, 6.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0009002685546875, -0.0008712857961654663, -0.0008423030376434326, -0.0008133202791213989, -0.0007843375205993652, -0.0007553547620773315, -0.0007263720035552979, -0.0006973892450332642, -0.0006684064865112305, -0.0006394237279891968, -0.0006104409694671631, -0.0005814582109451294, -0.0005524754524230957, -0.000523492693901062, -0.0004945099353790283, -0.00046552717685699463, -0.00043654441833496094, -0.00040756165981292725, -0.00037857890129089355, -0.00034959614276885986, -0.00032061338424682617, -0.0002916306257247925, -0.0002626478672027588, -0.0002336651086807251, -0.0002046823501586914, -0.00017569959163665771, -0.00014671683311462402, -0.00011773407459259033, -8.875131607055664e-05, -5.976855754852295e-05, -3.078579902648926e-05, -1.8030405044555664e-06, 2.7179718017578125e-05, 5.6162476539611816e-05, 8.514523506164551e-05, 0.0001141279935836792, 0.0001431107521057129, 0.00017209351062774658, 0.00020107626914978027, 0.00023005902767181396, 0.00025904178619384766, 0.00028802454471588135, 0.00031700730323791504, 0.00034599006175994873, 0.0003749728202819824, 0.0004039555788040161, 0.0004329383373260498, 0.0004619210958480835, 0.0004909038543701172, 0.0005198866128921509, 0.0005488693714141846, 0.0005778521299362183, 0.000606834888458252, 0.0006358176469802856, 0.0006648004055023193, 0.000693783164024353, 0.0007227659225463867, 0.0007517486810684204, 0.0007807314395904541, 0.0008097141981124878, 0.0008386969566345215, 0.0008676797151565552, 0.0008966624736785889, 0.0009256452322006226, 0.0009546279907226562]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 9.0, 14.0, 9.0, 10.0, 13.0, 12.0, 18.0, 29.0, 38.0, 24.0, 26.0, 27.0, 38.0, 37.0, 53.0, 49.0, 53.0, 42.0, 51.0, 47.0, 52.0, 46.0, 29.0, 44.0, 37.0, 22.0, 27.0, 31.0, 20.0, 12.0, 17.0, 13.0, 7.0, 9.0, 9.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00020503997802734375, -0.00019873306155204773, -0.0001924261450767517, -0.0001861192286014557, -0.00017981231212615967, -0.00017350539565086365, -0.00016719847917556763, -0.0001608915627002716, -0.00015458464622497559, -0.00014827772974967957, -0.00014197081327438354, -0.00013566389679908752, -0.0001293569803237915, -0.00012305006384849548, -0.00011674314737319946, -0.00011043623089790344, -0.00010412931442260742, -9.78223979473114e-05, -9.151548147201538e-05, -8.520856499671936e-05, -7.890164852142334e-05, -7.259473204612732e-05, -6.62878155708313e-05, -5.998089909553528e-05, -5.367398262023926e-05, -4.736706614494324e-05, -4.106014966964722e-05, -3.4753233194351196e-05, -2.8446316719055176e-05, -2.2139400243759155e-05, -1.5832483768463135e-05, -9.525567293167114e-06, -3.2186508178710938e-06, 3.0882656574249268e-06, 9.395182132720947e-06, 1.5702098608016968e-05, 2.2009015083312988e-05, 2.831593155860901e-05, 3.462284803390503e-05, 4.092976450920105e-05, 4.723668098449707e-05, 5.354359745979309e-05, 5.985051393508911e-05, 6.615743041038513e-05, 7.246434688568115e-05, 7.877126336097717e-05, 8.50781798362732e-05, 9.138509631156921e-05, 9.769201278686523e-05, 0.00010399892926216125, 0.00011030584573745728, 0.0001166127622127533, 0.00012291967868804932, 0.00012922659516334534, 0.00013553351163864136, 0.00014184042811393738, 0.0001481473445892334, 0.00015445426106452942, 0.00016076117753982544, 0.00016706809401512146, 0.00017337501049041748, 0.0001796819269657135, 0.00018598884344100952, 0.00019229575991630554, 0.00019860267639160156]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 25.0, 24.0, 46.0, 52.0, 117.0, 196.0, 296.0, 777.0, 1553.0, 3859.0, 13227.0, 59534.0, 681061.0, 244086.0, 31190.0, 7341.0, 2734.0, 1259.0, 496.0, 308.0, 133.0, 92.0, 45.0, 33.0, 18.0, 13.0, 11.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.118680953979492e-05, -4.009716212749481e-05, -3.90075147151947e-05, -3.791786730289459e-05, -3.682821989059448e-05, -3.573857247829437e-05, -3.464892506599426e-05, -3.355927765369415e-05, -3.246963024139404e-05, -3.137998282909393e-05, -3.0290335416793823e-05, -2.9200688004493713e-05, -2.8111040592193604e-05, -2.7021393179893494e-05, -2.5931745767593384e-05, -2.4842098355293274e-05, -2.3752450942993164e-05, -2.2662803530693054e-05, -2.1573156118392944e-05, -2.0483508706092834e-05, -1.9393861293792725e-05, -1.8304213881492615e-05, -1.7214566469192505e-05, -1.6124919056892395e-05, -1.5035271644592285e-05, -1.3945624232292175e-05, -1.2855976819992065e-05, -1.1766329407691956e-05, -1.0676681995391846e-05, -9.587034583091736e-06, -8.497387170791626e-06, -7.407739758491516e-06, -6.318092346191406e-06, -5.228444933891296e-06, -4.1387975215911865e-06, -3.0491501092910767e-06, -1.959502696990967e-06, -8.698552846908569e-07, 2.1979212760925293e-07, 1.3094395399093628e-06, 2.3990869522094727e-06, 3.4887343645095825e-06, 4.578381776809692e-06, 5.668029189109802e-06, 6.757676601409912e-06, 7.847324013710022e-06, 8.936971426010132e-06, 1.0026618838310242e-05, 1.1116266250610352e-05, 1.2205913662910461e-05, 1.3295561075210571e-05, 1.4385208487510681e-05, 1.547485589981079e-05, 1.65645033121109e-05, 1.765415072441101e-05, 1.874379813671112e-05, 1.983344554901123e-05, 2.092309296131134e-05, 2.201274037361145e-05, 2.310238778591156e-05, 2.419203519821167e-05, 2.528168261051178e-05, 2.637133002281189e-05, 2.7460977435112e-05, 2.855062484741211e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 7.0, 3.0, 18.0, 7.0, 19.0, 27.0, 23.0, 77.0, 62.0, 135.0, 89.0, 176.0, 135.0, 57.0, 50.0, 27.0, 25.0, 10.0, 15.0, 7.0, 10.0, 5.0, 0.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.635883331298828e-06, -3.5427510738372803e-06, -3.4496188163757324e-06, -3.3564865589141846e-06, -3.2633543014526367e-06, -3.170222043991089e-06, -3.077089786529541e-06, -2.983957529067993e-06, -2.8908252716064453e-06, -2.7976930141448975e-06, -2.7045607566833496e-06, -2.6114284992218018e-06, -2.518296241760254e-06, -2.425163984298706e-06, -2.332031726837158e-06, -2.2388994693756104e-06, -2.1457672119140625e-06, -2.0526349544525146e-06, -1.959502696990967e-06, -1.866370439529419e-06, -1.773238182067871e-06, -1.6801059246063232e-06, -1.5869736671447754e-06, -1.4938414096832275e-06, -1.4007091522216797e-06, -1.3075768947601318e-06, -1.214444637298584e-06, -1.1213123798370361e-06, -1.0281801223754883e-06, -9.350478649139404e-07, -8.419156074523926e-07, -7.487833499908447e-07, -6.556510925292969e-07, -5.62518835067749e-07, -4.6938657760620117e-07, -3.762543201446533e-07, -2.8312206268310547e-07, -1.8998980522155762e-07, -9.685754776000977e-08, -3.725290298461914e-09, 8.940696716308594e-08, 1.825392246246338e-07, 2.7567148208618164e-07, 3.688037395477295e-07, 4.6193599700927734e-07, 5.550682544708252e-07, 6.48200511932373e-07, 7.413327693939209e-07, 8.344650268554688e-07, 9.275972843170166e-07, 1.0207295417785645e-06, 1.1138617992401123e-06, 1.2069940567016602e-06, 1.300126314163208e-06, 1.3932585716247559e-06, 1.4863908290863037e-06, 1.5795230865478516e-06, 1.6726553440093994e-06, 1.7657876014709473e-06, 1.8589198589324951e-06, 1.952052116394043e-06, 2.045184373855591e-06, 2.1383166313171387e-06, 2.2314488887786865e-06, 2.3245811462402344e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 11.0, 9.0, 17.0, 20.0, 21.0, 29.0, 70.0, 116.0, 193.0, 326.0, 654.0, 1347.0, 2758.0, 5929.0, 17034.0, 64797.0, 483489.0, 390429.0, 55674.0, 15322.0, 5454.0, 2325.0, 1136.0, 634.0, 342.0, 167.0, 98.0, 49.0, 31.0, 20.0, 21.0, 9.0, 8.0, 2.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.913309097290039e-05, -1.8534250557422638e-05, -1.7935410141944885e-05, -1.7336569726467133e-05, -1.673772931098938e-05, -1.6138888895511627e-05, -1.5540048480033875e-05, -1.4941208064556122e-05, -1.4342367649078369e-05, -1.3743527233600616e-05, -1.3144686818122864e-05, -1.2545846402645111e-05, -1.1947005987167358e-05, -1.1348165571689606e-05, -1.0749325156211853e-05, -1.01504847407341e-05, -9.551644325256348e-06, -8.952803909778595e-06, -8.353963494300842e-06, -7.75512307882309e-06, -7.156282663345337e-06, -6.557442247867584e-06, -5.9586018323898315e-06, -5.359761416912079e-06, -4.760921001434326e-06, -4.1620805859565735e-06, -3.563240170478821e-06, -2.964399755001068e-06, -2.3655593395233154e-06, -1.7667189240455627e-06, -1.16787850856781e-06, -5.690380930900574e-07, 2.9802322387695312e-08, 6.28642737865448e-07, 1.2274831533432007e-06, 1.8263235688209534e-06, 2.425163984298706e-06, 3.0240043997764587e-06, 3.6228448152542114e-06, 4.221685230731964e-06, 4.820525646209717e-06, 5.4193660616874695e-06, 6.018206477165222e-06, 6.617046892642975e-06, 7.2158873081207275e-06, 7.81472772359848e-06, 8.413568139076233e-06, 9.012408554553986e-06, 9.611248970031738e-06, 1.0210089385509491e-05, 1.0808929800987244e-05, 1.1407770216464996e-05, 1.2006610631942749e-05, 1.2605451047420502e-05, 1.3204291462898254e-05, 1.3803131878376007e-05, 1.440197229385376e-05, 1.5000812709331512e-05, 1.5599653124809265e-05, 1.6198493540287018e-05, 1.679733395576477e-05, 1.7396174371242523e-05, 1.7995014786720276e-05, 1.859385520219803e-05, 1.919269561767578e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 8.0, 25.0, 49.0, 33.0, 47.0, 72.0, 67.0, 109.0, 94.0, 85.0, 74.0, 67.0, 57.0, 44.0, 31.0, 37.0, 17.0, 14.0, 13.0, 7.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.933906555175781e-06, -3.8100406527519226e-06, -3.686174750328064e-06, -3.5623088479042053e-06, -3.4384429454803467e-06, -3.314577043056488e-06, -3.1907111406326294e-06, -3.0668452382087708e-06, -2.942979335784912e-06, -2.8191134333610535e-06, -2.695247530937195e-06, -2.571381628513336e-06, -2.4475157260894775e-06, -2.323649823665619e-06, -2.1997839212417603e-06, -2.0759180188179016e-06, -1.952052116394043e-06, -1.8281862139701843e-06, -1.7043203115463257e-06, -1.580454409122467e-06, -1.4565885066986084e-06, -1.3327226042747498e-06, -1.2088567018508911e-06, -1.0849907994270325e-06, -9.611248970031738e-07, -8.372589945793152e-07, -7.133930921554565e-07, -5.895271897315979e-07, -4.6566128730773926e-07, -3.417953848838806e-07, -2.1792948246002197e-07, -9.406358003616333e-08, 2.9802322387695312e-08, 1.5366822481155396e-07, 2.775341272354126e-07, 4.0140002965927124e-07, 5.252659320831299e-07, 6.491318345069885e-07, 7.729977369308472e-07, 8.968636393547058e-07, 1.0207295417785645e-06, 1.144595444202423e-06, 1.2684613466262817e-06, 1.3923272490501404e-06, 1.516193151473999e-06, 1.6400590538978577e-06, 1.7639249563217163e-06, 1.887790858745575e-06, 2.0116567611694336e-06, 2.1355226635932922e-06, 2.259388566017151e-06, 2.3832544684410095e-06, 2.507120370864868e-06, 2.630986273288727e-06, 2.7548521757125854e-06, 2.878718078136444e-06, 3.0025839805603027e-06, 3.1264498829841614e-06, 3.25031578540802e-06, 3.3741816878318787e-06, 3.4980475902557373e-06, 3.621913492679596e-06, 3.7457793951034546e-06, 3.869645297527313e-06, 3.993511199951172e-06]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 15.0, 9.0, 17.0, 23.0, 32.0, 63.0, 142.0, 155.0, 187.0, 131.0, 76.0, 46.0, 37.0, 19.0, 15.0, 18.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006392365321516991, -0.0006205920944921672, -0.0006019477150402963, -0.0005833032773807645, -0.0005646588397212327, -0.0005460144020617008, -0.0005273700226098299, -0.0005087255849502981, -0.0004900811472907662, -0.00047143673873506486, -0.00045279230107553303, -0.00043414789251983166, -0.0004155034548602998, -0.00039685904630459845, -0.0003782146377488971, -0.00035957020008936524, -0.00034092579153366387, -0.0003222813829779625, -0.00030363694531843066, -0.0002849925367627293, -0.00026634809910319746, -0.0002477036905474961, -0.00022905926743987948, -0.00021041484433226287, -0.00019177042122464627, -0.00017312599811702967, -0.00015448157500941306, -0.00013583715190179646, -0.00011719273607013747, -9.854831296252087e-05, -7.990389713086188e-05, -6.125947402324528e-05, -4.261505091562867e-05, -2.3970629627001472e-05, -5.326208338374272e-06, 1.3318211131263524e-05, 3.196263423888013e-05, 5.060705734649673e-05, 6.925147317815572e-05, 8.789589628577232e-05, 0.00010654031939338893, 0.00012518474250100553, 0.00014382916560862213, 0.00016247358871623874, 0.0001811179972719401, 0.00019976243493147194, 0.00021840684348717332, 0.00023705126659478992, 0.0002556956897024065, 0.0002743400982581079, 0.00029298453591763973, 0.0003116289444733411, 0.00033027338213287294, 0.0003489177906885743, 0.00036756222834810615, 0.0003862066369038075, 0.0004048510454595089, 0.00042349545401521027, 0.0004421398916747421, 0.0004607843002304435, 0.0004794287378899753, 0.0004980731755495071, 0.0005167175550013781, 0.0005353619926609099, 0.0005540064303204417]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 9.0, 7.0, 12.0, 13.0, 11.0, 15.0, 23.0, 15.0, 21.0, 19.0, 27.0, 37.0, 32.0, 31.0, 32.0, 44.0, 41.0, 56.0, 56.0, 39.0, 38.0, 46.0, 45.0, 38.0, 35.0, 47.0, 34.0, 28.0, 19.0, 31.0, 20.0, 20.0, 16.0, 7.0, 13.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002710241242311895, -0.00026337685994803905, -0.00025572956656105816, -0.00024808230227790773, -0.00024043500889092684, -0.00023278773005586118, -0.0002251404512207955, -0.00021749318693764508, -0.0002098458935506642, -0.00020219861471559852, -0.00019455133588053286, -0.0001869040570454672, -0.00017925677821040154, -0.00017160949937533587, -0.0001639622205402702, -0.00015631495625711977, -0.0001486676774220541, -0.00014102039858698845, -0.00013337311975192279, -0.00012572584091685712, -0.00011807856208179146, -0.0001104312832467258, -0.00010278401168761775, -9.513673285255209e-05, -8.748945401748642e-05, -7.984217518242076e-05, -7.21948963473551e-05, -6.454762478824705e-05, -5.690034231520258e-05, -4.9253063480136916e-05, -4.160578828305006e-05, -3.39585094479844e-05, -2.6311230612918735e-05, -1.866395177785307e-05, -1.1016674761776812e-05, -3.369397745700553e-06, 4.27788108936511e-06, 1.1925159924430773e-05, 1.957243512151763e-05, 2.721971395658329e-05, 3.4866992791648954e-05, 4.251427162671462e-05, 5.016155046178028e-05, 5.7808825658867136e-05, 6.545610085595399e-05, 7.310337969101965e-05, 8.075065852608532e-05, 8.839793736115098e-05, 9.604521619621664e-05, 0.0001036924950312823, 0.00011133977386634797, 0.00011898705270141363, 0.0001266343315364793, 0.00013428161037154496, 0.0001419288746546954, 0.00014957616804167628, 0.00015722343232482672, 0.00016487071115989238, 0.00017251798999495804, 0.0001801652688300237, 0.00018781254766508937, 0.00019545982650015503, 0.0002031071053352207, 0.00021075436961837113, 0.00021840166300535202]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 8.0, 9.0, 11.0, 11.0, 21.0, 15.0, 36.0, 49.0, 51.0, 56.0, 104.0, 135.0, 207.0, 339.0, 506.0, 817.0, 1486.0, 3335.0, 13207.0, 4029282.0, 133338.0, 5848.0, 2337.0, 1185.0, 698.0, 397.0, 233.0, 174.0, 118.0, 76.0, 43.0, 44.0, 33.0, 20.0, 16.0, 8.0, 9.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009760856628417969, -0.0009479820728302002, -0.0009198784828186035, -0.0008917748928070068, -0.0008636713027954102, -0.0008355677127838135, -0.0008074641227722168, -0.0007793605327606201, -0.0007512569427490234, -0.0007231533527374268, -0.0006950497627258301, -0.0006669461727142334, -0.0006388425827026367, -0.00061073899269104, -0.0005826354026794434, -0.0005545318126678467, -0.00052642822265625, -0.0004983246326446533, -0.00047022104263305664, -0.00044211745262145996, -0.0004140138626098633, -0.0003859102725982666, -0.0003578066825866699, -0.00032970309257507324, -0.00030159950256347656, -0.0002734959125518799, -0.0002453923225402832, -0.00021728873252868652, -0.00018918514251708984, -0.00016108155250549316, -0.00013297796249389648, -0.0001048743724822998, -7.677078247070312e-05, -4.8667192459106445e-05, -2.0563602447509766e-05, 7.539987564086914e-06, 3.5643577575683594e-05, 6.374716758728027e-05, 9.185075759887695e-05, 0.00011995434761047363, 0.0001480579376220703, 0.000176161527633667, 0.00020426511764526367, 0.00023236870765686035, 0.00026047229766845703, 0.0002885758876800537, 0.0003166794776916504, 0.00034478306770324707, 0.00037288665771484375, 0.00040099024772644043, 0.0004290938377380371, 0.0004571974277496338, 0.00048530101776123047, 0.0005134046077728271, 0.0005415081977844238, 0.0005696117877960205, 0.0005977153778076172, 0.0006258189678192139, 0.0006539225578308105, 0.0006820261478424072, 0.0007101297378540039, 0.0007382333278656006, 0.0007663369178771973, 0.0007944405078887939, 0.0008225440979003906]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 6.0, 7.0, 13.0, 9.0, 18.0, 23.0, 14.0, 13.0, 27.0, 25.0, 31.0, 35.0, 33.0, 40.0, 39.0, 55.0, 45.0, 58.0, 49.0, 36.0, 57.0, 42.0, 44.0, 38.0, 44.0, 36.0, 32.0, 22.0, 16.0, 20.0, 15.0, 12.0, 14.0, 4.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0002428293228149414, -0.00023598037660121918, -0.00022913143038749695, -0.00022228248417377472, -0.0002154335379600525, -0.00020858459174633026, -0.00020173564553260803, -0.0001948866993188858, -0.00018803775310516357, -0.00018118880689144135, -0.00017433986067771912, -0.0001674909144639969, -0.00016064196825027466, -0.00015379302203655243, -0.0001469440758228302, -0.00014009512960910797, -0.00013324618339538574, -0.0001263972371816635, -0.00011954829096794128, -0.00011269934475421906, -0.00010585039854049683, -9.90014523267746e-05, -9.215250611305237e-05, -8.530355989933014e-05, -7.845461368560791e-05, -7.160566747188568e-05, -6.475672125816345e-05, -5.790777504444122e-05, -5.1058828830718994e-05, -4.4209882616996765e-05, -3.7360936403274536e-05, -3.0511990189552307e-05, -2.3663043975830078e-05, -1.681409776210785e-05, -9.96515154838562e-06, -3.116205334663391e-06, 3.732740879058838e-06, 1.0581687092781067e-05, 1.7430633306503296e-05, 2.4279579520225525e-05, 3.1128525733947754e-05, 3.797747194766998e-05, 4.482641816139221e-05, 5.167536437511444e-05, 5.852431058883667e-05, 6.53732568025589e-05, 7.222220301628113e-05, 7.907114923000336e-05, 8.592009544372559e-05, 9.276904165744781e-05, 9.961798787117004e-05, 0.00010646693408489227, 0.0001133158802986145, 0.00012016482651233673, 0.00012701377272605896, 0.0001338627189397812, 0.00014071166515350342, 0.00014756061136722565, 0.00015440955758094788, 0.0001612585037946701, 0.00016810745000839233, 0.00017495639622211456, 0.0001818053424358368, 0.00018865428864955902, 0.00019550323486328125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 11.0, 16.0, 33.0, 80.0, 229.0, 770.0, 2430.0, 10215.0, 3910791.0, 259107.0, 7694.0, 1961.0, 592.0, 194.0, 70.0, 37.0, 16.0, 11.0, 8.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014514923095703125, -0.0013932287693023682, -0.0013349652290344238, -0.0012767016887664795, -0.0012184381484985352, -0.0011601746082305908, -0.0011019110679626465, -0.0010436475276947021, -0.0009853839874267578, -0.0009271204471588135, -0.0008688569068908691, -0.0008105933666229248, -0.0007523298263549805, -0.0006940662860870361, -0.0006358027458190918, -0.0005775392055511475, -0.0005192756652832031, -0.0004610121250152588, -0.00040274858474731445, -0.0003444850444793701, -0.0002862215042114258, -0.00022795796394348145, -0.0001696944236755371, -0.00011143088340759277, -5.316734313964844e-05, 5.0961971282958984e-06, 6.335973739624023e-05, 0.00012162327766418457, 0.0001798868179321289, 0.00023815035820007324, 0.0002964138984680176, 0.0003546774387359619, 0.00041294097900390625, 0.0004712045192718506, 0.0005294680595397949, 0.0005877315998077393, 0.0006459951400756836, 0.0007042586803436279, 0.0007625222206115723, 0.0008207857608795166, 0.0008790493011474609, 0.0009373128414154053, 0.0009955763816833496, 0.001053839921951294, 0.0011121034622192383, 0.0011703670024871826, 0.001228630542755127, 0.0012868940830230713, 0.0013451576232910156, 0.00140342116355896, 0.0014616847038269043, 0.0015199482440948486, 0.001578211784362793, 0.0016364753246307373, 0.0016947388648986816, 0.001753002405166626, 0.0018112659454345703, 0.0018695294857025146, 0.001927793025970459, 0.0019860565662384033, 0.0020443201065063477, 0.002102583646774292, 0.0021608471870422363, 0.0022191107273101807, 0.002277374267578125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 8.0, 4.0, 9.0, 14.0, 11.0, 34.0, 96.0, 358.0, 2673.0, 567.0, 159.0, 55.0, 22.0, 15.0, 6.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016438961029052734, -0.00015977956354618073, -0.0001551695168018341, -0.0001505594700574875, -0.00014594942331314087, -0.00014133937656879425, -0.00013672932982444763, -0.000132119283080101, -0.0001275092363357544, -0.00012289918959140778, -0.00011828914284706116, -0.00011367909610271454, -0.00010906904935836792, -0.0001044590026140213, -9.984895586967468e-05, -9.523890912532806e-05, -9.062886238098145e-05, -8.601881563663483e-05, -8.140876889228821e-05, -7.679872214794159e-05, -7.218867540359497e-05, -6.757862865924835e-05, -6.296858191490173e-05, -5.8358535170555115e-05, -5.3748488426208496e-05, -4.913844168186188e-05, -4.452839493751526e-05, -3.991834819316864e-05, -3.530830144882202e-05, -3.06982547044754e-05, -2.6088207960128784e-05, -2.1478161215782166e-05, -1.6868114471435547e-05, -1.2258067727088928e-05, -7.64802098274231e-06, -3.037974238395691e-06, 1.5720725059509277e-06, 6.182119250297546e-06, 1.0792165994644165e-05, 1.5402212738990784e-05, 2.0012259483337402e-05, 2.462230622768402e-05, 2.923235297203064e-05, 3.384239971637726e-05, 3.845244646072388e-05, 4.3062493205070496e-05, 4.7672539949417114e-05, 5.228258669376373e-05, 5.689263343811035e-05, 6.150268018245697e-05, 6.611272692680359e-05, 7.072277367115021e-05, 7.533282041549683e-05, 7.994286715984344e-05, 8.455291390419006e-05, 8.916296064853668e-05, 9.37730073928833e-05, 9.838305413722992e-05, 0.00010299310088157654, 0.00010760314762592316, 0.00011221319437026978, 0.0001168232411146164, 0.00012143328785896301, 0.00012604333460330963, 0.00013065338134765625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 7.0, 13.0, 8.0, 14.0, 26.0, 25.0, 41.0, 79.0, 107.0, 137.0, 154.0, 114.0, 78.0, 58.0, 39.0, 30.0, 17.0, 22.0, 13.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003063292824663222, -0.00029379501938819885, -0.00028126072720624506, -0.00026872646412812173, -0.00025619217194616795, -0.00024365790886804461, -0.00023112364578992128, -0.00021858936815988272, -0.00020605509052984416, -0.0001935208128998056, -0.00018098653526976705, -0.00016845227219164371, -0.00015591799456160516, -0.0001433837169315666, -0.00013084945385344326, -0.0001183151762234047, -0.00010578089859336615, -9.324662096332759e-05, -8.071235060924664e-05, -6.81780802551657e-05, -5.564380262512714e-05, -4.310952499508858e-05, -3.057525464100763e-05, -1.8040984286926687e-05, -5.506706656888127e-06, 7.027567335171625e-06, 1.9561841327231377e-05, 3.209611531929113e-05, 4.463038931135088e-05, 5.716466694138944e-05, 6.969893729547039e-05, 8.223320764955133e-05, 9.476748527958989e-05, 0.00010730176290962845, 0.0001198360332637094, 0.00013237030361779034, 0.0001449045812478289, 0.00015743885887786746, 0.0001699731219559908, 0.00018250739958602935, 0.0001950416772160679, 0.00020757595484610647, 0.00022011023247614503, 0.00023264449555426836, 0.0002451787586323917, 0.0002577130508143455, 0.0002702473138924688, 0.0002827816060744226, 0.00029531586915254593, 0.00030785013223066926, 0.00032038442441262305, 0.0003329186874907464, 0.00034545297967270017, 0.0003579872427508235, 0.00037052150582894683, 0.00038305576890707016, 0.00039559006108902395, 0.0004081243241671473, 0.00042065861634910107, 0.0004331928794272244, 0.00044572714250534773, 0.0004582614346873015, 0.00047079569776542485, 0.00048332998994737864, 0.000495864253025502]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 0.0, 5.0, 4.0, 9.0, 7.0, 12.0, 19.0, 17.0, 16.0, 19.0, 25.0, 27.0, 32.0, 27.0, 38.0, 41.0, 33.0, 47.0, 25.0, 43.0, 49.0, 47.0, 52.0, 43.0, 45.0, 34.0, 38.0, 31.0, 50.0, 33.0, 24.0, 19.0, 16.0, 13.0, 14.0, 17.0, 8.0, 7.0, 0.0, 5.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.00023552111815661192, -0.00022920728952158242, -0.00022289346088655293, -0.00021657963225152344, -0.00021026580361649394, -0.00020395197498146445, -0.00019763814634643495, -0.00019132431771140546, -0.00018501048907637596, -0.00017869666044134647, -0.00017238283180631697, -0.00016606900317128748, -0.00015975517453625798, -0.0001534413459012285, -0.000147127517266199, -0.0001408136886311695, -0.00013449985999614, -0.0001281860313611105, -0.00012187220272608101, -0.00011555837409105152, -0.00010924454545602202, -0.00010293071682099253, -9.661688818596303e-05, -9.030305955093354e-05, -8.398923091590405e-05, -7.767540228087455e-05, -7.136157364584506e-05, -6.504774501081556e-05, -5.8733916375786066e-05, -5.242008774075657e-05, -4.6106259105727077e-05, -3.979243047069758e-05, -3.347858728375286e-05, -2.7164758648723364e-05, -2.085093001369387e-05, -1.4537101378664374e-05, -8.22327274363488e-06, -1.909444108605385e-06, 4.40438452642411e-06, 1.0718213161453605e-05, 1.70320417964831e-05, 2.3345870431512594e-05, 2.965969906654209e-05, 3.5973527701571584e-05, 4.228735633660108e-05, 4.860118497163057e-05, 5.491501360666007e-05, 6.122884224168956e-05, 6.754267087671906e-05, 7.385649951174855e-05, 8.017032814677805e-05, 8.648415678180754e-05, 9.279798541683704e-05, 9.911181405186653e-05, 0.00010542564268689603, 0.00011173947132192552, 0.00011805329995695502, 0.0001243671285919845, 0.000130680957227014, 0.0001369947858620435, 0.000143308614497073, 0.0001496224431321025, 0.00015593627176713198, 0.00016225010040216148, 0.00016856392903719097]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 15.0, 19.0, 34.0, 36.0, 54.0, 98.0, 117.0, 177.0, 302.0, 449.0, 706.0, 1206.0, 1868.0, 3294.0, 5593.0, 9848.0, 18664.0, 34790.0, 66829.0, 137520.0, 277122.0, 243061.0, 119670.0, 58882.0, 30379.0, 16306.0, 8963.0, 4952.0, 2911.0, 1671.0, 1114.0, 651.0, 461.0, 269.0, 172.0, 100.0, 81.0, 51.0, 34.0, 33.0, 13.0, 13.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.000179290771484375, -0.00017348863184452057, -0.00016768649220466614, -0.0001618843525648117, -0.00015608221292495728, -0.00015028007328510284, -0.0001444779336452484, -0.00013867579400539398, -0.00013287365436553955, -0.00012707151472568512, -0.00012126937508583069, -0.00011546723544597626, -0.00010966509580612183, -0.0001038629561662674, -9.806081652641296e-05, -9.225867688655853e-05, -8.64565372467041e-05, -8.065439760684967e-05, -7.485225796699524e-05, -6.905011832714081e-05, -6.324797868728638e-05, -5.7445839047431946e-05, -5.1643699407577515e-05, -4.5841559767723083e-05, -4.003942012786865e-05, -3.423728048801422e-05, -2.843514084815979e-05, -2.263300120830536e-05, -1.6830861568450928e-05, -1.1028721928596497e-05, -5.2265822887420654e-06, 5.755573511123657e-07, 6.377696990966797e-06, 1.2179836630821228e-05, 1.798197627067566e-05, 2.378411591053009e-05, 2.958625555038452e-05, 3.538839519023895e-05, 4.1190534830093384e-05, 4.6992674469947815e-05, 5.2794814109802246e-05, 5.859695374965668e-05, 6.439909338951111e-05, 7.020123302936554e-05, 7.600337266921997e-05, 8.18055123090744e-05, 8.760765194892883e-05, 9.340979158878326e-05, 9.92119312286377e-05, 0.00010501407086849213, 0.00011081621050834656, 0.00011661835014820099, 0.00012242048978805542, 0.00012822262942790985, 0.00013402476906776428, 0.0001398269087076187, 0.00014562904834747314, 0.00015143118798732758, 0.000157233327627182, 0.00016303546726703644, 0.00016883760690689087, 0.0001746397465467453, 0.00018044188618659973, 0.00018624402582645416, 0.0001920461654663086]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 10.0, 8.0, 13.0, 17.0, 6.0, 12.0, 17.0, 21.0, 31.0, 28.0, 25.0, 35.0, 36.0, 36.0, 35.0, 39.0, 38.0, 51.0, 37.0, 44.0, 43.0, 40.0, 48.0, 36.0, 27.0, 38.0, 29.0, 32.0, 34.0, 34.0, 20.0, 13.0, 8.0, 11.0, 8.0, 7.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0002105236053466797, -0.000204429030418396, -0.0001983344554901123, -0.0001922398805618286, -0.00018614530563354492, -0.00018005073070526123, -0.00017395615577697754, -0.00016786158084869385, -0.00016176700592041016, -0.00015567243099212646, -0.00014957785606384277, -0.00014348328113555908, -0.0001373887062072754, -0.0001312941312789917, -0.000125199556350708, -0.00011910498142242432, -0.00011301040649414062, -0.00010691583156585693, -0.00010082125663757324, -9.472668170928955e-05, -8.863210678100586e-05, -8.253753185272217e-05, -7.644295692443848e-05, -7.034838199615479e-05, -6.42538070678711e-05, -5.81592321395874e-05, -5.206465721130371e-05, -4.597008228302002e-05, -3.987550735473633e-05, -3.378093242645264e-05, -2.7686357498168945e-05, -2.1591782569885254e-05, -1.5497207641601562e-05, -9.402632713317871e-06, -3.3080577850341797e-06, 2.7865171432495117e-06, 8.881092071533203e-06, 1.4975666999816895e-05, 2.1070241928100586e-05, 2.7164816856384277e-05, 3.325939178466797e-05, 3.935396671295166e-05, 4.544854164123535e-05, 5.154311656951904e-05, 5.7637691497802734e-05, 6.373226642608643e-05, 6.982684135437012e-05, 7.592141628265381e-05, 8.20159912109375e-05, 8.811056613922119e-05, 9.420514106750488e-05, 0.00010029971599578857, 0.00010639429092407227, 0.00011248886585235596, 0.00011858344078063965, 0.00012467801570892334, 0.00013077259063720703, 0.00013686716556549072, 0.00014296174049377441, 0.0001490563154220581, 0.0001551508903503418, 0.0001612454652786255, 0.00016734004020690918, 0.00017343461513519287, 0.00017952919006347656]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 6.0, 10.0, 16.0, 19.0, 24.0, 42.0, 49.0, 101.0, 140.0, 186.0, 311.0, 444.0, 740.0, 1127.0, 1876.0, 3152.0, 5526.0, 10251.0, 20989.0, 48206.0, 138898.0, 496412.0, 201997.0, 63528.0, 26196.0, 12330.0, 6394.0, 3658.0, 2190.0, 1370.0, 849.0, 520.0, 341.0, 207.0, 149.0, 89.0, 61.0, 43.0, 26.0, 30.0, 18.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024890899658203125, -0.0002410411834716797, -0.00023317337036132812, -0.00022530555725097656, -0.000217437744140625, -0.00020956993103027344, -0.00020170211791992188, -0.0001938343048095703, -0.00018596649169921875, -0.0001780986785888672, -0.00017023086547851562, -0.00016236305236816406, -0.0001544952392578125, -0.00014662742614746094, -0.00013875961303710938, -0.0001308917999267578, -0.00012302398681640625, -0.00011515617370605469, -0.00010728836059570312, -9.942054748535156e-05, -9.1552734375e-05, -8.368492126464844e-05, -7.581710815429688e-05, -6.794929504394531e-05, -6.008148193359375e-05, -5.221366882324219e-05, -4.4345855712890625e-05, -3.647804260253906e-05, -2.86102294921875e-05, -2.0742416381835938e-05, -1.2874603271484375e-05, -5.0067901611328125e-06, 2.86102294921875e-06, 1.0728836059570312e-05, 1.8596649169921875e-05, 2.6464462280273438e-05, 3.4332275390625e-05, 4.220008850097656e-05, 5.0067901611328125e-05, 5.793571472167969e-05, 6.580352783203125e-05, 7.367134094238281e-05, 8.153915405273438e-05, 8.940696716308594e-05, 9.72747802734375e-05, 0.00010514259338378906, 0.00011301040649414062, 0.00012087821960449219, 0.00012874603271484375, 0.0001366138458251953, 0.00014448165893554688, 0.00015234947204589844, 0.00016021728515625, 0.00016808509826660156, 0.00017595291137695312, 0.0001838207244873047, 0.00019168853759765625, 0.0001995563507080078, 0.00020742416381835938, 0.00021529197692871094, 0.0002231597900390625, 0.00023102760314941406, 0.00023889541625976562, 0.0002467632293701172, 0.00025463104248046875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 9.0, 5.0, 9.0, 10.0, 11.0, 16.0, 17.0, 20.0, 21.0, 33.0, 26.0, 22.0, 32.0, 25.0, 31.0, 31.0, 37.0, 40.0, 41.0, 60.0, 35.0, 29.0, 34.0, 39.0, 33.0, 40.0, 23.0, 39.0, 27.0, 21.0, 28.0, 17.0, 26.0, 20.0, 17.0, 15.0, 14.0, 7.0, 9.0, 5.0, 4.0, 6.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000118255615234375, -0.00011470075696706772, -0.00011114589869976044, -0.00010759104043245316, -0.00010403618216514587, -0.00010048132389783859, -9.692646563053131e-05, -9.337160736322403e-05, -8.981674909591675e-05, -8.626189082860947e-05, -8.270703256130219e-05, -7.91521742939949e-05, -7.559731602668762e-05, -7.204245775938034e-05, -6.848759949207306e-05, -6.493274122476578e-05, -6.13778829574585e-05, -5.7823024690151215e-05, -5.426816642284393e-05, -5.071330815553665e-05, -4.715844988822937e-05, -4.360359162092209e-05, -4.004873335361481e-05, -3.6493875086307526e-05, -3.2939016819000244e-05, -2.9384158551692963e-05, -2.582930028438568e-05, -2.22744420170784e-05, -1.8719583749771118e-05, -1.5164725482463837e-05, -1.1609867215156555e-05, -8.055008947849274e-06, -4.500150680541992e-06, -9.452924132347107e-07, 2.609565854072571e-06, 6.164424121379852e-06, 9.719282388687134e-06, 1.3274140655994415e-05, 1.6828998923301697e-05, 2.0383857190608978e-05, 2.393871545791626e-05, 2.749357372522354e-05, 3.104843199253082e-05, 3.4603290259838104e-05, 3.8158148527145386e-05, 4.171300679445267e-05, 4.526786506175995e-05, 4.882272332906723e-05, 5.237758159637451e-05, 5.593243986368179e-05, 5.9487298130989075e-05, 6.304215639829636e-05, 6.659701466560364e-05, 7.015187293291092e-05, 7.37067312002182e-05, 7.726158946752548e-05, 8.081644773483276e-05, 8.437130600214005e-05, 8.792616426944733e-05, 9.148102253675461e-05, 9.503588080406189e-05, 9.859073907136917e-05, 0.00010214559733867645, 0.00010570045560598373, 0.00010925531387329102]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 11.0, 10.0, 5.0, 13.0, 16.0, 17.0, 42.0, 72.0, 94.0, 116.0, 141.0, 228.0, 357.0, 538.0, 897.0, 1347.0, 2052.0, 3633.0, 7536.0, 15708.0, 49745.0, 507591.0, 387904.0, 40965.0, 13959.0, 6687.0, 3313.0, 1977.0, 1244.0, 746.0, 470.0, 370.0, 246.0, 158.0, 102.0, 68.0, 46.0, 49.0, 22.0, 26.0, 11.0, 7.0, 6.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7179718017578125e-05, -2.6328489184379578e-05, -2.547726035118103e-05, -2.4626031517982483e-05, -2.3774802684783936e-05, -2.2923573851585388e-05, -2.207234501838684e-05, -2.1221116185188293e-05, -2.0369887351989746e-05, -1.95186585187912e-05, -1.866742968559265e-05, -1.7816200852394104e-05, -1.6964972019195557e-05, -1.611374318599701e-05, -1.5262514352798462e-05, -1.4411285519599915e-05, -1.3560056686401367e-05, -1.270882785320282e-05, -1.1857599020004272e-05, -1.1006370186805725e-05, -1.0155141353607178e-05, -9.30391252040863e-06, -8.452683687210083e-06, -7.601454854011536e-06, -6.750226020812988e-06, -5.898997187614441e-06, -5.0477683544158936e-06, -4.196539521217346e-06, -3.345310688018799e-06, -2.4940818548202515e-06, -1.642853021621704e-06, -7.916241884231567e-07, 5.960464477539063e-08, 9.10833477973938e-07, 1.7620623111724854e-06, 2.6132911443710327e-06, 3.46451997756958e-06, 4.3157488107681274e-06, 5.166977643966675e-06, 6.018206477165222e-06, 6.8694353103637695e-06, 7.720664143562317e-06, 8.571892976760864e-06, 9.423121809959412e-06, 1.0274350643157959e-05, 1.1125579476356506e-05, 1.1976808309555054e-05, 1.2828037142753601e-05, 1.3679265975952148e-05, 1.4530494809150696e-05, 1.5381723642349243e-05, 1.623295247554779e-05, 1.7084181308746338e-05, 1.7935410141944885e-05, 1.8786638975143433e-05, 1.963786780834198e-05, 2.0489096641540527e-05, 2.1340325474739075e-05, 2.2191554307937622e-05, 2.304278314113617e-05, 2.3894011974334717e-05, 2.4745240807533264e-05, 2.559646964073181e-05, 2.644769847393036e-05, 2.7298927307128906e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 5.0, 0.0, 8.0, 15.0, 15.0, 16.0, 18.0, 28.0, 0.0, 25.0, 37.0, 40.0, 60.0, 53.0, 0.0, 71.0, 70.0, 61.0, 63.0, 61.0, 0.0, 53.0, 48.0, 41.0, 50.0, 36.0, 16.0, 0.0, 24.0, 12.0, 18.0, 14.0, 4.0, 0.0, 7.0, 7.0, 4.0, 4.0, 3.0, 4.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.3802200555801392e-06, -1.3299286365509033e-06, -1.2796372175216675e-06, -1.2293457984924316e-06, -1.1790543794631958e-06, -1.12876296043396e-06, -1.0784715414047241e-06, -1.0281801223754883e-06, -9.778887033462524e-07, -9.275972843170166e-07, -8.773058652877808e-07, -8.270144462585449e-07, -7.767230272293091e-07, -7.264316082000732e-07, -6.761401891708374e-07, -6.258487701416016e-07, -5.755573511123657e-07, -5.252659320831299e-07, -4.7497451305389404e-07, -4.246830940246582e-07, -3.7439167499542236e-07, -3.241002559661865e-07, -2.738088369369507e-07, -2.2351741790771484e-07, -1.73225998878479e-07, -1.2293457984924316e-07, -7.264316082000732e-08, -2.2351741790771484e-08, 2.7939677238464355e-08, 7.82310962677002e-08, 1.2852251529693604e-07, 1.7881393432617188e-07, 2.2910535335540771e-07, 2.7939677238464355e-07, 3.296881914138794e-07, 3.7997961044311523e-07, 4.302710294723511e-07, 4.805624485015869e-07, 5.308538675308228e-07, 5.811452865600586e-07, 6.314367055892944e-07, 6.817281246185303e-07, 7.320195436477661e-07, 7.82310962677002e-07, 8.326023817062378e-07, 8.828938007354736e-07, 9.331852197647095e-07, 9.834766387939453e-07, 1.0337680578231812e-06, 1.084059476852417e-06, 1.1343508958816528e-06, 1.1846423149108887e-06, 1.2349337339401245e-06, 1.2852251529693604e-06, 1.3355165719985962e-06, 1.385807991027832e-06, 1.4360994100570679e-06, 1.4863908290863037e-06, 1.5366822481155396e-06, 1.5869736671447754e-06, 1.6372650861740112e-06, 1.687556505203247e-06, 1.737847924232483e-06, 1.7881393432617188e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 2.0, 8.0, 12.0, 10.0, 19.0, 19.0, 28.0, 48.0, 53.0, 131.0, 208.0, 450.0, 979.0, 2461.0, 7509.0, 27428.0, 269343.0, 679079.0, 44863.0, 10265.0, 3236.0, 1250.0, 517.0, 273.0, 112.0, 70.0, 42.0, 29.0, 19.0, 24.0, 9.0, 7.0, 5.0, 6.0, 5.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.7816505432128906e-05, -5.6170858442783356e-05, -5.4525211453437805e-05, -5.2879564464092255e-05, -5.1233917474746704e-05, -4.9588270485401154e-05, -4.79426234960556e-05, -4.629697650671005e-05, -4.46513295173645e-05, -4.300568252801895e-05, -4.13600355386734e-05, -3.971438854932785e-05, -3.80687415599823e-05, -3.642309457063675e-05, -3.47774475812912e-05, -3.313180059194565e-05, -3.14861536026001e-05, -2.9840506613254547e-05, -2.8194859623908997e-05, -2.6549212634563446e-05, -2.4903565645217896e-05, -2.3257918655872345e-05, -2.1612271666526794e-05, -1.9966624677181244e-05, -1.8320977687835693e-05, -1.6675330698490143e-05, -1.5029683709144592e-05, -1.3384036719799042e-05, -1.1738389730453491e-05, -1.009274274110794e-05, -8.44709575176239e-06, -6.80144876241684e-06, -5.155801773071289e-06, -3.5101547837257385e-06, -1.864507794380188e-06, -2.1886080503463745e-07, 1.426786184310913e-06, 3.0724331736564636e-06, 4.718080163002014e-06, 6.363727152347565e-06, 8.009374141693115e-06, 9.655021131038666e-06, 1.1300668120384216e-05, 1.2946315109729767e-05, 1.4591962099075317e-05, 1.6237609088420868e-05, 1.788325607776642e-05, 1.952890306711197e-05, 2.117455005645752e-05, 2.282019704580307e-05, 2.446584403514862e-05, 2.611149102449417e-05, 2.775713801383972e-05, 2.9402785003185272e-05, 3.104843199253082e-05, 3.269407898187637e-05, 3.4339725971221924e-05, 3.5985372960567474e-05, 3.7631019949913025e-05, 3.9276666939258575e-05, 4.0922313928604126e-05, 4.2567960917949677e-05, 4.421360790729523e-05, 4.585925489664078e-05, 4.750490188598633e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 7.0, 6.0, 9.0, 9.0, 9.0, 13.0, 20.0, 14.0, 23.0, 35.0, 47.0, 51.0, 76.0, 90.0, 125.0, 117.0, 71.0, 67.0, 46.0, 25.0, 32.0, 14.0, 17.0, 9.0, 9.0, 8.0, 9.0, 8.0, 8.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.781650543212891e-06, -5.602836608886719e-06, -5.424022674560547e-06, -5.245208740234375e-06, -5.066394805908203e-06, -4.887580871582031e-06, -4.708766937255859e-06, -4.5299530029296875e-06, -4.351139068603516e-06, -4.172325134277344e-06, -3.993511199951172e-06, -3.814697265625e-06, -3.635883331298828e-06, -3.4570693969726562e-06, -3.2782554626464844e-06, -3.0994415283203125e-06, -2.9206275939941406e-06, -2.7418136596679688e-06, -2.562999725341797e-06, -2.384185791015625e-06, -2.205371856689453e-06, -2.0265579223632812e-06, -1.8477439880371094e-06, -1.6689300537109375e-06, -1.4901161193847656e-06, -1.3113021850585938e-06, -1.1324882507324219e-06, -9.5367431640625e-07, -7.748603820800781e-07, -5.960464477539062e-07, -4.172325134277344e-07, -2.384185791015625e-07, -5.960464477539063e-08, 1.1920928955078125e-07, 2.980232238769531e-07, 4.76837158203125e-07, 6.556510925292969e-07, 8.344650268554688e-07, 1.0132789611816406e-06, 1.1920928955078125e-06, 1.3709068298339844e-06, 1.5497207641601562e-06, 1.7285346984863281e-06, 1.9073486328125e-06, 2.086162567138672e-06, 2.2649765014648438e-06, 2.4437904357910156e-06, 2.6226043701171875e-06, 2.8014183044433594e-06, 2.9802322387695312e-06, 3.159046173095703e-06, 3.337860107421875e-06, 3.516674041748047e-06, 3.6954879760742188e-06, 3.874301910400391e-06, 4.0531158447265625e-06, 4.231929779052734e-06, 4.410743713378906e-06, 4.589557647705078e-06, 4.76837158203125e-06, 4.947185516357422e-06, 5.125999450683594e-06, 5.304813385009766e-06, 5.4836273193359375e-06, 5.662441253662109e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 4.0, 12.0, 16.0, 27.0, 30.0, 28.0, 77.0, 86.0, 142.0, 168.0, 108.0, 82.0, 59.0, 55.0, 30.0, 23.0, 16.0, 9.0, 10.0, 8.0, 1.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030368362786248326, -0.00029128786991350353, -0.0002788921119645238, -0.0002664963249117136, -0.00025410056696273386, -0.00024170480901375413, -0.0002293090510647744, -0.00021691329311579466, -0.0002045175206148997, -0.00019212176266591996, -0.000179725990165025, -0.00016733023221604526, -0.00015493447426706553, -0.00014253870176617056, -0.00013014294381719083, -0.00011774717859225348, -0.00010535141336731613, -9.295564814237878e-05, -8.055988291744143e-05, -6.816412496846169e-05, -5.576835974352434e-05, -4.337259451858699e-05, -3.097683656960726e-05, -1.8581071344669908e-05, -6.185306119732559e-06, 6.210457286215387e-06, 1.8606220692163333e-05, 3.1001982279121876e-05, 4.3397747504059225e-05, 5.5793512728996575e-05, 6.818927067797631e-05, 8.058503590291366e-05, 9.298080112785101e-05, 0.00010537656635278836, 0.00011777233157772571, 0.00013016808952670544, 0.0001425638620276004, 0.00015495961997658014, 0.00016735537792555988, 0.00017975113587453961, 0.00019214690837543458, 0.0002045426663244143, 0.00021693843882530928, 0.000229334196774289, 0.00024172995472326875, 0.00025412574177607894, 0.0002665214706212282, 0.0002789172576740384, 0.00029131301562301815, 0.0003037087735719979, 0.0003161045315209776, 0.00032850028946995735, 0.00034089607652276754, 0.0003532918344717473, 0.000365687592420727, 0.00037808335036970675, 0.0003904791083186865, 0.0004028748662676662, 0.00041527062421664596, 0.00042766641126945615, 0.0004400621692184359, 0.0004524579271674156, 0.00046485368511639535, 0.0004772494430653751, 0.0004896452301181853]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 4.0, 8.0, 2.0, 10.0, 18.0, 15.0, 13.0, 20.0, 25.0, 17.0, 26.0, 33.0, 30.0, 25.0, 47.0, 36.0, 38.0, 35.0, 39.0, 44.0, 48.0, 54.0, 39.0, 47.0, 42.0, 31.0, 38.0, 41.0, 28.0, 34.0, 17.0, 16.0, 14.0, 17.0, 18.0, 9.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.00022094410087447613, -0.00021504303731489927, -0.00020914195920340717, -0.0002032408956438303, -0.00019733983208425343, -0.00019143876852467656, -0.00018553769041318446, -0.0001796366268536076, -0.0001737355487421155, -0.00016783448518253863, -0.00016193340707104653, -0.00015603234351146966, -0.0001501312799518928, -0.0001442302018404007, -0.00013832913828082383, -0.00013242807472124696, -0.0001265270111616701, -0.0001206259403261356, -0.00011472487676655874, -0.00010882380593102425, -0.00010292274237144738, -9.70216715359129e-05, -9.112060070037842e-05, -8.521953714080155e-05, -7.931846630526707e-05, -7.341739546973258e-05, -6.751633191015571e-05, -6.161526107462123e-05, -5.5714193877065554e-05, -4.981312667950988e-05, -4.3912055843975395e-05, -3.801098864641972e-05, -3.210993600077927e-05, -2.6208868803223595e-05, -2.0307799786678515e-05, -1.4406730770133436e-05, -8.50566357257776e-06, -2.6045963750220835e-06, 3.2964744605123997e-06, 9.197541658068076e-06, 1.5098608855623752e-05, 2.0999676053179428e-05, 2.6900745069724508e-05, 3.280181408626959e-05, 3.870288128382526e-05, 4.460394848138094e-05, 5.050501931691542e-05, 5.64060865144711e-05, 6.230715371202677e-05, 6.820822454756126e-05, 7.410928810713813e-05, 8.001035894267261e-05, 8.591142250224948e-05, 9.181249333778396e-05, 9.771356417331845e-05, 0.00010361462773289531, 0.0001095156985684298, 0.00011541676940396428, 0.00012131783296354115, 0.00012721889652311802, 0.00013311997463461012, 0.00013902103819418699, 0.00014492211630567908, 0.00015082317986525595, 0.00015672424342483282]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 10.0, 10.0, 10.0, 16.0, 20.0, 30.0, 59.0, 78.0, 139.0, 218.0, 323.0, 466.0, 736.0, 1265.0, 2117.0, 3531.0, 6154.0, 11354.0, 20764.0, 39711.0, 78166.0, 169433.0, 302385.0, 210062.0, 97409.0, 47919.0, 24936.0, 13490.0, 7324.0, 4152.0, 2392.0, 1417.0, 905.0, 561.0, 310.0, 220.0, 155.0, 84.0, 55.0, 50.0, 32.0, 28.0, 17.0, 12.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00044155120849609375, -0.00042613595724105835, -0.00041072070598602295, -0.00039530545473098755, -0.00037989020347595215, -0.00036447495222091675, -0.00034905970096588135, -0.00033364444971084595, -0.00031822919845581055, -0.00030281394720077515, -0.00028739869594573975, -0.00027198344469070435, -0.00025656819343566895, -0.00024115294218063354, -0.00022573769092559814, -0.00021032243967056274, -0.00019490718841552734, -0.00017949193716049194, -0.00016407668590545654, -0.00014866143465042114, -0.00013324618339538574, -0.00011783093214035034, -0.00010241568088531494, -8.700042963027954e-05, -7.158517837524414e-05, -5.616992712020874e-05, -4.075467586517334e-05, -2.533942461013794e-05, -9.924173355102539e-06, 5.491077899932861e-06, 2.0906329154968262e-05, 3.632158041000366e-05, 5.173683166503906e-05, 6.715208292007446e-05, 8.256733417510986e-05, 9.798258543014526e-05, 0.00011339783668518066, 0.00012881308794021606, 0.00014422833919525146, 0.00015964359045028687, 0.00017505884170532227, 0.00019047409296035767, 0.00020588934421539307, 0.00022130459547042847, 0.00023671984672546387, 0.00025213509798049927, 0.00026755034923553467, 0.00028296560049057007, 0.00029838085174560547, 0.00031379610300064087, 0.00032921135425567627, 0.00034462660551071167, 0.00036004185676574707, 0.00037545710802078247, 0.00039087235927581787, 0.00040628761053085327, 0.00042170286178588867, 0.00043711811304092407, 0.00045253336429595947, 0.0004679486155509949, 0.0004833638668060303, 0.0004987791180610657, 0.0005141943693161011, 0.0005296096205711365, 0.0005450248718261719]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 11.0, 4.0, 9.0, 16.0, 15.0, 18.0, 18.0, 22.0, 31.0, 31.0, 39.0, 37.0, 35.0, 52.0, 45.0, 50.0, 54.0, 50.0, 59.0, 45.0, 44.0, 44.0, 35.0, 37.0, 32.0, 29.0, 28.0, 16.0, 23.0, 23.0, 13.0, 11.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0002129077911376953, -0.0002072993665933609, -0.0002016909420490265, -0.00019608251750469208, -0.00019047409296035767, -0.00018486566841602325, -0.00017925724387168884, -0.00017364881932735443, -0.00016804039478302002, -0.0001624319702386856, -0.0001568235456943512, -0.00015121512115001678, -0.00014560669660568237, -0.00013999827206134796, -0.00013438984751701355, -0.00012878142297267914, -0.00012317299842834473, -0.00011756457388401031, -0.0001119561493396759, -0.00010634772479534149, -0.00010073930025100708, -9.513087570667267e-05, -8.952245116233826e-05, -8.391402661800385e-05, -7.830560207366943e-05, -7.269717752933502e-05, -6.708875298500061e-05, -6.14803284406662e-05, -5.587190389633179e-05, -5.0263479351997375e-05, -4.4655054807662964e-05, -3.904663026332855e-05, -3.343820571899414e-05, -2.782978117465973e-05, -2.2221356630325317e-05, -1.6612932085990906e-05, -1.1004507541656494e-05, -5.3960829973220825e-06, 2.123415470123291e-07, 5.820766091346741e-06, 1.1429190635681152e-05, 1.7037615180015564e-05, 2.2646039724349976e-05, 2.8254464268684387e-05, 3.38628888130188e-05, 3.947131335735321e-05, 4.507973790168762e-05, 5.0688162446022034e-05, 5.6296586990356445e-05, 6.190501153469086e-05, 6.751343607902527e-05, 7.312186062335968e-05, 7.873028516769409e-05, 8.43387097120285e-05, 8.994713425636292e-05, 9.555555880069733e-05, 0.00010116398334503174, 0.00010677240788936615, 0.00011238083243370056, 0.00011798925697803497, 0.00012359768152236938, 0.0001292061060667038, 0.0001348145306110382, 0.00014042295515537262, 0.00014603137969970703]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 15.0, 7.0, 14.0, 22.0, 41.0, 49.0, 102.0, 129.0, 239.0, 479.0, 964.0, 2035.0, 4930.0, 12287.0, 35732.0, 124833.0, 444619.0, 304505.0, 78060.0, 24017.0, 8741.0, 3557.0, 1508.0, 716.0, 384.0, 191.0, 117.0, 85.0, 50.0, 38.0, 21.0, 19.0, 16.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008115768432617188, -0.0007868483662605286, -0.0007621198892593384, -0.0007373914122581482, -0.000712662935256958, -0.0006879344582557678, -0.0006632059812545776, -0.0006384775042533875, -0.0006137490272521973, -0.0005890205502510071, -0.0005642920732498169, -0.0005395635962486267, -0.0005148351192474365, -0.0004901066422462463, -0.00046537816524505615, -0.00044064968824386597, -0.0004159212112426758, -0.0003911927342414856, -0.0003664642572402954, -0.0003417357802391052, -0.00031700730323791504, -0.00029227882623672485, -0.00026755034923553467, -0.00024282187223434448, -0.0002180933952331543, -0.0001933649182319641, -0.00016863644123077393, -0.00014390796422958374, -0.00011917948722839355, -9.445101022720337e-05, -6.972253322601318e-05, -4.4994056224823e-05, -2.0265579223632812e-05, 4.462897777557373e-06, 2.919137477874756e-05, 5.3919851779937744e-05, 7.864832878112793e-05, 0.00010337680578231812, 0.0001281052827835083, 0.00015283375978469849, 0.00017756223678588867, 0.00020229071378707886, 0.00022701919078826904, 0.00025174766778945923, 0.0002764761447906494, 0.0003012046217918396, 0.0003259330987930298, 0.00035066157579421997, 0.00037539005279541016, 0.00040011852979660034, 0.00042484700679779053, 0.0004495754837989807, 0.0004743039608001709, 0.0004990324378013611, 0.0005237609148025513, 0.0005484893918037415, 0.0005732178688049316, 0.0005979463458061218, 0.000622674822807312, 0.0006474032998085022, 0.0006721317768096924, 0.0006968602538108826, 0.0007215887308120728, 0.0007463172078132629, 0.0007710456848144531]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 2.0, 4.0, 11.0, 12.0, 11.0, 9.0, 24.0, 16.0, 21.0, 23.0, 34.0, 37.0, 34.0, 46.0, 40.0, 51.0, 52.0, 46.0, 42.0, 47.0, 51.0, 49.0, 46.0, 64.0, 31.0, 31.0, 40.0, 26.0, 17.0, 17.0, 15.0, 10.0, 6.0, 8.0, 7.0, 4.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013124942779541016, -0.00012680701911449432, -0.0001223646104335785, -0.00011792220175266266, -0.00011347979307174683, -0.000109037384390831, -0.00010459497570991516, -0.00010015256702899933, -9.57101583480835e-05, -9.126774966716766e-05, -8.682534098625183e-05, -8.2382932305336e-05, -7.794052362442017e-05, -7.349811494350433e-05, -6.90557062625885e-05, -6.461329758167267e-05, -6.0170888900756836e-05, -5.5728480219841003e-05, -5.128607153892517e-05, -4.684366285800934e-05, -4.2401254177093506e-05, -3.795884549617767e-05, -3.351643681526184e-05, -2.9074028134346008e-05, -2.4631619453430176e-05, -2.0189210772514343e-05, -1.574680209159851e-05, -1.1304393410682678e-05, -6.861984729766846e-06, -2.419576048851013e-06, 2.0228326320648193e-06, 6.465241312980652e-06, 1.0907649993896484e-05, 1.5350058674812317e-05, 1.979246735572815e-05, 2.4234876036643982e-05, 2.8677284717559814e-05, 3.311969339847565e-05, 3.756210207939148e-05, 4.200451076030731e-05, 4.6446919441223145e-05, 5.088932812213898e-05, 5.533173680305481e-05, 5.977414548397064e-05, 6.421655416488647e-05, 6.865896284580231e-05, 7.310137152671814e-05, 7.754378020763397e-05, 8.19861888885498e-05, 8.642859756946564e-05, 9.087100625038147e-05, 9.53134149312973e-05, 9.975582361221313e-05, 0.00010419823229312897, 0.0001086406409740448, 0.00011308304965496063, 0.00011752545833587646, 0.0001219678670167923, 0.00012641027569770813, 0.00013085268437862396, 0.0001352950930595398, 0.00013973750174045563, 0.00014417991042137146, 0.0001486223191022873, 0.00015306472778320312]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 9.0, 17.0, 20.0, 33.0, 36.0, 56.0, 109.0, 135.0, 227.0, 334.0, 667.0, 1139.0, 1923.0, 4426.0, 11480.0, 37776.0, 139763.0, 651708.0, 149401.0, 28694.0, 11469.0, 4498.0, 1904.0, 1124.0, 659.0, 362.0, 186.0, 145.0, 92.0, 49.0, 33.0, 25.0, 19.0, 7.0, 10.0, 10.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.537799835205078e-05, -1.4978460967540741e-05, -1.45789235830307e-05, -1.417938619852066e-05, -1.377984881401062e-05, -1.338031142950058e-05, -1.298077404499054e-05, -1.25812366604805e-05, -1.2181699275970459e-05, -1.1782161891460419e-05, -1.1382624506950378e-05, -1.0983087122440338e-05, -1.0583549737930298e-05, -1.0184012353420258e-05, -9.784474968910217e-06, -9.384937584400177e-06, -8.985400199890137e-06, -8.585862815380096e-06, -8.186325430870056e-06, -7.786788046360016e-06, -7.387250661849976e-06, -6.987713277339935e-06, -6.588175892829895e-06, -6.188638508319855e-06, -5.7891011238098145e-06, -5.389563739299774e-06, -4.990026354789734e-06, -4.590488970279694e-06, -4.190951585769653e-06, -3.791414201259613e-06, -3.3918768167495728e-06, -2.9923394322395325e-06, -2.592802047729492e-06, -2.193264663219452e-06, -1.7937272787094116e-06, -1.3941898941993713e-06, -9.94652509689331e-07, -5.951151251792908e-07, -1.955777406692505e-07, 2.039596438407898e-07, 6.034970283508301e-07, 1.0030344128608704e-06, 1.4025717973709106e-06, 1.802109181880951e-06, 2.201646566390991e-06, 2.6011839509010315e-06, 3.0007213354110718e-06, 3.400258719921112e-06, 3.7997961044311523e-06, 4.199333488941193e-06, 4.598870873451233e-06, 4.998408257961273e-06, 5.3979456424713135e-06, 5.797483026981354e-06, 6.197020411491394e-06, 6.596557796001434e-06, 6.996095180511475e-06, 7.395632565021515e-06, 7.795169949531555e-06, 8.194707334041595e-06, 8.594244718551636e-06, 8.993782103061676e-06, 9.393319487571716e-06, 9.792856872081757e-06, 1.0192394256591797e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 3.0, 7.0, 0.0, 4.0, 10.0, 7.0, 12.0, 26.0, 0.0, 29.0, 33.0, 73.0, 107.0, 123.0, 0.0, 143.0, 145.0, 91.0, 63.0, 34.0, 0.0, 29.0, 19.0, 18.0, 10.0, 6.0, 0.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.940696716308594e-07, -8.44709575176239e-07, -7.953494787216187e-07, -7.459893822669983e-07, -6.966292858123779e-07, -6.472691893577576e-07, -5.979090929031372e-07, -5.485489964485168e-07, -4.991888999938965e-07, -4.498288035392761e-07, -4.0046870708465576e-07, -3.511086106300354e-07, -3.0174851417541504e-07, -2.523884177207947e-07, -2.0302832126617432e-07, -1.5366822481155396e-07, -1.043081283569336e-07, -5.494803190231323e-08, -5.587935447692871e-09, 4.377216100692749e-08, 9.313225746154785e-08, 1.424923539161682e-07, 1.9185245037078857e-07, 2.4121254682540894e-07, 2.905726432800293e-07, 3.3993273973464966e-07, 3.8929283618927e-07, 4.386529326438904e-07, 4.880130290985107e-07, 5.373731255531311e-07, 5.867332220077515e-07, 6.360933184623718e-07, 6.854534149169922e-07, 7.348135113716125e-07, 7.841736078262329e-07, 8.335337042808533e-07, 8.828938007354736e-07, 9.32253897190094e-07, 9.816139936447144e-07, 1.0309740900993347e-06, 1.080334186553955e-06, 1.1296942830085754e-06, 1.1790543794631958e-06, 1.2284144759178162e-06, 1.2777745723724365e-06, 1.3271346688270569e-06, 1.3764947652816772e-06, 1.4258548617362976e-06, 1.475214958190918e-06, 1.5245750546455383e-06, 1.5739351511001587e-06, 1.623295247554779e-06, 1.6726553440093994e-06, 1.7220154404640198e-06, 1.7713755369186401e-06, 1.8207356333732605e-06, 1.8700957298278809e-06, 1.9194558262825012e-06, 1.9688159227371216e-06, 2.018176019191742e-06, 2.0675361156463623e-06, 2.1168962121009827e-06, 2.166256308555603e-06, 2.2156164050102234e-06, 2.2649765014648438e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 9.0, 20.0, 19.0, 43.0, 55.0, 66.0, 107.0, 189.0, 250.0, 539.0, 1056.0, 1384.0, 3742.0, 8522.0, 13728.0, 44711.0, 93586.0, 431039.0, 323586.0, 67178.0, 34432.0, 13262.0, 4719.0, 3048.0, 1471.0, 628.0, 443.0, 181.0, 183.0, 104.0, 56.0, 45.0, 49.0, 25.0, 20.0, 16.0, 7.0, 7.0, 10.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.258487701416016e-06, -6.041489541530609e-06, -5.824491381645203e-06, -5.607493221759796e-06, -5.39049506187439e-06, -5.173496901988983e-06, -4.956498742103577e-06, -4.73950058221817e-06, -4.522502422332764e-06, -4.305504262447357e-06, -4.088506102561951e-06, -3.871507942676544e-06, -3.6545097827911377e-06, -3.437511622905731e-06, -3.2205134630203247e-06, -3.0035153031349182e-06, -2.7865171432495117e-06, -2.5695189833641052e-06, -2.3525208234786987e-06, -2.1355226635932922e-06, -1.9185245037078857e-06, -1.7015263438224792e-06, -1.4845281839370728e-06, -1.2675300240516663e-06, -1.0505318641662598e-06, -8.335337042808533e-07, -6.165355443954468e-07, -3.995373845100403e-07, -1.825392246246338e-07, 3.4458935260772705e-08, 2.514570951461792e-07, 4.684552550315857e-07, 6.854534149169922e-07, 9.024515748023987e-07, 1.1194497346878052e-06, 1.3364478945732117e-06, 1.5534460544586182e-06, 1.7704442143440247e-06, 1.987442374229431e-06, 2.2044405341148376e-06, 2.421438694000244e-06, 2.6384368538856506e-06, 2.855435013771057e-06, 3.0724331736564636e-06, 3.28943133354187e-06, 3.5064294934272766e-06, 3.723427653312683e-06, 3.94042581319809e-06, 4.157423973083496e-06, 4.374422132968903e-06, 4.591420292854309e-06, 4.8084184527397156e-06, 5.025416612625122e-06, 5.2424147725105286e-06, 5.459412932395935e-06, 5.6764110922813416e-06, 5.893409252166748e-06, 6.1104074120521545e-06, 6.327405571937561e-06, 6.5444037318229675e-06, 6.761401891708374e-06, 6.9784000515937805e-06, 7.195398211479187e-06, 7.4123963713645935e-06, 7.62939453125e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 10.0, 0.0, 6.0, 8.0, 8.0, 15.0, 0.0, 18.0, 14.0, 32.0, 24.0, 0.0, 29.0, 46.0, 43.0, 75.0, 0.0, 78.0, 73.0, 71.0, 57.0, 0.0, 65.0, 61.0, 58.0, 45.0, 0.0, 42.0, 40.0, 26.0, 12.0, 0.0, 16.0, 17.0, 8.0, 6.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5022233128547668e-06, -1.4547258615493774e-06, -1.407228410243988e-06, -1.3597309589385986e-06, -1.3122335076332092e-06, -1.2647360563278198e-06, -1.2172386050224304e-06, -1.169741153717041e-06, -1.1222437024116516e-06, -1.0747462511062622e-06, -1.0272487998008728e-06, -9.797513484954834e-07, -9.32253897190094e-07, -8.847564458847046e-07, -8.372589945793152e-07, -7.897615432739258e-07, -7.422640919685364e-07, -6.94766640663147e-07, -6.472691893577576e-07, -5.997717380523682e-07, -5.522742867469788e-07, -5.047768354415894e-07, -4.5727938413619995e-07, -4.0978193283081055e-07, -3.6228448152542114e-07, -3.1478703022003174e-07, -2.6728957891464233e-07, -2.1979212760925293e-07, -1.7229467630386353e-07, -1.2479722499847412e-07, -7.729977369308472e-08, -2.9802322387695312e-08, 1.7695128917694092e-08, 6.51925802230835e-08, 1.126900315284729e-07, 1.601874828338623e-07, 2.076849341392517e-07, 2.551823854446411e-07, 3.026798367500305e-07, 3.501772880554199e-07, 3.976747393608093e-07, 4.4517219066619873e-07, 4.926696419715881e-07, 5.401670932769775e-07, 5.876645445823669e-07, 6.351619958877563e-07, 6.826594471931458e-07, 7.301568984985352e-07, 7.776543498039246e-07, 8.25151801109314e-07, 8.726492524147034e-07, 9.201467037200928e-07, 9.676441550254822e-07, 1.0151416063308716e-06, 1.062639057636261e-06, 1.1101365089416504e-06, 1.1576339602470398e-06, 1.2051314115524292e-06, 1.2526288628578186e-06, 1.300126314163208e-06, 1.3476237654685974e-06, 1.3951212167739868e-06, 1.4426186680793762e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 5.0, 8.0, 11.0, 12.0, 11.0, 20.0, 23.0, 33.0, 49.0, 82.0, 97.0, 113.0, 137.0, 123.0, 77.0, 56.0, 32.0, 26.0, 23.0, 15.0, 10.0, 9.0, 7.0, 9.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001612284977454692, -0.0001533331669634208, -0.0001454378361813724, -0.000137542505399324, -0.0001296471746172756, -0.00012175183655926958, -0.00011385649850126356, -0.00010596116771921515, -9.806583693716675e-05, -9.017050615511835e-05, -8.227517537306994e-05, -7.437983731506392e-05, -6.648450653301552e-05, -5.8589175750967115e-05, -5.0693841330939904e-05, -4.279850691091269e-05, -3.490317612886429e-05, -2.700784352782648e-05, -1.9112510926788673e-05, -1.1217178325750865e-05, -3.3218457247130573e-06, 4.573485057335347e-06, 1.2468819477362558e-05, 2.036415389738977e-05, 2.8259484679438174e-05, 3.615481546148658e-05, 4.405014988151379e-05, 5.1945484301541e-05, 5.9840815083589405e-05, 6.773614586563781e-05, 7.563148392364383e-05, 8.352681470569223e-05, 9.142217459157109e-05, 9.93175053736195e-05, 0.0001072128361556679, 0.00011510817421367392, 0.0001230034977197647, 0.00013089884305372834, 0.00013879417383577675, 0.00014668950461782515, 0.00015458483539987355, 0.00016248016618192196, 0.00017037549696397036, 0.00017827082774601877, 0.0001861661730799824, 0.00019406148931011558, 0.0002019568346440792, 0.0002098521654261276, 0.00021774749620817602, 0.00022564282699022442, 0.00023353815777227283, 0.00024143348855432123, 0.00024932881933636963, 0.00025722416467033327, 0.00026511948090046644, 0.0002730148262344301, 0.0002809101715683937, 0.00028880551690235734, 0.0002967008331324905, 0.00030459617846645415, 0.0003124914946965873, 0.00032038684003055096, 0.00032828215626068413, 0.00033617750159464777, 0.00034407281782478094]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 6.0, 7.0, 12.0, 17.0, 21.0, 23.0, 21.0, 18.0, 21.0, 32.0, 32.0, 34.0, 27.0, 41.0, 54.0, 40.0, 46.0, 40.0, 52.0, 47.0, 53.0, 38.0, 42.0, 31.0, 20.0, 19.0, 28.0, 30.0, 19.0, 25.0, 18.0, 20.0, 13.0, 13.0, 8.0, 8.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.00018265857943333685, -0.0001780151651473716, -0.0001733717363094911, -0.00016872832202352583, -0.00016408489318564534, -0.00015944147889968008, -0.00015479806461371481, -0.00015015463577583432, -0.00014551122148986906, -0.0001408678072039038, -0.0001362243783660233, -0.00013158096408005804, -0.00012693753524217755, -0.00012229412095621228, -0.0001176506993942894, -0.00011300727783236653, -0.00010836385627044365, -0.00010372043470852077, -9.907701314659789e-05, -9.443359158467501e-05, -8.979017729870975e-05, -8.514675573678687e-05, -8.0503334174864e-05, -7.585991988889873e-05, -7.121649105101824e-05, -6.657306948909536e-05, -6.192964792717248e-05, -5.728623000322841e-05, -5.264281207928434e-05, -4.799939051736146e-05, -4.3355968955438584e-05, -3.871255103149451e-05, -3.406912583159283e-05, -2.9425706088659354e-05, -2.478228634572588e-05, -2.0138864783803e-05, -1.5495445040869527e-05, -1.0852025297936052e-05, -6.208603736013174e-06, -1.5651858120691031e-06, 3.078235749853775e-06, 7.72165549278725e-06, 1.2365076145215426e-05, 1.7008496797643602e-05, 2.1651916540577076e-05, 2.629533628351055e-05, 3.093875784543343e-05, 3.55821757693775e-05, 4.022559733130038e-05, 4.4869018893223256e-05, 4.951243681716733e-05, 5.4155858379090205e-05, 5.8799276303034276e-05, 6.344269786495715e-05, 6.808611942688003e-05, 7.272954098880291e-05, 7.737295527476817e-05, 8.201637683669105e-05, 8.665979839861393e-05, 9.13032126845792e-05, 9.594663424650207e-05, 0.00010059005580842495, 0.00010523347737034783, 0.0001098768989322707, 0.00011452032049419358]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 3.0, 10.0, 10.0, 14.0, 20.0, 21.0, 31.0, 31.0, 49.0, 59.0, 92.0, 110.0, 152.0, 172.0, 270.0, 361.0, 520.0, 709.0, 1033.0, 1534.0, 3358.0, 39521.0, 3967610.0, 164492.0, 7785.0, 2027.0, 1227.0, 862.0, 634.0, 425.0, 281.0, 212.0, 175.0, 127.0, 75.0, 67.0, 53.0, 47.0, 34.0, 21.0, 20.0, 8.0, 8.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003345012664794922, -0.0003248639404773712, -0.00031522661447525024, -0.00030558928847312927, -0.0002959519624710083, -0.00028631463646888733, -0.00027667731046676636, -0.0002670399844646454, -0.0002574026584625244, -0.00024776533246040344, -0.00023812800645828247, -0.0002284906804561615, -0.00021885335445404053, -0.00020921602845191956, -0.00019957870244979858, -0.0001899413764476776, -0.00018030405044555664, -0.00017066672444343567, -0.0001610293984413147, -0.00015139207243919373, -0.00014175474643707275, -0.00013211742043495178, -0.0001224800944328308, -0.00011284276843070984, -0.00010320544242858887, -9.35681164264679e-05, -8.393079042434692e-05, -7.429346442222595e-05, -6.465613842010498e-05, -5.501881241798401e-05, -4.538148641586304e-05, -3.5744160413742065e-05, -2.6106834411621094e-05, -1.6469508409500122e-05, -6.83218240737915e-06, 2.8051435947418213e-06, 1.2442469596862793e-05, 2.2079795598983765e-05, 3.1717121601104736e-05, 4.135444760322571e-05, 5.099177360534668e-05, 6.062909960746765e-05, 7.026642560958862e-05, 7.99037516117096e-05, 8.954107761383057e-05, 9.917840361595154e-05, 0.00010881572961807251, 0.00011845305562019348, 0.00012809038162231445, 0.00013772770762443542, 0.0001473650336265564, 0.00015700235962867737, 0.00016663968563079834, 0.0001762770116329193, 0.00018591433763504028, 0.00019555166363716125, 0.00020518898963928223, 0.0002148263156414032, 0.00022446364164352417, 0.00023410096764564514, 0.0002437382936477661, 0.0002533756196498871, 0.00026301294565200806, 0.00027265027165412903, 0.00028228759765625]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 7.0, 10.0, 14.0, 19.0, 16.0, 19.0, 22.0, 33.0, 35.0, 37.0, 28.0, 42.0, 51.0, 66.0, 59.0, 59.0, 50.0, 57.0, 57.0, 51.0, 31.0, 41.0, 28.0, 25.0, 23.0, 27.0, 21.0, 18.0, 11.0, 8.0, 9.0, 5.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019550323486328125, -0.00019014254212379456, -0.00018478184938430786, -0.00017942115664482117, -0.00017406046390533447, -0.00016869977116584778, -0.00016333907842636108, -0.0001579783856868744, -0.0001526176929473877, -0.000147257000207901, -0.0001418963074684143, -0.0001365356147289276, -0.00013117492198944092, -0.00012581422924995422, -0.00012045353651046753, -0.00011509284377098083, -0.00010973215103149414, -0.00010437145829200745, -9.901076555252075e-05, -9.365007281303406e-05, -8.828938007354736e-05, -8.292868733406067e-05, -7.756799459457397e-05, -7.220730185508728e-05, -6.684660911560059e-05, -6.148591637611389e-05, -5.61252236366272e-05, -5.07645308971405e-05, -4.540383815765381e-05, -4.0043145418167114e-05, -3.468245267868042e-05, -2.9321759939193726e-05, -2.396106719970703e-05, -1.8600374460220337e-05, -1.3239681720733643e-05, -7.878988981246948e-06, -2.518296241760254e-06, 2.8423964977264404e-06, 8.203089237213135e-06, 1.3563781976699829e-05, 1.8924474716186523e-05, 2.4285167455673218e-05, 2.9645860195159912e-05, 3.5006552934646606e-05, 4.03672456741333e-05, 4.5727938413619995e-05, 5.108863115310669e-05, 5.6449323892593384e-05, 6.181001663208008e-05, 6.717070937156677e-05, 7.253140211105347e-05, 7.789209485054016e-05, 8.325278759002686e-05, 8.861348032951355e-05, 9.397417306900024e-05, 9.933486580848694e-05, 0.00010469555854797363, 0.00011005625128746033, 0.00011541694402694702, 0.00012077763676643372, 0.0001261383295059204, 0.0001314990222454071, 0.0001368597149848938, 0.0001422204077243805, 0.0001475811004638672]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 18.0, 27.0, 61.0, 142.0, 296.0, 742.0, 2355.0, 14066.0, 4150867.0, 21404.0, 2785.0, 845.0, 363.0, 150.0, 70.0, 37.0, 19.0, 12.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008587837219238281, -0.0008297339081764221, -0.0008006840944290161, -0.0007716342806816101, -0.0007425844669342041, -0.0007135346531867981, -0.0006844848394393921, -0.0006554350256919861, -0.0006263852119445801, -0.0005973353981971741, -0.0005682855844497681, -0.0005392357707023621, -0.0005101859569549561, -0.00048113614320755005, -0.00045208632946014404, -0.00042303651571273804, -0.00039398670196533203, -0.000364936888217926, -0.00033588707447052, -0.000306837260723114, -0.000277787446975708, -0.000248737633228302, -0.000219687819480896, -0.00019063800573349, -0.00016158819198608398, -0.00013253837823867798, -0.00010348856449127197, -7.443875074386597e-05, -4.538893699645996e-05, -1.6339123249053955e-05, 1.271069049835205e-05, 4.176050424575806e-05, 7.081031799316406e-05, 9.986013174057007e-05, 0.00012890994548797607, 0.00015795975923538208, 0.00018700957298278809, 0.0002160593867301941, 0.0002451092004776001, 0.0002741590142250061, 0.0003032088279724121, 0.0003322586417198181, 0.0003613084554672241, 0.0003903582692146301, 0.00041940808296203613, 0.00044845789670944214, 0.00047750771045684814, 0.0005065575242042542, 0.0005356073379516602, 0.0005646571516990662, 0.0005937069654464722, 0.0006227567791938782, 0.0006518065929412842, 0.0006808564066886902, 0.0007099062204360962, 0.0007389560341835022, 0.0007680058479309082, 0.0007970556616783142, 0.0008261054754257202, 0.0008551552891731262, 0.0008842051029205322, 0.0009132549166679382, 0.0009423047304153442, 0.0009713545441627502, 0.0010004043579101562]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 16.0, 61.0, 177.0, 2531.0, 989.0, 175.0, 58.0, 22.0, 14.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.189678192138672e-05, -7.90674239397049e-05, -7.623806595802307e-05, -7.340870797634125e-05, -7.057934999465942e-05, -6.77499920129776e-05, -6.492063403129578e-05, -6.209127604961395e-05, -5.926191806793213e-05, -5.6432560086250305e-05, -5.360320210456848e-05, -5.077384412288666e-05, -4.7944486141204834e-05, -4.511512815952301e-05, -4.2285770177841187e-05, -3.945641219615936e-05, -3.662705421447754e-05, -3.3797696232795715e-05, -3.096833825111389e-05, -2.8138980269432068e-05, -2.5309622287750244e-05, -2.248026430606842e-05, -1.9650906324386597e-05, -1.6821548342704773e-05, -1.399219036102295e-05, -1.1162832379341125e-05, -8.333474397659302e-06, -5.504116415977478e-06, -2.6747584342956543e-06, 1.5459954738616943e-07, 2.983957529067993e-06, 5.813315510749817e-06, 8.64267349243164e-06, 1.1472031474113464e-05, 1.4301389455795288e-05, 1.7130747437477112e-05, 1.9960105419158936e-05, 2.278946340084076e-05, 2.5618821382522583e-05, 2.8448179364204407e-05, 3.127753734588623e-05, 3.4106895327568054e-05, 3.693625330924988e-05, 3.97656112909317e-05, 4.2594969272613525e-05, 4.542432725429535e-05, 4.825368523597717e-05, 5.1083043217658997e-05, 5.391240119934082e-05, 5.6741759181022644e-05, 5.957111716270447e-05, 6.240047514438629e-05, 6.522983312606812e-05, 6.805919110774994e-05, 7.088854908943176e-05, 7.371790707111359e-05, 7.654726505279541e-05, 7.937662303447723e-05, 8.220598101615906e-05, 8.503533899784088e-05, 8.78646969795227e-05, 9.069405496120453e-05, 9.352341294288635e-05, 9.635277092456818e-05, 9.918212890625e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 5.0, 8.0, 7.0, 8.0, 11.0, 21.0, 20.0, 22.0, 29.0, 54.0, 75.0, 86.0, 117.0, 135.0, 97.0, 84.0, 57.0, 42.0, 20.0, 26.0, 19.0, 11.0, 11.0, 10.0, 9.0, 3.0, 2.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001673589868005365, -0.00016079442866612226, -0.00015422985597979277, -0.00014766529784537852, -0.00014110073971096426, -0.00013453618157655, -0.00012797160889022052, -0.00012140705075580627, -0.0001148424853454344, -0.00010827791993506253, -0.00010171336180064827, -9.51487963902764e-05, -8.858423097990453e-05, -8.201967284549028e-05, -7.545510743511841e-05, -6.889054202474654e-05, -6.232598389033228e-05, -5.576142211793922e-05, -4.9196860345546156e-05, -4.2632294935174286e-05, -3.6067733162781224e-05, -2.950317139038816e-05, -2.293860598001629e-05, -1.637404420762323e-05, -9.809482435230166e-06, -3.2449197533424012e-06, 3.3196429285453632e-06, 9.88420651992783e-06, 1.6448768292320892e-05, 2.3013330064713955e-05, 2.9577895475085825e-05, 3.614245724747889e-05, 4.270701901987195e-05, 4.927158079226501e-05, 5.5836142564658076e-05, 6.240070797502995e-05, 6.89652661094442e-05, 7.552983151981607e-05, 8.209439693018794e-05, 8.86589550646022e-05, 9.522352047497407e-05, 0.00010178808588534594, 0.00010835264401976019, 0.00011491720943013206, 0.00012148177484050393, 0.0001280463329749182, 0.00013461089110933244, 0.00014117546379566193, 0.00014774002193007618, 0.00015430458006449044, 0.00016086915275081992, 0.00016743371088523418, 0.00017399826901964843, 0.00018056284170597792, 0.00018712739984039217, 0.00019369195797480643, 0.0002002565306611359, 0.00020682108879555017, 0.00021338566148187965, 0.0002199502196162939, 0.00022651477775070816, 0.00023307933588512242, 0.0002396439085714519, 0.0002462084812577814, 0.0002527730248402804]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 16.0, 10.0, 21.0, 21.0, 14.0, 20.0, 26.0, 31.0, 27.0, 31.0, 45.0, 42.0, 56.0, 38.0, 45.0, 58.0, 47.0, 61.0, 48.0, 47.0, 37.0, 30.0, 38.0, 38.0, 31.0, 26.0, 16.0, 17.0, 12.0, 9.0, 10.0, 7.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00018814783834386617, -0.0001833651913329959, -0.00017858255887404084, -0.00017379991186317056, -0.00016901726485230029, -0.00016423461784143, -0.00015945198538247496, -0.00015466933837160468, -0.0001498866913607344, -0.00014510404434986413, -0.00014032141189090908, -0.0001355387648800388, -0.00013075611786916852, -0.00012597347085829824, -0.00012119083839934319, -0.00011640819138847291, -0.00011162555165356025, -0.00010684291191864759, -0.00010206026490777731, -9.727762517286465e-05, -9.249497816199437e-05, -8.77123384270817e-05, -8.292969141621143e-05, -7.814705168129876e-05, -7.33644119463861e-05, -6.858177221147344e-05, -6.379912520060316e-05, -5.9016485465690494e-05, -5.4233838454820216e-05, -4.945119871990755e-05, -4.466855534701608e-05, -3.988591197412461e-05, -3.510325768729672e-05, -3.0320614314405248e-05, -2.5537970941513777e-05, -2.075532938761171e-05, -1.597268601472024e-05, -1.1190042641828768e-05, -6.407401087926701e-06, -1.62475771503523e-06, 3.157885657856241e-06, 7.940529030747712e-06, 1.272317149414448e-05, 1.750581395754125e-05, 2.228845733043272e-05, 2.707110070332419e-05, 3.185374225722626e-05, 3.663638563011773e-05, 4.14190290030092e-05, 4.620167237590067e-05, 5.098431574879214e-05, 5.5766955483704805e-05, 6.054960249457508e-05, 6.533224222948775e-05, 7.011488196440041e-05, 7.489752897527069e-05, 7.968017598614097e-05, 8.446281572105363e-05, 8.924546273192391e-05, 9.402810246683657e-05, 9.881074947770685e-05, 0.00010359338921261951, 0.00010837602894753218, 0.00011315867595840245, 0.00011794131569331512]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 8.0, 7.0, 13.0, 18.0, 20.0, 48.0, 59.0, 90.0, 136.0, 233.0, 304.0, 487.0, 758.0, 1172.0, 1776.0, 2995.0, 4937.0, 7998.0, 13643.0, 22950.0, 41653.0, 79167.0, 156941.0, 277670.0, 205246.0, 104332.0, 53995.0, 29582.0, 16665.0, 9835.0, 5954.0, 3681.0, 2207.0, 1476.0, 846.0, 512.0, 421.0, 232.0, 167.0, 103.0, 69.0, 57.0, 32.0, 23.0, 19.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011861324310302734, -0.00011475011706352234, -0.00011088699102401733, -0.00010702386498451233, -0.00010316073894500732, -9.929761290550232e-05, -9.543448686599731e-05, -9.157136082649231e-05, -8.77082347869873e-05, -8.38451087474823e-05, -7.99819827079773e-05, -7.611885666847229e-05, -7.225573062896729e-05, -6.839260458946228e-05, -6.452947854995728e-05, -6.066635251045227e-05, -5.6803226470947266e-05, -5.294010043144226e-05, -4.9076974391937256e-05, -4.521384835243225e-05, -4.1350722312927246e-05, -3.748759627342224e-05, -3.3624470233917236e-05, -2.976134419441223e-05, -2.5898218154907227e-05, -2.203509211540222e-05, -1.8171966075897217e-05, -1.4308840036392212e-05, -1.0445713996887207e-05, -6.582587957382202e-06, -2.7194619178771973e-06, 1.1436641216278076e-06, 5.0067901611328125e-06, 8.869916200637817e-06, 1.2733042240142822e-05, 1.6596168279647827e-05, 2.0459294319152832e-05, 2.4322420358657837e-05, 2.8185546398162842e-05, 3.204867243766785e-05, 3.591179847717285e-05, 3.9774924516677856e-05, 4.363805055618286e-05, 4.7501176595687866e-05, 5.136430263519287e-05, 5.5227428674697876e-05, 5.909055471420288e-05, 6.295368075370789e-05, 6.681680679321289e-05, 7.06799328327179e-05, 7.45430588722229e-05, 7.84061849117279e-05, 8.226931095123291e-05, 8.613243699073792e-05, 8.999556303024292e-05, 9.385868906974792e-05, 9.772181510925293e-05, 0.00010158494114875793, 0.00010544806718826294, 0.00010931119322776794, 0.00011317431926727295, 0.00011703744530677795, 0.00012090057134628296, 0.00012476369738578796, 0.00012862682342529297]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 5.0, 12.0, 10.0, 10.0, 20.0, 17.0, 17.0, 26.0, 28.0, 34.0, 41.0, 36.0, 45.0, 50.0, 47.0, 46.0, 53.0, 57.0, 54.0, 42.0, 48.0, 45.0, 46.0, 30.0, 36.0, 26.0, 30.0, 18.0, 7.0, 12.0, 10.0, 11.0, 10.0, 2.0, 7.0, 3.0, 2.0, 5.0, 2.0], "bins": [-0.00019884109497070312, -0.00019404292106628418, -0.00018924474716186523, -0.0001844465732574463, -0.00017964839935302734, -0.0001748502254486084, -0.00017005205154418945, -0.0001652538776397705, -0.00016045570373535156, -0.00015565752983093262, -0.00015085935592651367, -0.00014606118202209473, -0.00014126300811767578, -0.00013646483421325684, -0.0001316666603088379, -0.00012686848640441895, -0.0001220703125, -0.00011727213859558105, -0.00011247396469116211, -0.00010767579078674316, -0.00010287761688232422, -9.807944297790527e-05, -9.328126907348633e-05, -8.848309516906738e-05, -8.368492126464844e-05, -7.888674736022949e-05, -7.408857345581055e-05, -6.92903995513916e-05, -6.449222564697266e-05, -5.969405174255371e-05, -5.4895877838134766e-05, -5.009770393371582e-05, -4.5299530029296875e-05, -4.050135612487793e-05, -3.5703182220458984e-05, -3.090500831604004e-05, -2.6106834411621094e-05, -2.130866050720215e-05, -1.6510486602783203e-05, -1.1712312698364258e-05, -6.9141387939453125e-06, -2.115964889526367e-06, 2.682209014892578e-06, 7.4803829193115234e-06, 1.2278556823730469e-05, 1.7076730728149414e-05, 2.187490463256836e-05, 2.6673078536987305e-05, 3.147125244140625e-05, 3.6269426345825195e-05, 4.106760025024414e-05, 4.5865774154663086e-05, 5.066394805908203e-05, 5.5462121963500977e-05, 6.026029586791992e-05, 6.505846977233887e-05, 6.985664367675781e-05, 7.465481758117676e-05, 7.94529914855957e-05, 8.425116539001465e-05, 8.90493392944336e-05, 9.384751319885254e-05, 9.864568710327148e-05, 0.00010344386100769043, 0.00010824203491210938]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 18.0, 18.0, 24.0, 22.0, 40.0, 50.0, 83.0, 101.0, 178.0, 249.0, 331.0, 471.0, 749.0, 1100.0, 1707.0, 2748.0, 4478.0, 7588.0, 14129.0, 29063.0, 69810.0, 224619.0, 474676.0, 123830.0, 45307.0, 20622.0, 10455.0, 6034.0, 3424.0, 2305.0, 1406.0, 943.0, 581.0, 384.0, 297.0, 210.0, 137.0, 93.0, 71.0, 57.0, 40.0, 24.0, 16.0, 15.0, 13.0, 9.0, 5.0, 8.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0001652240753173828, -0.0001601036638021469, -0.000154983252286911, -0.0001498628407716751, -0.0001447424292564392, -0.0001396220177412033, -0.0001345016062259674, -0.0001293811947107315, -0.0001242607831954956, -0.0001191403716802597, -0.0001140199601650238, -0.0001088995486497879, -0.000103779137134552, -9.86587256193161e-05, -9.35383141040802e-05, -8.84179025888443e-05, -8.32974910736084e-05, -7.81770795583725e-05, -7.30566680431366e-05, -6.79362565279007e-05, -6.28158450126648e-05, -5.7695433497428894e-05, -5.257502198219299e-05, -4.745461046695709e-05, -4.233419895172119e-05, -3.721378743648529e-05, -3.209337592124939e-05, -2.697296440601349e-05, -2.1852552890777588e-05, -1.6732141375541687e-05, -1.1611729860305786e-05, -6.491318345069885e-06, -1.3709068298339844e-06, 3.7495046854019165e-06, 8.869916200637817e-06, 1.3990327715873718e-05, 1.911073923110962e-05, 2.423115074634552e-05, 2.935156226158142e-05, 3.447197377681732e-05, 3.959238529205322e-05, 4.4712796807289124e-05, 4.9833208322525024e-05, 5.4953619837760925e-05, 6.0074031352996826e-05, 6.519444286823273e-05, 7.031485438346863e-05, 7.543526589870453e-05, 8.055567741394043e-05, 8.567608892917633e-05, 9.079650044441223e-05, 9.591691195964813e-05, 0.00010103732347488403, 0.00010615773499011993, 0.00011127814650535583, 0.00011639855802059174, 0.00012151896953582764, 0.00012663938105106354, 0.00013175979256629944, 0.00013688020408153534, 0.00014200061559677124, 0.00014712102711200714, 0.00015224143862724304, 0.00015736185014247894, 0.00016248226165771484]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 9.0, 9.0, 13.0, 19.0, 18.0, 14.0, 24.0, 32.0, 30.0, 30.0, 32.0, 42.0, 30.0, 35.0, 39.0, 49.0, 43.0, 41.0, 51.0, 50.0, 42.0, 45.0, 36.0, 38.0, 24.0, 21.0, 27.0, 19.0, 21.0, 13.0, 29.0, 10.0, 8.0, 7.0, 6.0, 8.0, 6.0, 3.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.677078247070312e-05, -7.411371916532516e-05, -7.14566558599472e-05, -6.879959255456924e-05, -6.614252924919128e-05, -6.348546594381332e-05, -6.0828402638435364e-05, -5.8171339333057404e-05, -5.551427602767944e-05, -5.285721272230148e-05, -5.020014941692352e-05, -4.754308611154556e-05, -4.48860228061676e-05, -4.222895950078964e-05, -3.957189619541168e-05, -3.691483289003372e-05, -3.425776958465576e-05, -3.16007062792778e-05, -2.894364297389984e-05, -2.628657966852188e-05, -2.362951636314392e-05, -2.097245305776596e-05, -1.8315389752388e-05, -1.565832644701004e-05, -1.300126314163208e-05, -1.034419983625412e-05, -7.68713653087616e-06, -5.0300732254981995e-06, -2.3730099201202393e-06, 2.8405338525772095e-07, 2.941116690635681e-06, 5.598179996013641e-06, 8.255243301391602e-06, 1.0912306606769562e-05, 1.3569369912147522e-05, 1.6226433217525482e-05, 1.8883496522903442e-05, 2.1540559828281403e-05, 2.4197623133659363e-05, 2.6854686439037323e-05, 2.9511749744415283e-05, 3.2168813049793243e-05, 3.4825876355171204e-05, 3.7482939660549164e-05, 4.0140002965927124e-05, 4.2797066271305084e-05, 4.5454129576683044e-05, 4.8111192882061005e-05, 5.0768256187438965e-05, 5.3425319492816925e-05, 5.6082382798194885e-05, 5.8739446103572845e-05, 6.13965094089508e-05, 6.405357271432877e-05, 6.671063601970673e-05, 6.936769932508469e-05, 7.202476263046265e-05, 7.46818259358406e-05, 7.733888924121857e-05, 7.999595254659653e-05, 8.265301585197449e-05, 8.531007915735245e-05, 8.796714246273041e-05, 9.062420576810837e-05, 9.328126907348633e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 3.0, 4.0, 10.0, 12.0, 21.0, 24.0, 30.0, 41.0, 58.0, 85.0, 113.0, 172.0, 221.0, 368.0, 515.0, 866.0, 1416.0, 2950.0, 5911.0, 18390.0, 86563.0, 768777.0, 125072.0, 21620.0, 7967.0, 3006.0, 1651.0, 955.0, 510.0, 417.0, 226.0, 147.0, 117.0, 92.0, 55.0, 58.0, 39.0, 24.0, 13.0, 11.0, 9.0, 3.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.384185791015625e-05, -2.3152679204940796e-05, -2.2463500499725342e-05, -2.1774321794509888e-05, -2.1085143089294434e-05, -2.039596438407898e-05, -1.9706785678863525e-05, -1.901760697364807e-05, -1.8328428268432617e-05, -1.7639249563217163e-05, -1.695007085800171e-05, -1.6260892152786255e-05, -1.55717134475708e-05, -1.4882534742355347e-05, -1.4193356037139893e-05, -1.3504177331924438e-05, -1.2814998626708984e-05, -1.212581992149353e-05, -1.1436641216278076e-05, -1.0747462511062622e-05, -1.0058283805847168e-05, -9.369105100631714e-06, -8.67992639541626e-06, -7.990747690200806e-06, -7.3015689849853516e-06, -6.6123902797698975e-06, -5.923211574554443e-06, -5.234032869338989e-06, -4.544854164123535e-06, -3.855675458908081e-06, -3.166496753692627e-06, -2.477318048477173e-06, -1.7881393432617188e-06, -1.0989606380462646e-06, -4.0978193283081055e-07, 2.7939677238464355e-07, 9.685754776000977e-07, 1.6577541828155518e-06, 2.346932888031006e-06, 3.03611159324646e-06, 3.725290298461914e-06, 4.414469003677368e-06, 5.103647708892822e-06, 5.792826414108276e-06, 6.4820051193237305e-06, 7.1711838245391846e-06, 7.860362529754639e-06, 8.549541234970093e-06, 9.238719940185547e-06, 9.927898645401001e-06, 1.0617077350616455e-05, 1.130625605583191e-05, 1.1995434761047363e-05, 1.2684613466262817e-05, 1.3373792171478271e-05, 1.4062970876693726e-05, 1.475214958190918e-05, 1.5441328287124634e-05, 1.6130506992340088e-05, 1.6819685697555542e-05, 1.7508864402770996e-05, 1.819804310798645e-05, 1.8887221813201904e-05, 1.957640051841736e-05, 2.0265579223632812e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 0.0, 11.0, 0.0, 5.0, 13.0, 0.0, 17.0, 23.0, 0.0, 24.0, 0.0, 29.0, 36.0, 0.0, 61.0, 72.0, 0.0, 75.0, 0.0, 89.0, 71.0, 0.0, 71.0, 80.0, 0.0, 69.0, 0.0, 54.0, 41.0, 0.0, 34.0, 27.0, 0.0, 16.0, 0.0, 24.0, 14.0, 0.0, 10.0, 8.0, 0.0, 8.0, 0.0, 7.0, 5.0, 0.0, 5.0, 5.0, 0.0, 1.0, 1.0], "bins": [-1.2516975402832031e-06, -1.214444637298584e-06, -1.1771917343139648e-06, -1.1399388313293457e-06, -1.1026859283447266e-06, -1.0654330253601074e-06, -1.0281801223754883e-06, -9.909272193908691e-07, -9.5367431640625e-07, -9.164214134216309e-07, -8.791685104370117e-07, -8.419156074523926e-07, -8.046627044677734e-07, -7.674098014831543e-07, -7.301568984985352e-07, -6.92903995513916e-07, -6.556510925292969e-07, -6.183981895446777e-07, -5.811452865600586e-07, -5.438923835754395e-07, -5.066394805908203e-07, -4.6938657760620117e-07, -4.3213367462158203e-07, -3.948807716369629e-07, -3.5762786865234375e-07, -3.203749656677246e-07, -2.8312206268310547e-07, -2.4586915969848633e-07, -2.086162567138672e-07, -1.7136335372924805e-07, -1.341104507446289e-07, -9.685754776000977e-08, -5.960464477539063e-08, -2.2351741790771484e-08, 1.4901161193847656e-08, 5.21540641784668e-08, 8.940696716308594e-08, 1.2665987014770508e-07, 1.6391277313232422e-07, 2.0116567611694336e-07, 2.384185791015625e-07, 2.7567148208618164e-07, 3.129243850708008e-07, 3.501772880554199e-07, 3.8743019104003906e-07, 4.246830940246582e-07, 4.6193599700927734e-07, 4.991888999938965e-07, 5.364418029785156e-07, 5.736947059631348e-07, 6.109476089477539e-07, 6.48200511932373e-07, 6.854534149169922e-07, 7.227063179016113e-07, 7.599592208862305e-07, 7.972121238708496e-07, 8.344650268554688e-07, 8.717179298400879e-07, 9.08970832824707e-07, 9.462237358093262e-07, 9.834766387939453e-07, 1.0207295417785645e-06, 1.0579824447631836e-06, 1.0952353477478027e-06, 1.1324882507324219e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 3.0, 9.0, 7.0, 14.0, 16.0, 14.0, 36.0, 70.0, 102.0, 186.0, 466.0, 1058.0, 3383.0, 14834.0, 120291.0, 831279.0, 63618.0, 9122.0, 2386.0, 930.0, 321.0, 160.0, 91.0, 50.0, 34.0, 21.0, 14.0, 9.0, 8.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0], "bins": [-4.649162292480469e-05, -4.527997225522995e-05, -4.406832158565521e-05, -4.2856670916080475e-05, -4.164502024650574e-05, -4.0433369576931e-05, -3.922171890735626e-05, -3.8010068237781525e-05, -3.679841756820679e-05, -3.558676689863205e-05, -3.437511622905731e-05, -3.3163465559482574e-05, -3.195181488990784e-05, -3.07401642203331e-05, -2.9528513550758362e-05, -2.8316862881183624e-05, -2.7105212211608887e-05, -2.589356154203415e-05, -2.468191087245941e-05, -2.3470260202884674e-05, -2.2258609533309937e-05, -2.10469588637352e-05, -1.983530819416046e-05, -1.8623657524585724e-05, -1.7412006855010986e-05, -1.620035618543625e-05, -1.4988705515861511e-05, -1.3777054846286774e-05, -1.2565404176712036e-05, -1.1353753507137299e-05, -1.0142102837562561e-05, -8.930452167987823e-06, -7.718801498413086e-06, -6.507150828838348e-06, -5.295500159263611e-06, -4.083849489688873e-06, -2.8721988201141357e-06, -1.6605481505393982e-06, -4.4889748096466064e-07, 7.627531886100769e-07, 1.9744038581848145e-06, 3.186054527759552e-06, 4.3977051973342896e-06, 5.609355866909027e-06, 6.821006536483765e-06, 8.032657206058502e-06, 9.24430787563324e-06, 1.0455958545207977e-05, 1.1667609214782715e-05, 1.2879259884357452e-05, 1.409091055393219e-05, 1.5302561223506927e-05, 1.6514211893081665e-05, 1.7725862562656403e-05, 1.893751323223114e-05, 2.0149163901805878e-05, 2.1360814571380615e-05, 2.2572465240955353e-05, 2.378411591053009e-05, 2.4995766580104828e-05, 2.6207417249679565e-05, 2.7419067919254303e-05, 2.863071858882904e-05, 2.9842369258403778e-05, 3.1054019927978516e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 4.0, 2.0, 5.0, 5.0, 7.0, 14.0, 15.0, 13.0, 17.0, 38.0, 38.0, 65.0, 78.0, 107.0, 121.0, 121.0, 78.0, 64.0, 53.0, 33.0, 40.0, 19.0, 14.0, 9.0, 5.0, 13.0, 4.0, 4.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2186508178710938e-06, -3.0975788831710815e-06, -2.9765069484710693e-06, -2.855435013771057e-06, -2.734363079071045e-06, -2.6132911443710327e-06, -2.4922192096710205e-06, -2.3711472749710083e-06, -2.250075340270996e-06, -2.129003405570984e-06, -2.0079314708709717e-06, -1.8868595361709595e-06, -1.7657876014709473e-06, -1.644715666770935e-06, -1.5236437320709229e-06, -1.4025717973709106e-06, -1.2814998626708984e-06, -1.1604279279708862e-06, -1.039355993270874e-06, -9.182840585708618e-07, -7.972121238708496e-07, -6.761401891708374e-07, -5.550682544708252e-07, -4.33996319770813e-07, -3.129243850708008e-07, -1.9185245037078857e-07, -7.078051567077637e-08, 5.029141902923584e-08, 1.7136335372924805e-07, 2.9243528842926025e-07, 4.1350722312927246e-07, 5.345791578292847e-07, 6.556510925292969e-07, 7.767230272293091e-07, 8.977949619293213e-07, 1.0188668966293335e-06, 1.1399388313293457e-06, 1.261010766029358e-06, 1.3820827007293701e-06, 1.5031546354293823e-06, 1.6242265701293945e-06, 1.7452985048294067e-06, 1.866370439529419e-06, 1.987442374229431e-06, 2.1085143089294434e-06, 2.2295862436294556e-06, 2.3506581783294678e-06, 2.47173011302948e-06, 2.592802047729492e-06, 2.7138739824295044e-06, 2.8349459171295166e-06, 2.956017851829529e-06, 3.077089786529541e-06, 3.1981617212295532e-06, 3.3192336559295654e-06, 3.4403055906295776e-06, 3.56137752532959e-06, 3.682449460029602e-06, 3.8035213947296143e-06, 3.9245933294296265e-06, 4.045665264129639e-06, 4.166737198829651e-06, 4.287809133529663e-06, 4.408881068229675e-06, 4.5299530029296875e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 9.0, 5.0, 15.0, 12.0, 20.0, 29.0, 27.0, 50.0, 59.0, 95.0, 118.0, 133.0, 93.0, 80.0, 65.0, 37.0, 25.0, 29.0, 17.0, 16.0, 13.0, 9.0, 6.0, 8.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00015652990259695798, -0.00015037144476082176, -0.00014421300147660077, -0.00013805454364046454, -0.00013189608580432832, -0.0001257376279681921, -0.00011957918468397111, -0.00011342072684783489, -0.00010726227628765628, -0.00010110382572747767, -9.494536789134145e-05, -8.878691733116284e-05, -8.262846677098423e-05, -7.647000893484801e-05, -7.03115583746694e-05, -6.41531078144908e-05, -5.799464997835457e-05, -5.183619578019716e-05, -4.5677741582039744e-05, -3.9519291021861136e-05, -3.336083682370372e-05, -2.7202382625546306e-05, -2.10439320653677e-05, -1.4885477867210284e-05, -8.727023669052869e-06, -2.568570380390156e-06, 3.589882908272557e-06, 9.748335287440568e-06, 1.5906789485597983e-05, 2.2065243683755398e-05, 2.8223694243934005e-05, 3.438214844209142e-05, 4.0540602640248835e-05, 4.669905683840625e-05, 5.2857511036563665e-05, 5.901596159674227e-05, 6.51744194328785e-05, 7.13328699930571e-05, 7.749132055323571e-05, 8.364977838937193e-05, 8.980822894955054e-05, 9.596667950972915e-05, 0.00010212513734586537, 0.00010828358790604398, 0.00011444203846622258, 0.0001206004963023588, 0.0001267589395865798, 0.00013291739742271602, 0.00013907585525885224, 0.00014523431309498847, 0.00015139275637920946, 0.00015755121421534568, 0.0001637096720514819, 0.0001698681153357029, 0.00017602657317183912, 0.00018218503100797534, 0.00018834348884411156, 0.00019450194668024778, 0.00020066038996446878, 0.000206818847800605, 0.00021297730563674122, 0.00021913574892096221, 0.00022529420675709844, 0.00023145266459323466, 0.00023761110787745565]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 10.0, 15.0, 14.0, 23.0, 14.0, 21.0, 22.0, 30.0, 29.0, 28.0, 38.0, 42.0, 47.0, 48.0, 42.0, 51.0, 59.0, 58.0, 44.0, 52.0, 44.0, 32.0, 33.0, 39.0, 31.0, 27.0, 25.0, 16.0, 16.0, 8.0, 13.0, 6.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0001744865148793906, -0.00017000085790641606, -0.00016551520093344152, -0.00016102954396046698, -0.00015654388698749244, -0.00015205821546260267, -0.00014757255848962814, -0.0001430869015166536, -0.00013860124454367906, -0.00013411558757070452, -0.00012962993059772998, -0.00012514427362475544, -0.00012065860937582329, -0.00011617295240284875, -0.0001116872881539166, -0.00010720163118094206, -0.00010271597420796752, -9.823031723499298e-05, -9.374466026201844e-05, -8.925899601308629e-05, -8.477333904011175e-05, -8.028768206713721e-05, -7.580201781820506e-05, -7.131636084523052e-05, -6.683070387225598e-05, -6.234504689928144e-05, -5.7859386288328096e-05, -5.337372567737475e-05, -4.888806870440021e-05, -4.440241173142567e-05, -3.991675112047233e-05, -3.543109050951898e-05, -3.094542626058683e-05, -2.6459767468622886e-05, -2.1974108676658943e-05, -1.7488449884695e-05, -1.3002791092731059e-05, -8.517132300767116e-06, -4.031473508803174e-06, 4.54187102150172e-07, 4.939844075124711e-06, 9.425502867088653e-06, 1.3911161659052595e-05, 1.8396820451016538e-05, 2.288247924298048e-05, 2.7368138034944423e-05, 3.1853796826908365e-05, 3.633945743786171e-05, 4.082511441083625e-05, 4.531077138381079e-05, 4.9796431994764134e-05, 5.428209260571748e-05, 5.876774957869202e-05, 6.325340655166656e-05, 6.77390635246411e-05, 7.222472777357325e-05, 7.671038474654779e-05, 8.119604171952233e-05, 8.568170596845448e-05, 9.016736294142902e-05, 9.465301991440356e-05, 9.91386768873781e-05, 0.00010362433386035264, 0.00010810999810928479, 0.00011259565508225933]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 10.0, 16.0, 23.0, 22.0, 43.0, 54.0, 94.0, 155.0, 237.0, 395.0, 659.0, 1150.0, 2111.0, 3679.0, 6480.0, 12279.0, 22642.0, 44952.0, 99492.0, 242302.0, 326727.0, 151759.0, 65384.0, 31433.0, 16359.0, 8752.0, 4820.0, 2656.0, 1525.0, 924.0, 529.0, 290.0, 196.0, 119.0, 89.0, 62.0, 47.0, 27.0, 16.0, 15.0, 10.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004246234893798828, -0.0004118494689464569, -0.000399075448513031, -0.0003863014280796051, -0.0003735274076461792, -0.0003607533872127533, -0.0003479793667793274, -0.0003352053463459015, -0.0003224313259124756, -0.0003096573054790497, -0.0002968832850456238, -0.0002841092646121979, -0.00027133524417877197, -0.00025856122374534607, -0.00024578720331192017, -0.00023301318287849426, -0.00022023916244506836, -0.00020746514201164246, -0.00019469112157821655, -0.00018191710114479065, -0.00016914308071136475, -0.00015636906027793884, -0.00014359503984451294, -0.00013082101941108704, -0.00011804699897766113, -0.00010527297854423523, -9.249895811080933e-05, -7.972493767738342e-05, -6.695091724395752e-05, -5.4176896810531616e-05, -4.140287637710571e-05, -2.862885594367981e-05, -1.5854835510253906e-05, -3.080815076828003e-06, 9.6932053565979e-06, 2.2467225790023804e-05, 3.524124622344971e-05, 4.801526665687561e-05, 6.0789287090301514e-05, 7.356330752372742e-05, 8.633732795715332e-05, 9.911134839057922e-05, 0.00011188536882400513, 0.00012465938925743103, 0.00013743340969085693, 0.00015020743012428284, 0.00016298145055770874, 0.00017575547099113464, 0.00018852949142456055, 0.00020130351185798645, 0.00021407753229141235, 0.00022685155272483826, 0.00023962557315826416, 0.00025239959359169006, 0.00026517361402511597, 0.00027794763445854187, 0.0002907216548919678, 0.0003034956753253937, 0.0003162696957588196, 0.0003290437161922455, 0.0003418177366256714, 0.0003545917570590973, 0.0003673657774925232, 0.0003801397979259491, 0.000392913818359375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 10.0, 12.0, 16.0, 17.0, 19.0, 22.0, 24.0, 32.0, 20.0, 36.0, 55.0, 41.0, 35.0, 56.0, 55.0, 61.0, 56.0, 59.0, 49.0, 42.0, 36.0, 35.0, 33.0, 22.0, 30.0, 18.0, 29.0, 15.0, 12.0, 9.0, 10.0, 9.0, 2.0, 3.0, 4.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.00017511844635009766, -0.00017077568918466568, -0.0001664329320192337, -0.00016209017485380173, -0.00015774741768836975, -0.00015340466052293777, -0.0001490619033575058, -0.00014471914619207382, -0.00014037638902664185, -0.00013603363186120987, -0.0001316908746957779, -0.00012734811753034592, -0.00012300536036491394, -0.00011866260319948196, -0.00011431984603404999, -0.00010997708886861801, -0.00010563433170318604, -0.00010129157453775406, -9.694881737232208e-05, -9.26060602068901e-05, -8.826330304145813e-05, -8.392054587602615e-05, -7.957778871059418e-05, -7.52350315451622e-05, -7.089227437973022e-05, -6.654951721429825e-05, -6.220676004886627e-05, -5.7864002883434296e-05, -5.352124571800232e-05, -4.917848855257034e-05, -4.483573138713837e-05, -4.049297422170639e-05, -3.6150217056274414e-05, -3.180745989084244e-05, -2.746470272541046e-05, -2.3121945559978485e-05, -1.877918839454651e-05, -1.4436431229114532e-05, -1.0093674063682556e-05, -5.75091689825058e-06, -1.4081597328186035e-06, 2.934597432613373e-06, 7.277354598045349e-06, 1.1620111763477325e-05, 1.5962868928909302e-05, 2.0305626094341278e-05, 2.4648383259773254e-05, 2.899114042520523e-05, 3.333389759063721e-05, 3.767665475606918e-05, 4.201941192150116e-05, 4.6362169086933136e-05, 5.070492625236511e-05, 5.504768341779709e-05, 5.9390440583229065e-05, 6.373319774866104e-05, 6.807595491409302e-05, 7.2418712079525e-05, 7.676146924495697e-05, 8.110422641038895e-05, 8.544698357582092e-05, 8.97897407412529e-05, 9.413249790668488e-05, 9.847525507211685e-05, 0.00010281801223754883]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 9.0, 7.0, 5.0, 9.0, 19.0, 19.0, 35.0, 66.0, 76.0, 137.0, 255.0, 548.0, 1111.0, 2684.0, 6845.0, 18505.0, 60001.0, 256499.0, 510819.0, 134485.0, 36180.0, 12031.0, 4471.0, 1974.0, 832.0, 408.0, 206.0, 112.0, 70.0, 36.0, 32.0, 14.0, 20.0, 11.0, 15.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004260540008544922, -0.00040604546666145325, -0.0003860369324684143, -0.00036602839827537537, -0.0003460198640823364, -0.0003260113298892975, -0.00030600279569625854, -0.0002859942615032196, -0.00026598572731018066, -0.0002459771931171417, -0.00022596865892410278, -0.00020596012473106384, -0.0001859515905380249, -0.00016594305634498596, -0.00014593452215194702, -0.00012592598795890808, -0.00010591745376586914, -8.59089195728302e-05, -6.590038537979126e-05, -4.589185118675232e-05, -2.588331699371338e-05, -5.8747828006744385e-06, 1.4133751392364502e-05, 3.414228558540344e-05, 5.415081977844238e-05, 7.415935397148132e-05, 9.416788816452026e-05, 0.0001141764223575592, 0.00013418495655059814, 0.00015419349074363708, 0.00017420202493667603, 0.00019421055912971497, 0.0002142190933227539, 0.00023422762751579285, 0.0002542361617088318, 0.00027424469590187073, 0.00029425323009490967, 0.0003142617642879486, 0.00033427029848098755, 0.0003542788326740265, 0.00037428736686706543, 0.00039429590106010437, 0.0004143044352531433, 0.00043431296944618225, 0.0004543215036392212, 0.00047433003783226013, 0.0004943385720252991, 0.000514347106218338, 0.000534355640411377, 0.0005543641746044159, 0.0005743727087974548, 0.0005943812429904938, 0.0006143897771835327, 0.0006343983113765717, 0.0006544068455696106, 0.0006744153797626495, 0.0006944239139556885, 0.0007144324481487274, 0.0007344409823417664, 0.0007544495165348053, 0.0007744580507278442, 0.0007944665849208832, 0.0008144751191139221, 0.0008344836533069611, 0.0008544921875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 9.0, 3.0, 7.0, 10.0, 7.0, 11.0, 19.0, 17.0, 22.0, 28.0, 20.0, 43.0, 47.0, 48.0, 45.0, 53.0, 53.0, 41.0, 43.0, 54.0, 53.0, 38.0, 50.0, 43.0, 45.0, 26.0, 23.0, 28.0, 25.0, 21.0, 16.0, 16.0, 14.0, 8.0, 5.0, 7.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.00014925003051757812, -0.00014560576528310776, -0.0001419615000486374, -0.00013831723481416702, -0.00013467296957969666, -0.0001310287043452263, -0.00012738443911075592, -0.00012374017387628555, -0.00012009590864181519, -0.00011645164340734482, -0.00011280737817287445, -0.00010916311293840408, -0.00010551884770393372, -0.00010187458246946335, -9.823031723499298e-05, -9.458605200052261e-05, -9.094178676605225e-05, -8.729752153158188e-05, -8.365325629711151e-05, -8.000899106264114e-05, -7.636472582817078e-05, -7.272046059370041e-05, -6.907619535923004e-05, -6.543193012475967e-05, -6.17876648902893e-05, -5.814339965581894e-05, -5.449913442134857e-05, -5.0854869186878204e-05, -4.721060395240784e-05, -4.356633871793747e-05, -3.99220734834671e-05, -3.6277808248996735e-05, -3.263354301452637e-05, -2.8989277780056e-05, -2.5345012545585632e-05, -2.1700747311115265e-05, -1.8056482076644897e-05, -1.441221684217453e-05, -1.0767951607704163e-05, -7.123686373233795e-06, -3.4794211387634277e-06, 1.648440957069397e-07, 3.809109330177307e-06, 7.4533745646476746e-06, 1.1097639799118042e-05, 1.474190503358841e-05, 1.8386170268058777e-05, 2.2030435502529144e-05, 2.5674700736999512e-05, 2.931896597146988e-05, 3.2963231205940247e-05, 3.6607496440410614e-05, 4.025176167488098e-05, 4.389602690935135e-05, 4.7540292143821716e-05, 5.1184557378292084e-05, 5.482882261276245e-05, 5.847308784723282e-05, 6.211735308170319e-05, 6.576161831617355e-05, 6.940588355064392e-05, 7.305014878511429e-05, 7.669441401958466e-05, 8.033867925405502e-05, 8.398294448852539e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 1.0, 8.0, 15.0, 15.0, 21.0, 35.0, 46.0, 56.0, 103.0, 155.0, 287.0, 465.0, 908.0, 1899.0, 3352.0, 9076.0, 28784.0, 153372.0, 692409.0, 118338.0, 24461.0, 7296.0, 3646.0, 1711.0, 893.0, 455.0, 284.0, 161.0, 99.0, 60.0, 39.0, 34.0, 23.0, 13.0, 17.0, 3.0, 3.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-05, -1.145247370004654e-05, -1.0984018445014954e-05, -1.0515563189983368e-05, -1.0047107934951782e-05, -9.578652679920197e-06, -9.11019742488861e-06, -8.641742169857025e-06, -8.17328691482544e-06, -7.704831659793854e-06, -7.236376404762268e-06, -6.767921149730682e-06, -6.299465894699097e-06, -5.831010639667511e-06, -5.362555384635925e-06, -4.89410012960434e-06, -4.425644874572754e-06, -3.957189619541168e-06, -3.4887343645095825e-06, -3.020279109477997e-06, -2.551823854446411e-06, -2.0833685994148254e-06, -1.6149133443832397e-06, -1.146458089351654e-06, -6.780028343200684e-07, -2.0954757928848267e-07, 2.5890767574310303e-07, 7.273629307746887e-07, 1.1958181858062744e-06, 1.6642734408378601e-06, 2.132728695869446e-06, 2.6011839509010315e-06, 3.069639205932617e-06, 3.538094460964203e-06, 4.0065497159957886e-06, 4.475004971027374e-06, 4.94346022605896e-06, 5.411915481090546e-06, 5.880370736122131e-06, 6.348825991153717e-06, 6.817281246185303e-06, 7.2857365012168884e-06, 7.754191756248474e-06, 8.22264701128006e-06, 8.691102266311646e-06, 9.159557521343231e-06, 9.628012776374817e-06, 1.0096468031406403e-05, 1.0564923286437988e-05, 1.1033378541469574e-05, 1.150183379650116e-05, 1.1970289051532745e-05, 1.2438744306564331e-05, 1.2907199561595917e-05, 1.3375654816627502e-05, 1.3844110071659088e-05, 1.4312565326690674e-05, 1.478102058172226e-05, 1.5249475836753845e-05, 1.571793109178543e-05, 1.6186386346817017e-05, 1.6654841601848602e-05, 1.7123296856880188e-05, 1.7591752111911774e-05, 1.806020736694336e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 6.0, 7.0, 2.0, 11.0, 8.0, 10.0, 14.0, 54.0, 38.0, 76.0, 89.0, 242.0, 106.0, 100.0, 71.0, 77.0, 26.0, 21.0, 20.0, 3.0, 0.0, 5.0, 8.0, 3.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.159046173095703e-06, -3.0836090445518494e-06, -3.0081719160079956e-06, -2.932734787464142e-06, -2.857297658920288e-06, -2.7818605303764343e-06, -2.7064234018325806e-06, -2.630986273288727e-06, -2.555549144744873e-06, -2.4801120162010193e-06, -2.4046748876571655e-06, -2.3292377591133118e-06, -2.253800630569458e-06, -2.1783635020256042e-06, -2.1029263734817505e-06, -2.0274892449378967e-06, -1.952052116394043e-06, -1.8766149878501892e-06, -1.8011778593063354e-06, -1.7257407307624817e-06, -1.650303602218628e-06, -1.5748664736747742e-06, -1.4994293451309204e-06, -1.4239922165870667e-06, -1.3485550880432129e-06, -1.2731179594993591e-06, -1.1976808309555054e-06, -1.1222437024116516e-06, -1.0468065738677979e-06, -9.71369445323944e-07, -8.959323167800903e-07, -8.204951882362366e-07, -7.450580596923828e-07, -6.69620931148529e-07, -5.941838026046753e-07, -5.187466740608215e-07, -4.4330954551696777e-07, -3.67872416973114e-07, -2.9243528842926025e-07, -2.169981598854065e-07, -1.4156103134155273e-07, -6.612390279769897e-08, 9.313225746154785e-09, 8.475035429000854e-08, 1.601874828338623e-07, 2.3562461137771606e-07, 3.110617399215698e-07, 3.864988684654236e-07, 4.6193599700927734e-07, 5.373731255531311e-07, 6.128102540969849e-07, 6.882473826408386e-07, 7.636845111846924e-07, 8.391216397285461e-07, 9.145587682723999e-07, 9.899958968162537e-07, 1.0654330253601074e-06, 1.1408701539039612e-06, 1.216307282447815e-06, 1.2917444109916687e-06, 1.3671815395355225e-06, 1.4426186680793762e-06, 1.51805579662323e-06, 1.5934929251670837e-06, 1.6689300537109375e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 6.0, 12.0, 21.0, 28.0, 52.0, 83.0, 111.0, 231.0, 310.0, 817.0, 1652.0, 4545.0, 23890.0, 185989.0, 757267.0, 57450.0, 11059.0, 2689.0, 1111.0, 507.0, 303.0, 148.0, 94.0, 54.0, 43.0, 25.0, 26.0, 5.0, 8.0, 7.0, 2.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.728534698486328e-05, -1.6780570149421692e-05, -1.6275793313980103e-05, -1.5771016478538513e-05, -1.5266239643096924e-05, -1.4761462807655334e-05, -1.4256685972213745e-05, -1.3751909136772156e-05, -1.3247132301330566e-05, -1.2742355465888977e-05, -1.2237578630447388e-05, -1.1732801795005798e-05, -1.1228024959564209e-05, -1.072324812412262e-05, -1.021847128868103e-05, -9.713694453239441e-06, -9.208917617797852e-06, -8.704140782356262e-06, -8.199363946914673e-06, -7.694587111473083e-06, -7.189810276031494e-06, -6.685033440589905e-06, -6.1802566051483154e-06, -5.675479769706726e-06, -5.170702934265137e-06, -4.665926098823547e-06, -4.161149263381958e-06, -3.6563724279403687e-06, -3.1515955924987793e-06, -2.64681875705719e-06, -2.1420419216156006e-06, -1.6372650861740112e-06, -1.1324882507324219e-06, -6.277114152908325e-07, -1.2293457984924316e-07, 3.818422555923462e-07, 8.866190910339355e-07, 1.391395926475525e-06, 1.8961727619171143e-06, 2.4009495973587036e-06, 2.905726432800293e-06, 3.4105032682418823e-06, 3.915280103683472e-06, 4.420056939125061e-06, 4.92483377456665e-06, 5.42961061000824e-06, 5.934387445449829e-06, 6.4391642808914185e-06, 6.943941116333008e-06, 7.448717951774597e-06, 7.953494787216187e-06, 8.458271622657776e-06, 8.963048458099365e-06, 9.467825293540955e-06, 9.972602128982544e-06, 1.0477378964424133e-05, 1.0982155799865723e-05, 1.1486932635307312e-05, 1.1991709470748901e-05, 1.249648630619049e-05, 1.300126314163208e-05, 1.350603997707367e-05, 1.4010816812515259e-05, 1.4515593647956848e-05, 1.5020370483398438e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 17.0, 27.0, 15.0, 38.0, 71.0, 101.0, 138.0, 73.0, 131.0, 127.0, 92.0, 65.0, 26.0, 28.0, 19.0, 11.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2186508178710938e-06, -3.1115487217903137e-06, -3.0044466257095337e-06, -2.8973445296287537e-06, -2.7902424335479736e-06, -2.6831403374671936e-06, -2.5760382413864136e-06, -2.4689361453056335e-06, -2.3618340492248535e-06, -2.2547319531440735e-06, -2.1476298570632935e-06, -2.0405277609825134e-06, -1.9334256649017334e-06, -1.8263235688209534e-06, -1.7192214727401733e-06, -1.6121193766593933e-06, -1.5050172805786133e-06, -1.3979151844978333e-06, -1.2908130884170532e-06, -1.1837109923362732e-06, -1.0766088962554932e-06, -9.695068001747131e-07, -8.624047040939331e-07, -7.553026080131531e-07, -6.48200511932373e-07, -5.41098415851593e-07, -4.33996319770813e-07, -3.2689422369003296e-07, -2.1979212760925293e-07, -1.126900315284729e-07, -5.587935447692871e-09, 1.0151416063308716e-07, 2.086162567138672e-07, 3.157183527946472e-07, 4.2282044887542725e-07, 5.299225449562073e-07, 6.370246410369873e-07, 7.441267371177673e-07, 8.512288331985474e-07, 9.583309292793274e-07, 1.0654330253601074e-06, 1.1725351214408875e-06, 1.2796372175216675e-06, 1.3867393136024475e-06, 1.4938414096832275e-06, 1.6009435057640076e-06, 1.7080456018447876e-06, 1.8151476979255676e-06, 1.9222497940063477e-06, 2.0293518900871277e-06, 2.1364539861679077e-06, 2.2435560822486877e-06, 2.3506581783294678e-06, 2.457760274410248e-06, 2.564862370491028e-06, 2.671964466571808e-06, 2.779066562652588e-06, 2.886168658733368e-06, 2.993270754814148e-06, 3.100372850894928e-06, 3.207474946975708e-06, 3.314577043056488e-06, 3.421679139137268e-06, 3.528781235218048e-06, 3.635883331298828e-06]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 2.0, 9.0, 17.0, 18.0, 29.0, 45.0, 52.0, 89.0, 150.0, 177.0, 138.0, 81.0, 64.0, 31.0, 27.0, 12.0, 21.0, 8.0, 10.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029821222415193915, -0.0002904866123571992, -0.0002827609714586288, -0.0002750353596638888, -0.00026730974786914885, -0.00025958410697057843, -0.00025185849517583847, -0.0002441328833810985, -0.00023640725703444332, -0.00022868163068778813, -0.00022095601889304817, -0.00021323039254639298, -0.0002055047661997378, -0.00019777915440499783, -0.00019005352805834264, -0.00018232790171168745, -0.00017460228991694748, -0.0001668766635702923, -0.00015915105177555233, -0.00015142542542889714, -0.00014369981363415718, -0.000135974187287502, -0.0001282485609408468, -0.00012052294187014922, -0.00011279732279945165, -0.00010507170372875407, -9.73460846580565e-05, -8.962045831140131e-05, -8.189483924070373e-05, -7.416922017000616e-05, -6.644359382335097e-05, -5.871797475265339e-05, -5.0992355681955814e-05, -4.326673661125824e-05, -3.5541113902581856e-05, -2.7815493012894876e-05, -2.0089872123207897e-05, -1.2364253052510321e-05, -4.638630343833938e-06, 3.0869923648424447e-06, 1.081261143554002e-05, 1.8538232325227e-05, 2.626385321491398e-05, 3.398947592359036e-05, 4.171509499428794e-05, 4.9440714064985514e-05, 5.7166336773661897e-05, 6.489195948233828e-05, 7.261757855303586e-05, 8.034319762373343e-05, 8.806881669443101e-05, 9.57944430410862e-05, 0.00010352006211178377, 0.00011124568118248135, 0.00011897130752913654, 0.0001266969193238765, 0.0001344225456705317, 0.00014214817201718688, 0.00014987378381192684, 0.00015759941015858203, 0.00016532503650523722, 0.00017305064829997718, 0.00018077627464663237, 0.00018850190099328756, 0.00019622751278802752]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 16.0, 21.0, 7.0, 19.0, 21.0, 23.0, 26.0, 25.0, 41.0, 49.0, 38.0, 45.0, 52.0, 57.0, 57.0, 57.0, 53.0, 34.0, 55.0, 44.0, 34.0, 40.0, 27.0, 32.0, 30.0, 18.0, 17.0, 14.0, 5.0, 13.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00017491601465735584, -0.0001703561283648014, -0.00016579622752033174, -0.0001612363412277773, -0.00015667644038330764, -0.0001521165540907532, -0.00014755665324628353, -0.0001429967669537291, -0.00013843686610925943, -0.000133876979816705, -0.00012931707897223532, -0.00012475719267968088, -0.00012019729183521122, -0.00011563739826669917, -0.00011107750469818711, -0.00010651761840563267, -0.00010195772483712062, -9.739783126860857e-05, -9.283793770009652e-05, -8.827804413158447e-05, -8.371815056307241e-05, -7.915825699456036e-05, -7.459837070200592e-05, -7.003846985753626e-05, -6.547858356498182e-05, -6.0918689996469766e-05, -5.6358796427957714e-05, -5.179890285944566e-05, -4.723900929093361e-05, -4.267911572242156e-05, -3.811922579188831e-05, -3.355933222337626e-05, -2.89994350168854e-05, -2.4439541448373348e-05, -1.9879647879861295e-05, -1.5319756130338646e-05, -1.0759862561826594e-05, -6.199968993314542e-06, -1.6400772437918931e-06, 2.919816324720159e-06, 7.4797098932322115e-06, 1.2039603461744264e-05, 1.6599497030256316e-05, 2.1159388779778965e-05, 2.5719282348291017e-05, 3.027917591680307e-05, 3.483906766632572e-05, 3.939896123483777e-05, 4.395885480334982e-05, 4.8518748371861875e-05, 5.307864194037393e-05, 5.763853550888598e-05, 6.219842907739803e-05, 6.675832264591008e-05, 7.131820893846452e-05, 7.587810978293419e-05, 8.043799607548863e-05, 8.499788964400068e-05, 8.955778321251273e-05, 9.411767678102478e-05, 9.867757034953684e-05, 0.00010323746391804889, 0.00010779735748656094, 0.00011235724377911538, 0.00011691714462358505]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 11.0, 9.0, 21.0, 19.0, 31.0, 49.0, 55.0, 77.0, 126.0, 174.0, 266.0, 426.0, 758.0, 1910.0, 53713.0, 4106368.0, 26527.0, 1914.0, 693.0, 382.0, 245.0, 127.0, 127.0, 74.0, 47.0, 45.0, 28.0, 16.0, 15.0, 11.0, 8.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004246234893798828, -0.00041384994983673096, -0.0004030764102935791, -0.00039230287075042725, -0.0003815293312072754, -0.00037075579166412354, -0.0003599822521209717, -0.0003492087125778198, -0.00033843517303466797, -0.0003276616334915161, -0.00031688809394836426, -0.0003061145544052124, -0.00029534101486206055, -0.0002845674753189087, -0.00027379393577575684, -0.000263020396232605, -0.0002522468566894531, -0.00024147331714630127, -0.00023069977760314941, -0.00021992623805999756, -0.0002091526985168457, -0.00019837915897369385, -0.000187605619430542, -0.00017683207988739014, -0.00016605854034423828, -0.00015528500080108643, -0.00014451146125793457, -0.00013373792171478271, -0.00012296438217163086, -0.000112190842628479, -0.00010141730308532715, -9.064376354217529e-05, -7.987022399902344e-05, -6.909668445587158e-05, -5.8323144912719727e-05, -4.754960536956787e-05, -3.6776065826416016e-05, -2.600252628326416e-05, -1.5228986740112305e-05, -4.455447196960449e-06, 6.318092346191406e-06, 1.7091631889343262e-05, 2.7865171432495117e-05, 3.863871097564697e-05, 4.941225051879883e-05, 6.0185790061950684e-05, 7.095932960510254e-05, 8.17328691482544e-05, 9.250640869140625e-05, 0.0001032799482345581, 0.00011405348777770996, 0.00012482702732086182, 0.00013560056686401367, 0.00014637410640716553, 0.00015714764595031738, 0.00016792118549346924, 0.0001786947250366211, 0.00018946826457977295, 0.0002002418041229248, 0.00021101534366607666, 0.00022178888320922852, 0.00023256242275238037, 0.00024333596229553223, 0.0002541095018386841, 0.00026488304138183594]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 7.0, 6.0, 11.0, 13.0, 12.0, 14.0, 21.0, 22.0, 30.0, 28.0, 40.0, 39.0, 55.0, 57.0, 49.0, 51.0, 54.0, 58.0, 50.0, 54.0, 54.0, 46.0, 44.0, 42.0, 29.0, 24.0, 25.0, 21.0, 12.0, 8.0, 11.0, 10.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00018358230590820312, -0.0001789713278412819, -0.00017436034977436066, -0.00016974937170743942, -0.0001651383936405182, -0.00016052741557359695, -0.00015591643750667572, -0.00015130545943975449, -0.00014669448137283325, -0.00014208350330591202, -0.00013747252523899078, -0.00013286154717206955, -0.00012825056910514832, -0.00012363959103822708, -0.00011902861297130585, -0.00011441763490438461, -0.00010980665683746338, -0.00010519567877054214, -0.00010058470070362091, -9.597372263669968e-05, -9.136274456977844e-05, -8.675176650285721e-05, -8.214078843593597e-05, -7.752981036901474e-05, -7.29188323020935e-05, -6.830785423517227e-05, -6.369687616825104e-05, -5.9085898101329803e-05, -5.447492003440857e-05, -4.9863941967487335e-05, -4.52529639005661e-05, -4.064198583364487e-05, -3.603100776672363e-05, -3.14200296998024e-05, -2.6809051632881165e-05, -2.219807356595993e-05, -1.7587095499038696e-05, -1.2976117432117462e-05, -8.365139365196228e-06, -3.754161298274994e-06, 8.568167686462402e-07, 5.467794835567474e-06, 1.0078772902488708e-05, 1.4689750969409943e-05, 1.9300729036331177e-05, 2.391170710325241e-05, 2.8522685170173645e-05, 3.313366323709488e-05, 3.774464130401611e-05, 4.235561937093735e-05, 4.696659743785858e-05, 5.1577575504779816e-05, 5.618855357170105e-05, 6.0799531638622284e-05, 6.541050970554352e-05, 7.002148777246475e-05, 7.463246583938599e-05, 7.924344390630722e-05, 8.385442197322845e-05, 8.846540004014969e-05, 9.307637810707092e-05, 9.768735617399216e-05, 0.00010229833424091339, 0.00010690931230783463, 0.00011152029037475586]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 9.0, 23.0, 31.0, 54.0, 140.0, 241.0, 596.0, 1749.0, 19709.0, 4157703.0, 11550.0, 1492.0, 519.0, 214.0, 106.0, 64.0, 27.0, 19.0, 15.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.0010118484497070312, -0.000990055501461029, -0.0009682625532150269, -0.0009464696049690247, -0.0009246766567230225, -0.0009028837084770203, -0.0008810907602310181, -0.0008592978119850159, -0.0008375048637390137, -0.0008157119154930115, -0.0007939189672470093, -0.0007721260190010071, -0.0007503330707550049, -0.0007285401225090027, -0.0007067471742630005, -0.0006849542260169983, -0.0006631612777709961, -0.0006413683295249939, -0.0006195753812789917, -0.0005977824330329895, -0.0005759894847869873, -0.0005541965365409851, -0.0005324035882949829, -0.0005106106400489807, -0.0004888176918029785, -0.0004670247435569763, -0.0004452317953109741, -0.0004234388470649719, -0.0004016458988189697, -0.00037985295057296753, -0.00035806000232696533, -0.00033626705408096313, -0.00031447410583496094, -0.00029268115758895874, -0.00027088820934295654, -0.00024909526109695435, -0.00022730231285095215, -0.00020550936460494995, -0.00018371641635894775, -0.00016192346811294556, -0.00014013051986694336, -0.00011833757162094116, -9.654462337493896e-05, -7.475167512893677e-05, -5.295872688293457e-05, -3.116577863693237e-05, -9.372830390930176e-06, 1.2420117855072021e-05, 3.421306610107422e-05, 5.6006014347076416e-05, 7.779896259307861e-05, 9.959191083908081e-05, 0.00012138485908508301, 0.0001431778073310852, 0.0001649707555770874, 0.0001867637038230896, 0.0002085566520690918, 0.000230349600315094, 0.0002521425485610962, 0.0002739354968070984, 0.0002957284450531006, 0.0003175213932991028, 0.000339314341545105, 0.0003611072897911072, 0.0003829002380371094]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 12.0, 11.0, 28.0, 75.0, 204.0, 2953.0, 517.0, 150.0, 52.0, 27.0, 14.0, 12.0, 7.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.349781036376953e-05, -3.171246498823166e-05, -2.9927119612693787e-05, -2.8141774237155914e-05, -2.6356428861618042e-05, -2.457108348608017e-05, -2.2785738110542297e-05, -2.1000392735004425e-05, -1.9215047359466553e-05, -1.742970198392868e-05, -1.5644356608390808e-05, -1.3859011232852936e-05, -1.2073665857315063e-05, -1.0288320481777191e-05, -8.502975106239319e-06, -6.7176297307014465e-06, -4.932284355163574e-06, -3.146938979625702e-06, -1.3615936040878296e-06, 4.237517714500427e-07, 2.209097146987915e-06, 3.994442522525787e-06, 5.77978789806366e-06, 7.565133273601532e-06, 9.350478649139404e-06, 1.1135824024677277e-05, 1.2921169400215149e-05, 1.4706514775753021e-05, 1.6491860151290894e-05, 1.8277205526828766e-05, 2.0062550902366638e-05, 2.184789627790451e-05, 2.3633241653442383e-05, 2.5418587028980255e-05, 2.7203932404518127e-05, 2.8989277780056e-05, 3.077462315559387e-05, 3.2559968531131744e-05, 3.434531390666962e-05, 3.613065928220749e-05, 3.791600465774536e-05, 3.9701350033283234e-05, 4.1486695408821106e-05, 4.327204078435898e-05, 4.505738615989685e-05, 4.684273153543472e-05, 4.8628076910972595e-05, 5.041342228651047e-05, 5.219876766204834e-05, 5.398411303758621e-05, 5.5769458413124084e-05, 5.755480378866196e-05, 5.934014916419983e-05, 6.11254945397377e-05, 6.291083991527557e-05, 6.469618529081345e-05, 6.648153066635132e-05, 6.826687604188919e-05, 7.005222141742706e-05, 7.183756679296494e-05, 7.362291216850281e-05, 7.540825754404068e-05, 7.719360291957855e-05, 7.897894829511642e-05, 8.07642936706543e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 7.0, 6.0, 6.0, 19.0, 17.0, 28.0, 45.0, 59.0, 95.0, 142.0, 171.0, 133.0, 81.0, 60.0, 39.0, 23.0, 13.0, 11.0, 14.0, 11.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002212283870903775, -0.00021463185839820653, -0.00020803532970603555, -0.00020143880101386458, -0.00019484228687360883, -0.00018824575818143785, -0.00018164922948926687, -0.0001750527007970959, -0.00016845617210492492, -0.00016185964341275394, -0.00015526311472058296, -0.00014866658602841198, -0.000142070057336241, -0.00013547352864407003, -0.00012887701450381428, -0.0001222804858116433, -0.00011568395711947232, -0.00010908742842730135, -0.00010249089973513037, -9.5894378318917e-05, -8.929784962674603e-05, -8.270132093457505e-05, -7.610479951836169e-05, -6.950827082619071e-05, -6.291174213401973e-05, -5.6315213441848755e-05, -4.9718688387656584e-05, -4.3122163333464414e-05, -3.6525634641293436e-05, -2.992910594912246e-05, -2.3332580894930288e-05, -1.6736055840738118e-05, -1.0139541700482368e-05, -3.5430148273007944e-06, 3.0535120458807796e-06, 9.650038919062354e-06, 1.6246565792243928e-05, 2.2843094484414905e-05, 2.9439619538607076e-05, 3.6036144592799246e-05, 4.2632673284970224e-05, 4.92292019771412e-05, 5.582572703133337e-05, 6.242225208552554e-05, 6.901878077769652e-05, 7.56153094698675e-05, 8.221183088608086e-05, 8.880835957825184e-05, 9.540488827042282e-05, 0.0001020014169625938, 0.00010859794565476477, 0.00011519446707097813, 0.00012179099576314911, 0.0001283875317312777, 0.00013498404587153345, 0.00014158057456370443, 0.0001481771032558754, 0.00015477363194804639, 0.00016137016064021736, 0.00016796668933238834, 0.0001745632034726441, 0.00018115973216481507, 0.00018775626085698605, 0.00019435278954915702, 0.000200949318241328]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 7.0, 14.0, 14.0, 18.0, 22.0, 13.0, 23.0, 24.0, 35.0, 50.0, 36.0, 48.0, 41.0, 54.0, 51.0, 46.0, 55.0, 54.0, 57.0, 44.0, 46.0, 29.0, 34.0, 36.0, 27.0, 29.0, 19.0, 17.0, 12.0, 15.0, 12.0, 6.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.00017124858277384192, -0.00016712701471988112, -0.00016300544666592032, -0.00015888387861195952, -0.00015476231055799872, -0.00015064074250403792, -0.00014651917445007712, -0.00014239762094803154, -0.00013827605289407074, -0.00013415448484010994, -0.00013003291678614914, -0.00012591134873218834, -0.00012178978067822754, -0.00011766821262426674, -0.00011354665184626356, -0.00010942508379230276, -0.00010530350846238434, -0.00010118194040842354, -9.706037235446274e-05, -9.293880430050194e-05, -8.881723624654114e-05, -8.469566819258034e-05, -8.057410741457716e-05, -7.645253936061636e-05, -7.233097130665556e-05, -6.820940325269476e-05, -6.408783519873396e-05, -5.996627078275196e-05, -5.584470272879116e-05, -5.172313467483036e-05, -4.760157025884837e-05, -4.348000220488757e-05, -3.935844142688438e-05, -3.523687337292358e-05, -3.111530531896278e-05, -2.699374090298079e-05, -2.287217284901999e-05, -1.875060479505919e-05, -1.4629038560087793e-05, -1.0507472325116396e-05, -6.385904271155596e-06, -2.2643371266894974e-06, 1.857230017776601e-06, 5.978797162242699e-06, 1.0100364306708798e-05, 1.4221932360669598e-05, 1.8343498595640995e-05, 2.246506483061239e-05, 2.658663288457319e-05, 3.070820093853399e-05, 3.482976899249479e-05, 3.8951333408476785e-05, 4.3072901462437585e-05, 4.7194469516398385e-05, 5.131603393238038e-05, 5.543760198634118e-05, 5.955917004030198e-05, 6.368073809426278e-05, 6.780230614822358e-05, 7.192387420218438e-05, 7.604544225614518e-05, 8.016701031010598e-05, 8.428857108810917e-05, 8.841013914206997e-05, 9.253170719603077e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 11.0, 14.0, 33.0, 39.0, 72.0, 101.0, 165.0, 258.0, 458.0, 783.0, 1192.0, 2042.0, 3536.0, 5755.0, 10660.0, 18614.0, 36999.0, 74772.0, 166325.0, 308370.0, 218060.0, 98986.0, 47146.0, 23650.0, 12939.0, 7198.0, 4132.0, 2507.0, 1452.0, 901.0, 566.0, 296.0, 181.0, 112.0, 81.0, 53.0, 38.0, 16.0, 9.0, 13.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.655952453613281e-05, -9.307079017162323e-05, -8.958205580711365e-05, -8.609332144260406e-05, -8.260458707809448e-05, -7.91158527135849e-05, -7.562711834907532e-05, -7.213838398456573e-05, -6.864964962005615e-05, -6.516091525554657e-05, -6.167218089103699e-05, -5.8183446526527405e-05, -5.469471216201782e-05, -5.120597779750824e-05, -4.771724343299866e-05, -4.4228509068489075e-05, -4.073977470397949e-05, -3.725104033946991e-05, -3.376230597496033e-05, -3.0273571610450745e-05, -2.6784837245941162e-05, -2.329610288143158e-05, -1.9807368516921997e-05, -1.6318634152412415e-05, -1.2829899787902832e-05, -9.34116542339325e-06, -5.852431058883667e-06, -2.3636966943740845e-06, 1.125037670135498e-06, 4.6137720346450806e-06, 8.102506399154663e-06, 1.1591240763664246e-05, 1.5079975128173828e-05, 1.856870949268341e-05, 2.2057443857192993e-05, 2.5546178221702576e-05, 2.9034912586212158e-05, 3.252364695072174e-05, 3.601238131523132e-05, 3.9501115679740906e-05, 4.298985004425049e-05, 4.647858440876007e-05, 4.996731877326965e-05, 5.3456053137779236e-05, 5.694478750228882e-05, 6.04335218667984e-05, 6.392225623130798e-05, 6.741099059581757e-05, 7.089972496032715e-05, 7.438845932483673e-05, 7.787719368934631e-05, 8.13659280538559e-05, 8.485466241836548e-05, 8.834339678287506e-05, 9.183213114738464e-05, 9.532086551189423e-05, 9.880959987640381e-05, 0.00010229833424091339, 0.00010578706860542297, 0.00010927580296993256, 0.00011276453733444214, 0.00011625327169895172, 0.0001197420060634613, 0.00012323074042797089, 0.00012671947479248047]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 8.0, 15.0, 14.0, 19.0, 18.0, 28.0, 28.0, 30.0, 42.0, 53.0, 60.0, 42.0, 56.0, 68.0, 52.0, 62.0, 49.0, 49.0, 56.0, 34.0, 34.0, 31.0, 27.0, 41.0, 17.0, 15.0, 10.0, 13.0, 11.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.00018298625946044922, -0.00017864443361759186, -0.0001743026077747345, -0.00016996078193187714, -0.00016561895608901978, -0.00016127713024616241, -0.00015693530440330505, -0.0001525934785604477, -0.00014825165271759033, -0.00014390982687473297, -0.0001395680010318756, -0.00013522617518901825, -0.0001308843493461609, -0.00012654252350330353, -0.00012220069766044617, -0.0001178588718175888, -0.00011351704597473145, -0.00010917522013187408, -0.00010483339428901672, -0.00010049156844615936, -9.6149742603302e-05, -9.180791676044464e-05, -8.746609091758728e-05, -8.312426507472992e-05, -7.878243923187256e-05, -7.44406133890152e-05, -7.009878754615784e-05, -6.575696170330048e-05, -6.141513586044312e-05, -5.7073310017585754e-05, -5.2731484174728394e-05, -4.838965833187103e-05, -4.404783248901367e-05, -3.970600664615631e-05, -3.536418080329895e-05, -3.102235496044159e-05, -2.668052911758423e-05, -2.2338703274726868e-05, -1.7996877431869507e-05, -1.3655051589012146e-05, -9.313225746154785e-06, -4.971399903297424e-06, -6.295740604400635e-07, 3.7122517824172974e-06, 8.054077625274658e-06, 1.2395903468132019e-05, 1.673772931098938e-05, 2.107955515384674e-05, 2.54213809967041e-05, 2.9763206839561462e-05, 3.410503268241882e-05, 3.8446858525276184e-05, 4.2788684368133545e-05, 4.7130510210990906e-05, 5.1472336053848267e-05, 5.581416189670563e-05, 6.015598773956299e-05, 6.449781358242035e-05, 6.883963942527771e-05, 7.318146526813507e-05, 7.752329111099243e-05, 8.186511695384979e-05, 8.620694279670715e-05, 9.054876863956451e-05, 9.489059448242188e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 9.0, 6.0, 12.0, 16.0, 22.0, 20.0, 45.0, 63.0, 90.0, 153.0, 183.0, 296.0, 446.0, 669.0, 960.0, 1659.0, 2602.0, 4423.0, 8059.0, 15721.0, 34541.0, 97340.0, 448134.0, 300158.0, 74104.0, 28612.0, 13116.0, 6694.0, 3842.0, 2429.0, 1420.0, 879.0, 575.0, 396.0, 274.0, 193.0, 124.0, 71.0, 52.0, 39.0, 36.0, 28.0, 14.0, 11.0, 7.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.00014710426330566406, -0.0001427624374628067, -0.00013842061161994934, -0.00013407878577709198, -0.00012973695993423462, -0.00012539513409137726, -0.0001210533082485199, -0.00011671148240566254, -0.00011236965656280518, -0.00010802783071994781, -0.00010368600487709045, -9.93441790342331e-05, -9.500235319137573e-05, -9.066052734851837e-05, -8.631870150566101e-05, -8.197687566280365e-05, -7.763504981994629e-05, -7.329322397708893e-05, -6.895139813423157e-05, -6.46095722913742e-05, -6.0267746448516846e-05, -5.5925920605659485e-05, -5.1584094762802124e-05, -4.724226891994476e-05, -4.29004430770874e-05, -3.855861723423004e-05, -3.421679139137268e-05, -2.987496554851532e-05, -2.553313970565796e-05, -2.1191313862800598e-05, -1.6849488019943237e-05, -1.2507662177085876e-05, -8.165836334228516e-06, -3.824010491371155e-06, 5.178153514862061e-07, 4.859641194343567e-06, 9.201467037200928e-06, 1.3543292880058289e-05, 1.788511872291565e-05, 2.222694456577301e-05, 2.656877040863037e-05, 3.091059625148773e-05, 3.525242209434509e-05, 3.9594247937202454e-05, 4.3936073780059814e-05, 4.8277899622917175e-05, 5.2619725465774536e-05, 5.69615513086319e-05, 6.130337715148926e-05, 6.564520299434662e-05, 6.998702883720398e-05, 7.432885468006134e-05, 7.86706805229187e-05, 8.301250636577606e-05, 8.735433220863342e-05, 9.169615805149078e-05, 9.603798389434814e-05, 0.0001003798097372055, 0.00010472163558006287, 0.00010906346142292023, 0.00011340528726577759, 0.00011774711310863495, 0.0001220889389514923, 0.00012643076479434967, 0.00013077259063720703]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 16.0, 15.0, 16.0, 22.0, 24.0, 27.0, 32.0, 33.0, 33.0, 25.0, 42.0, 34.0, 48.0, 54.0, 43.0, 39.0, 57.0, 49.0, 51.0, 31.0, 35.0, 34.0, 35.0, 33.0, 22.0, 33.0, 23.0, 19.0, 10.0, 14.0, 9.0, 4.0, 9.0, 4.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.450580596923828e-05, -7.227901369333267e-05, -7.005222141742706e-05, -6.782542914152145e-05, -6.559863686561584e-05, -6.337184458971024e-05, -6.114505231380463e-05, -5.891826003789902e-05, -5.669146776199341e-05, -5.44646754860878e-05, -5.223788321018219e-05, -5.001109093427658e-05, -4.778429865837097e-05, -4.555750638246536e-05, -4.3330714106559753e-05, -4.1103921830654144e-05, -3.8877129554748535e-05, -3.6650337278842926e-05, -3.442354500293732e-05, -3.219675272703171e-05, -2.99699604511261e-05, -2.774316817522049e-05, -2.551637589931488e-05, -2.328958362340927e-05, -2.1062791347503662e-05, -1.8835999071598053e-05, -1.6609206795692444e-05, -1.4382414519786835e-05, -1.2155622243881226e-05, -9.928829967975616e-06, -7.702037692070007e-06, -5.475245416164398e-06, -3.248453140258789e-06, -1.02166086435318e-06, 1.2051314115524292e-06, 3.4319236874580383e-06, 5.6587159633636475e-06, 7.885508239269257e-06, 1.0112300515174866e-05, 1.2339092791080475e-05, 1.4565885066986084e-05, 1.6792677342891693e-05, 1.9019469618797302e-05, 2.124626189470291e-05, 2.347305417060852e-05, 2.569984644651413e-05, 2.792663872241974e-05, 3.0153430998325348e-05, 3.238022327423096e-05, 3.4607015550136566e-05, 3.6833807826042175e-05, 3.9060600101947784e-05, 4.1287392377853394e-05, 4.3514184653759e-05, 4.574097692966461e-05, 4.796776920557022e-05, 5.019456148147583e-05, 5.242135375738144e-05, 5.464814603328705e-05, 5.687493830919266e-05, 5.9101730585098267e-05, 6.132852286100388e-05, 6.355531513690948e-05, 6.57821074128151e-05, 6.80088996887207e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 4.0, 8.0, 12.0, 19.0, 24.0, 45.0, 73.0, 69.0, 95.0, 166.0, 205.0, 287.0, 494.0, 607.0, 911.0, 1479.0, 2371.0, 4126.0, 6804.0, 13032.0, 32502.0, 101641.0, 698942.0, 121505.0, 30777.0, 13916.0, 7607.0, 3717.0, 2514.0, 1447.0, 958.0, 688.0, 435.0, 298.0, 221.0, 158.0, 130.0, 78.0, 37.0, 27.0, 33.0, 34.0, 30.0, 7.0, 3.0, 8.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.396106719970703e-05, -2.3224391043186188e-05, -2.2487714886665344e-05, -2.17510387301445e-05, -2.1014362573623657e-05, -2.0277686417102814e-05, -1.954101026058197e-05, -1.8804334104061127e-05, -1.8067657947540283e-05, -1.733098179101944e-05, -1.6594305634498596e-05, -1.5857629477977753e-05, -1.512095332145691e-05, -1.4384277164936066e-05, -1.3647601008415222e-05, -1.2910924851894379e-05, -1.2174248695373535e-05, -1.1437572538852692e-05, -1.0700896382331848e-05, -9.964220225811005e-06, -9.227544069290161e-06, -8.490867912769318e-06, -7.754191756248474e-06, -7.017515599727631e-06, -6.280839443206787e-06, -5.544163286685944e-06, -4.8074871301651e-06, -4.070810973644257e-06, -3.334134817123413e-06, -2.5974586606025696e-06, -1.860782504081726e-06, -1.1241063475608826e-06, -3.8743019104003906e-07, 3.4924596548080444e-07, 1.085922122001648e-06, 1.8225982785224915e-06, 2.559274435043335e-06, 3.2959505915641785e-06, 4.032626748085022e-06, 4.7693029046058655e-06, 5.505979061126709e-06, 6.2426552176475525e-06, 6.979331374168396e-06, 7.71600753068924e-06, 8.452683687210083e-06, 9.189359843730927e-06, 9.92603600025177e-06, 1.0662712156772614e-05, 1.1399388313293457e-05, 1.21360644698143e-05, 1.2872740626335144e-05, 1.3609416782855988e-05, 1.4346092939376831e-05, 1.5082769095897675e-05, 1.5819445252418518e-05, 1.655612140893936e-05, 1.7292797565460205e-05, 1.802947372198105e-05, 1.8766149878501892e-05, 1.9502826035022736e-05, 2.023950219154358e-05, 2.0976178348064423e-05, 2.1712854504585266e-05, 2.244953066110611e-05, 2.3186206817626953e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 0.0, 5.0, 1.0, 5.0, 0.0, 6.0, 10.0, 9.0, 0.0, 10.0, 6.0, 0.0, 12.0, 11.0, 15.0, 0.0, 25.0, 30.0, 44.0, 0.0, 55.0, 58.0, 69.0, 0.0, 81.0, 94.0, 0.0, 67.0, 82.0, 49.0, 0.0, 56.0, 46.0, 48.0, 0.0, 26.0, 25.0, 10.0, 0.0, 11.0, 9.0, 0.0, 10.0, 5.0, 5.0, 0.0, 6.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.430511474609375e-06, -1.3867393136024475e-06, -1.34296715259552e-06, -1.2991949915885925e-06, -1.255422830581665e-06, -1.2116506695747375e-06, -1.16787850856781e-06, -1.1241063475608826e-06, -1.080334186553955e-06, -1.0365620255470276e-06, -9.927898645401e-07, -9.490177035331726e-07, -9.052455425262451e-07, -8.614733815193176e-07, -8.177012205123901e-07, -7.739290595054626e-07, -7.301568984985352e-07, -6.863847374916077e-07, -6.426125764846802e-07, -5.988404154777527e-07, -5.550682544708252e-07, -5.112960934638977e-07, -4.675239324569702e-07, -4.237517714500427e-07, -3.7997961044311523e-07, -3.3620744943618774e-07, -2.9243528842926025e-07, -2.4866312742233276e-07, -2.0489096641540527e-07, -1.6111880540847778e-07, -1.1734664440155029e-07, -7.35744833946228e-08, -2.9802322387695312e-08, 1.3969838619232178e-08, 5.774199962615967e-08, 1.0151416063308716e-07, 1.4528632164001465e-07, 1.8905848264694214e-07, 2.3283064365386963e-07, 2.766028046607971e-07, 3.203749656677246e-07, 3.641471266746521e-07, 4.079192876815796e-07, 4.516914486885071e-07, 4.954636096954346e-07, 5.392357707023621e-07, 5.830079317092896e-07, 6.26780092716217e-07, 6.705522537231445e-07, 7.14324414730072e-07, 7.580965757369995e-07, 8.01868736743927e-07, 8.456408977508545e-07, 8.89413058757782e-07, 9.331852197647095e-07, 9.76957380771637e-07, 1.0207295417785645e-06, 1.064501702785492e-06, 1.1082738637924194e-06, 1.152046024799347e-06, 1.1958181858062744e-06, 1.239590346813202e-06, 1.2833625078201294e-06, 1.3271346688270569e-06, 1.3709068298339844e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 3.0, 8.0, 9.0, 15.0, 23.0, 17.0, 40.0, 58.0, 94.0, 208.0, 571.0, 1867.0, 7988.0, 61168.0, 858658.0, 102844.0, 11366.0, 2391.0, 673.0, 227.0, 118.0, 56.0, 30.0, 24.0, 22.0, 9.0, 12.0, 11.0, 4.0, 8.0, 3.0, 6.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.450580596923828e-05, -7.20703974366188e-05, -6.963498890399933e-05, -6.719958037137985e-05, -6.476417183876038e-05, -6.23287633061409e-05, -5.989335477352142e-05, -5.745794624090195e-05, -5.502253770828247e-05, -5.2587129175662994e-05, -5.015172064304352e-05, -4.771631211042404e-05, -4.5280903577804565e-05, -4.284549504518509e-05, -4.041008651256561e-05, -3.7974677979946136e-05, -3.553926944732666e-05, -3.3103860914707184e-05, -3.066845238208771e-05, -2.823304384946823e-05, -2.5797635316848755e-05, -2.336222678422928e-05, -2.0926818251609802e-05, -1.8491409718990326e-05, -1.605600118637085e-05, -1.3620592653751373e-05, -1.1185184121131897e-05, -8.74977558851242e-06, -6.314367055892944e-06, -3.878958523273468e-06, -1.4435499906539917e-06, 9.918585419654846e-07, 3.427267074584961e-06, 5.862675607204437e-06, 8.298084139823914e-06, 1.073349267244339e-05, 1.3168901205062866e-05, 1.5604309737682343e-05, 1.803971827030182e-05, 2.0475126802921295e-05, 2.291053533554077e-05, 2.5345943868160248e-05, 2.7781352400779724e-05, 3.02167609333992e-05, 3.265216946601868e-05, 3.508757799863815e-05, 3.752298653125763e-05, 3.9958395063877106e-05, 4.239380359649658e-05, 4.482921212911606e-05, 4.7264620661735535e-05, 4.970002919435501e-05, 5.213543772697449e-05, 5.4570846259593964e-05, 5.700625479221344e-05, 5.9441663324832916e-05, 6.187707185745239e-05, 6.431248039007187e-05, 6.674788892269135e-05, 6.918329745531082e-05, 7.16187059879303e-05, 7.405411452054977e-05, 7.648952305316925e-05, 7.892493158578873e-05, 8.13603401184082e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 8.0, 4.0, 10.0, 14.0, 14.0, 20.0, 20.0, 30.0, 33.0, 45.0, 53.0, 31.0, 65.0, 78.0, 78.0, 52.0, 70.0, 59.0, 59.0, 36.0, 37.0, 33.0, 23.0, 23.0, 18.0, 18.0, 13.0, 8.0, 7.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.020069122314453e-06, -5.846843123435974e-06, -5.673617124557495e-06, -5.500391125679016e-06, -5.327165126800537e-06, -5.153939127922058e-06, -4.980713129043579e-06, -4.8074871301651e-06, -4.634261131286621e-06, -4.461035132408142e-06, -4.287809133529663e-06, -4.114583134651184e-06, -3.941357135772705e-06, -3.768131136894226e-06, -3.594905138015747e-06, -3.421679139137268e-06, -3.248453140258789e-06, -3.07522714138031e-06, -2.902001142501831e-06, -2.728775143623352e-06, -2.555549144744873e-06, -2.382323145866394e-06, -2.209097146987915e-06, -2.035871148109436e-06, -1.862645149230957e-06, -1.689419150352478e-06, -1.516193151473999e-06, -1.34296715259552e-06, -1.169741153717041e-06, -9.96515154838562e-07, -8.23289155960083e-07, -6.50063157081604e-07, -4.76837158203125e-07, -3.03611159324646e-07, -1.30385160446167e-07, 4.284083843231201e-08, 2.1606683731079102e-07, 3.8929283618927e-07, 5.62518835067749e-07, 7.35744833946228e-07, 9.08970832824707e-07, 1.082196831703186e-06, 1.255422830581665e-06, 1.428648829460144e-06, 1.601874828338623e-06, 1.775100827217102e-06, 1.948326826095581e-06, 2.12155282497406e-06, 2.294778823852539e-06, 2.468004822731018e-06, 2.641230821609497e-06, 2.814456820487976e-06, 2.987682819366455e-06, 3.160908818244934e-06, 3.334134817123413e-06, 3.507360816001892e-06, 3.680586814880371e-06, 3.85381281375885e-06, 4.027038812637329e-06, 4.200264811515808e-06, 4.373490810394287e-06, 4.546716809272766e-06, 4.719942808151245e-06, 4.893168807029724e-06, 5.066394805908203e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 4.0, 9.0, 14.0, 19.0, 27.0, 38.0, 60.0, 71.0, 116.0, 144.0, 135.0, 103.0, 62.0, 45.0, 28.0, 23.0, 24.0, 14.0, 9.0, 7.0, 7.0, 9.0, 8.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014808820560574532, -0.0001427437673555687, -0.00013739931455347687, -0.00013205487630330026, -0.00012671043805312365, -0.00012136599252698943, -0.00011602154700085521, -0.0001106771087506786, -0.00010533267050050199, -9.998822497436777e-05, -9.464378672419116e-05, -8.929934119805694e-05, -8.395490294788033e-05, -7.86104574217461e-05, -7.326601189561188e-05, -6.792157364543527e-05, -6.257712811930105e-05, -5.7232686231145635e-05, -5.188824434299022e-05, -4.6543798816856e-05, -4.119936056667939e-05, -3.5854915040545166e-05, -3.051047315238975e-05, -2.5166031264234334e-05, -1.982158937607892e-05, -1.4477147487923503e-05, -9.132704690273385e-06, -3.788261892623268e-06, 1.5561799955321476e-06, 6.900621883687563e-06, 1.2245065590832382e-05, 1.7589507478987798e-05, 2.2933949367143214e-05, 2.827839125529863e-05, 3.3622833143454045e-05, 3.896727866958827e-05, 4.4311716919764876e-05, 4.96561624458991e-05, 5.5000604334054515e-05, 6.034504622220993e-05, 6.568948447238654e-05, 7.103392999852076e-05, 7.637836824869737e-05, 8.172281377483159e-05, 8.70672520250082e-05, 9.241169755114242e-05, 9.775614307727665e-05, 0.00010310058132745326, 0.00010844502685358748, 0.0001137894723797217, 0.00011913391062989831, 0.00012447834888007492, 0.00012982280168216676, 0.00013516723993234336, 0.00014051167818251997, 0.00014585611643269658, 0.00015120056923478842, 0.00015654500748496503, 0.00016188946028705686, 0.00016723389853723347, 0.00017257833678741008, 0.0001779227750375867, 0.00018326722783967853, 0.00018861166608985513, 0.00019395610434003174]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 7.0, 14.0, 17.0, 13.0, 24.0, 10.0, 26.0, 24.0, 35.0, 47.0, 48.0, 39.0, 50.0, 49.0, 53.0, 52.0, 56.0, 52.0, 52.0, 42.0, 52.0, 32.0, 34.0, 31.0, 32.0, 27.0, 21.0, 11.0, 14.0, 14.0, 8.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00015805740258656442, -0.0001542433601571247, -0.0001504293322796002, -0.00014661528985016048, -0.00014280124742072076, -0.00013898720499128103, -0.00013517317711375654, -0.00013135913468431681, -0.0001275450922548771, -0.00012373104982543737, -0.00011991701467195526, -0.00011610297951847315, -0.00011228893708903342, -0.00010847490193555132, -0.0001046608667820692, -0.00010084682435262948, -9.703279647510499e-05, -9.321876132162288e-05, -8.940471889218315e-05, -8.559068373870105e-05, -8.177664130926132e-05, -7.796260615577921e-05, -7.41485710022971e-05, -7.033452857285738e-05, -6.652049341937527e-05, -6.270645826589316e-05, -5.889241583645344e-05, -5.507838068297133e-05, -5.126434189151041e-05, -4.7450303100049496e-05, -4.3636267946567386e-05, -3.982222915510647e-05, -3.600818308768794e-05, -3.219414429622702e-05, -2.838010732375551e-05, -2.4566070351283997e-05, -2.075203155982308e-05, -1.6937992768362164e-05, -1.3123955795890652e-05, -9.309918823419139e-06, -5.495880031958222e-06, -1.6818421499920078e-06, 2.132195731974207e-06, 5.9462336139404215e-06, 9.760271495906636e-06, 1.3574310287367553e-05, 1.7388347259839065e-05, 2.1202384232310578e-05, 2.5016423023771495e-05, 2.883046181523241e-05, 3.264450060669333e-05, 3.645853576017544e-05, 4.027257455163635e-05, 4.408661334309727e-05, 4.790064849657938e-05, 5.1714687288040295e-05, 5.552872607950121e-05, 5.934276487096213e-05, 6.315680366242304e-05, 6.697083881590515e-05, 7.078488124534488e-05, 7.459891639882699e-05, 7.84129515523091e-05, 8.222699398174882e-05, 8.604102913523093e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 3.0, 3.0, 5.0, 7.0, 19.0, 18.0, 20.0, 27.0, 41.0, 65.0, 98.0, 135.0, 231.0, 426.0, 686.0, 1164.0, 2070.0, 3470.0, 5939.0, 10304.0, 18116.0, 32968.0, 63142.0, 132357.0, 276888.0, 254625.0, 117713.0, 57829.0, 30274.0, 16815.0, 9613.0, 5541.0, 3230.0, 1939.0, 1101.0, 640.0, 367.0, 237.0, 133.0, 89.0, 58.0, 44.0, 22.0, 22.0, 11.0, 14.0, 4.0, 7.0, 7.0, 4.0, 8.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.00029778480529785156, -0.0002890080213546753, -0.000280231237411499, -0.00027145445346832275, -0.0002626776695251465, -0.0002539008855819702, -0.00024512410163879395, -0.00023634731769561768, -0.0002275705337524414, -0.00021879374980926514, -0.00021001696586608887, -0.0002012401819229126, -0.00019246339797973633, -0.00018368661403656006, -0.0001749098300933838, -0.00016613304615020752, -0.00015735626220703125, -0.00014857947826385498, -0.0001398026943206787, -0.00013102591037750244, -0.00012224912643432617, -0.0001134723424911499, -0.00010469555854797363, -9.591877460479736e-05, -8.71419906616211e-05, -7.836520671844482e-05, -6.958842277526855e-05, -6.0811638832092285e-05, -5.2034854888916016e-05, -4.3258070945739746e-05, -3.4481287002563477e-05, -2.5704503059387207e-05, -1.6927719116210938e-05, -8.150935173034668e-06, 6.258487701416016e-07, 9.402632713317871e-06, 1.817941665649414e-05, 2.695620059967041e-05, 3.573298454284668e-05, 4.450976848602295e-05, 5.328655242919922e-05, 6.206333637237549e-05, 7.084012031555176e-05, 7.961690425872803e-05, 8.83936882019043e-05, 9.717047214508057e-05, 0.00010594725608825684, 0.0001147240400314331, 0.00012350082397460938, 0.00013227760791778564, 0.00014105439186096191, 0.00014983117580413818, 0.00015860795974731445, 0.00016738474369049072, 0.000176161527633667, 0.00018493831157684326, 0.00019371509552001953, 0.0002024918794631958, 0.00021126866340637207, 0.00022004544734954834, 0.0002288222312927246, 0.00023759901523590088, 0.00024637579917907715, 0.0002551525831222534, 0.0002639293670654297]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 10.0, 5.0, 12.0, 15.0, 12.0, 17.0, 17.0, 23.0, 29.0, 37.0, 45.0, 50.0, 47.0, 44.0, 56.0, 56.0, 65.0, 65.0, 42.0, 55.0, 44.0, 32.0, 37.0, 30.0, 28.0, 29.0, 20.0, 23.0, 18.0, 15.0, 7.0, 8.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00013446807861328125, -0.00013114232569932938, -0.0001278165727853775, -0.00012449081987142563, -0.00012116506695747375, -0.00011783931404352188, -0.00011451356112957001, -0.00011118780821561813, -0.00010786205530166626, -0.00010453630238771439, -0.00010121054947376251, -9.788479655981064e-05, -9.455904364585876e-05, -9.123329073190689e-05, -8.790753781795502e-05, -8.458178490400314e-05, -8.125603199005127e-05, -7.79302790760994e-05, -7.460452616214752e-05, -7.127877324819565e-05, -6.795302033424377e-05, -6.46272674202919e-05, -6.130151450634003e-05, -5.797576159238815e-05, -5.465000867843628e-05, -5.1324255764484406e-05, -4.799850285053253e-05, -4.467274993658066e-05, -4.1346997022628784e-05, -3.802124410867691e-05, -3.469549119472504e-05, -3.136973828077316e-05, -2.804398536682129e-05, -2.4718232452869415e-05, -2.139247953891754e-05, -1.8066726624965668e-05, -1.4740973711013794e-05, -1.141522079706192e-05, -8.089467883110046e-06, -4.763714969158173e-06, -1.4379620552062988e-06, 1.887790858745575e-06, 5.213543772697449e-06, 8.539296686649323e-06, 1.1865049600601196e-05, 1.519080251455307e-05, 1.8516555428504944e-05, 2.1842308342456818e-05, 2.516806125640869e-05, 2.8493814170360565e-05, 3.181956708431244e-05, 3.514531999826431e-05, 3.8471072912216187e-05, 4.179682582616806e-05, 4.5122578740119934e-05, 4.844833165407181e-05, 5.177408456802368e-05, 5.5099837481975555e-05, 5.842559039592743e-05, 6.17513433098793e-05, 6.507709622383118e-05, 6.840284913778305e-05, 7.172860205173492e-05, 7.50543549656868e-05, 7.838010787963867e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 8.0, 8.0, 8.0, 20.0, 23.0, 38.0, 67.0, 90.0, 103.0, 228.0, 351.0, 597.0, 1051.0, 1801.0, 2966.0, 5468.0, 9747.0, 18089.0, 35057.0, 73013.0, 175814.0, 356863.0, 201304.0, 82584.0, 38989.0, 19709.0, 10513.0, 5924.0, 3287.0, 1880.0, 1184.0, 663.0, 410.0, 248.0, 159.0, 110.0, 70.0, 49.0, 23.0, 11.0, 17.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025010108947753906, -0.0002419203519821167, -0.00023373961448669434, -0.00022555887699127197, -0.0002173781394958496, -0.00020919740200042725, -0.00020101666450500488, -0.00019283592700958252, -0.00018465518951416016, -0.0001764744520187378, -0.00016829371452331543, -0.00016011297702789307, -0.0001519322395324707, -0.00014375150203704834, -0.00013557076454162598, -0.0001273900270462036, -0.00011920928955078125, -0.00011102855205535889, -0.00010284781455993652, -9.466707706451416e-05, -8.64863395690918e-05, -7.830560207366943e-05, -7.012486457824707e-05, -6.194412708282471e-05, -5.3763389587402344e-05, -4.558265209197998e-05, -3.740191459655762e-05, -2.9221177101135254e-05, -2.104043960571289e-05, -1.2859702110290527e-05, -4.678964614868164e-06, 3.5017728805541992e-06, 1.1682510375976562e-05, 1.9863247871398926e-05, 2.804398536682129e-05, 3.622472286224365e-05, 4.4405460357666016e-05, 5.258619785308838e-05, 6.076693534851074e-05, 6.89476728439331e-05, 7.712841033935547e-05, 8.530914783477783e-05, 9.34898853302002e-05, 0.00010167062282562256, 0.00010985136032104492, 0.00011803209781646729, 0.00012621283531188965, 0.000134393572807312, 0.00014257431030273438, 0.00015075504779815674, 0.0001589357852935791, 0.00016711652278900146, 0.00017529726028442383, 0.0001834779977798462, 0.00019165873527526855, 0.00019983947277069092, 0.00020802021026611328, 0.00021620094776153564, 0.000224381685256958, 0.00023256242275238037, 0.00024074316024780273, 0.0002489238977432251, 0.00025710463523864746, 0.0002652853727340698, 0.0002734661102294922]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 9.0, 9.0, 23.0, 13.0, 17.0, 17.0, 30.0, 20.0, 26.0, 39.0, 39.0, 30.0, 32.0, 45.0, 39.0, 47.0, 54.0, 45.0, 46.0, 34.0, 46.0, 41.0, 30.0, 36.0, 27.0, 28.0, 26.0, 25.0, 19.0, 14.0, 17.0, 12.0, 10.0, 13.0, 7.0, 6.0, 6.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-7.444620132446289e-05, -7.22147524356842e-05, -6.998330354690552e-05, -6.775185465812683e-05, -6.552040576934814e-05, -6.328895688056946e-05, -6.105750799179077e-05, -5.8826059103012085e-05, -5.65946102142334e-05, -5.436316132545471e-05, -5.2131712436676025e-05, -4.990026354789734e-05, -4.766881465911865e-05, -4.5437365770339966e-05, -4.320591688156128e-05, -4.097446799278259e-05, -3.8743019104003906e-05, -3.651157021522522e-05, -3.428012132644653e-05, -3.204867243766785e-05, -2.981722354888916e-05, -2.7585774660110474e-05, -2.5354325771331787e-05, -2.31228768825531e-05, -2.0891427993774414e-05, -1.8659979104995728e-05, -1.642853021621704e-05, -1.4197081327438354e-05, -1.1965632438659668e-05, -9.734183549880981e-06, -7.502734661102295e-06, -5.271285772323608e-06, -3.039836883544922e-06, -8.083879947662354e-07, 1.4230608940124512e-06, 3.6545097827911377e-06, 5.885958671569824e-06, 8.11740756034851e-06, 1.0348856449127197e-05, 1.2580305337905884e-05, 1.481175422668457e-05, 1.7043203115463257e-05, 1.9274652004241943e-05, 2.150610089302063e-05, 2.3737549781799316e-05, 2.5968998670578003e-05, 2.820044755935669e-05, 3.0431896448135376e-05, 3.266334533691406e-05, 3.489479422569275e-05, 3.7126243114471436e-05, 3.935769200325012e-05, 4.158914089202881e-05, 4.3820589780807495e-05, 4.605203866958618e-05, 4.828348755836487e-05, 5.0514936447143555e-05, 5.274638533592224e-05, 5.497783422470093e-05, 5.7209283113479614e-05, 5.94407320022583e-05, 6.167218089103699e-05, 6.390362977981567e-05, 6.613507866859436e-05, 6.836652755737305e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 8.0, 10.0, 11.0, 19.0, 30.0, 49.0, 78.0, 98.0, 151.0, 228.0, 373.0, 596.0, 951.0, 1766.0, 3035.0, 6298.0, 14037.0, 38018.0, 152360.0, 612086.0, 152989.0, 38051.0, 13821.0, 6089.0, 3083.0, 1614.0, 1040.0, 674.0, 331.0, 207.0, 150.0, 83.0, 74.0, 34.0, 26.0, 27.0, 12.0, 17.0, 7.0, 8.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.0371208190917969e-05, -1.007039099931717e-05, -9.76957380771637e-06, -9.46875661611557e-06, -9.16793942451477e-06, -8.867122232913971e-06, -8.566305041313171e-06, -8.265487849712372e-06, -7.964670658111572e-06, -7.663853466510773e-06, -7.363036274909973e-06, -7.062219083309174e-06, -6.761401891708374e-06, -6.4605847001075745e-06, -6.159767508506775e-06, -5.858950316905975e-06, -5.558133125305176e-06, -5.257315933704376e-06, -4.956498742103577e-06, -4.655681550502777e-06, -4.3548643589019775e-06, -4.054047167301178e-06, -3.7532299757003784e-06, -3.452412784099579e-06, -3.1515955924987793e-06, -2.8507784008979797e-06, -2.54996120929718e-06, -2.2491440176963806e-06, -1.948326826095581e-06, -1.6475096344947815e-06, -1.346692442893982e-06, -1.0458752512931824e-06, -7.450580596923828e-07, -4.4424086809158325e-07, -1.434236764907837e-07, 1.5739351511001587e-07, 4.5821070671081543e-07, 7.59027898311615e-07, 1.0598450899124146e-06, 1.3606622815132141e-06, 1.6614794731140137e-06, 1.9622966647148132e-06, 2.263113856315613e-06, 2.5639310479164124e-06, 2.864748239517212e-06, 3.1655654311180115e-06, 3.466382622718811e-06, 3.7671998143196106e-06, 4.06801700592041e-06, 4.36883419752121e-06, 4.669651389122009e-06, 4.970468580722809e-06, 5.271285772323608e-06, 5.572102963924408e-06, 5.8729201555252075e-06, 6.173737347126007e-06, 6.474554538726807e-06, 6.775371730327606e-06, 7.076188921928406e-06, 7.377006113529205e-06, 7.677823305130005e-06, 7.978640496730804e-06, 8.279457688331604e-06, 8.580274879932404e-06, 8.881092071533203e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 8.0, 10.0, 4.0, 8.0, 9.0, 17.0, 16.0, 13.0, 70.0, 51.0, 71.0, 81.0, 105.0, 98.0, 112.0, 78.0, 56.0, 48.0, 37.0, 25.0, 18.0, 21.0, 9.0, 9.0, 11.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.384185791015625e-06, -2.3208558559417725e-06, -2.25752592086792e-06, -2.1941959857940674e-06, -2.130866050720215e-06, -2.0675361156463623e-06, -2.0042061805725098e-06, -1.9408762454986572e-06, -1.8775463104248047e-06, -1.8142163753509521e-06, -1.7508864402770996e-06, -1.687556505203247e-06, -1.6242265701293945e-06, -1.560896635055542e-06, -1.4975666999816895e-06, -1.434236764907837e-06, -1.3709068298339844e-06, -1.3075768947601318e-06, -1.2442469596862793e-06, -1.1809170246124268e-06, -1.1175870895385742e-06, -1.0542571544647217e-06, -9.909272193908691e-07, -9.275972843170166e-07, -8.642673492431641e-07, -8.009374141693115e-07, -7.37607479095459e-07, -6.742775440216064e-07, -6.109476089477539e-07, -5.476176738739014e-07, -4.842877388000488e-07, -4.209578037261963e-07, -3.5762786865234375e-07, -2.942979335784912e-07, -2.3096799850463867e-07, -1.6763806343078613e-07, -1.043081283569336e-07, -4.0978193283081055e-08, 2.2351741790771484e-08, 8.568167686462402e-08, 1.4901161193847656e-07, 2.123415470123291e-07, 2.7567148208618164e-07, 3.390014171600342e-07, 4.023313522338867e-07, 4.6566128730773926e-07, 5.289912223815918e-07, 5.923211574554443e-07, 6.556510925292969e-07, 7.189810276031494e-07, 7.82310962677002e-07, 8.456408977508545e-07, 9.08970832824707e-07, 9.723007678985596e-07, 1.0356307029724121e-06, 1.0989606380462646e-06, 1.1622905731201172e-06, 1.2256205081939697e-06, 1.2889504432678223e-06, 1.3522803783416748e-06, 1.4156103134155273e-06, 1.4789402484893799e-06, 1.5422701835632324e-06, 1.605600118637085e-06, 1.6689300537109375e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 3.0, 14.0, 22.0, 39.0, 44.0, 76.0, 111.0, 151.0, 273.0, 377.0, 786.0, 1119.0, 2604.0, 5013.0, 16362.0, 47251.0, 357504.0, 523002.0, 61140.0, 20254.0, 5958.0, 3136.0, 1252.0, 802.0, 435.0, 314.0, 159.0, 132.0, 77.0, 50.0, 37.0, 16.0, 20.0, 5.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0609626770019531e-05, -1.0279007256031036e-05, -9.948387742042542e-06, -9.617768228054047e-06, -9.287148714065552e-06, -8.956529200077057e-06, -8.625909686088562e-06, -8.295290172100067e-06, -7.964670658111572e-06, -7.634051144123077e-06, -7.3034316301345825e-06, -6.972812116146088e-06, -6.642192602157593e-06, -6.311573088169098e-06, -5.980953574180603e-06, -5.650334060192108e-06, -5.319714546203613e-06, -4.989095032215118e-06, -4.6584755182266235e-06, -4.327856004238129e-06, -3.997236490249634e-06, -3.666616976261139e-06, -3.335997462272644e-06, -3.005377948284149e-06, -2.6747584342956543e-06, -2.3441389203071594e-06, -2.0135194063186646e-06, -1.6828998923301697e-06, -1.3522803783416748e-06, -1.02166086435318e-06, -6.910413503646851e-07, -3.604218363761902e-07, -2.9802322387695312e-08, 3.0081719160079956e-07, 6.314367055892944e-07, 9.620562195777893e-07, 1.2926757335662842e-06, 1.623295247554779e-06, 1.953914761543274e-06, 2.284534275531769e-06, 2.6151537895202637e-06, 2.9457733035087585e-06, 3.2763928174972534e-06, 3.6070123314857483e-06, 3.937631845474243e-06, 4.268251359462738e-06, 4.598870873451233e-06, 4.929490387439728e-06, 5.260109901428223e-06, 5.5907294154167175e-06, 5.921348929405212e-06, 6.251968443393707e-06, 6.582587957382202e-06, 6.913207471370697e-06, 7.243826985359192e-06, 7.574446499347687e-06, 7.905066013336182e-06, 8.235685527324677e-06, 8.566305041313171e-06, 8.896924555301666e-06, 9.227544069290161e-06, 9.558163583278656e-06, 9.888783097267151e-06, 1.0219402611255646e-05, 1.055002212524414e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 4.0, 2.0, 5.0, 3.0, 11.0, 6.0, 31.0, 14.0, 67.0, 21.0, 99.0, 68.0, 62.0, 130.0, 79.0, 119.0, 63.0, 78.0, 29.0, 43.0, 13.0, 23.0, 11.0, 6.0, 3.0, 8.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86102294921875e-06, -2.773478627204895e-06, -2.68593430519104e-06, -2.598389983177185e-06, -2.51084566116333e-06, -2.423301339149475e-06, -2.33575701713562e-06, -2.248212695121765e-06, -2.16066837310791e-06, -2.073124051094055e-06, -1.9855797290802e-06, -1.8980354070663452e-06, -1.8104910850524902e-06, -1.7229467630386353e-06, -1.6354024410247803e-06, -1.5478581190109253e-06, -1.4603137969970703e-06, -1.3727694749832153e-06, -1.2852251529693604e-06, -1.1976808309555054e-06, -1.1101365089416504e-06, -1.0225921869277954e-06, -9.350478649139404e-07, -8.475035429000854e-07, -7.599592208862305e-07, -6.724148988723755e-07, -5.848705768585205e-07, -4.973262548446655e-07, -4.0978193283081055e-07, -3.2223761081695557e-07, -2.3469328880310059e-07, -1.471489667892456e-07, -5.960464477539063e-08, 2.7939677238464355e-08, 1.1548399925231934e-07, 2.0302832126617432e-07, 2.905726432800293e-07, 3.781169652938843e-07, 4.6566128730773926e-07, 5.532056093215942e-07, 6.407499313354492e-07, 7.282942533493042e-07, 8.158385753631592e-07, 9.033828973770142e-07, 9.909272193908691e-07, 1.0784715414047241e-06, 1.166015863418579e-06, 1.253560185432434e-06, 1.341104507446289e-06, 1.428648829460144e-06, 1.516193151473999e-06, 1.603737473487854e-06, 1.691281795501709e-06, 1.778826117515564e-06, 1.866370439529419e-06, 1.953914761543274e-06, 2.041459083557129e-06, 2.129003405570984e-06, 2.216547727584839e-06, 2.304092049598694e-06, 2.391636371612549e-06, 2.479180693626404e-06, 2.566725015640259e-06, 2.6542693376541138e-06, 2.7418136596679688e-06]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 11.0, 9.0, 11.0, 16.0, 20.0, 39.0, 74.0, 120.0, 185.0, 169.0, 129.0, 86.0, 28.0, 34.0, 20.0, 22.0, 8.0, 8.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020575930830091238, -0.00019892820273526013, -0.00019209708261769265, -0.0001852659770520404, -0.00017843485693447292, -0.00017160375136882067, -0.00016477264580316842, -0.00015794152568560094, -0.00015111040556803346, -0.0001442793000023812, -0.00013744817988481373, -0.00013061707431916147, -0.000123785954201594, -0.00011695484863594174, -0.00011012373579433188, -0.00010329262295272201, -9.646151738706976e-05, -8.96304045454599e-05, -8.279929170385003e-05, -7.596818613819778e-05, -6.91370660206303e-05, -6.230596045497805e-05, -5.547484761336818e-05, -4.864373477175832e-05, -4.181262193014845e-05, -3.498150908853859e-05, -2.8150398065918125e-05, -2.1319287043297663e-05, -1.4488174201687798e-05, -7.657061360077932e-06, -8.259521564468741e-07, 6.005160685162991e-06, 1.2836288078688085e-05, 1.966740092029795e-05, 2.6498511942918412e-05, 3.3329622965538874e-05, 4.016073580714874e-05, 4.6991848648758605e-05, 5.3822957852389663e-05, 6.065407069399953e-05, 6.74851835356094e-05, 7.431629637721926e-05, 8.114740921882913e-05, 8.797852206043899e-05, 9.480962762609124e-05, 0.00010164074774365872, 0.00010847185330931097, 0.00011530296615092084, 0.0001221340789925307, 0.00012896518455818295, 0.00013579630467575043, 0.00014262741024140269, 0.00014945853035897017, 0.00015628963592462242, 0.00016312074149027467, 0.00016995186160784215, 0.00017678298172540963, 0.00018361408729106188, 0.00019044520740862936, 0.0001972763129742816, 0.0002041074330918491, 0.00021093853865750134, 0.0002177696442231536, 0.00022460076434072107, 0.00023143186990637332]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 10.0, 9.0, 8.0, 19.0, 14.0, 10.0, 27.0, 31.0, 36.0, 34.0, 40.0, 35.0, 45.0, 47.0, 52.0, 57.0, 61.0, 47.0, 57.0, 49.0, 57.0, 27.0, 30.0, 28.0, 29.0, 29.0, 24.0, 19.0, 18.0, 9.0, 7.0, 12.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00013880932237952948, -0.00013524501991923898, -0.0001316807174589485, -0.000128116414998658, -0.0001245521125383675, -0.00012098781007807702, -0.00011742351489374414, -0.00011385921243345365, -0.00011029490997316316, -0.00010673060751287267, -0.00010316630505258217, -9.960200259229168e-05, -9.60377074079588e-05, -9.247340494766831e-05, -8.890910248737782e-05, -8.534480002708733e-05, -8.178049756679684e-05, -7.821619510650635e-05, -7.465189264621586e-05, -7.108759018592536e-05, -6.752328772563487e-05, -6.395898526534438e-05, -6.0394690081011504e-05, -5.683038762072101e-05, -5.326608516043052e-05, -4.970178270014003e-05, -4.613748023984954e-05, -4.257318141753785e-05, -3.900887895724736e-05, -3.544457649695687e-05, -3.1880277674645185e-05, -2.8315975214354694e-05, -2.4751665478106588e-05, -2.1187363017816097e-05, -1.762306237651501e-05, -1.4058760825719219e-05, -1.0494459274923429e-05, -6.930156814632937e-06, -3.3658561733318493e-06, 1.9844446796923876e-07, 3.7627469282597303e-06, 7.32704847905552e-06, 1.089135002985131e-05, 1.44556515806471e-05, 1.801995313144289e-05, 2.158425559173338e-05, 2.514855623303447e-05, 2.8712856874335557e-05, 3.227715933462605e-05, 3.584146179491654e-05, 3.940576425520703e-05, 4.2970063077518716e-05, 4.653436553780921e-05, 5.00986679980997e-05, 5.3662966820411384e-05, 5.7227269280701876e-05, 6.079157174099237e-05, 6.435587420128286e-05, 6.792017666157335e-05, 7.148447912186384e-05, 7.504878158215433e-05, 7.861308404244483e-05, 8.21773792267777e-05, 8.57416816870682e-05, 8.930598414735869e-05]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 8.0, 8.0, 7.0, 6.0, 9.0, 17.0, 21.0, 29.0, 32.0, 63.0, 93.0, 129.0, 198.0, 308.0, 413.0, 756.0, 1172.0, 1913.0, 3373.0, 6315.0, 14059.0, 53751.0, 4045380.0, 41054.0, 12101.0, 5615.0, 2895.0, 1674.0, 1037.0, 647.0, 400.0, 277.0, 163.0, 121.0, 91.0, 45.0, 42.0, 24.0, 13.0, 12.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0004799365997314453, -0.00046745315194129944, -0.00045496970415115356, -0.0004424862563610077, -0.0004300028085708618, -0.00041751936078071594, -0.00040503591299057007, -0.0003925524652004242, -0.0003800690174102783, -0.00036758556962013245, -0.00035510212182998657, -0.0003426186740398407, -0.0003301352262496948, -0.00031765177845954895, -0.0003051683306694031, -0.0002926848828792572, -0.00028020143508911133, -0.00026771798729896545, -0.0002552345395088196, -0.0002427510917186737, -0.00023026764392852783, -0.00021778419613838196, -0.00020530074834823608, -0.0001928173005580902, -0.00018033385276794434, -0.00016785040497779846, -0.0001553669571876526, -0.00014288350939750671, -0.00013040006160736084, -0.00011791661381721497, -0.00010543316602706909, -9.294971823692322e-05, -8.046627044677734e-05, -6.798282265663147e-05, -5.5499374866485596e-05, -4.301592707633972e-05, -3.053247928619385e-05, -1.8049031496047974e-05, -5.5655837059021e-06, 6.917864084243774e-06, 1.940131187438965e-05, 3.188475966453552e-05, 4.4368207454681396e-05, 5.685165524482727e-05, 6.933510303497314e-05, 8.181855082511902e-05, 9.430199861526489e-05, 0.00010678544640541077, 0.00011926889419555664, 0.00013175234198570251, 0.0001442357897758484, 0.00015671923756599426, 0.00016920268535614014, 0.000181686133146286, 0.00019416958093643188, 0.00020665302872657776, 0.00021913647651672363, 0.0002316199243068695, 0.00024410337209701538, 0.00025658681988716125, 0.00026907026767730713, 0.000281553715467453, 0.0002940371632575989, 0.00030652061104774475, 0.0003190040588378906]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 5.0, 10.0, 14.0, 15.0, 25.0, 24.0, 28.0, 37.0, 30.0, 33.0, 46.0, 61.0, 56.0, 52.0, 64.0, 50.0, 61.0, 53.0, 50.0, 44.0, 45.0, 31.0, 29.0, 22.0, 23.0, 16.0, 15.0, 12.0, 12.0, 6.0, 8.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.887052536010742e-05, -8.653290569782257e-05, -8.419528603553772e-05, -8.185766637325287e-05, -7.952004671096802e-05, -7.718242704868317e-05, -7.484480738639832e-05, -7.250718772411346e-05, -7.016956806182861e-05, -6.783194839954376e-05, -6.549432873725891e-05, -6.315670907497406e-05, -6.081908941268921e-05, -5.848146975040436e-05, -5.614385008811951e-05, -5.3806230425834656e-05, -5.1468610763549805e-05, -4.9130991101264954e-05, -4.67933714389801e-05, -4.445575177669525e-05, -4.21181321144104e-05, -3.978051245212555e-05, -3.74428927898407e-05, -3.510527312755585e-05, -3.2767653465270996e-05, -3.0430033802986145e-05, -2.8092414140701294e-05, -2.5754794478416443e-05, -2.3417174816131592e-05, -2.107955515384674e-05, -1.874193549156189e-05, -1.640431582927704e-05, -1.4066696166992188e-05, -1.1729076504707336e-05, -9.391456842422485e-06, -7.053837180137634e-06, -4.716217517852783e-06, -2.378597855567932e-06, -4.0978193283081055e-08, 2.29664146900177e-06, 4.634261131286621e-06, 6.971880793571472e-06, 9.309500455856323e-06, 1.1647120118141174e-05, 1.3984739780426025e-05, 1.6322359442710876e-05, 1.8659979104995728e-05, 2.099759876728058e-05, 2.333521842956543e-05, 2.567283809185028e-05, 2.8010457754135132e-05, 3.0348077416419983e-05, 3.2685697078704834e-05, 3.5023316740989685e-05, 3.7360936403274536e-05, 3.969855606555939e-05, 4.203617572784424e-05, 4.437379539012909e-05, 4.671141505241394e-05, 4.904903471469879e-05, 5.138665437698364e-05, 5.3724274039268494e-05, 5.6061893701553345e-05, 5.8399513363838196e-05, 6.073713302612305e-05]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 10.0, 12.0, 18.0, 18.0, 24.0, 53.0, 94.0, 151.0, 291.0, 574.0, 1182.0, 2733.0, 7930.0, 29188.0, 806589.0, 3299741.0, 31802.0, 8413.0, 2941.0, 1230.0, 550.0, 295.0, 152.0, 106.0, 69.0, 36.0, 23.0, 12.0, 15.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.000453948974609375, -0.000440988689661026, -0.000428028404712677, -0.000415068119764328, -0.000402107834815979, -0.00038914754986763, -0.000376187264919281, -0.000363226979970932, -0.000350266695022583, -0.000337306410074234, -0.000324346125125885, -0.000311385840177536, -0.000298425555229187, -0.000285465270280838, -0.000272504985332489, -0.00025954470038414, -0.000246584415435791, -0.00023362413048744202, -0.00022066384553909302, -0.00020770356059074402, -0.00019474327564239502, -0.00018178299069404602, -0.00016882270574569702, -0.00015586242079734802, -0.00014290213584899902, -0.00012994185090065002, -0.00011698156595230103, -0.00010402128100395203, -9.106099605560303e-05, -7.810071110725403e-05, -6.514042615890503e-05, -5.218014121055603e-05, -3.921985626220703e-05, -2.6259571313858032e-05, -1.3299286365509033e-05, -3.390014171600342e-07, 1.2621283531188965e-05, 2.5581568479537964e-05, 3.854185342788696e-05, 5.150213837623596e-05, 6.446242332458496e-05, 7.742270827293396e-05, 9.038299322128296e-05, 0.00010334327816963196, 0.00011630356311798096, 0.00012926384806632996, 0.00014222413301467896, 0.00015518441796302795, 0.00016814470291137695, 0.00018110498785972595, 0.00019406527280807495, 0.00020702555775642395, 0.00021998584270477295, 0.00023294612765312195, 0.00024590641260147095, 0.00025886669754981995, 0.00027182698249816895, 0.00028478726744651794, 0.00029774755239486694, 0.00031070783734321594, 0.00032366812229156494, 0.00033662840723991394, 0.00034958869218826294, 0.00036254897713661194, 0.00037550926208496094]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 6.0, 5.0, 4.0, 12.0, 15.0, 17.0, 20.0, 22.0, 31.0, 44.0, 89.0, 308.0, 2784.0, 433.0, 117.0, 43.0, 26.0, 18.0, 16.0, 12.0, 6.0, 6.0, 7.0, 8.0, 4.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.258487701416016e-05, -6.07762485742569e-05, -5.896762013435364e-05, -5.715899169445038e-05, -5.535036325454712e-05, -5.354173481464386e-05, -5.17331063747406e-05, -4.992447793483734e-05, -4.811584949493408e-05, -4.630722105503082e-05, -4.4498592615127563e-05, -4.2689964175224304e-05, -4.0881335735321045e-05, -3.9072707295417786e-05, -3.7264078855514526e-05, -3.545545041561127e-05, -3.364682197570801e-05, -3.183819353580475e-05, -3.002956509590149e-05, -2.822093665599823e-05, -2.641230821609497e-05, -2.460367977619171e-05, -2.2795051336288452e-05, -2.0986422896385193e-05, -1.9177794456481934e-05, -1.7369166016578674e-05, -1.5560537576675415e-05, -1.3751909136772156e-05, -1.1943280696868896e-05, -1.0134652256965637e-05, -8.326023817062378e-06, -6.517395377159119e-06, -4.708766937255859e-06, -2.9001384973526e-06, -1.0915100574493408e-06, 7.171183824539185e-07, 2.5257468223571777e-06, 4.334375262260437e-06, 6.143003702163696e-06, 7.951632142066956e-06, 9.760260581970215e-06, 1.1568889021873474e-05, 1.3377517461776733e-05, 1.5186145901679993e-05, 1.6994774341583252e-05, 1.880340278148651e-05, 2.061203122138977e-05, 2.242065966129303e-05, 2.422928810119629e-05, 2.603791654109955e-05, 2.7846544981002808e-05, 2.9655173420906067e-05, 3.1463801860809326e-05, 3.3272430300712585e-05, 3.5081058740615845e-05, 3.6889687180519104e-05, 3.869831562042236e-05, 4.050694406032562e-05, 4.231557250022888e-05, 4.412420094013214e-05, 4.59328293800354e-05, 4.774145781993866e-05, 4.955008625984192e-05, 5.135871469974518e-05, 5.316734313964844e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 9.0, 10.0, 12.0, 25.0, 30.0, 41.0, 61.0, 103.0, 134.0, 160.0, 125.0, 73.0, 50.0, 47.0, 29.0, 20.0, 8.0, 13.0, 11.0, 5.0, 8.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.00013855243742000312, -0.00013483522343449295, -0.00013111799489706755, -0.00012740078091155738, -0.00012368355237413198, -0.00011996633838862181, -0.00011624911712715402, -0.00011253189586568624, -0.00010881467460421845, -0.00010509745334275067, -0.00010138023208128288, -9.76630108198151e-05, -9.394579683430493e-05, -9.022856829687953e-05, -8.651135431136936e-05, -8.279413304990157e-05, -7.907691178843379e-05, -7.5359690526966e-05, -7.164246926549822e-05, -6.792524800403044e-05, -6.420802674256265e-05, -6.0490809119073674e-05, -5.6773591495584697e-05, -5.305637023411691e-05, -4.933914897264913e-05, -4.562192771118134e-05, -4.190470644971356e-05, -3.818748882622458e-05, -3.4470267564756796e-05, -3.075304630328901e-05, -2.703582686081063e-05, -2.331860741833225e-05, -1.960139343282208e-05, -1.5884172171354294e-05, -1.2166952728875913e-05, -8.44973237690283e-06, -4.732512024929747e-06, -1.0152907634619623e-06, 2.7019286790164188e-06, 6.4191481214948e-06, 1.0136369382962584e-05, 1.3853589734935667e-05, 1.757081008690875e-05, 2.128802952938713e-05, 2.5005250790854916e-05, 2.87224720523227e-05, 3.243968967581168e-05, 3.615691093727946e-05, 3.987413219874725e-05, 4.359135346021503e-05, 4.730857472168282e-05, 5.1025792345171794e-05, 5.474301360663958e-05, 5.8460234868107364e-05, 6.217745249159634e-05, 6.589467375306413e-05, 6.961189501453191e-05, 7.33291162759997e-05, 7.704633753746748e-05, 8.076355879893526e-05, 8.448078006040305e-05, 8.819799404591322e-05, 9.1915215307381e-05, 9.563243656884879e-05, 9.934965783031657e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 3.0, 9.0, 10.0, 7.0, 15.0, 13.0, 8.0, 19.0, 20.0, 25.0, 28.0, 35.0, 41.0, 31.0, 34.0, 28.0, 40.0, 50.0, 49.0, 50.0, 56.0, 37.0, 44.0, 39.0, 34.0, 38.0, 34.0, 28.0, 25.0, 19.0, 19.0, 16.0, 13.0, 12.0, 16.0, 18.0, 7.0, 6.0, 5.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0], "bins": [-7.5403084338177e-05, -7.339872536249459e-05, -7.139435911085457e-05, -6.939000013517216e-05, -6.738563388353214e-05, -6.538127490784973e-05, -6.337690865620971e-05, -6.13725496805273e-05, -5.9368187066866085e-05, -5.736382445320487e-05, -5.5359461839543656e-05, -5.335509922588244e-05, -5.135074025020003e-05, -4.934637399856001e-05, -4.7342015022877604e-05, -4.533765240921639e-05, -4.3333289795555174e-05, -4.132892718189396e-05, -3.9324564568232745e-05, -3.732020195457153e-05, -3.5315839340910316e-05, -3.331148036522791e-05, -3.130711775156669e-05, -2.930275513790548e-05, -2.7298392524244264e-05, -2.529402991058305e-05, -2.3289667296921834e-05, -2.1285306502250023e-05, -1.928094388858881e-05, -1.7276581274927594e-05, -1.5272220480255783e-05, -1.3267857866594568e-05, -1.1263495252933353e-05, -9.259132639272138e-06, -7.2547709351056255e-06, -5.250408776191762e-06, -3.246046617277898e-06, -1.2416840036166832e-06, 7.626777005498298e-07, 2.7670394047163427e-06, 4.771402018377557e-06, 6.775764177291421e-06, 8.780126336205285e-06, 1.0784488040371798e-05, 1.2788850654033013e-05, 1.4793213267694227e-05, 1.679757406236604e-05, 1.8801936676027253e-05, 2.0806299289688468e-05, 2.2810661903349683e-05, 2.4815024517010897e-05, 2.681938531168271e-05, 2.8823747925343923e-05, 3.0828108720015734e-05, 3.283247133367695e-05, 3.4836833947338164e-05, 3.684119656099938e-05, 3.884555917466059e-05, 4.084992178832181e-05, 4.285428440198302e-05, 4.485864337766543e-05, 4.686300962930545e-05, 4.886736860498786e-05, 5.0871731218649074e-05, 5.287609383231029e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 8.0, 5.0, 7.0, 20.0, 22.0, 25.0, 56.0, 70.0, 112.0, 171.0, 241.0, 387.0, 610.0, 945.0, 1430.0, 2380.0, 3782.0, 6405.0, 11533.0, 20931.0, 43125.0, 95824.0, 237109.0, 338854.0, 152212.0, 64544.0, 30500.0, 15311.0, 8732.0, 5030.0, 2903.0, 1905.0, 1161.0, 757.0, 487.0, 337.0, 223.0, 133.0, 87.0, 55.0, 43.0, 23.0, 25.0, 13.0, 9.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-8.767843246459961e-05, -8.519180119037628e-05, -8.270516991615295e-05, -8.021853864192963e-05, -7.77319073677063e-05, -7.524527609348297e-05, -7.275864481925964e-05, -7.027201354503632e-05, -6.778538227081299e-05, -6.529875099658966e-05, -6.281211972236633e-05, -6.0325488448143005e-05, -5.783885717391968e-05, -5.535222589969635e-05, -5.286559462547302e-05, -5.0378963351249695e-05, -4.789233207702637e-05, -4.540570080280304e-05, -4.291906952857971e-05, -4.0432438254356384e-05, -3.794580698013306e-05, -3.545917570590973e-05, -3.29725444316864e-05, -3.0485913157463074e-05, -2.7999281883239746e-05, -2.551265060901642e-05, -2.302601933479309e-05, -2.0539388060569763e-05, -1.8052756786346436e-05, -1.5566125512123108e-05, -1.307949423789978e-05, -1.0592862963676453e-05, -8.106231689453125e-06, -5.619600415229797e-06, -3.1329691410064697e-06, -6.463378667831421e-07, 1.8402934074401855e-06, 4.326924681663513e-06, 6.813555955886841e-06, 9.300187230110168e-06, 1.1786818504333496e-05, 1.4273449778556824e-05, 1.676008105278015e-05, 1.924671232700348e-05, 2.1733343601226807e-05, 2.4219974875450134e-05, 2.6706606149673462e-05, 2.919323742389679e-05, 3.167986869812012e-05, 3.4166499972343445e-05, 3.665313124656677e-05, 3.91397625207901e-05, 4.162639379501343e-05, 4.4113025069236755e-05, 4.659965634346008e-05, 4.908628761768341e-05, 5.157291889190674e-05, 5.4059550166130066e-05, 5.6546181440353394e-05, 5.903281271457672e-05, 6.151944398880005e-05, 6.400607526302338e-05, 6.64927065372467e-05, 6.897933781147003e-05, 7.146596908569336e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 10.0, 11.0, 9.0, 8.0, 12.0, 13.0, 16.0, 23.0, 30.0, 28.0, 34.0, 37.0, 40.0, 35.0, 46.0, 38.0, 47.0, 53.0, 42.0, 65.0, 56.0, 37.0, 42.0, 28.0, 42.0, 27.0, 23.0, 23.0, 24.0, 21.0, 13.0, 16.0, 13.0, 10.0, 9.0, 4.0, 6.0, 3.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.891654968261719e-05, -7.678661495447159e-05, -7.465668022632599e-05, -7.252674549818039e-05, -7.039681077003479e-05, -6.826687604188919e-05, -6.613694131374359e-05, -6.400700658559799e-05, -6.187707185745239e-05, -5.974713712930679e-05, -5.7617202401161194e-05, -5.5487267673015594e-05, -5.3357332944869995e-05, -5.1227398216724396e-05, -4.9097463488578796e-05, -4.69675287604332e-05, -4.48375940322876e-05, -4.2707659304142e-05, -4.05777245759964e-05, -3.84477898478508e-05, -3.63178551197052e-05, -3.41879203915596e-05, -3.2057985663414e-05, -2.9928050935268402e-05, -2.7798116207122803e-05, -2.5668181478977203e-05, -2.3538246750831604e-05, -2.1408312022686005e-05, -1.9278377294540405e-05, -1.7148442566394806e-05, -1.5018507838249207e-05, -1.2888573110103607e-05, -1.0758638381958008e-05, -8.628703653812408e-06, -6.498768925666809e-06, -4.36883419752121e-06, -2.2388994693756104e-06, -1.0896474123001099e-07, 2.0209699869155884e-06, 4.150904715061188e-06, 6.280839443206787e-06, 8.410774171352386e-06, 1.0540708899497986e-05, 1.2670643627643585e-05, 1.4800578355789185e-05, 1.6930513083934784e-05, 1.9060447812080383e-05, 2.1190382540225983e-05, 2.3320317268371582e-05, 2.545025199651718e-05, 2.758018672466278e-05, 2.971012145280838e-05, 3.184005618095398e-05, 3.396999090909958e-05, 3.609992563724518e-05, 3.822986036539078e-05, 4.035979509353638e-05, 4.2489729821681976e-05, 4.4619664549827576e-05, 4.6749599277973175e-05, 4.8879534006118774e-05, 5.1009468734264374e-05, 5.313940346240997e-05, 5.526933819055557e-05, 5.739927291870117e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 14.0, 21.0, 31.0, 20.0, 23.0, 40.0, 54.0, 98.0, 127.0, 207.0, 258.0, 358.0, 477.0, 690.0, 1120.0, 1584.0, 2490.0, 3960.0, 6590.0, 12181.0, 25082.0, 66141.0, 281959.0, 486886.0, 90785.0, 31804.0, 14839.0, 7723.0, 4479.0, 2766.0, 1830.0, 1223.0, 803.0, 515.0, 400.0, 289.0, 190.0, 106.0, 106.0, 101.0, 56.0, 33.0, 22.0, 14.0, 15.0, 12.0, 9.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.685754776000977e-05, -9.384378790855408e-05, -9.083002805709839e-05, -8.78162682056427e-05, -8.480250835418701e-05, -8.178874850273132e-05, -7.877498865127563e-05, -7.576122879981995e-05, -7.274746894836426e-05, -6.973370909690857e-05, -6.671994924545288e-05, -6.370618939399719e-05, -6.0692429542541504e-05, -5.7678669691085815e-05, -5.466490983963013e-05, -5.165114998817444e-05, -4.863739013671875e-05, -4.562363028526306e-05, -4.260987043380737e-05, -3.9596110582351685e-05, -3.6582350730895996e-05, -3.356859087944031e-05, -3.055483102798462e-05, -2.754107117652893e-05, -2.4527311325073242e-05, -2.1513551473617554e-05, -1.8499791622161865e-05, -1.5486031770706177e-05, -1.2472271919250488e-05, -9.4585120677948e-06, -6.444752216339111e-06, -3.430992364883423e-06, -4.172325134277344e-07, 2.596527338027954e-06, 5.610287189483643e-06, 8.624047040939331e-06, 1.163780689239502e-05, 1.4651566743850708e-05, 1.7665326595306396e-05, 2.0679086446762085e-05, 2.3692846298217773e-05, 2.6706606149673462e-05, 2.972036600112915e-05, 3.273412585258484e-05, 3.574788570404053e-05, 3.8761645555496216e-05, 4.1775405406951904e-05, 4.478916525840759e-05, 4.780292510986328e-05, 5.081668496131897e-05, 5.383044481277466e-05, 5.684420466423035e-05, 5.9857964515686035e-05, 6.287172436714172e-05, 6.588548421859741e-05, 6.88992440700531e-05, 7.191300392150879e-05, 7.492676377296448e-05, 7.794052362442017e-05, 8.095428347587585e-05, 8.396804332733154e-05, 8.698180317878723e-05, 8.999556303024292e-05, 9.300932288169861e-05, 9.60230827331543e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 7.0, 11.0, 8.0, 10.0, 9.0, 16.0, 12.0, 24.0, 18.0, 19.0, 18.0, 22.0, 26.0, 28.0, 33.0, 22.0, 35.0, 40.0, 49.0, 46.0, 48.0, 32.0, 36.0, 32.0, 33.0, 32.0, 36.0, 36.0, 35.0, 26.0, 19.0, 26.0, 25.0, 18.0, 11.0, 14.0, 12.0, 16.0, 12.0, 9.0, 11.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-3.8564205169677734e-05, -3.7408433854579926e-05, -3.625266253948212e-05, -3.509689122438431e-05, -3.39411199092865e-05, -3.278534859418869e-05, -3.162957727909088e-05, -3.0473805963993073e-05, -2.9318034648895264e-05, -2.8162263333797455e-05, -2.7006492018699646e-05, -2.5850720703601837e-05, -2.469494938850403e-05, -2.353917807340622e-05, -2.238340675830841e-05, -2.1227635443210602e-05, -2.0071864128112793e-05, -1.8916092813014984e-05, -1.7760321497917175e-05, -1.6604550182819366e-05, -1.5448778867721558e-05, -1.4293007552623749e-05, -1.313723623752594e-05, -1.1981464922428131e-05, -1.0825693607330322e-05, -9.669922292232513e-06, -8.514150977134705e-06, -7.358379662036896e-06, -6.202608346939087e-06, -5.046837031841278e-06, -3.891065716743469e-06, -2.7352944016456604e-06, -1.5795230865478516e-06, -4.237517714500427e-07, 7.320195436477661e-07, 1.887790858745575e-06, 3.043562173843384e-06, 4.199333488941193e-06, 5.3551048040390015e-06, 6.51087611913681e-06, 7.666647434234619e-06, 8.822418749332428e-06, 9.978190064430237e-06, 1.1133961379528046e-05, 1.2289732694625854e-05, 1.3445504009723663e-05, 1.4601275324821472e-05, 1.575704663991928e-05, 1.691281795501709e-05, 1.80685892701149e-05, 1.9224360585212708e-05, 2.0380131900310516e-05, 2.1535903215408325e-05, 2.2691674530506134e-05, 2.3847445845603943e-05, 2.5003217160701752e-05, 2.615898847579956e-05, 2.731475979089737e-05, 2.8470531105995178e-05, 2.9626302421092987e-05, 3.0782073736190796e-05, 3.1937845051288605e-05, 3.3093616366386414e-05, 3.424938768148422e-05, 3.540515899658203e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 4.0, 8.0, 19.0, 14.0, 16.0, 28.0, 41.0, 53.0, 66.0, 116.0, 168.0, 200.0, 315.0, 453.0, 746.0, 1296.0, 2237.0, 3921.0, 8212.0, 16658.0, 48980.0, 666017.0, 227181.0, 41281.0, 14150.0, 7445.0, 3737.0, 1825.0, 1199.0, 742.0, 446.0, 304.0, 191.0, 143.0, 103.0, 65.0, 55.0, 34.0, 25.0, 17.0, 10.0, 6.0, 11.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.473592758178711e-05, -2.3984350264072418e-05, -2.3232772946357727e-05, -2.2481195628643036e-05, -2.1729618310928345e-05, -2.0978040993213654e-05, -2.0226463675498962e-05, -1.947488635778427e-05, -1.872330904006958e-05, -1.797173172235489e-05, -1.7220154404640198e-05, -1.6468577086925507e-05, -1.5716999769210815e-05, -1.4965422451496124e-05, -1.4213845133781433e-05, -1.3462267816066742e-05, -1.271069049835205e-05, -1.195911318063736e-05, -1.1207535862922668e-05, -1.0455958545207977e-05, -9.704381227493286e-06, -8.952803909778595e-06, -8.201226592063904e-06, -7.449649274349213e-06, -6.6980719566345215e-06, -5.94649463891983e-06, -5.194917321205139e-06, -4.443340003490448e-06, -3.691762685775757e-06, -2.9401853680610657e-06, -2.1886080503463745e-06, -1.4370307326316833e-06, -6.854534149169922e-07, 6.612390279769897e-08, 8.177012205123901e-07, 1.5692785382270813e-06, 2.3208558559417725e-06, 3.0724331736564636e-06, 3.824010491371155e-06, 4.575587809085846e-06, 5.327165126800537e-06, 6.078742444515228e-06, 6.8303197622299194e-06, 7.581897079944611e-06, 8.333474397659302e-06, 9.085051715373993e-06, 9.836629033088684e-06, 1.0588206350803375e-05, 1.1339783668518066e-05, 1.2091360986232758e-05, 1.2842938303947449e-05, 1.359451562166214e-05, 1.4346092939376831e-05, 1.5097670257091522e-05, 1.5849247574806213e-05, 1.6600824892520905e-05, 1.7352402210235596e-05, 1.8103979527950287e-05, 1.8855556845664978e-05, 1.960713416337967e-05, 2.035871148109436e-05, 2.111028879880905e-05, 2.1861866116523743e-05, 2.2613443434238434e-05, 2.3365020751953125e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 1.0, 14.0, 2.0, 15.0, 13.0, 12.0, 39.0, 20.0, 24.0, 24.0, 48.0, 125.0, 86.0, 131.0, 96.0, 65.0, 61.0, 92.0, 25.0, 24.0, 16.0, 12.0, 20.0, 10.0, 5.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.955777406692505e-06, -1.8849968910217285e-06, -1.8142163753509521e-06, -1.7434358596801758e-06, -1.6726553440093994e-06, -1.601874828338623e-06, -1.5310943126678467e-06, -1.4603137969970703e-06, -1.389533281326294e-06, -1.3187527656555176e-06, -1.2479722499847412e-06, -1.1771917343139648e-06, -1.1064112186431885e-06, -1.0356307029724121e-06, -9.648501873016357e-07, -8.940696716308594e-07, -8.23289155960083e-07, -7.525086402893066e-07, -6.817281246185303e-07, -6.109476089477539e-07, -5.401670932769775e-07, -4.6938657760620117e-07, -3.986060619354248e-07, -3.2782554626464844e-07, -2.5704503059387207e-07, -1.862645149230957e-07, -1.1548399925231934e-07, -4.470348358154297e-08, 2.60770320892334e-08, 9.685754776000977e-08, 1.6763806343078613e-07, 2.384185791015625e-07, 3.0919909477233887e-07, 3.7997961044311523e-07, 4.507601261138916e-07, 5.21540641784668e-07, 5.923211574554443e-07, 6.631016731262207e-07, 7.338821887969971e-07, 8.046627044677734e-07, 8.754432201385498e-07, 9.462237358093262e-07, 1.0170042514801025e-06, 1.087784767150879e-06, 1.1585652828216553e-06, 1.2293457984924316e-06, 1.300126314163208e-06, 1.3709068298339844e-06, 1.4416873455047607e-06, 1.5124678611755371e-06, 1.5832483768463135e-06, 1.6540288925170898e-06, 1.7248094081878662e-06, 1.7955899238586426e-06, 1.866370439529419e-06, 1.9371509552001953e-06, 2.0079314708709717e-06, 2.078711986541748e-06, 2.1494925022125244e-06, 2.2202730178833008e-06, 2.291053533554077e-06, 2.3618340492248535e-06, 2.43261456489563e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 8.0, 7.0, 8.0, 13.0, 24.0, 38.0, 54.0, 87.0, 120.0, 211.0, 402.0, 877.0, 2000.0, 5144.0, 17782.0, 101157.0, 828290.0, 71257.0, 13259.0, 4452.0, 1652.0, 805.0, 381.0, 216.0, 116.0, 69.0, 42.0, 18.0, 19.0, 9.0, 10.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.756450653076172e-05, -4.605017602443695e-05, -4.453584551811218e-05, -4.3021515011787415e-05, -4.1507184505462646e-05, -3.999285399913788e-05, -3.847852349281311e-05, -3.696419298648834e-05, -3.5449862480163574e-05, -3.3935531973838806e-05, -3.242120146751404e-05, -3.090687096118927e-05, -2.9392540454864502e-05, -2.7878209948539734e-05, -2.6363879442214966e-05, -2.4849548935890198e-05, -2.333521842956543e-05, -2.182088792324066e-05, -2.0306557416915894e-05, -1.8792226910591125e-05, -1.7277896404266357e-05, -1.576356589794159e-05, -1.4249235391616821e-05, -1.2734904885292053e-05, -1.1220574378967285e-05, -9.706243872642517e-06, -8.191913366317749e-06, -6.677582859992981e-06, -5.163252353668213e-06, -3.648921847343445e-06, -2.1345913410186768e-06, -6.202608346939087e-07, 8.940696716308594e-07, 2.4084001779556274e-06, 3.9227306842803955e-06, 5.4370611906051636e-06, 6.951391696929932e-06, 8.4657222032547e-06, 9.980052709579468e-06, 1.1494383215904236e-05, 1.3008713722229004e-05, 1.4523044228553772e-05, 1.603737473487854e-05, 1.7551705241203308e-05, 1.9066035747528076e-05, 2.0580366253852844e-05, 2.2094696760177612e-05, 2.360902726650238e-05, 2.512335777282715e-05, 2.6637688279151917e-05, 2.8152018785476685e-05, 2.9666349291801453e-05, 3.118067979812622e-05, 3.269501030445099e-05, 3.420934081077576e-05, 3.5723671317100525e-05, 3.723800182342529e-05, 3.875233232975006e-05, 4.026666283607483e-05, 4.17809933423996e-05, 4.3295323848724365e-05, 4.480965435504913e-05, 4.63239848613739e-05, 4.783831536769867e-05, 4.935264587402344e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 6.0, 11.0, 2.0, 12.0, 20.0, 27.0, 19.0, 45.0, 65.0, 99.0, 121.0, 180.0, 85.0, 90.0, 54.0, 38.0, 20.0, 29.0, 11.0, 19.0, 8.0, 6.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.318092346191406e-06, -6.109476089477539e-06, -5.900859832763672e-06, -5.692243576049805e-06, -5.4836273193359375e-06, -5.27501106262207e-06, -5.066394805908203e-06, -4.857778549194336e-06, -4.649162292480469e-06, -4.4405460357666016e-06, -4.231929779052734e-06, -4.023313522338867e-06, -3.814697265625e-06, -3.606081008911133e-06, -3.3974647521972656e-06, -3.1888484954833984e-06, -2.9802322387695312e-06, -2.771615982055664e-06, -2.562999725341797e-06, -2.3543834686279297e-06, -2.1457672119140625e-06, -1.9371509552001953e-06, -1.7285346984863281e-06, -1.519918441772461e-06, -1.3113021850585938e-06, -1.1026859283447266e-06, -8.940696716308594e-07, -6.854534149169922e-07, -4.76837158203125e-07, -2.682209014892578e-07, -5.960464477539063e-08, 1.4901161193847656e-07, 3.5762786865234375e-07, 5.662441253662109e-07, 7.748603820800781e-07, 9.834766387939453e-07, 1.1920928955078125e-06, 1.4007091522216797e-06, 1.6093254089355469e-06, 1.817941665649414e-06, 2.0265579223632812e-06, 2.2351741790771484e-06, 2.4437904357910156e-06, 2.652406692504883e-06, 2.86102294921875e-06, 3.069639205932617e-06, 3.2782554626464844e-06, 3.4868717193603516e-06, 3.6954879760742188e-06, 3.904104232788086e-06, 4.112720489501953e-06, 4.32133674621582e-06, 4.5299530029296875e-06, 4.738569259643555e-06, 4.947185516357422e-06, 5.155801773071289e-06, 5.364418029785156e-06, 5.5730342864990234e-06, 5.781650543212891e-06, 5.990266799926758e-06, 6.198883056640625e-06, 6.407499313354492e-06, 6.616115570068359e-06, 6.8247318267822266e-06, 7.033348083496094e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 14.0, 16.0, 15.0, 38.0, 47.0, 57.0, 119.0, 164.0, 167.0, 86.0, 63.0, 49.0, 39.0, 21.0, 27.0, 12.0, 9.0, 13.0, 8.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013186248543206602, -0.00012819450057577342, -0.00012452650116756558, -0.00012085851631127298, -0.00011719053145498037, -0.00011352253932273015, -0.00010985454719047993, -0.00010618656233418733, -0.00010251857020193711, -9.885057806968689e-05, -9.518259321339428e-05, -9.151460108114406e-05, -8.784660894889385e-05, -8.417862409260124e-05, -8.051063196035102e-05, -7.68426398281008e-05, -7.31746549718082e-05, -6.950666283955798e-05, -6.583867798326537e-05, -6.217068585101515e-05, -5.850269735674374e-05, -5.4834708862472326e-05, -5.1166716730222106e-05, -4.7498728235950693e-05, -4.383073974167928e-05, -4.016275124740787e-05, -3.6494762753136456e-05, -3.2826770620886236e-05, -2.9158782126614824e-05, -2.549079363234341e-05, -2.1822803319082595e-05, -1.815481300582178e-05, -1.4486817235592753e-05, -1.0818827831826638e-05, -7.150838428060524e-06, -3.48284902429441e-06, 1.8514037947170436e-07, 3.853128873743117e-06, 7.521119187003933e-06, 1.1189109500264749e-05, 1.4857097994536161e-05, 1.8525086488807574e-05, 2.219307680206839e-05, 2.5861067115329206e-05, 2.952905560960062e-05, 3.319704410387203e-05, 3.686503623612225e-05, 4.053302473039366e-05, 4.4201013224665076e-05, 4.786900171893649e-05, 5.15369902132079e-05, 5.520498234545812e-05, 5.887297083972953e-05, 6.254095933400095e-05, 6.620895146625116e-05, 6.987694359850138e-05, 7.354492845479399e-05, 7.721292058704421e-05, 8.088090544333681e-05, 8.454889757558703e-05, 8.821688243187964e-05, 9.188487456412986e-05, 9.555286669638008e-05, 9.922085155267268e-05, 0.0001028888436849229]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 5.0, 6.0, 14.0, 6.0, 17.0, 11.0, 13.0, 27.0, 22.0, 16.0, 33.0, 37.0, 44.0, 31.0, 35.0, 30.0, 44.0, 51.0, 44.0, 57.0, 42.0, 50.0, 35.0, 36.0, 28.0, 47.0, 31.0, 22.0, 25.0, 17.0, 18.0, 17.0, 12.0, 15.0, 15.0, 9.0, 9.0, 6.0, 4.0, 4.0, 7.0, 3.0, 4.0, 3.0, 1.0], "bins": [-7.107014243956655e-05, -6.920228042872623e-05, -6.733442569384351e-05, -6.546656368300319e-05, -6.359870167216286e-05, -6.173083966132253e-05, -5.986298492643982e-05, -5.7995122915599495e-05, -5.6127264542737976e-05, -5.4259406169876456e-05, -5.239154415903613e-05, -5.052368578617461e-05, -4.865582741331309e-05, -4.6787965402472764e-05, -4.4920107029611245e-05, -4.3052248656749725e-05, -4.11843866459094e-05, -3.931652827304788e-05, -3.744866626220755e-05, -3.558080788934603e-05, -3.371294587850571e-05, -3.184508750564419e-05, -2.9977229132782668e-05, -2.8109368940931745e-05, -2.6241508749080822e-05, -2.43736485572299e-05, -2.2505788365378976e-05, -2.0637929992517456e-05, -1.8770069800666533e-05, -1.690220960881561e-05, -1.503435032645939e-05, -1.3166491044103168e-05, -1.1298634490231052e-05, -9.430774298380129e-06, -7.562915016023908e-06, -5.695055278920336e-06, -3.827195541816764e-06, -1.9593353499658406e-06, -9.147606760961935e-08, 1.7763832147466019e-06, 3.644243406597525e-06, 5.512103143701097e-06, 7.379962880804669e-06, 9.24782216316089e-06, 1.1115682355011813e-05, 1.2983542546862736e-05, 1.4851401829218958e-05, 1.671926111157518e-05, 1.8587121303426102e-05, 2.0454981495277025e-05, 2.2322841687127948e-05, 2.4190700059989467e-05, 2.605856025184039e-05, 2.7926420443691313e-05, 2.9794278816552833e-05, 3.166213718941435e-05, 3.352999920025468e-05, 3.53978575731162e-05, 3.7265719583956525e-05, 3.9133577956818044e-05, 4.100143996765837e-05, 4.286929834051989e-05, 4.473715671338141e-05, 4.6605018724221736e-05, 4.8472877097083256e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 11.0, 6.0, 12.0, 15.0, 28.0, 48.0, 72.0, 89.0, 124.0, 239.0, 344.0, 566.0, 1046.0, 1721.0, 3217.0, 5755.0, 11500.0, 23685.0, 54202.0, 144370.0, 425031.0, 233276.0, 78310.0, 32452.0, 15382.0, 7594.0, 4091.0, 2197.0, 1227.0, 731.0, 445.0, 258.0, 155.0, 90.0, 66.0, 65.0, 42.0, 30.0, 17.0, 13.0, 7.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-0.0003108978271484375, -0.0003024265170097351, -0.0002939552068710327, -0.0002854838967323303, -0.00027701258659362793, -0.00026854127645492554, -0.00026006996631622314, -0.00025159865617752075, -0.00024312734603881836, -0.00023465603590011597, -0.00022618472576141357, -0.00021771341562271118, -0.0002092421054840088, -0.0002007707953453064, -0.000192299485206604, -0.0001838281750679016, -0.00017535686492919922, -0.00016688555479049683, -0.00015841424465179443, -0.00014994293451309204, -0.00014147162437438965, -0.00013300031423568726, -0.00012452900409698486, -0.00011605769395828247, -0.00010758638381958008, -9.911507368087769e-05, -9.064376354217529e-05, -8.21724534034729e-05, -7.370114326477051e-05, -6.522983312606812e-05, -5.675852298736572e-05, -4.828721284866333e-05, -3.981590270996094e-05, -3.1344592571258545e-05, -2.2873282432556152e-05, -1.440197229385376e-05, -5.930662155151367e-06, 2.5406479835510254e-06, 1.1011958122253418e-05, 1.948326826095581e-05, 2.7954578399658203e-05, 3.6425888538360596e-05, 4.489719867706299e-05, 5.336850881576538e-05, 6.183981895446777e-05, 7.031112909317017e-05, 7.878243923187256e-05, 8.725374937057495e-05, 9.572505950927734e-05, 0.00010419636964797974, 0.00011266767978668213, 0.00012113898992538452, 0.00012961030006408691, 0.0001380816102027893, 0.0001465529203414917, 0.0001550242304801941, 0.00016349554061889648, 0.00017196685075759888, 0.00018043816089630127, 0.00018890947103500366, 0.00019738078117370605, 0.00020585209131240845, 0.00021432340145111084, 0.00022279471158981323, 0.00023126602172851562]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 1.0, 4.0, 10.0, 16.0, 6.0, 14.0, 14.0, 13.0, 22.0, 17.0, 46.0, 33.0, 38.0, 35.0, 44.0, 51.0, 46.0, 50.0, 52.0, 46.0, 58.0, 38.0, 41.0, 46.0, 38.0, 37.0, 26.0, 21.0, 22.0, 26.0, 13.0, 10.0, 9.0, 15.0, 14.0, 12.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.869699478149414e-05, -4.73707914352417e-05, -4.604458808898926e-05, -4.4718384742736816e-05, -4.3392181396484375e-05, -4.2065978050231934e-05, -4.073977470397949e-05, -3.941357135772705e-05, -3.808736801147461e-05, -3.676116466522217e-05, -3.5434961318969727e-05, -3.4108757972717285e-05, -3.2782554626464844e-05, -3.14563512802124e-05, -3.013014793395996e-05, -2.880394458770752e-05, -2.7477741241455078e-05, -2.6151537895202637e-05, -2.4825334548950195e-05, -2.3499131202697754e-05, -2.2172927856445312e-05, -2.084672451019287e-05, -1.952052116394043e-05, -1.8194317817687988e-05, -1.6868114471435547e-05, -1.5541911125183105e-05, -1.4215707778930664e-05, -1.2889504432678223e-05, -1.1563301086425781e-05, -1.023709774017334e-05, -8.910894393920898e-06, -7.584691047668457e-06, -6.258487701416016e-06, -4.932284355163574e-06, -3.606081008911133e-06, -2.2798776626586914e-06, -9.5367431640625e-07, 3.725290298461914e-07, 1.6987323760986328e-06, 3.0249357223510742e-06, 4.351139068603516e-06, 5.677342414855957e-06, 7.0035457611083984e-06, 8.32974910736084e-06, 9.655952453613281e-06, 1.0982155799865723e-05, 1.2308359146118164e-05, 1.3634562492370605e-05, 1.4960765838623047e-05, 1.6286969184875488e-05, 1.761317253112793e-05, 1.893937587738037e-05, 2.0265579223632812e-05, 2.1591782569885254e-05, 2.2917985916137695e-05, 2.4244189262390137e-05, 2.5570392608642578e-05, 2.689659595489502e-05, 2.822279930114746e-05, 2.9549002647399902e-05, 3.0875205993652344e-05, 3.2201409339904785e-05, 3.3527612686157227e-05, 3.485381603240967e-05, 3.618001937866211e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 13.0, 8.0, 10.0, 25.0, 29.0, 47.0, 71.0, 96.0, 142.0, 225.0, 267.0, 424.0, 586.0, 945.0, 1349.0, 2029.0, 3004.0, 4385.0, 6858.0, 10806.0, 16433.0, 26386.0, 44707.0, 78183.0, 157950.0, 328795.0, 165984.0, 79207.0, 44662.0, 26867.0, 16567.0, 10694.0, 7028.0, 4473.0, 3081.0, 2050.0, 1290.0, 871.0, 616.0, 446.0, 276.0, 189.0, 170.0, 103.0, 63.0, 41.0, 26.0, 20.0, 15.0, 22.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.638071060180664e-05, -9.332224726676941e-05, -9.026378393173218e-05, -8.720532059669495e-05, -8.414685726165771e-05, -8.108839392662048e-05, -7.802993059158325e-05, -7.497146725654602e-05, -7.191300392150879e-05, -6.885454058647156e-05, -6.579607725143433e-05, -6.27376139163971e-05, -5.967915058135986e-05, -5.662068724632263e-05, -5.35622239112854e-05, -5.050376057624817e-05, -4.744529724121094e-05, -4.4386833906173706e-05, -4.1328370571136475e-05, -3.826990723609924e-05, -3.521144390106201e-05, -3.215298056602478e-05, -2.909451723098755e-05, -2.6036053895950317e-05, -2.2977590560913086e-05, -1.9919127225875854e-05, -1.6860663890838623e-05, -1.3802200555801392e-05, -1.074373722076416e-05, -7.685273885726929e-06, -4.626810550689697e-06, -1.5683472156524658e-06, 1.4901161193847656e-06, 4.548579454421997e-06, 7.6070427894592285e-06, 1.066550612449646e-05, 1.3723969459533691e-05, 1.6782432794570923e-05, 1.9840896129608154e-05, 2.2899359464645386e-05, 2.5957822799682617e-05, 2.901628613471985e-05, 3.207474946975708e-05, 3.513321280479431e-05, 3.819167613983154e-05, 4.1250139474868774e-05, 4.4308602809906006e-05, 4.736706614494324e-05, 5.042552947998047e-05, 5.34839928150177e-05, 5.654245615005493e-05, 5.960091948509216e-05, 6.26593828201294e-05, 6.571784615516663e-05, 6.877630949020386e-05, 7.183477282524109e-05, 7.489323616027832e-05, 7.795169949531555e-05, 8.101016283035278e-05, 8.406862616539001e-05, 8.712708950042725e-05, 9.018555283546448e-05, 9.324401617050171e-05, 9.630247950553894e-05, 9.936094284057617e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 9.0, 8.0, 17.0, 12.0, 10.0, 18.0, 12.0, 14.0, 21.0, 22.0, 22.0, 16.0, 40.0, 36.0, 32.0, 30.0, 41.0, 37.0, 38.0, 41.0, 54.0, 44.0, 33.0, 39.0, 43.0, 45.0, 28.0, 33.0, 27.0, 23.0, 22.0, 21.0, 18.0, 8.0, 13.0, 14.0, 14.0, 10.0, 8.0, 4.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-3.1113624572753906e-05, -3.0141323804855347e-05, -2.9169023036956787e-05, -2.8196722269058228e-05, -2.7224421501159668e-05, -2.625212073326111e-05, -2.527981996536255e-05, -2.430751919746399e-05, -2.333521842956543e-05, -2.236291766166687e-05, -2.139061689376831e-05, -2.041831612586975e-05, -1.944601535797119e-05, -1.8473714590072632e-05, -1.7501413822174072e-05, -1.6529113054275513e-05, -1.5556812286376953e-05, -1.4584511518478394e-05, -1.3612210750579834e-05, -1.2639909982681274e-05, -1.1667609214782715e-05, -1.0695308446884155e-05, -9.723007678985596e-06, -8.750706911087036e-06, -7.778406143188477e-06, -6.806105375289917e-06, -5.833804607391357e-06, -4.861503839492798e-06, -3.889203071594238e-06, -2.9169023036956787e-06, -1.944601535797119e-06, -9.723007678985596e-07, 0.0, 9.723007678985596e-07, 1.944601535797119e-06, 2.9169023036956787e-06, 3.889203071594238e-06, 4.861503839492798e-06, 5.833804607391357e-06, 6.806105375289917e-06, 7.778406143188477e-06, 8.750706911087036e-06, 9.723007678985596e-06, 1.0695308446884155e-05, 1.1667609214782715e-05, 1.2639909982681274e-05, 1.3612210750579834e-05, 1.4584511518478394e-05, 1.5556812286376953e-05, 1.6529113054275513e-05, 1.7501413822174072e-05, 1.8473714590072632e-05, 1.944601535797119e-05, 2.041831612586975e-05, 2.139061689376831e-05, 2.236291766166687e-05, 2.333521842956543e-05, 2.430751919746399e-05, 2.527981996536255e-05, 2.625212073326111e-05, 2.7224421501159668e-05, 2.8196722269058228e-05, 2.9169023036956787e-05, 3.0141323804855347e-05, 3.1113624572753906e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0, 9.0, 9.0, 22.0, 33.0, 18.0, 37.0, 55.0, 88.0, 119.0, 237.0, 389.0, 616.0, 1130.0, 2229.0, 4475.0, 10504.0, 29866.0, 132705.0, 683334.0, 132707.0, 29752.0, 10505.0, 4589.0, 2261.0, 1196.0, 635.0, 361.0, 237.0, 118.0, 95.0, 65.0, 32.0, 35.0, 26.0, 15.0, 10.0, 13.0, 3.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.887580871582031e-06, -4.708766937255859e-06, -4.5299530029296875e-06, -4.351139068603516e-06, -4.172325134277344e-06, -3.993511199951172e-06, -3.814697265625e-06, -3.635883331298828e-06, -3.4570693969726562e-06, -3.2782554626464844e-06, -3.0994415283203125e-06, -2.9206275939941406e-06, -2.7418136596679688e-06, -2.562999725341797e-06, -2.384185791015625e-06, -2.205371856689453e-06, -2.0265579223632812e-06, -1.8477439880371094e-06, -1.6689300537109375e-06, -1.4901161193847656e-06, -1.3113021850585938e-06, -1.1324882507324219e-06, -9.5367431640625e-07, -7.748603820800781e-07, -5.960464477539062e-07, -4.172325134277344e-07, -2.384185791015625e-07, -5.960464477539063e-08, 1.1920928955078125e-07, 2.980232238769531e-07, 4.76837158203125e-07, 6.556510925292969e-07, 8.344650268554688e-07, 1.0132789611816406e-06, 1.1920928955078125e-06, 1.3709068298339844e-06, 1.5497207641601562e-06, 1.7285346984863281e-06, 1.9073486328125e-06, 2.086162567138672e-06, 2.2649765014648438e-06, 2.4437904357910156e-06, 2.6226043701171875e-06, 2.8014183044433594e-06, 2.9802322387695312e-06, 3.159046173095703e-06, 3.337860107421875e-06, 3.516674041748047e-06, 3.6954879760742188e-06, 3.874301910400391e-06, 4.0531158447265625e-06, 4.231929779052734e-06, 4.410743713378906e-06, 4.589557647705078e-06, 4.76837158203125e-06, 4.947185516357422e-06, 5.125999450683594e-06, 5.304813385009766e-06, 5.4836273193359375e-06, 5.662441253662109e-06, 5.841255187988281e-06, 6.020069122314453e-06, 6.198883056640625e-06, 6.377696990966797e-06, 6.556510925292969e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 8.0, 0.0, 6.0, 0.0, 9.0, 0.0, 13.0, 0.0, 24.0, 0.0, 48.0, 0.0, 103.0, 0.0, 180.0, 0.0, 232.0, 0.0, 159.0, 0.0, 105.0, 0.0, 45.0, 0.0, 28.0, 0.0, 19.0, 0.0, 10.0, 17.0, 0.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.653128027915955e-07, -5.345791578292847e-07, -5.038455128669739e-07, -4.731118679046631e-07, -4.423782229423523e-07, -4.116445779800415e-07, -3.809109330177307e-07, -3.501772880554199e-07, -3.1944364309310913e-07, -2.8870999813079834e-07, -2.5797635316848755e-07, -2.2724270820617676e-07, -1.9650906324386597e-07, -1.6577541828155518e-07, -1.3504177331924438e-07, -1.043081283569336e-07, -7.35744833946228e-08, -4.284083843231201e-08, -1.210719347000122e-08, 1.862645149230957e-08, 4.936009645462036e-08, 8.009374141693115e-08, 1.1082738637924194e-07, 1.4156103134155273e-07, 1.7229467630386353e-07, 2.0302832126617432e-07, 2.337619662284851e-07, 2.644956111907959e-07, 2.952292561531067e-07, 3.259629011154175e-07, 3.5669654607772827e-07, 3.8743019104003906e-07, 4.1816383600234985e-07, 4.4889748096466064e-07, 4.796311259269714e-07, 5.103647708892822e-07, 5.41098415851593e-07, 5.718320608139038e-07, 6.025657057762146e-07, 6.332993507385254e-07, 6.640329957008362e-07, 6.94766640663147e-07, 7.255002856254578e-07, 7.562339305877686e-07, 7.869675755500793e-07, 8.177012205123901e-07, 8.484348654747009e-07, 8.791685104370117e-07, 9.099021553993225e-07, 9.406358003616333e-07, 9.71369445323944e-07, 1.0021030902862549e-06, 1.0328367352485657e-06, 1.0635703802108765e-06, 1.0943040251731873e-06, 1.125037670135498e-06, 1.1557713150978088e-06, 1.1865049600601196e-06, 1.2172386050224304e-06, 1.2479722499847412e-06, 1.278705894947052e-06, 1.3094395399093628e-06, 1.3401731848716736e-06, 1.3709068298339844e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 9.0, 9.0, 14.0, 27.0, 17.0, 35.0, 72.0, 63.0, 100.0, 141.0, 211.0, 243.0, 394.0, 579.0, 957.0, 1459.0, 2607.0, 4756.0, 9710.0, 22516.0, 59224.0, 228672.0, 541757.0, 109464.0, 35509.0, 14319.0, 6681.0, 3464.0, 1943.0, 1197.0, 748.0, 482.0, 338.0, 230.0, 167.0, 116.0, 83.0, 67.0, 34.0, 27.0, 33.0, 23.0, 12.0, 8.0, 8.0, 6.0, 4.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0], "bins": [-3.933906555175781e-06, -3.814697265625e-06, -3.6954879760742188e-06, -3.5762786865234375e-06, -3.4570693969726562e-06, -3.337860107421875e-06, -3.2186508178710938e-06, -3.0994415283203125e-06, -2.9802322387695312e-06, -2.86102294921875e-06, -2.7418136596679688e-06, -2.6226043701171875e-06, -2.5033950805664062e-06, -2.384185791015625e-06, -2.2649765014648438e-06, -2.1457672119140625e-06, -2.0265579223632812e-06, -1.9073486328125e-06, -1.7881393432617188e-06, -1.6689300537109375e-06, -1.5497207641601562e-06, -1.430511474609375e-06, -1.3113021850585938e-06, -1.1920928955078125e-06, -1.0728836059570312e-06, -9.5367431640625e-07, -8.344650268554688e-07, -7.152557373046875e-07, -5.960464477539062e-07, -4.76837158203125e-07, -3.5762786865234375e-07, -2.384185791015625e-07, -1.1920928955078125e-07, 0.0, 1.1920928955078125e-07, 2.384185791015625e-07, 3.5762786865234375e-07, 4.76837158203125e-07, 5.960464477539062e-07, 7.152557373046875e-07, 8.344650268554688e-07, 9.5367431640625e-07, 1.0728836059570312e-06, 1.1920928955078125e-06, 1.3113021850585938e-06, 1.430511474609375e-06, 1.5497207641601562e-06, 1.6689300537109375e-06, 1.7881393432617188e-06, 1.9073486328125e-06, 2.0265579223632812e-06, 2.1457672119140625e-06, 2.2649765014648438e-06, 2.384185791015625e-06, 2.5033950805664062e-06, 2.6226043701171875e-06, 2.7418136596679688e-06, 2.86102294921875e-06, 2.9802322387695312e-06, 3.0994415283203125e-06, 3.2186508178710938e-06, 3.337860107421875e-06, 3.4570693969726562e-06, 3.5762786865234375e-06, 3.6954879760742188e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 5.0, 0.0, 4.0, 16.0, 27.0, 0.0, 40.0, 59.0, 0.0, 101.0, 148.0, 179.0, 0.0, 139.0, 115.0, 62.0, 0.0, 40.0, 28.0, 0.0, 17.0, 7.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4472752809524536e-06, -1.4044344425201416e-06, -1.3615936040878296e-06, -1.3187527656555176e-06, -1.2759119272232056e-06, -1.2330710887908936e-06, -1.1902302503585815e-06, -1.1473894119262695e-06, -1.1045485734939575e-06, -1.0617077350616455e-06, -1.0188668966293335e-06, -9.760260581970215e-07, -9.331852197647095e-07, -8.903443813323975e-07, -8.475035429000854e-07, -8.046627044677734e-07, -7.618218660354614e-07, -7.189810276031494e-07, -6.761401891708374e-07, -6.332993507385254e-07, -5.904585123062134e-07, -5.476176738739014e-07, -5.047768354415894e-07, -4.6193599700927734e-07, -4.1909515857696533e-07, -3.762543201446533e-07, -3.334134817123413e-07, -2.905726432800293e-07, -2.477318048477173e-07, -2.0489096641540527e-07, -1.6205012798309326e-07, -1.1920928955078125e-07, -7.636845111846924e-08, -3.3527612686157227e-08, 9.313225746154785e-09, 5.21540641784668e-08, 9.499490261077881e-08, 1.3783574104309082e-07, 1.8067657947540283e-07, 2.2351741790771484e-07, 2.6635825634002686e-07, 3.0919909477233887e-07, 3.520399332046509e-07, 3.948807716369629e-07, 4.377216100692749e-07, 4.805624485015869e-07, 5.234032869338989e-07, 5.662441253662109e-07, 6.09084963798523e-07, 6.51925802230835e-07, 6.94766640663147e-07, 7.37607479095459e-07, 7.80448317527771e-07, 8.23289155960083e-07, 8.66129994392395e-07, 9.08970832824707e-07, 9.51811671257019e-07, 9.94652509689331e-07, 1.037493348121643e-06, 1.080334186553955e-06, 1.123175024986267e-06, 1.166015863418579e-06, 1.2088567018508911e-06, 1.2516975402832031e-06]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 4.0, 3.0, 7.0, 12.0, 7.0, 8.0, 10.0, 20.0, 22.0, 21.0, 33.0, 44.0, 49.0, 94.0, 124.0, 135.0, 89.0, 58.0, 46.0, 45.0, 30.0, 23.0, 26.0, 12.0, 10.0, 13.0, 7.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0], "bins": [-6.13670126767829e-05, -5.974776649964042e-05, -5.8128520322497934e-05, -5.650927414535545e-05, -5.489002796821296e-05, -5.3270781791070476e-05, -5.165153561392799e-05, -5.003229307476431e-05, -4.841304325964302e-05, -4.679379708250053e-05, -4.5174550905358046e-05, -4.355530472821556e-05, -4.1936058551073074e-05, -4.031681237393059e-05, -3.86975661967881e-05, -3.7078323657624424e-05, -3.545907748048194e-05, -3.383983130333945e-05, -3.2220585126196966e-05, -3.060133894905448e-05, -2.8982092771911994e-05, -2.7362846594769508e-05, -2.5743602236616425e-05, -2.412435605947394e-05, -2.2505109882331453e-05, -2.0885863705188967e-05, -1.926661752804648e-05, -1.76473731698934e-05, -1.6028126992750913e-05, -1.4408879906113725e-05, -1.2789634638465941e-05, -1.1170388461323455e-05, -9.551142284180969e-06, -7.931896107038483e-06, -6.312650384643348e-06, -4.693404662248213e-06, -3.074158485105727e-06, -1.4549123079632409e-06, 1.643329596845433e-07, 1.7835791368270293e-06, 3.4028253139695153e-06, 5.022071491112001e-06, 6.641317213507136e-06, 8.260562935902271e-06, 9.879809113044757e-06, 1.1499055290187243e-05, 1.3118300557835028e-05, 1.4737546734977514e-05, 1.635679291212e-05, 1.7976039089262486e-05, 1.959528526640497e-05, 2.1214531443547457e-05, 2.2833777620689943e-05, 2.445302379783243e-05, 2.6072268155985512e-05, 2.7691514333127998e-05, 2.9310760510270484e-05, 3.0930004868423566e-05, 3.254925104556605e-05, 3.416849722270854e-05, 3.5787743399851024e-05, 3.740698957699351e-05, 3.9026235754135996e-05, 4.064548193127848e-05, 4.226472810842097e-05]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 9.0, 10.0, 17.0, 11.0, 17.0, 22.0, 25.0, 31.0, 29.0, 40.0, 36.0, 38.0, 32.0, 61.0, 57.0, 48.0, 48.0, 59.0, 43.0, 31.0, 42.0, 39.0, 47.0, 28.0, 30.0, 30.0, 24.0, 13.0, 20.0, 15.0, 3.0, 10.0, 9.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.9290239985566586e-05, -4.793240805156529e-05, -4.65745797555428e-05, -4.52167478215415e-05, -4.3858919525519013e-05, -4.250108759151772e-05, -4.114325565751642e-05, -3.978542736149393e-05, -3.842759906547144e-05, -3.7069767131470144e-05, -3.5711938835447654e-05, -3.435410690144636e-05, -3.299627860542387e-05, -3.163844667142257e-05, -3.0280616556410678e-05, -2.8922786441398785e-05, -2.7564954507397488e-05, -2.6207124392385595e-05, -2.48492942773737e-05, -2.3491462343372405e-05, -2.2133634047349915e-05, -2.0775802113348618e-05, -1.9417971998336725e-05, -1.8060141883324832e-05, -1.670231176831294e-05, -1.5344481653301045e-05, -1.3986651538289152e-05, -1.2628820513782557e-05, -1.1270990398770664e-05, -9.91316028375877e-06, -8.555329259252176e-06, -7.1974991442402825e-06, -5.839672667207196e-06, -4.481842552195303e-06, -3.124011982436059e-06, -1.766181412676815e-06, -4.0835129766492173e-07, 9.494788173469715e-07, 2.3073098418535665e-06, 3.6651399568654597e-06, 5.022970071877353e-06, 6.380800186889246e-06, 7.73863030190114e-06, 9.096461326407734e-06, 1.0454291441419628e-05, 1.181212155643152e-05, 1.3169952580938116e-05, 1.4527782695950009e-05, 1.5885612810961902e-05, 1.7243442925973795e-05, 1.860127304098569e-05, 1.9959104974986985e-05, 2.1316933271009475e-05, 2.2674765205010772e-05, 2.4032595320022665e-05, 2.5390425435034558e-05, 2.674825555004645e-05, 2.8106085665058345e-05, 2.9463915780070238e-05, 3.082174589508213e-05, 3.217957782908343e-05, 3.353740612510592e-05, 3.4895238059107214e-05, 3.625306999310851e-05, 3.7610898289131e-05]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 9.0, 12.0, 9.0, 19.0, 24.0, 52.0, 47.0, 84.0, 113.0, 164.0, 234.0, 371.0, 513.0, 825.0, 1353.0, 2054.0, 3380.0, 5382.0, 8856.0, 15222.0, 26883.0, 48917.0, 94166.0, 212166.0, 3057523.0, 433336.0, 130662.0, 64628.0, 34696.0, 19620.0, 11867.0, 7240.0, 4644.0, 2885.0, 1941.0, 1352.0, 879.0, 659.0, 444.0, 312.0, 238.0, 147.0, 98.0, 92.0, 50.0, 33.0, 33.0, 21.0, 11.0, 8.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.8650970458984375e-05, -5.6743621826171875e-05, -5.4836273193359375e-05, -5.2928924560546875e-05, -5.1021575927734375e-05, -4.9114227294921875e-05, -4.7206878662109375e-05, -4.5299530029296875e-05, -4.3392181396484375e-05, -4.1484832763671875e-05, -3.9577484130859375e-05, -3.7670135498046875e-05, -3.5762786865234375e-05, -3.3855438232421875e-05, -3.1948089599609375e-05, -3.0040740966796875e-05, -2.8133392333984375e-05, -2.6226043701171875e-05, -2.4318695068359375e-05, -2.2411346435546875e-05, -2.0503997802734375e-05, -1.8596649169921875e-05, -1.6689300537109375e-05, -1.4781951904296875e-05, -1.2874603271484375e-05, -1.0967254638671875e-05, -9.059906005859375e-06, -7.152557373046875e-06, -5.245208740234375e-06, -3.337860107421875e-06, -1.430511474609375e-06, 4.76837158203125e-07, 2.384185791015625e-06, 4.291534423828125e-06, 6.198883056640625e-06, 8.106231689453125e-06, 1.0013580322265625e-05, 1.1920928955078125e-05, 1.3828277587890625e-05, 1.5735626220703125e-05, 1.7642974853515625e-05, 1.9550323486328125e-05, 2.1457672119140625e-05, 2.3365020751953125e-05, 2.5272369384765625e-05, 2.7179718017578125e-05, 2.9087066650390625e-05, 3.0994415283203125e-05, 3.2901763916015625e-05, 3.4809112548828125e-05, 3.6716461181640625e-05, 3.8623809814453125e-05, 4.0531158447265625e-05, 4.2438507080078125e-05, 4.4345855712890625e-05, 4.6253204345703125e-05, 4.8160552978515625e-05, 5.0067901611328125e-05, 5.1975250244140625e-05, 5.3882598876953125e-05, 5.5789947509765625e-05, 5.7697296142578125e-05, 5.9604644775390625e-05, 6.151199340820312e-05, 6.341934204101562e-05]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 16.0, 8.0, 21.0, 13.0, 29.0, 22.0, 32.0, 24.0, 33.0, 24.0, 33.0, 41.0, 46.0, 40.0, 52.0, 29.0, 51.0, 53.0, 54.0, 43.0, 20.0, 33.0, 37.0, 26.0, 34.0, 29.0, 19.0, 30.0, 20.0, 14.0, 8.0, 7.0, 6.0, 7.0, 5.0, 7.0, 4.0, 1.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.125999450683594e-06, -4.957430064678192e-06, -4.7888606786727905e-06, -4.620291292667389e-06, -4.451721906661987e-06, -4.283152520656586e-06, -4.114583134651184e-06, -3.9460137486457825e-06, -3.777444362640381e-06, -3.6088749766349792e-06, -3.4403055906295776e-06, -3.271736204624176e-06, -3.1031668186187744e-06, -2.934597432613373e-06, -2.766028046607971e-06, -2.5974586606025696e-06, -2.428889274597168e-06, -2.2603198885917664e-06, -2.0917505025863647e-06, -1.923181116580963e-06, -1.7546117305755615e-06, -1.58604234457016e-06, -1.4174729585647583e-06, -1.2489035725593567e-06, -1.080334186553955e-06, -9.117648005485535e-07, -7.431954145431519e-07, -5.746260285377502e-07, -4.0605664253234863e-07, -2.3748725652694702e-07, -6.891787052154541e-08, 9.96515154838562e-08, 2.682209014892578e-07, 4.367902874946594e-07, 6.05359673500061e-07, 7.739290595054626e-07, 9.424984455108643e-07, 1.1110678315162659e-06, 1.2796372175216675e-06, 1.448206603527069e-06, 1.6167759895324707e-06, 1.7853453755378723e-06, 1.953914761543274e-06, 2.1224841475486755e-06, 2.291053533554077e-06, 2.4596229195594788e-06, 2.6281923055648804e-06, 2.796761691570282e-06, 2.9653310775756836e-06, 3.133900463581085e-06, 3.302469849586487e-06, 3.4710392355918884e-06, 3.63960862159729e-06, 3.8081780076026917e-06, 3.976747393608093e-06, 4.145316779613495e-06, 4.3138861656188965e-06, 4.482455551624298e-06, 4.6510249376297e-06, 4.819594323635101e-06, 4.988163709640503e-06, 5.1567330956459045e-06, 5.325302481651306e-06, 5.493871867656708e-06, 5.662441253662109e-06]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 0.0, 1.0, 8.0, 7.0, 14.0, 18.0, 19.0, 40.0, 40.0, 74.0, 111.0, 177.0, 332.0, 716.0, 1832.0, 5642.0, 20628.0, 97114.0, 1225766.0, 2691845.0, 116097.0, 23651.0, 6354.0, 2069.0, 774.0, 371.0, 207.0, 117.0, 78.0, 57.0, 42.0, 23.0, 18.0, 17.0, 7.0, 7.0, 3.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.262561798095703e-05, -9.025353938341141e-05, -8.788146078586578e-05, -8.550938218832016e-05, -8.313730359077454e-05, -8.076522499322891e-05, -7.839314639568329e-05, -7.602106779813766e-05, -7.364898920059204e-05, -7.127691060304642e-05, -6.89048320055008e-05, -6.653275340795517e-05, -6.416067481040955e-05, -6.178859621286392e-05, -5.94165176153183e-05, -5.7044439017772675e-05, -5.467236042022705e-05, -5.230028182268143e-05, -4.99282032251358e-05, -4.755612462759018e-05, -4.5184046030044556e-05, -4.281196743249893e-05, -4.043988883495331e-05, -3.8067810237407684e-05, -3.569573163986206e-05, -3.332365304231644e-05, -3.095157444477081e-05, -2.857949584722519e-05, -2.6207417249679565e-05, -2.383533865213394e-05, -2.1463260054588318e-05, -1.9091181457042694e-05, -1.671910285949707e-05, -1.4347024261951447e-05, -1.1974945664405823e-05, -9.602867066860199e-06, -7.230788469314575e-06, -4.858709871768951e-06, -2.4866312742233276e-06, -1.1455267667770386e-07, 2.25752592086792e-06, 4.629604518413544e-06, 7.0016831159591675e-06, 9.373761713504791e-06, 1.1745840311050415e-05, 1.4117918908596039e-05, 1.6489997506141663e-05, 1.8862076103687286e-05, 2.123415470123291e-05, 2.3606233298778534e-05, 2.5978311896324158e-05, 2.835039049386978e-05, 3.0722469091415405e-05, 3.309454768896103e-05, 3.546662628650665e-05, 3.7838704884052277e-05, 4.02107834815979e-05, 4.2582862079143524e-05, 4.495494067668915e-05, 4.732701927423477e-05, 4.9699097871780396e-05, 5.207117646932602e-05, 5.444325506687164e-05, 5.681533366441727e-05, 5.918741226196289e-05]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 1.0, 10.0, 3.0, 8.0, 10.0, 13.0, 24.0, 19.0, 37.0, 32.0, 52.0, 47.0, 62.0, 90.0, 81.0, 131.0, 111.0, 216.0, 387.0, 1437.0, 381.0, 233.0, 127.0, 112.0, 93.0, 72.0, 61.0, 51.0, 47.0, 22.0, 32.0, 16.0, 15.0, 13.0, 7.0, 11.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.450580596923828e-06, -7.179565727710724e-06, -6.90855085849762e-06, -6.637535989284515e-06, -6.366521120071411e-06, -6.095506250858307e-06, -5.824491381645203e-06, -5.553476512432098e-06, -5.282461643218994e-06, -5.01144677400589e-06, -4.740431904792786e-06, -4.469417035579681e-06, -4.198402166366577e-06, -3.927387297153473e-06, -3.6563724279403687e-06, -3.3853575587272644e-06, -3.11434268951416e-06, -2.843327820301056e-06, -2.5723129510879517e-06, -2.3012980818748474e-06, -2.030283212661743e-06, -1.759268343448639e-06, -1.4882534742355347e-06, -1.2172386050224304e-06, -9.462237358093262e-07, -6.752088665962219e-07, -4.041939973831177e-07, -1.3317912817001343e-07, 1.3783574104309082e-07, 4.0885061025619507e-07, 6.798654794692993e-07, 9.508803486824036e-07, 1.2218952178955078e-06, 1.492910087108612e-06, 1.7639249563217163e-06, 2.0349398255348206e-06, 2.305954694747925e-06, 2.576969563961029e-06, 2.8479844331741333e-06, 3.1189993023872375e-06, 3.390014171600342e-06, 3.661029040813446e-06, 3.93204391002655e-06, 4.2030587792396545e-06, 4.474073648452759e-06, 4.745088517665863e-06, 5.016103386878967e-06, 5.2871182560920715e-06, 5.558133125305176e-06, 5.82914799451828e-06, 6.100162863731384e-06, 6.3711777329444885e-06, 6.642192602157593e-06, 6.913207471370697e-06, 7.184222340583801e-06, 7.4552372097969055e-06, 7.72625207901001e-06, 7.997266948223114e-06, 8.268281817436218e-06, 8.539296686649323e-06, 8.810311555862427e-06, 9.081326425075531e-06, 9.352341294288635e-06, 9.62335616350174e-06, 9.894371032714844e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 13.0, 13.0, 10.0, 29.0, 47.0, 47.0, 76.0, 120.0, 180.0, 160.0, 103.0, 55.0, 42.0, 23.0, 19.0, 12.0, 15.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3416974727297202e-05, -2.2471531337941997e-05, -2.1526087948586792e-05, -2.0580644559231587e-05, -1.9635201169876382e-05, -1.8689757780521177e-05, -1.7744314391165972e-05, -1.6798869182821363e-05, -1.5853427612455562e-05, -1.4907984223100357e-05, -1.3962540833745152e-05, -1.3017097444389947e-05, -1.2071654055034742e-05, -1.1126210665679537e-05, -1.018076636682963e-05, -9.235322977474425e-06, -8.289878678624518e-06, -7.344435289269313e-06, -6.398991899914108e-06, -5.453548055811552e-06, -4.508104666456347e-06, -3.5626612771011423e-06, -2.6172174329985864e-06, -1.6717740436433814e-06, -7.263306542881764e-07, 2.1911284875386627e-07, 1.164556351795909e-06, 2.1099999685247894e-06, 3.0554433578799944e-06, 4.0008867472351994e-06, 4.946330591337755e-06, 5.89177398069296e-06, 6.837217370048165e-06, 7.78266075940337e-06, 8.728104148758575e-06, 9.67354753811378e-06, 1.0618990927468985e-05, 1.156443431682419e-05, 1.2509878615674097e-05, 1.3455322005029302e-05, 1.4400765394384507e-05, 1.5346209693234414e-05, 1.629165308258962e-05, 1.7237096471944824e-05, 1.818253986130003e-05, 1.9127983250655234e-05, 2.007342664001044e-05, 2.1018870029365644e-05, 2.196431341872085e-05, 2.2909756808076054e-05, 2.385520019743126e-05, 2.4800643586786464e-05, 2.574608697614167e-05, 2.6691530365496874e-05, 2.7636975573841482e-05, 2.8582417144207284e-05, 2.9527862352551892e-05, 3.0473305741907097e-05, 3.14187491312623e-05, 3.236419433960691e-05, 3.330963590997271e-05, 3.425508111831732e-05, 3.520052268868312e-05, 3.614596789702773e-05, 3.709140946739353e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 2.0, 1.0, 8.0, 7.0, 14.0, 16.0, 19.0, 13.0, 14.0, 27.0, 16.0, 14.0, 22.0, 19.0, 32.0, 26.0, 38.0, 31.0, 39.0, 43.0, 37.0, 33.0, 46.0, 42.0, 33.0, 47.0, 31.0, 31.0, 30.0, 30.0, 41.0, 21.0, 20.0, 25.0, 26.0, 14.0, 15.0, 14.0, 15.0, 12.0, 4.0, 8.0, 6.0, 4.0, 3.0, 0.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.3425305041891988e-05, -1.302155214943923e-05, -1.2617800166481175e-05, -1.2214047274028417e-05, -1.1810294381575659e-05, -1.1406542398617603e-05, -1.1002789506164845e-05, -1.0599036613712087e-05, -1.0195284630754031e-05, -9.791531738301273e-06, -9.387779755343217e-06, -8.98402686289046e-06, -8.580274879932404e-06, -8.176521987479646e-06, -7.772769095026888e-06, -7.369016657321481e-06, -6.965264219616074e-06, -6.561511781910667e-06, -6.15775934420526e-06, -5.7540064517525025e-06, -5.3502540140470956e-06, -4.946501576341689e-06, -4.542748683888931e-06, -4.138996246183524e-06, -3.735243808478117e-06, -3.33149137077271e-06, -2.9277387056936277e-06, -2.5239860406145453e-06, -2.1202336029091384e-06, -1.7164811652037315e-06, -1.3127285001246491e-06, -9.089758350455668e-07, -5.052233973401599e-07, -1.0147084594791522e-07, 3.022817054443294e-07, 7.060342568365741e-07, 1.1097868082288187e-06, 1.5135392459342256e-06, 1.917291911013308e-06, 2.3210445760923903e-06, 2.7247970137977973e-06, 3.128549451503204e-06, 3.5323021165822865e-06, 3.936054781661369e-06, 4.339807219366776e-06, 4.743559657072183e-06, 5.1473125495249406e-06, 5.5510649872303475e-06, 5.954817424935754e-06, 6.358569862641161e-06, 6.762322300346568e-06, 7.166075192799326e-06, 7.569827630504733e-06, 7.97358006821014e-06, 8.377332960662898e-06, 8.781085853115655e-06, 9.184837836073712e-06, 9.58859072852647e-06, 9.992342711484525e-06, 1.0396095603937283e-05, 1.079984758689534e-05, 1.1203600479348097e-05, 1.1607353371800855e-05, 1.201110535475891e-05, 1.2414858247211669e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 0.0, 5.0, 9.0, 11.0, 15.0, 47.0, 68.0, 70.0, 115.0, 176.0, 318.0, 477.0, 812.0, 1498.0, 2529.0, 5353.0, 9327.0, 18837.0, 39811.0, 91152.0, 252283.0, 331459.0, 163029.0, 68546.0, 30768.0, 15894.0, 6988.0, 3806.0, 2144.0, 1181.0, 763.0, 382.0, 220.0, 158.0, 90.0, 77.0, 39.0, 29.0, 14.0, 13.0, 13.0, 6.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6629695892333984e-05, -1.6081146895885468e-05, -1.553259789943695e-05, -1.4984048902988434e-05, -1.4435499906539917e-05, -1.38869509100914e-05, -1.3338401913642883e-05, -1.2789852917194366e-05, -1.224130392074585e-05, -1.1692754924297333e-05, -1.1144205927848816e-05, -1.0595656931400299e-05, -1.0047107934951782e-05, -9.498558938503265e-06, -8.950009942054749e-06, -8.401460945606232e-06, -7.852911949157715e-06, -7.304362952709198e-06, -6.755813956260681e-06, -6.207264959812164e-06, -5.6587159633636475e-06, -5.110166966915131e-06, -4.561617970466614e-06, -4.013068974018097e-06, -3.46451997756958e-06, -2.9159709811210632e-06, -2.3674219846725464e-06, -1.8188729882240295e-06, -1.2703239917755127e-06, -7.217749953269958e-07, -1.73225998878479e-07, 3.7532299757003784e-07, 9.238719940185547e-07, 1.4724209904670715e-06, 2.0209699869155884e-06, 2.5695189833641052e-06, 3.118067979812622e-06, 3.666616976261139e-06, 4.215165972709656e-06, 4.763714969158173e-06, 5.3122639656066895e-06, 5.860812962055206e-06, 6.409361958503723e-06, 6.95791095495224e-06, 7.506459951400757e-06, 8.055008947849274e-06, 8.60355794429779e-06, 9.152106940746307e-06, 9.700655937194824e-06, 1.0249204933643341e-05, 1.0797753930091858e-05, 1.1346302926540375e-05, 1.1894851922988892e-05, 1.2443400919437408e-05, 1.2991949915885925e-05, 1.3540498912334442e-05, 1.4089047908782959e-05, 1.4637596905231476e-05, 1.5186145901679993e-05, 1.573469489812851e-05, 1.6283243894577026e-05, 1.6831792891025543e-05, 1.738034188747406e-05, 1.7928890883922577e-05, 1.8477439880371094e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 5.0, 11.0, 7.0, 9.0, 15.0, 21.0, 10.0, 16.0, 20.0, 17.0, 28.0, 19.0, 34.0, 41.0, 34.0, 35.0, 53.0, 34.0, 57.0, 49.0, 39.0, 46.0, 49.0, 35.0, 36.0, 31.0, 40.0, 36.0, 27.0, 16.0, 21.0, 18.0, 20.0, 10.0, 13.0, 13.0, 10.0, 6.0, 6.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5139579772949219e-05, -1.4659017324447632e-05, -1.4178454875946045e-05, -1.3697892427444458e-05, -1.3217329978942871e-05, -1.2736767530441284e-05, -1.2256205081939697e-05, -1.177564263343811e-05, -1.1295080184936523e-05, -1.0814517736434937e-05, -1.033395528793335e-05, -9.853392839431763e-06, -9.372830390930176e-06, -8.892267942428589e-06, -8.411705493927002e-06, -7.931143045425415e-06, -7.450580596923828e-06, -6.970018148422241e-06, -6.489455699920654e-06, -6.008893251419067e-06, -5.5283308029174805e-06, -5.0477683544158936e-06, -4.567205905914307e-06, -4.08664345741272e-06, -3.606081008911133e-06, -3.125518560409546e-06, -2.644956111907959e-06, -2.164393663406372e-06, -1.6838312149047852e-06, -1.2032687664031982e-06, -7.227063179016113e-07, -2.421438694000244e-07, 2.384185791015625e-07, 7.189810276031494e-07, 1.1995434761047363e-06, 1.6801059246063232e-06, 2.16066837310791e-06, 2.641230821609497e-06, 3.121793270111084e-06, 3.602355718612671e-06, 4.082918167114258e-06, 4.563480615615845e-06, 5.044043064117432e-06, 5.5246055126190186e-06, 6.0051679611206055e-06, 6.485730409622192e-06, 6.966292858123779e-06, 7.446855306625366e-06, 7.927417755126953e-06, 8.40798020362854e-06, 8.888542652130127e-06, 9.369105100631714e-06, 9.8496675491333e-06, 1.0330229997634888e-05, 1.0810792446136475e-05, 1.1291354894638062e-05, 1.1771917343139648e-05, 1.2252479791641235e-05, 1.2733042240142822e-05, 1.321360468864441e-05, 1.3694167137145996e-05, 1.4174729585647583e-05, 1.465529203414917e-05, 1.5135854482650757e-05, 1.5616416931152344e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 6.0, 10.0, 11.0, 23.0, 35.0, 45.0, 56.0, 64.0, 135.0, 160.0, 205.0, 317.0, 458.0, 602.0, 949.0, 1441.0, 2041.0, 3615.0, 5980.0, 9246.0, 19480.0, 35841.0, 101147.0, 379145.0, 306029.0, 101057.0, 38622.0, 16593.0, 9991.0, 5623.0, 3055.0, 2196.0, 1230.0, 990.0, 692.0, 412.0, 313.0, 221.0, 132.0, 120.0, 76.0, 45.0, 35.0, 30.0, 15.0, 23.0, 15.0, 9.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.5437602996826172e-05, -1.4922581613063812e-05, -1.4407560229301453e-05, -1.3892538845539093e-05, -1.3377517461776733e-05, -1.2862496078014374e-05, -1.2347474694252014e-05, -1.1832453310489655e-05, -1.1317431926727295e-05, -1.0802410542964935e-05, -1.0287389159202576e-05, -9.772367775440216e-06, -9.257346391677856e-06, -8.742325007915497e-06, -8.227303624153137e-06, -7.712282240390778e-06, -7.197260856628418e-06, -6.682239472866058e-06, -6.167218089103699e-06, -5.652196705341339e-06, -5.1371753215789795e-06, -4.62215393781662e-06, -4.10713255405426e-06, -3.5921111702919006e-06, -3.077089786529541e-06, -2.5620684027671814e-06, -2.0470470190048218e-06, -1.5320256352424622e-06, -1.0170042514801025e-06, -5.019828677177429e-07, 1.30385160446167e-08, 5.280598998069763e-07, 1.043081283569336e-06, 1.5581026673316956e-06, 2.073124051094055e-06, 2.588145434856415e-06, 3.1031668186187744e-06, 3.618188202381134e-06, 4.133209586143494e-06, 4.648230969905853e-06, 5.163252353668213e-06, 5.6782737374305725e-06, 6.193295121192932e-06, 6.708316504955292e-06, 7.223337888717651e-06, 7.738359272480011e-06, 8.25338065624237e-06, 8.76840204000473e-06, 9.28342342376709e-06, 9.79844480752945e-06, 1.0313466191291809e-05, 1.0828487575054169e-05, 1.1343508958816528e-05, 1.1858530342578888e-05, 1.2373551726341248e-05, 1.2888573110103607e-05, 1.3403594493865967e-05, 1.3918615877628326e-05, 1.4433637261390686e-05, 1.4948658645153046e-05, 1.5463680028915405e-05, 1.5978701412677765e-05, 1.6493722796440125e-05, 1.7008744180202484e-05, 1.7523765563964844e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 11.0, 5.0, 7.0, 11.0, 13.0, 16.0, 13.0, 11.0, 17.0, 15.0, 25.0, 30.0, 21.0, 30.0, 25.0, 43.0, 39.0, 34.0, 41.0, 33.0, 44.0, 47.0, 32.0, 48.0, 32.0, 50.0, 37.0, 28.0, 25.0, 21.0, 32.0, 34.0, 26.0, 28.0, 12.0, 10.0, 7.0, 11.0, 11.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.821487426757812e-06, -8.53557139635086e-06, -8.249655365943909e-06, -7.963739335536957e-06, -7.677823305130005e-06, -7.391907274723053e-06, -7.105991244316101e-06, -6.820075213909149e-06, -6.534159183502197e-06, -6.248243153095245e-06, -5.9623271226882935e-06, -5.6764110922813416e-06, -5.39049506187439e-06, -5.104579031467438e-06, -4.818663001060486e-06, -4.532746970653534e-06, -4.246830940246582e-06, -3.96091490983963e-06, -3.6749988794326782e-06, -3.3890828490257263e-06, -3.1031668186187744e-06, -2.8172507882118225e-06, -2.5313347578048706e-06, -2.2454187273979187e-06, -1.959502696990967e-06, -1.6735866665840149e-06, -1.387670636177063e-06, -1.101754605770111e-06, -8.158385753631592e-07, -5.299225449562073e-07, -2.4400651454925537e-07, 4.190951585769653e-08, 3.2782554626464844e-07, 6.137415766716003e-07, 8.996576070785522e-07, 1.1855736374855042e-06, 1.471489667892456e-06, 1.757405698299408e-06, 2.04332172870636e-06, 2.3292377591133118e-06, 2.6151537895202637e-06, 2.9010698199272156e-06, 3.1869858503341675e-06, 3.4729018807411194e-06, 3.7588179111480713e-06, 4.044733941555023e-06, 4.330649971961975e-06, 4.616566002368927e-06, 4.902482032775879e-06, 5.188398063182831e-06, 5.474314093589783e-06, 5.760230123996735e-06, 6.0461461544036865e-06, 6.3320621848106384e-06, 6.61797821521759e-06, 6.903894245624542e-06, 7.189810276031494e-06, 7.475726306438446e-06, 7.761642336845398e-06, 8.04755836725235e-06, 8.333474397659302e-06, 8.619390428066254e-06, 8.905306458473206e-06, 9.191222488880157e-06, 9.47713851928711e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 3.0, 9.0, 7.0, 18.0, 18.0, 33.0, 25.0, 23.0, 57.0, 95.0, 250.0, 201.0, 307.0, 374.0, 498.0, 804.0, 1165.0, 1725.0, 2454.0, 11377.0, 13968.0, 33183.0, 115154.0, 684809.0, 114971.0, 33186.0, 14083.0, 7584.0, 6782.0, 1708.0, 1089.0, 741.0, 498.0, 372.0, 255.0, 202.0, 138.0, 193.0, 50.0, 36.0, 30.0, 22.0, 19.0, 9.0, 7.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.086162567138672e-06, -2.020038664340973e-06, -1.953914761543274e-06, -1.887790858745575e-06, -1.821666955947876e-06, -1.755543053150177e-06, -1.689419150352478e-06, -1.623295247554779e-06, -1.55717134475708e-06, -1.491047441959381e-06, -1.4249235391616821e-06, -1.3587996363639832e-06, -1.2926757335662842e-06, -1.2265518307685852e-06, -1.1604279279708862e-06, -1.0943040251731873e-06, -1.0281801223754883e-06, -9.620562195777893e-07, -8.959323167800903e-07, -8.298084139823914e-07, -7.636845111846924e-07, -6.975606083869934e-07, -6.314367055892944e-07, -5.653128027915955e-07, -4.991888999938965e-07, -4.330649971961975e-07, -3.6694109439849854e-07, -3.0081719160079956e-07, -2.3469328880310059e-07, -1.685693860054016e-07, -1.0244548320770264e-07, -3.632158041000366e-08, 2.9802322387695312e-08, 9.592622518539429e-08, 1.6205012798309326e-07, 2.2817403078079224e-07, 2.942979335784912e-07, 3.604218363761902e-07, 4.2654573917388916e-07, 4.926696419715881e-07, 5.587935447692871e-07, 6.249174475669861e-07, 6.910413503646851e-07, 7.57165253162384e-07, 8.23289155960083e-07, 8.89413058757782e-07, 9.55536961555481e-07, 1.02166086435318e-06, 1.087784767150879e-06, 1.1539086699485779e-06, 1.2200325727462769e-06, 1.2861564755439758e-06, 1.3522803783416748e-06, 1.4184042811393738e-06, 1.4845281839370728e-06, 1.5506520867347717e-06, 1.6167759895324707e-06, 1.6828998923301697e-06, 1.7490237951278687e-06, 1.8151476979255676e-06, 1.8812716007232666e-06, 1.9473955035209656e-06, 2.0135194063186646e-06, 2.0796433091163635e-06, 2.1457672119140625e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 12.0, 0.0, 16.0, 0.0, 0.0, 20.0, 0.0, 0.0, 55.0, 0.0, 100.0, 0.0, 0.0, 125.0, 0.0, 353.0, 0.0, 0.0, 126.0, 0.0, 87.0, 0.0, 0.0, 55.0, 0.0, 30.0, 0.0, 0.0, 15.0, 0.0, 0.0, 12.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.919726729393005e-07, -6.686896085739136e-07, -6.454065442085266e-07, -6.221234798431396e-07, -5.988404154777527e-07, -5.755573511123657e-07, -5.522742867469788e-07, -5.289912223815918e-07, -5.057081580162048e-07, -4.824250936508179e-07, -4.591420292854309e-07, -4.3585896492004395e-07, -4.12575900554657e-07, -3.8929283618927e-07, -3.6600977182388306e-07, -3.427267074584961e-07, -3.1944364309310913e-07, -2.9616057872772217e-07, -2.728775143623352e-07, -2.4959444999694824e-07, -2.2631138563156128e-07, -2.0302832126617432e-07, -1.7974525690078735e-07, -1.564621925354004e-07, -1.3317912817001343e-07, -1.0989606380462646e-07, -8.66129994392395e-08, -6.332993507385254e-08, -4.0046870708465576e-08, -1.6763806343078613e-08, 6.51925802230835e-09, 2.9802322387695312e-08, 5.3085386753082275e-08, 7.636845111846924e-08, 9.96515154838562e-08, 1.2293457984924316e-07, 1.4621764421463013e-07, 1.695007085800171e-07, 1.9278377294540405e-07, 2.1606683731079102e-07, 2.39349901676178e-07, 2.6263296604156494e-07, 2.859160304069519e-07, 3.0919909477233887e-07, 3.3248215913772583e-07, 3.557652235031128e-07, 3.7904828786849976e-07, 4.023313522338867e-07, 4.256144165992737e-07, 4.4889748096466064e-07, 4.721805453300476e-07, 4.954636096954346e-07, 5.187466740608215e-07, 5.420297384262085e-07, 5.653128027915955e-07, 5.885958671569824e-07, 6.118789315223694e-07, 6.351619958877563e-07, 6.584450602531433e-07, 6.817281246185303e-07, 7.050111889839172e-07, 7.282942533493042e-07, 7.515773177146912e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 12.0, 7.0, 0.0, 12.0, 6.0, 28.0, 23.0, 9.0, 12.0, 57.0, 94.0, 171.0, 487.0, 1207.0, 1146.0, 5321.0, 15093.0, 63236.0, 121966.0, 752605.0, 63271.0, 15129.0, 5428.0, 1145.0, 1177.0, 493.0, 179.0, 88.0, 56.0, 8.0, 8.0, 18.0, 18.0, 0.0, 14.0, 1.0, 2.0, 9.0, 0.0, 4.0, 1.0, 2.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.3974647521972656e-06, -3.291293978691101e-06, -3.1851232051849365e-06, -3.078952431678772e-06, -2.9727816581726074e-06, -2.866610884666443e-06, -2.7604401111602783e-06, -2.6542693376541138e-06, -2.5480985641479492e-06, -2.4419277906417847e-06, -2.33575701713562e-06, -2.2295862436294556e-06, -2.123415470123291e-06, -2.0172446966171265e-06, -1.911073923110962e-06, -1.8049031496047974e-06, -1.6987323760986328e-06, -1.5925616025924683e-06, -1.4863908290863037e-06, -1.3802200555801392e-06, -1.2740492820739746e-06, -1.16787850856781e-06, -1.0617077350616455e-06, -9.55536961555481e-07, -8.493661880493164e-07, -7.431954145431519e-07, -6.370246410369873e-07, -5.308538675308228e-07, -4.246830940246582e-07, -3.1851232051849365e-07, -2.123415470123291e-07, -1.0617077350616455e-07, 0.0, 1.0617077350616455e-07, 2.123415470123291e-07, 3.1851232051849365e-07, 4.246830940246582e-07, 5.308538675308228e-07, 6.370246410369873e-07, 7.431954145431519e-07, 8.493661880493164e-07, 9.55536961555481e-07, 1.0617077350616455e-06, 1.16787850856781e-06, 1.2740492820739746e-06, 1.3802200555801392e-06, 1.4863908290863037e-06, 1.5925616025924683e-06, 1.6987323760986328e-06, 1.8049031496047974e-06, 1.911073923110962e-06, 2.0172446966171265e-06, 2.123415470123291e-06, 2.2295862436294556e-06, 2.33575701713562e-06, 2.4419277906417847e-06, 2.5480985641479492e-06, 2.6542693376541138e-06, 2.7604401111602783e-06, 2.866610884666443e-06, 2.9727816581726074e-06, 3.078952431678772e-06, 3.1851232051849365e-06, 3.291293978691101e-06, 3.3974647521972656e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 74.0, 0.0, 0.0, 0.0, 0.0, 163.0, 0.0, 0.0, 0.0, 0.0, 419.0, 0.0, 0.0, 0.0, 185.0, 0.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 45.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 9.0, 10.0, 7.0, 17.0, 20.0, 31.0, 56.0, 61.0, 116.0, 183.0, 171.0, 125.0, 64.0, 31.0, 23.0, 19.0, 10.0, 12.0, 10.0, 0.0, 8.0, 6.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5568253477104008e-05, -2.4585091523476876e-05, -2.360192775086034e-05, -2.261876579723321e-05, -2.1635602024616674e-05, -2.0652440070989542e-05, -1.966927811736241e-05, -1.8686114344745874e-05, -1.7702952391118743e-05, -1.671979043749161e-05, -1.5736626664875075e-05, -1.4753464711247943e-05, -1.377030184812611e-05, -1.2787138985004276e-05, -1.1803977031377144e-05, -1.082081416825531e-05, -9.837651305133477e-06, -8.854488442011643e-06, -7.87132557888981e-06, -6.888163625262678e-06, -5.905000762140844e-06, -4.92183789901901e-06, -3.938675490644528e-06, -2.955513082270045e-06, -1.972350219148211e-06, -9.89187583400053e-07, -6.024947651894763e-09, 9.771376880962634e-07, 1.9603003238444217e-06, 2.9434631869662553e-06, 3.926625595340738e-06, 4.909788003715221e-06, 5.8929508668370545e-06, 6.876113729958888e-06, 7.859276593080722e-06, 8.842438546707854e-06, 9.825601409829687e-06, 1.0808764272951521e-05, 1.1791926226578653e-05, 1.2775089089700487e-05, 1.375825195282232e-05, 1.4741414815944154e-05, 1.5724577679065987e-05, 1.670773963269312e-05, 1.769090158632025e-05, 1.8674065358936787e-05, 1.965722731256392e-05, 2.064038926619105e-05, 2.1623553038807586e-05, 2.2606714992434718e-05, 2.3589878765051253e-05, 2.4573040718678385e-05, 2.555620449129492e-05, 2.6539366444922052e-05, 2.7522528398549184e-05, 2.850569217116572e-05, 2.948885412479285e-05, 3.0472016078419983e-05, 3.145517985103652e-05, 3.2438343623653054e-05, 3.342150375829078e-05, 3.440466753090732e-05, 3.5387831303523853e-05, 3.637099143816158e-05, 3.735415521077812e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 1.0, 4.0, 10.0, 13.0, 13.0, 18.0, 13.0, 17.0, 22.0, 21.0, 12.0, 22.0, 16.0, 28.0, 30.0, 35.0, 34.0, 28.0, 51.0, 34.0, 39.0, 42.0, 39.0, 41.0, 42.0, 33.0, 27.0, 30.0, 40.0, 30.0, 32.0, 23.0, 21.0, 23.0, 20.0, 14.0, 11.0, 13.0, 18.0, 5.0, 7.0, 8.0, 4.0, 1.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.3491824574884959e-05, -1.3089642379782163e-05, -1.2687461094174068e-05, -1.2285279808565974e-05, -1.1883097613463178e-05, -1.1480915418360382e-05, -1.1078734132752288e-05, -1.0676552847144194e-05, -1.0274370652041398e-05, -9.872188456938602e-06, -9.470007171330508e-06, -9.067825885722414e-06, -8.665643690619618e-06, -8.263461495516822e-06, -7.861280209908728e-06, -7.4590984695532825e-06, -7.056916729197837e-06, -6.654734988842392e-06, -6.252553248486947e-06, -5.850371508131502e-06, -5.448189767776057e-06, -5.046008027420612e-06, -4.643826287065167e-06, -4.241644546709722e-06, -3.839462806354277e-06, -3.4372810659988318e-06, -3.0350993256433867e-06, -2.6329175852879416e-06, -2.2307358449324965e-06, -1.8285541045770515e-06, -1.4263723642216064e-06, -1.0241906238661613e-06, -6.22009793005418e-07, -2.1982805264997296e-07, 1.823536877054721e-07, 5.845354280609172e-07, 9.867171684163623e-07, 1.3888989087718073e-06, 1.7910806491272524e-06, 2.1932623894826975e-06, 2.5954441298381425e-06, 2.9976258701935876e-06, 3.3998076105490327e-06, 3.8019893509044778e-06, 4.204171091259923e-06, 4.606352831615368e-06, 5.008534571970813e-06, 5.410716312326258e-06, 5.812898052681703e-06, 6.215079793037148e-06, 6.617261533392593e-06, 7.019443273748038e-06, 7.421625014103483e-06, 7.823806299711578e-06, 8.225988494814374e-06, 8.62817068991717e-06, 9.030351975525264e-06, 9.432533261133358e-06, 9.834715456236154e-06, 1.023689765133895e-05, 1.0639078936947044e-05, 1.1041260222555138e-05, 1.1443442417657934e-05, 1.184562461276073e-05, 1.2247805898368824e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 11.0, 11.0, 24.0, 40.0, 52.0, 77.0, 119.0, 171.0, 230.0, 406.0, 529.0, 905.0, 1365.0, 2353.0, 3531.0, 5849.0, 10107.0, 17672.0, 32061.0, 63458.0, 143085.0, 381566.0, 213296.0, 81387.0, 39185.0, 20874.0, 11956.0, 6936.0, 4193.0, 2574.0, 1530.0, 1012.0, 675.0, 428.0, 302.0, 203.0, 109.0, 90.0, 65.0, 40.0, 24.0, 14.0, 10.0, 6.0, 6.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.042552947998047e-05, -4.8881396651268005e-05, -4.733726382255554e-05, -4.579313099384308e-05, -4.4248998165130615e-05, -4.270486533641815e-05, -4.116073250770569e-05, -3.9616599678993225e-05, -3.807246685028076e-05, -3.65283340215683e-05, -3.4984201192855835e-05, -3.344006836414337e-05, -3.189593553543091e-05, -3.0351802706718445e-05, -2.880766987800598e-05, -2.7263537049293518e-05, -2.5719404220581055e-05, -2.417527139186859e-05, -2.2631138563156128e-05, -2.1087005734443665e-05, -1.95428729057312e-05, -1.7998740077018738e-05, -1.6454607248306274e-05, -1.4910474419593811e-05, -1.3366341590881348e-05, -1.1822208762168884e-05, -1.0278075933456421e-05, -8.733943104743958e-06, -7.189810276031494e-06, -5.645677447319031e-06, -4.101544618606567e-06, -2.557411789894104e-06, -1.0132789611816406e-06, 5.308538675308228e-07, 2.074986696243286e-06, 3.6191195249557495e-06, 5.163252353668213e-06, 6.707385182380676e-06, 8.25151801109314e-06, 9.795650839805603e-06, 1.1339783668518066e-05, 1.288391649723053e-05, 1.4428049325942993e-05, 1.5972182154655457e-05, 1.751631498336792e-05, 1.9060447812080383e-05, 2.0604580640792847e-05, 2.214871346950531e-05, 2.3692846298217773e-05, 2.5236979126930237e-05, 2.67811119556427e-05, 2.8325244784355164e-05, 2.9869377613067627e-05, 3.141351044178009e-05, 3.2957643270492554e-05, 3.450177609920502e-05, 3.604590892791748e-05, 3.7590041756629944e-05, 3.913417458534241e-05, 4.067830741405487e-05, 4.2222440242767334e-05, 4.37665730714798e-05, 4.531070590019226e-05, 4.6854838728904724e-05, 4.839897155761719e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 2.0, 1.0, 3.0, 5.0, 9.0, 12.0, 14.0, 11.0, 12.0, 16.0, 14.0, 18.0, 25.0, 15.0, 21.0, 35.0, 24.0, 37.0, 29.0, 38.0, 41.0, 33.0, 46.0, 45.0, 42.0, 40.0, 29.0, 53.0, 43.0, 29.0, 34.0, 28.0, 23.0, 35.0, 17.0, 20.0, 21.0, 15.0, 9.0, 6.0, 15.0, 13.0, 5.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.033348083496094e-06, -6.818212568759918e-06, -6.603077054023743e-06, -6.387941539287567e-06, -6.172806024551392e-06, -5.957670509815216e-06, -5.7425349950790405e-06, -5.527399480342865e-06, -5.3122639656066895e-06, -5.097128450870514e-06, -4.881992936134338e-06, -4.666857421398163e-06, -4.451721906661987e-06, -4.236586391925812e-06, -4.021450877189636e-06, -3.8063153624534607e-06, -3.591179847717285e-06, -3.3760443329811096e-06, -3.160908818244934e-06, -2.9457733035087585e-06, -2.730637788772583e-06, -2.5155022740364075e-06, -2.300366759300232e-06, -2.0852312445640564e-06, -1.8700957298278809e-06, -1.6549602150917053e-06, -1.4398247003555298e-06, -1.2246891856193542e-06, -1.0095536708831787e-06, -7.944181561470032e-07, -5.792826414108276e-07, -3.641471266746521e-07, -1.4901161193847656e-07, 6.612390279769897e-08, 2.812594175338745e-07, 4.9639493227005e-07, 7.115304470062256e-07, 9.266659617424011e-07, 1.1418014764785767e-06, 1.3569369912147522e-06, 1.5720725059509277e-06, 1.7872080206871033e-06, 2.002343535423279e-06, 2.2174790501594543e-06, 2.43261456489563e-06, 2.6477500796318054e-06, 2.862885594367981e-06, 3.0780211091041565e-06, 3.293156623840332e-06, 3.5082921385765076e-06, 3.723427653312683e-06, 3.938563168048859e-06, 4.153698682785034e-06, 4.36883419752121e-06, 4.583969712257385e-06, 4.799105226993561e-06, 5.014240741729736e-06, 5.229376256465912e-06, 5.444511771202087e-06, 5.659647285938263e-06, 5.8747828006744385e-06, 6.089918315410614e-06, 6.3050538301467896e-06, 6.520189344882965e-06, 6.735324859619141e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 9.0, 20.0, 25.0, 29.0, 45.0, 70.0, 108.0, 176.0, 257.0, 451.0, 730.0, 1245.0, 2162.0, 4264.0, 7481.0, 14358.0, 28479.0, 65349.0, 162027.0, 474215.0, 162524.0, 65068.0, 28018.0, 14120.0, 7715.0, 4208.0, 2121.0, 1297.0, 742.0, 417.0, 271.0, 199.0, 96.0, 84.0, 49.0, 37.0, 27.0, 12.0, 11.0, 8.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.369020462036133e-05, -4.242360591888428e-05, -4.1157007217407227e-05, -3.9890408515930176e-05, -3.8623809814453125e-05, -3.7357211112976074e-05, -3.6090612411499023e-05, -3.482401371002197e-05, -3.355741500854492e-05, -3.229081630706787e-05, -3.102421760559082e-05, -2.975761890411377e-05, -2.849102020263672e-05, -2.7224421501159668e-05, -2.5957822799682617e-05, -2.4691224098205566e-05, -2.3424625396728516e-05, -2.2158026695251465e-05, -2.0891427993774414e-05, -1.9624829292297363e-05, -1.8358230590820312e-05, -1.7091631889343262e-05, -1.582503318786621e-05, -1.455843448638916e-05, -1.329183578491211e-05, -1.2025237083435059e-05, -1.0758638381958008e-05, -9.492039680480957e-06, -8.225440979003906e-06, -6.9588422775268555e-06, -5.692243576049805e-06, -4.425644874572754e-06, -3.159046173095703e-06, -1.8924474716186523e-06, -6.258487701416016e-07, 6.407499313354492e-07, 1.9073486328125e-06, 3.1739473342895508e-06, 4.4405460357666016e-06, 5.707144737243652e-06, 6.973743438720703e-06, 8.240342140197754e-06, 9.506940841674805e-06, 1.0773539543151855e-05, 1.2040138244628906e-05, 1.3306736946105957e-05, 1.4573335647583008e-05, 1.583993434906006e-05, 1.710653305053711e-05, 1.837313175201416e-05, 1.963973045349121e-05, 2.0906329154968262e-05, 2.2172927856445312e-05, 2.3439526557922363e-05, 2.4706125259399414e-05, 2.5972723960876465e-05, 2.7239322662353516e-05, 2.8505921363830566e-05, 2.9772520065307617e-05, 3.103911876678467e-05, 3.230571746826172e-05, 3.357231616973877e-05, 3.483891487121582e-05, 3.610551357269287e-05, 3.737211227416992e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 10.0, 15.0, 17.0, 17.0, 20.0, 16.0, 36.0, 31.0, 41.0, 53.0, 48.0, 48.0, 78.0, 63.0, 58.0, 70.0, 64.0, 50.0, 57.0, 36.0, 40.0, 22.0, 37.0, 27.0, 9.0, 11.0, 5.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-05, -1.2148171663284302e-05, -1.1779367923736572e-05, -1.1410564184188843e-05, -1.1041760444641113e-05, -1.0672956705093384e-05, -1.0304152965545654e-05, -9.935349225997925e-06, -9.566545486450195e-06, -9.197741746902466e-06, -8.828938007354736e-06, -8.460134267807007e-06, -8.091330528259277e-06, -7.722526788711548e-06, -7.353723049163818e-06, -6.984919309616089e-06, -6.616115570068359e-06, -6.24731183052063e-06, -5.8785080909729e-06, -5.509704351425171e-06, -5.140900611877441e-06, -4.772096872329712e-06, -4.403293132781982e-06, -4.034489393234253e-06, -3.6656856536865234e-06, -3.296881914138794e-06, -2.9280781745910645e-06, -2.559274435043335e-06, -2.1904706954956055e-06, -1.821666955947876e-06, -1.4528632164001465e-06, -1.084059476852417e-06, -7.152557373046875e-07, -3.46451997756958e-07, 2.2351741790771484e-08, 3.91155481338501e-07, 7.599592208862305e-07, 1.12876296043396e-06, 1.4975666999816895e-06, 1.866370439529419e-06, 2.2351741790771484e-06, 2.603977918624878e-06, 2.9727816581726074e-06, 3.341585397720337e-06, 3.7103891372680664e-06, 4.079192876815796e-06, 4.447996616363525e-06, 4.816800355911255e-06, 5.185604095458984e-06, 5.554407835006714e-06, 5.923211574554443e-06, 6.292015314102173e-06, 6.660819053649902e-06, 7.029622793197632e-06, 7.398426532745361e-06, 7.76723027229309e-06, 8.13603401184082e-06, 8.50483775138855e-06, 8.87364149093628e-06, 9.242445230484009e-06, 9.611248970031738e-06, 9.980052709579468e-06, 1.0348856449127197e-05, 1.0717660188674927e-05, 1.1086463928222656e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 7.0, 0.0, 0.0, 15.0, 0.0, 25.0, 0.0, 28.0, 0.0, 84.0, 0.0, 108.0, 0.0, 0.0, 204.0, 0.0, 306.0, 0.0, 720.0, 0.0, 1322.0, 0.0, 2978.0, 0.0, 0.0, 10405.0, 0.0, 1015793.0, 0.0, 10781.0, 0.0, 2926.0, 0.0, 1376.0, 0.0, 0.0, 749.0, 0.0, 315.0, 0.0, 191.0, 0.0, 115.0, 0.0, 62.0, 0.0, 0.0, 28.0, 0.0, 14.0, 0.0, 9.0, 0.0, 4.0, 0.0, 5.0], "bins": [-9.5367431640625e-07, -9.266659617424011e-07, -8.996576070785522e-07, -8.726492524147034e-07, -8.456408977508545e-07, -8.186325430870056e-07, -7.916241884231567e-07, -7.646158337593079e-07, -7.37607479095459e-07, -7.105991244316101e-07, -6.835907697677612e-07, -6.565824151039124e-07, -6.295740604400635e-07, -6.025657057762146e-07, -5.755573511123657e-07, -5.485489964485168e-07, -5.21540641784668e-07, -4.945322871208191e-07, -4.675239324569702e-07, -4.4051557779312134e-07, -4.1350722312927246e-07, -3.864988684654236e-07, -3.594905138015747e-07, -3.3248215913772583e-07, -3.0547380447387695e-07, -2.784654498100281e-07, -2.514570951461792e-07, -2.2444874048233032e-07, -1.9744038581848145e-07, -1.7043203115463257e-07, -1.434236764907837e-07, -1.1641532182693481e-07, -8.940696716308594e-08, -6.239861249923706e-08, -3.5390257835388184e-08, -8.381903171539307e-09, 1.862645149230957e-08, 4.563480615615845e-08, 7.264316082000732e-08, 9.96515154838562e-08, 1.2665987014770508e-07, 1.5366822481155396e-07, 1.8067657947540283e-07, 2.076849341392517e-07, 2.3469328880310059e-07, 2.6170164346694946e-07, 2.8870999813079834e-07, 3.157183527946472e-07, 3.427267074584961e-07, 3.6973506212234497e-07, 3.9674341678619385e-07, 4.237517714500427e-07, 4.507601261138916e-07, 4.777684807777405e-07, 5.047768354415894e-07, 5.317851901054382e-07, 5.587935447692871e-07, 5.85801899433136e-07, 6.128102540969849e-07, 6.398186087608337e-07, 6.668269634246826e-07, 6.938353180885315e-07, 7.208436727523804e-07, 7.478520274162292e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [276.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3596.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15101.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1010546.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15234.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3554.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 269.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 954.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 14.0, 12.0, 24.0, 30.0, 37.0, 40.0, 70.0, 102.0, 181.0, 178.0, 69.0, 52.0, 43.0, 29.0, 20.0, 14.0, 13.0, 15.0, 8.0, 8.0, 9.0, 2.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1247977454331703e-05, -1.075767522706883e-05, -1.0267372999805957e-05, -9.777070772543084e-06, -9.28676854528021e-06, -8.796466318017337e-06, -8.306164090754464e-06, -7.815862772986293e-06, -7.325560090976069e-06, -6.8352578637131955e-06, -6.344955636450322e-06, -5.8546538639348e-06, -5.364351636671927e-06, -4.874049409409054e-06, -4.38374718214618e-06, -3.893444954883307e-06, -3.403142727620434e-06, -2.912840500357561e-06, -2.4225382730946876e-06, -1.93223627320549e-06, -1.4419340459426166e-06, -9.516318186797434e-07, -4.613298187905457e-07, 2.8972408472327515e-08, 5.192746357352007e-07, 1.009576862998074e-06, 1.4998789765741094e-06, 1.990181090150145e-06, 2.480483317413018e-06, 2.9707855446758913e-06, 3.461087544565089e-06, 3.951389771827962e-06, 4.4416919990908355e-06, 4.931994226353709e-06, 5.422296453616582e-06, 5.912598680879455e-06, 6.402900908142328e-06, 6.8932031354052015e-06, 7.383504907920724e-06, 7.873806680436246e-06, 8.364109817193821e-06, 8.854412044456694e-06, 9.344714271719567e-06, 9.83501649898244e-06, 1.0325318726245314e-05, 1.0815620953508187e-05, 1.130592318077106e-05, 1.1796224498539232e-05, 1.2286526725802105e-05, 1.2776828953064978e-05, 1.3267131180327851e-05, 1.3757433407590725e-05, 1.4247735634853598e-05, 1.4738037862116471e-05, 1.5228339179884642e-05, 1.5718642316642217e-05, 1.620894363441039e-05, 1.669924495217856e-05, 1.7189548088936135e-05, 1.7679849406704307e-05, 1.817015254346188e-05, 1.8660453861230053e-05, 1.9150756997987628e-05, 1.96410583157558e-05, 2.0131361452513374e-05]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 7.0, 9.0, 5.0, 6.0, 17.0, 10.0, 12.0, 13.0, 24.0, 24.0, 18.0, 22.0, 23.0, 32.0, 28.0, 32.0, 40.0, 45.0, 33.0, 41.0, 42.0, 45.0, 46.0, 31.0, 50.0, 38.0, 32.0, 33.0, 28.0, 21.0, 22.0, 25.0, 24.0, 28.0, 15.0, 13.0, 19.0, 11.0, 9.0, 5.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.646144695172552e-06, -7.392462975985836e-06, -7.1387812567991205e-06, -6.885099537612405e-06, -6.631417818425689e-06, -6.377736099238973e-06, -6.124054834799608e-06, -5.8703731156128924e-06, -5.616691396426177e-06, -5.363009677239461e-06, -5.109327958052745e-06, -4.855646238866029e-06, -4.601964974426664e-06, -4.348283255239949e-06, -4.094601536053233e-06, -3.840919816866517e-06, -3.5872380976798013e-06, -3.3335563784930855e-06, -3.0798746593063697e-06, -2.8261931674933294e-06, -2.5725114483066136e-06, -2.318829729119898e-06, -2.0651482373068575e-06, -1.8114665181201417e-06, -1.557784798933426e-06, -1.3041030797467101e-06, -1.050421474246832e-06, -7.967398119035352e-07, -5.430581495602382e-07, -2.8937643037352245e-07, -3.569482487364439e-08, 2.1798678062623367e-07, 4.7166849981294945e-07, 7.253501621562464e-07, 9.790318244995433e-07, 1.2327134299994214e-06, 1.4863951491861371e-06, 1.740076868372853e-06, 1.9937583601858933e-06, 2.247440079372609e-06, 2.501121798559325e-06, 2.7548035177460406e-06, 3.0084852369327564e-06, 3.2621667287457967e-06, 3.5158484479325125e-06, 3.7695301671192283e-06, 4.023211658932269e-06, 4.276893378118984e-06, 4.5305750973057e-06, 4.784256816492416e-06, 5.037938535679132e-06, 5.2916202548658475e-06, 5.545301974052563e-06, 5.798983693239279e-06, 6.052664957678644e-06, 6.30634667686536e-06, 6.5600283960520755e-06, 6.813710115238791e-06, 7.067391834425507e-06, 7.321073553612223e-06, 7.574754818051588e-06, 7.828436537238304e-06, 8.08211825642502e-06, 8.335799975611735e-06, 8.589481694798451e-06]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 3.0, 6.0, 30.0, 57.0, 57.0, 150.0, 216.0, 321.0, 577.0, 823.0, 1799.0, 2034.0, 3282.0, 4699.0, 7206.0, 10246.0, 16632.0, 34603.0, 43471.0, 68148.0, 109005.0, 173090.0, 298832.0, 492874.0, 1853004.0, 420142.0, 241283.0, 141664.0, 91988.0, 58728.0, 38404.0, 31981.0, 15380.0, 10042.0, 7245.0, 4813.0, 3398.0, 2347.0, 2100.0, 988.0, 712.0, 524.0, 374.0, 305.0, 190.0, 183.0, 101.0, 58.0, 57.0, 33.0, 27.0, 24.0, 17.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.304813385009766e-06, -5.1176175475120544e-06, -4.930421710014343e-06, -4.743225872516632e-06, -4.556030035018921e-06, -4.36883419752121e-06, -4.1816383600234985e-06, -3.994442522525787e-06, -3.807246685028076e-06, -3.620050847530365e-06, -3.432855010032654e-06, -3.2456591725349426e-06, -3.0584633350372314e-06, -2.8712674975395203e-06, -2.684071660041809e-06, -2.496875822544098e-06, -2.3096799850463867e-06, -2.1224841475486755e-06, -1.9352883100509644e-06, -1.7480924725532532e-06, -1.560896635055542e-06, -1.3737007975578308e-06, -1.1865049600601196e-06, -9.993091225624084e-07, -8.121132850646973e-07, -6.249174475669861e-07, -4.377216100692749e-07, -2.505257725715637e-07, -6.332993507385254e-08, 1.2386590242385864e-07, 3.110617399215698e-07, 4.98257577419281e-07, 6.854534149169922e-07, 8.726492524147034e-07, 1.0598450899124146e-06, 1.2470409274101257e-06, 1.434236764907837e-06, 1.621432602405548e-06, 1.8086284399032593e-06, 1.9958242774009705e-06, 2.1830201148986816e-06, 2.370215952396393e-06, 2.557411789894104e-06, 2.744607627391815e-06, 2.9318034648895264e-06, 3.1189993023872375e-06, 3.3061951398849487e-06, 3.49339097738266e-06, 3.680586814880371e-06, 3.867782652378082e-06, 4.0549784898757935e-06, 4.242174327373505e-06, 4.429370164871216e-06, 4.616566002368927e-06, 4.803761839866638e-06, 4.990957677364349e-06, 5.1781535148620605e-06, 5.365349352359772e-06, 5.552545189857483e-06, 5.739741027355194e-06, 5.926936864852905e-06, 6.1141327023506165e-06, 6.301328539848328e-06, 6.488524377346039e-06, 6.67572021484375e-06]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 73.0, 0.0, 0.0, 0.0, 129.0, 0.0, 0.0, 142.0, 0.0, 0.0, 0.0, 162.0, 0.0, 0.0, 0.0, 146.0, 0.0, 0.0, 117.0, 0.0, 0.0, 0.0, 70.0, 0.0, 0.0, 47.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.76837158203125e-07, -4.600733518600464e-07, -4.4330954551696777e-07, -4.2654573917388916e-07, -4.0978193283081055e-07, -3.9301812648773193e-07, -3.762543201446533e-07, -3.594905138015747e-07, -3.427267074584961e-07, -3.259629011154175e-07, -3.0919909477233887e-07, -2.9243528842926025e-07, -2.7567148208618164e-07, -2.5890767574310303e-07, -2.421438694000244e-07, -2.253800630569458e-07, -2.086162567138672e-07, -1.9185245037078857e-07, -1.7508864402770996e-07, -1.5832483768463135e-07, -1.4156103134155273e-07, -1.2479722499847412e-07, -1.0803341865539551e-07, -9.12696123123169e-08, -7.450580596923828e-08, -5.774199962615967e-08, -4.0978193283081055e-08, -2.421438694000244e-08, -7.450580596923828e-09, 9.313225746154785e-09, 2.60770320892334e-08, 4.284083843231201e-08, 5.960464477539063e-08, 7.636845111846924e-08, 9.313225746154785e-08, 1.0989606380462646e-07, 1.2665987014770508e-07, 1.434236764907837e-07, 1.601874828338623e-07, 1.7695128917694092e-07, 1.9371509552001953e-07, 2.1047890186309814e-07, 2.2724270820617676e-07, 2.4400651454925537e-07, 2.60770320892334e-07, 2.775341272354126e-07, 2.942979335784912e-07, 3.110617399215698e-07, 3.2782554626464844e-07, 3.4458935260772705e-07, 3.6135315895080566e-07, 3.781169652938843e-07, 3.948807716369629e-07, 4.116445779800415e-07, 4.284083843231201e-07, 4.4517219066619873e-07, 4.6193599700927734e-07, 4.78699803352356e-07, 4.954636096954346e-07, 5.122274160385132e-07, 5.289912223815918e-07, 5.457550287246704e-07, 5.62518835067749e-07, 5.792826414108276e-07, 5.960464477539062e-07]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 10.0, 18.0, 39.0, 72.0, 176.0, 314.0, 823.0, 1719.0, 3948.0, 9304.0, 77986.0, 3756641.0, 320253.0, 15515.0, 3830.0, 1753.0, 906.0, 424.0, 215.0, 121.0, 55.0, 35.0, 21.0, 10.0, 8.0, 6.0, 2.0, 9.0, 6.0, 5.0, 7.0, 10.0, 4.0, 10.0, 5.0, 1.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2934207916259766e-05, -1.2275762856006622e-05, -1.1617317795753479e-05, -1.0958872735500336e-05, -1.0300427675247192e-05, -9.641982614994049e-06, -8.983537554740906e-06, -8.325092494487762e-06, -7.666647434234619e-06, -7.008202373981476e-06, -6.3497573137283325e-06, -5.691312253475189e-06, -5.032867193222046e-06, -4.374422132968903e-06, -3.7159770727157593e-06, -3.057532012462616e-06, -2.3990869522094727e-06, -1.7406418919563293e-06, -1.082196831703186e-06, -4.237517714500427e-07, 2.3469328880310059e-07, 8.931383490562439e-07, 1.5515834093093872e-06, 2.2100284695625305e-06, 2.868473529815674e-06, 3.526918590068817e-06, 4.1853636503219604e-06, 4.843808710575104e-06, 5.502253770828247e-06, 6.16069883108139e-06, 6.819143891334534e-06, 7.477588951587677e-06, 8.13603401184082e-06, 8.794479072093964e-06, 9.452924132347107e-06, 1.011136919260025e-05, 1.0769814252853394e-05, 1.1428259313106537e-05, 1.208670437335968e-05, 1.2745149433612823e-05, 1.3403594493865967e-05, 1.406203955411911e-05, 1.4720484614372253e-05, 1.5378929674625397e-05, 1.603737473487854e-05, 1.6695819795131683e-05, 1.7354264855384827e-05, 1.801270991563797e-05, 1.8671154975891113e-05, 1.9329600036144257e-05, 1.99880450963974e-05, 2.0646490156650543e-05, 2.1304935216903687e-05, 2.196338027715683e-05, 2.2621825337409973e-05, 2.3280270397663116e-05, 2.393871545791626e-05, 2.4597160518169403e-05, 2.5255605578422546e-05, 2.591405063867569e-05, 2.6572495698928833e-05, 2.7230940759181976e-05, 2.788938581943512e-05, 2.8547830879688263e-05, 2.9206275939941406e-05]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 9.0, 9.0, 12.0, 21.0, 27.0, 58.0, 116.0, 148.0, 231.0, 311.0, 417.0, 792.0, 543.0, 387.0, 332.0, 231.0, 166.0, 95.0, 61.0, 27.0, 20.0, 8.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.682209014892578e-06, -2.621673047542572e-06, -2.561137080192566e-06, -2.50060111284256e-06, -2.4400651454925537e-06, -2.3795291781425476e-06, -2.3189932107925415e-06, -2.2584572434425354e-06, -2.1979212760925293e-06, -2.137385308742523e-06, -2.076849341392517e-06, -2.016313374042511e-06, -1.955777406692505e-06, -1.8952414393424988e-06, -1.8347054719924927e-06, -1.7741695046424866e-06, -1.7136335372924805e-06, -1.6530975699424744e-06, -1.5925616025924683e-06, -1.5320256352424622e-06, -1.471489667892456e-06, -1.41095370054245e-06, -1.3504177331924438e-06, -1.2898817658424377e-06, -1.2293457984924316e-06, -1.1688098311424255e-06, -1.1082738637924194e-06, -1.0477378964424133e-06, -9.872019290924072e-07, -9.266659617424011e-07, -8.66129994392395e-07, -8.055940270423889e-07, -7.450580596923828e-07, -6.845220923423767e-07, -6.239861249923706e-07, -5.634501576423645e-07, -5.029141902923584e-07, -4.423782229423523e-07, -3.818422555923462e-07, -3.213062882423401e-07, -2.60770320892334e-07, -2.0023435354232788e-07, -1.3969838619232178e-07, -7.916241884231567e-08, -1.862645149230957e-08, 4.190951585769653e-08, 1.0244548320770264e-07, 1.6298145055770874e-07, 2.2351741790771484e-07, 2.8405338525772095e-07, 3.4458935260772705e-07, 4.0512531995773315e-07, 4.6566128730773926e-07, 5.261972546577454e-07, 5.867332220077515e-07, 6.472691893577576e-07, 7.078051567077637e-07, 7.683411240577698e-07, 8.288770914077759e-07, 8.89413058757782e-07, 9.499490261077881e-07, 1.0104849934577942e-06, 1.0710209608078003e-06, 1.1315569281578064e-06, 1.1920928955078125e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 8.0, 5.0, 14.0, 20.0, 40.0, 50.0, 81.0, 165.0, 230.0, 142.0, 83.0, 56.0, 38.0, 20.0, 13.0, 6.0, 6.0, 5.0, 3.0, 4.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.492740572459297e-06, -4.2837941691686865e-06, -4.074848220625427e-06, -3.865901817334816e-06, -3.656955414044205e-06, -3.4480090107535943e-06, -3.239062834836659e-06, -3.0301166589197237e-06, -2.821170255629113e-06, -2.612223852338502e-06, -2.403277676421567e-06, -2.1943315005046315e-06, -1.985385097214021e-06, -1.7764388076102477e-06, -1.5674925180064747e-06, -1.3585462284027017e-06, -1.1495999387989286e-06, -9.406536491951556e-07, -7.317073595913826e-07, -5.227610699876095e-07, -3.138147803838365e-07, -1.0486849078006344e-07, 1.040777988237096e-07, 3.1302408842748264e-07, 5.219703780312557e-07, 7.309166676350287e-07, 9.398629572388018e-07, 1.1488092468425748e-06, 1.3577555364463478e-06, 1.5667018260501209e-06, 1.775648115653894e-06, 1.9845942915708292e-06, 2.193540240114089e-06, 2.4024866434047e-06, 2.611432819321635e-06, 2.8203789952385705e-06, 3.0293253985291813e-06, 3.238271801819792e-06, 3.4472179777367273e-06, 3.6561641536536627e-06, 3.865110556944273e-06, 4.074056960234884e-06, 4.283003363525495e-06, 4.491949312068755e-06, 4.7008957153593656e-06, 4.909842118649976e-06, 5.118788067193236e-06, 5.327734470483847e-06, 5.536680873774458e-06, 5.7456272770650685e-06, 5.954573680355679e-06, 6.163519628898939e-06, 6.37246603218955e-06, 6.581412435480161e-06, 6.7903583840234205e-06, 6.999304787314031e-06, 7.208251190604642e-06, 7.417197593895253e-06, 7.6261439971858636e-06, 7.835090400476474e-06, 8.044036803767085e-06, 8.252982297562994e-06, 8.461928700853605e-06, 8.670875104144216e-06, 8.879821507434826e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 11.0, 3.0, 8.0, 15.0, 10.0, 17.0, 15.0, 20.0, 27.0, 28.0, 19.0, 29.0, 48.0, 41.0, 49.0, 34.0, 35.0, 46.0, 43.0, 45.0, 42.0, 55.0, 42.0, 40.0, 43.0, 53.0, 37.0, 14.0, 34.0, 14.0, 16.0, 21.0, 11.0, 14.0, 8.0, 6.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6994071049557533e-06, -2.6072709715663223e-06, -2.515134838176891e-06, -2.42299870478746e-06, -2.330862571398029e-06, -2.238726438008598e-06, -2.146590304619167e-06, -2.0544543986034114e-06, -1.962318037840305e-06, -1.8701819044508738e-06, -1.7780457710614428e-06, -1.6859096376720117e-06, -1.5937735042825807e-06, -1.5016373708931496e-06, -1.4095013511905563e-06, -1.3173652178011253e-06, -1.225229198098532e-06, -1.1330930647091009e-06, -1.0409569313196698e-06, -9.488208547736576e-07, -8.566847213842266e-07, -7.645485879947955e-07, -6.724125114487833e-07, -5.802763780593523e-07, -4.881402446699212e-07, -3.960041112804902e-07, -3.0386800631276856e-07, -2.1173190134504694e-07, -1.1959576795561588e-07, -2.7459634566184832e-08, 6.467644197982736e-08, 1.568125753692584e-07, 2.4894870875868946e-07, 3.410848421481205e-07, 4.3322094711584214e-07, 5.253570520835638e-07, 6.174931854729948e-07, 7.096293188624259e-07, 8.017653954084381e-07, 8.939015287978691e-07, 9.860376621873002e-07, 1.0781737955767312e-06, 1.1703099289661623e-06, 1.2624459486687556e-06, 1.3545820820581866e-06, 1.4467182154476177e-06, 1.5388543488370487e-06, 1.6309904822264798e-06, 1.7231266156159109e-06, 1.815262749005342e-06, 1.907398882394773e-06, 1.999535015784204e-06, 2.091671149173635e-06, 2.183807282563066e-06, 2.2759431885788217e-06, 2.3680795493419282e-06, 2.460215455357684e-06, 2.552351588747115e-06, 2.644487722136546e-06, 2.736623855525977e-06, 2.828759988915408e-06, 2.920896122304839e-06, 3.01303225569427e-06, 3.1051681617100257e-06, 3.1973045224731322e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 13.0, 10.0, 26.0, 19.0, 52.0, 39.0, 117.0, 101.0, 282.0, 208.0, 669.0, 591.0, 1958.0, 1579.0, 5515.0, 4965.0, 18813.0, 17830.0, 80913.0, 91581.0, 426453.0, 171229.0, 143041.0, 29407.0, 29372.0, 7495.0, 8373.0, 2313.0, 2708.0, 784.0, 960.0, 324.0, 362.0, 112.0, 154.0, 38.0, 56.0, 22.0, 30.0, 7.0, 10.0, 5.0, 8.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.9206275939941406e-06, -2.8312206268310547e-06, -2.7418136596679688e-06, -2.652406692504883e-06, -2.562999725341797e-06, -2.473592758178711e-06, -2.384185791015625e-06, -2.294778823852539e-06, -2.205371856689453e-06, -2.115964889526367e-06, -2.0265579223632812e-06, -1.9371509552001953e-06, -1.8477439880371094e-06, -1.7583370208740234e-06, -1.6689300537109375e-06, -1.5795230865478516e-06, -1.4901161193847656e-06, -1.4007091522216797e-06, -1.3113021850585938e-06, -1.2218952178955078e-06, -1.1324882507324219e-06, -1.043081283569336e-06, -9.5367431640625e-07, -8.642673492431641e-07, -7.748603820800781e-07, -6.854534149169922e-07, -5.960464477539062e-07, -5.066394805908203e-07, -4.172325134277344e-07, -3.2782554626464844e-07, -2.384185791015625e-07, -1.4901161193847656e-07, -5.960464477539063e-08, 2.9802322387695312e-08, 1.1920928955078125e-07, 2.086162567138672e-07, 2.980232238769531e-07, 3.8743019104003906e-07, 4.76837158203125e-07, 5.662441253662109e-07, 6.556510925292969e-07, 7.450580596923828e-07, 8.344650268554688e-07, 9.238719940185547e-07, 1.0132789611816406e-06, 1.1026859283447266e-06, 1.1920928955078125e-06, 1.2814998626708984e-06, 1.3709068298339844e-06, 1.4603137969970703e-06, 1.5497207641601562e-06, 1.6391277313232422e-06, 1.7285346984863281e-06, 1.817941665649414e-06, 1.9073486328125e-06, 1.996755599975586e-06, 2.086162567138672e-06, 2.175569534301758e-06, 2.2649765014648438e-06, 2.3543834686279297e-06, 2.4437904357910156e-06, 2.5331974029541016e-06, 2.6226043701171875e-06, 2.7120113372802734e-06, 2.8014183044433594e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 6.0, 5.0, 3.0, 10.0, 12.0, 5.0, 17.0, 27.0, 13.0, 25.0, 35.0, 18.0, 36.0, 64.0, 29.0, 62.0, 53.0, 53.0, 36.0, 59.0, 52.0, 30.0, 58.0, 58.0, 25.0, 50.0, 40.0, 14.0, 27.0, 22.0, 8.0, 18.0, 11.0, 9.0, 3.0, 6.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-06, -3.475695848464966e-06, -3.375113010406494e-06, -3.2745301723480225e-06, -3.1739473342895508e-06, -3.073364496231079e-06, -2.9727816581726074e-06, -2.8721988201141357e-06, -2.771615982055664e-06, -2.6710331439971924e-06, -2.5704503059387207e-06, -2.469867467880249e-06, -2.3692846298217773e-06, -2.2687017917633057e-06, -2.168118953704834e-06, -2.0675361156463623e-06, -1.9669532775878906e-06, -1.866370439529419e-06, -1.7657876014709473e-06, -1.6652047634124756e-06, -1.564621925354004e-06, -1.4640390872955322e-06, -1.3634562492370605e-06, -1.2628734111785889e-06, -1.1622905731201172e-06, -1.0617077350616455e-06, -9.611248970031738e-07, -8.605420589447021e-07, -7.599592208862305e-07, -6.593763828277588e-07, -5.587935447692871e-07, -4.5821070671081543e-07, -3.5762786865234375e-07, -2.5704503059387207e-07, -1.564621925354004e-07, -5.587935447692871e-08, 4.470348358154297e-08, 1.4528632164001465e-07, 2.4586915969848633e-07, 3.46451997756958e-07, 4.470348358154297e-07, 5.476176738739014e-07, 6.48200511932373e-07, 7.487833499908447e-07, 8.493661880493164e-07, 9.499490261077881e-07, 1.0505318641662598e-06, 1.1511147022247314e-06, 1.2516975402832031e-06, 1.3522803783416748e-06, 1.4528632164001465e-06, 1.5534460544586182e-06, 1.6540288925170898e-06, 1.7546117305755615e-06, 1.8551945686340332e-06, 1.955777406692505e-06, 2.0563602447509766e-06, 2.1569430828094482e-06, 2.25752592086792e-06, 2.3581087589263916e-06, 2.4586915969848633e-06, 2.559274435043335e-06, 2.6598572731018066e-06, 2.7604401111602783e-06, 2.86102294921875e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 8.0, 1.0, 4.0, 7.0, 8.0, 15.0, 15.0, 20.0, 18.0, 58.0, 47.0, 54.0, 90.0, 95.0, 282.0, 229.0, 290.0, 414.0, 1323.0, 1089.0, 1440.0, 2218.0, 3342.0, 14647.0, 17370.0, 37586.0, 104746.0, 677552.0, 142502.0, 17233.0, 9301.0, 5366.0, 5603.0, 1529.0, 1067.0, 755.0, 576.0, 697.0, 219.0, 166.0, 124.0, 171.0, 75.0, 45.0, 32.0, 27.0, 42.0, 15.0, 11.0, 14.0, 12.0, 7.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.1923333406448364e-06, -2.119690179824829e-06, -2.0470470190048218e-06, -1.9744038581848145e-06, -1.9017606973648071e-06, -1.8291175365447998e-06, -1.7564743757247925e-06, -1.6838312149047852e-06, -1.6111880540847778e-06, -1.5385448932647705e-06, -1.4659017324447632e-06, -1.3932585716247559e-06, -1.3206154108047485e-06, -1.2479722499847412e-06, -1.1753290891647339e-06, -1.1026859283447266e-06, -1.0300427675247192e-06, -9.57399606704712e-07, -8.847564458847046e-07, -8.121132850646973e-07, -7.394701242446899e-07, -6.668269634246826e-07, -5.941838026046753e-07, -5.21540641784668e-07, -4.4889748096466064e-07, -3.762543201446533e-07, -3.03611159324646e-07, -2.3096799850463867e-07, -1.5832483768463135e-07, -8.568167686462402e-08, -1.30385160446167e-08, 5.960464477539063e-08, 1.3224780559539795e-07, 2.0489096641540527e-07, 2.775341272354126e-07, 3.501772880554199e-07, 4.2282044887542725e-07, 4.954636096954346e-07, 5.681067705154419e-07, 6.407499313354492e-07, 7.133930921554565e-07, 7.860362529754639e-07, 8.586794137954712e-07, 9.313225746154785e-07, 1.0039657354354858e-06, 1.0766088962554932e-06, 1.1492520570755005e-06, 1.2218952178955078e-06, 1.2945383787155151e-06, 1.3671815395355225e-06, 1.4398247003555298e-06, 1.5124678611755371e-06, 1.5851110219955444e-06, 1.6577541828155518e-06, 1.730397343635559e-06, 1.8030405044555664e-06, 1.8756836652755737e-06, 1.948326826095581e-06, 2.0209699869155884e-06, 2.0936131477355957e-06, 2.166256308555603e-06, 2.2388994693756104e-06, 2.3115426301956177e-06, 2.384185791015625e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 8.0, 5.0, 0.0, 7.0, 8.0, 0.0, 10.0, 18.0, 0.0, 18.0, 17.0, 0.0, 27.0, 38.0, 0.0, 33.0, 55.0, 0.0, 50.0, 0.0, 401.0, 48.0, 0.0, 62.0, 45.0, 0.0, 32.0, 29.0, 0.0, 18.0, 14.0, 0.0, 16.0, 16.0, 0.0, 8.0, 8.0, 0.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2516975402832031e-06, -1.212581992149353e-06, -1.173466444015503e-06, -1.1343508958816528e-06, -1.0952353477478027e-06, -1.0561197996139526e-06, -1.0170042514801025e-06, -9.778887033462524e-07, -9.387731552124023e-07, -8.996576070785522e-07, -8.605420589447021e-07, -8.21426510810852e-07, -7.82310962677002e-07, -7.431954145431519e-07, -7.040798664093018e-07, -6.649643182754517e-07, -6.258487701416016e-07, -5.867332220077515e-07, -5.476176738739014e-07, -5.085021257400513e-07, -4.6938657760620117e-07, -4.302710294723511e-07, -3.91155481338501e-07, -3.520399332046509e-07, -3.129243850708008e-07, -2.738088369369507e-07, -2.3469328880310059e-07, -1.955777406692505e-07, -1.564621925354004e-07, -1.1734664440155029e-07, -7.82310962677002e-08, -3.91155481338501e-08, 0.0, 3.91155481338501e-08, 7.82310962677002e-08, 1.1734664440155029e-07, 1.564621925354004e-07, 1.955777406692505e-07, 2.3469328880310059e-07, 2.738088369369507e-07, 3.129243850708008e-07, 3.520399332046509e-07, 3.91155481338501e-07, 4.302710294723511e-07, 4.6938657760620117e-07, 5.085021257400513e-07, 5.476176738739014e-07, 5.867332220077515e-07, 6.258487701416016e-07, 6.649643182754517e-07, 7.040798664093018e-07, 7.431954145431519e-07, 7.82310962677002e-07, 8.21426510810852e-07, 8.605420589447021e-07, 8.996576070785522e-07, 9.387731552124023e-07, 9.778887033462524e-07, 1.0170042514801025e-06, 1.0561197996139526e-06, 1.0952353477478027e-06, 1.1343508958816528e-06, 1.173466444015503e-06, 1.212581992149353e-06, 1.2516975402832031e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 7.0, 5.0, 1.0, 4.0, 5.0, 7.0, 13.0, 13.0, 16.0, 19.0, 28.0, 35.0, 60.0, 68.0, 104.0, 166.0, 130.0, 86.0, 50.0, 50.0, 30.0, 30.0, 18.0, 10.0, 8.0, 7.0, 8.0, 2.0, 1.0, 7.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.668039309763117e-06, -4.534388153842883e-06, -4.40073699792265e-06, -4.267085842002416e-06, -4.1334346860821825e-06, -3.999783530161949e-06, -3.866132374241715e-06, -3.7324809909478063e-06, -3.5988298350275727e-06, -3.465178679107339e-06, -3.3315275231871055e-06, -3.197876367266872e-06, -3.064224983972963e-06, -2.9305738280527294e-06, -2.796922672132496e-06, -2.6632715162122622e-06, -2.5296203602920286e-06, -2.395969204371795e-06, -2.2623180484515615e-06, -2.128666892531328e-06, -1.9950157366110943e-06, -1.861364467004023e-06, -1.7277131973969517e-06, -1.5940620414767182e-06, -1.4604108855564846e-06, -1.326759729636251e-06, -1.1931085737160174e-06, -1.0594573041089461e-06, -9.258061481887125e-07, -7.92154992268479e-07, -6.585037795048265e-07, -5.248525667411741e-07, -3.912009560735896e-07, -2.575497717316466e-07, -1.238985873897036e-07, 9.7525969522394e-09, 1.434037812941824e-07, 2.77054937214416e-07, 4.107061499780684e-07, 5.443573627417209e-07, 6.780085186619544e-07, 8.11659674582188e-07, 9.453108873458405e-07, 1.078962100109493e-06, 1.2126132560297265e-06, 1.34626441194996e-06, 1.4799156815570313e-06, 1.613566837477265e-06, 1.7472179933974985e-06, 1.880869149317732e-06, 2.0145203052379657e-06, 2.1481714611581992e-06, 2.281822617078433e-06, 2.4154737729986664e-06, 2.5491251562925754e-06, 2.682776312212809e-06, 2.8164274681330426e-06, 2.950078624053276e-06, 3.0837297799735097e-06, 3.2173809358937433e-06, 3.3510323191876523e-06, 3.484683475107886e-06, 3.6183346310281195e-06, 3.751985786948353e-06, 3.885636942868587e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 5.0, 8.0, 8.0, 15.0, 11.0, 18.0, 21.0, 27.0, 23.0, 22.0, 36.0, 36.0, 42.0, 45.0, 39.0, 37.0, 41.0, 48.0, 43.0, 50.0, 45.0, 46.0, 42.0, 43.0, 52.0, 38.0, 18.0, 33.0, 20.0, 13.0, 20.0, 10.0, 14.0, 11.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6794045879796613e-06, -2.5894087229971774e-06, -2.499412630641018e-06, -2.409416765658534e-06, -2.3194206733023748e-06, -2.229424808319891e-06, -2.139428943337407e-06, -2.049433078354923e-06, -1.9594369859987637e-06, -1.869441007329442e-06, -1.7794450286601204e-06, -1.6894491636776365e-06, -1.599453185008315e-06, -1.5094572063389933e-06, -1.4194613413565094e-06, -1.3294653626871877e-06, -1.239469384017866e-06, -1.1494734053485445e-06, -1.0594774266792228e-06, -9.69481561696739e-07, -8.794855830274173e-07, -7.894896043580957e-07, -6.994936825321929e-07, -6.094977607062901e-07, -5.195017820369685e-07, -4.295058317893563e-07, -3.395098815417441e-07, -2.495139312941319e-07, -1.595179810465197e-07, -6.952203079890751e-08, 2.047391944870469e-08, 1.1046984127460746e-07, 2.0046559257025365e-07, 2.9046154281786585e-07, 3.8045749306547805e-07, 4.7045344331309025e-07, 5.604493935607024e-07, 6.504453722300241e-07, 7.404412940559268e-07, 8.304372158818296e-07, 9.204331945511512e-07, 1.0104291732204729e-06, 1.1004251518897945e-06, 1.1904210168722784e-06, 1.2804169955416e-06, 1.3704129742109217e-06, 1.4604088391934056e-06, 1.5504048178627272e-06, 1.6404007965320488e-06, 1.7303967752013705e-06, 1.820392753870692e-06, 1.910388618853176e-06, 2.00038448383566e-06, 2.0903805761918193e-06, 2.180376441174303e-06, 2.2703725335304625e-06, 2.3603683985129464e-06, 2.4503642634954304e-06, 2.5403603558515897e-06, 2.6303562208340736e-06, 2.720352313190233e-06, 2.810348178172717e-06, 2.9003440431552008e-06, 2.9903399081376847e-06, 3.080336000493844e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 8.0, 3.0, 12.0, 19.0, 20.0, 26.0, 35.0, 64.0, 110.0, 159.0, 237.0, 296.0, 567.0, 905.0, 1530.0, 2724.0, 5276.0, 11710.0, 28441.0, 80488.0, 328217.0, 429401.0, 97996.0, 33278.0, 13510.0, 6139.0, 3092.0, 1662.0, 936.0, 553.0, 314.0, 282.0, 157.0, 130.0, 71.0, 58.0, 36.0, 25.0, 19.0, 16.0, 10.0, 5.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1444091796875e-05, -1.1086463928222656e-05, -1.0728836059570312e-05, -1.0371208190917969e-05, -1.0013580322265625e-05, -9.655952453613281e-06, -9.298324584960938e-06, -8.940696716308594e-06, -8.58306884765625e-06, -8.225440979003906e-06, -7.867813110351562e-06, -7.510185241699219e-06, -7.152557373046875e-06, -6.794929504394531e-06, -6.4373016357421875e-06, -6.079673767089844e-06, -5.7220458984375e-06, -5.364418029785156e-06, -5.0067901611328125e-06, -4.649162292480469e-06, -4.291534423828125e-06, -3.933906555175781e-06, -3.5762786865234375e-06, -3.2186508178710938e-06, -2.86102294921875e-06, -2.5033950805664062e-06, -2.1457672119140625e-06, -1.7881393432617188e-06, -1.430511474609375e-06, -1.0728836059570312e-06, -7.152557373046875e-07, -3.5762786865234375e-07, 0.0, 3.5762786865234375e-07, 7.152557373046875e-07, 1.0728836059570312e-06, 1.430511474609375e-06, 1.7881393432617188e-06, 2.1457672119140625e-06, 2.5033950805664062e-06, 2.86102294921875e-06, 3.2186508178710938e-06, 3.5762786865234375e-06, 3.933906555175781e-06, 4.291534423828125e-06, 4.649162292480469e-06, 5.0067901611328125e-06, 5.364418029785156e-06, 5.7220458984375e-06, 6.079673767089844e-06, 6.4373016357421875e-06, 6.794929504394531e-06, 7.152557373046875e-06, 7.510185241699219e-06, 7.867813110351562e-06, 8.225440979003906e-06, 8.58306884765625e-06, 8.940696716308594e-06, 9.298324584960938e-06, 9.655952453613281e-06, 1.0013580322265625e-05, 1.0371208190917969e-05, 1.0728836059570312e-05, 1.1086463928222656e-05, 1.1444091796875e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 5.0, 5.0, 4.0, 0.0, 14.0, 16.0, 0.0, 16.0, 27.0, 0.0, 34.0, 34.0, 0.0, 51.0, 57.0, 0.0, 59.0, 55.0, 66.0, 0.0, 68.0, 64.0, 0.0, 85.0, 70.0, 0.0, 83.0, 51.0, 0.0, 28.0, 28.0, 0.0, 22.0, 21.0, 22.0, 0.0, 11.0, 6.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4491379261016846e-06, -1.4081597328186035e-06, -1.3671815395355225e-06, -1.3262033462524414e-06, -1.2852251529693604e-06, -1.2442469596862793e-06, -1.2032687664031982e-06, -1.1622905731201172e-06, -1.1213123798370361e-06, -1.080334186553955e-06, -1.039355993270874e-06, -9.98377799987793e-07, -9.57399606704712e-07, -9.164214134216309e-07, -8.754432201385498e-07, -8.344650268554688e-07, -7.934868335723877e-07, -7.525086402893066e-07, -7.115304470062256e-07, -6.705522537231445e-07, -6.295740604400635e-07, -5.885958671569824e-07, -5.476176738739014e-07, -5.066394805908203e-07, -4.6566128730773926e-07, -4.246830940246582e-07, -3.8370490074157715e-07, -3.427267074584961e-07, -3.0174851417541504e-07, -2.60770320892334e-07, -2.1979212760925293e-07, -1.7881393432617188e-07, -1.3783574104309082e-07, -9.685754776000977e-08, -5.587935447692871e-08, -1.4901161193847656e-08, 2.60770320892334e-08, 6.705522537231445e-08, 1.0803341865539551e-07, 1.4901161193847656e-07, 1.8998980522155762e-07, 2.3096799850463867e-07, 2.7194619178771973e-07, 3.129243850708008e-07, 3.5390257835388184e-07, 3.948807716369629e-07, 4.3585896492004395e-07, 4.76837158203125e-07, 5.178153514862061e-07, 5.587935447692871e-07, 5.997717380523682e-07, 6.407499313354492e-07, 6.817281246185303e-07, 7.227063179016113e-07, 7.636845111846924e-07, 8.046627044677734e-07, 8.456408977508545e-07, 8.866190910339355e-07, 9.275972843170166e-07, 9.685754776000977e-07, 1.0095536708831787e-06, 1.0505318641662598e-06, 1.0915100574493408e-06, 1.1324882507324219e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 7.0, 9.0, 11.0, 12.0, 28.0, 39.0, 68.0, 53.0, 146.0, 214.0, 341.0, 662.0, 666.0, 1586.0, 2997.0, 5435.0, 6370.0, 17104.0, 36337.0, 85269.0, 261684.0, 341880.0, 167725.0, 63426.0, 27895.0, 10122.0, 8591.0, 4405.0, 2366.0, 1333.0, 505.0, 460.0, 298.0, 187.0, 102.0, 44.0, 48.0, 37.0, 29.0, 14.0, 17.0, 10.0, 6.0, 4.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-06, -4.364177584648132e-06, -4.198402166366577e-06, -4.032626748085022e-06, -3.866851329803467e-06, -3.7010759115219116e-06, -3.5353004932403564e-06, -3.3695250749588013e-06, -3.203749656677246e-06, -3.037974238395691e-06, -2.8721988201141357e-06, -2.7064234018325806e-06, -2.5406479835510254e-06, -2.3748725652694702e-06, -2.209097146987915e-06, -2.04332172870636e-06, -1.8775463104248047e-06, -1.7117708921432495e-06, -1.5459954738616943e-06, -1.3802200555801392e-06, -1.214444637298584e-06, -1.0486692190170288e-06, -8.828938007354736e-07, -7.171183824539185e-07, -5.513429641723633e-07, -3.855675458908081e-07, -2.1979212760925293e-07, -5.4016709327697754e-08, 1.1175870895385742e-07, 2.775341272354126e-07, 4.4330954551696777e-07, 6.09084963798523e-07, 7.748603820800781e-07, 9.406358003616333e-07, 1.1064112186431885e-06, 1.2721866369247437e-06, 1.4379620552062988e-06, 1.603737473487854e-06, 1.7695128917694092e-06, 1.9352883100509644e-06, 2.1010637283325195e-06, 2.2668391466140747e-06, 2.43261456489563e-06, 2.598389983177185e-06, 2.7641654014587402e-06, 2.9299408197402954e-06, 3.0957162380218506e-06, 3.2614916563034058e-06, 3.427267074584961e-06, 3.593042492866516e-06, 3.7588179111480713e-06, 3.9245933294296265e-06, 4.090368747711182e-06, 4.256144165992737e-06, 4.421919584274292e-06, 4.587695002555847e-06, 4.753470420837402e-06, 4.9192458391189575e-06, 5.085021257400513e-06, 5.250796675682068e-06, 5.416572093963623e-06, 5.582347512245178e-06, 5.748122930526733e-06, 5.9138983488082886e-06, 6.079673767089844e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 9.0, 5.0, 10.0, 0.0, 13.0, 21.0, 21.0, 0.0, 21.0, 43.0, 54.0, 0.0, 62.0, 74.0, 66.0, 0.0, 87.0, 79.0, 78.0, 0.0, 79.0, 60.0, 48.0, 0.0, 50.0, 28.0, 36.0, 0.0, 23.0, 11.0, 14.0, 0.0, 4.0, 4.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-06, -1.087784767150879e-06, -1.043081283569336e-06, -9.98377799987793e-07, -9.5367431640625e-07, -9.08970832824707e-07, -8.642673492431641e-07, -8.195638656616211e-07, -7.748603820800781e-07, -7.301568984985352e-07, -6.854534149169922e-07, -6.407499313354492e-07, -5.960464477539062e-07, -5.513429641723633e-07, -5.066394805908203e-07, -4.6193599700927734e-07, -4.172325134277344e-07, -3.725290298461914e-07, -3.2782554626464844e-07, -2.8312206268310547e-07, -2.384185791015625e-07, -1.9371509552001953e-07, -1.4901161193847656e-07, -1.043081283569336e-07, -5.960464477539063e-08, -1.4901161193847656e-08, 2.9802322387695312e-08, 7.450580596923828e-08, 1.1920928955078125e-07, 1.6391277313232422e-07, 2.086162567138672e-07, 2.5331974029541016e-07, 2.980232238769531e-07, 3.427267074584961e-07, 3.8743019104003906e-07, 4.3213367462158203e-07, 4.76837158203125e-07, 5.21540641784668e-07, 5.662441253662109e-07, 6.109476089477539e-07, 6.556510925292969e-07, 7.003545761108398e-07, 7.450580596923828e-07, 7.897615432739258e-07, 8.344650268554688e-07, 8.791685104370117e-07, 9.238719940185547e-07, 9.685754776000977e-07, 1.0132789611816406e-06, 1.0579824447631836e-06, 1.1026859283447266e-06, 1.1473894119262695e-06, 1.1920928955078125e-06, 1.2367963790893555e-06, 1.2814998626708984e-06, 1.3262033462524414e-06, 1.3709068298339844e-06, 1.4156103134155273e-06, 1.4603137969970703e-06, 1.5050172805786133e-06, 1.5497207641601562e-06, 1.5944242477416992e-06, 1.6391277313232422e-06, 1.6838312149047852e-06, 1.7285346984863281e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 8.0, 17.0, 17.0, 35.0, 48.0, 55.0, 111.0, 175.0, 204.0, 102.0, 55.0, 40.0, 28.0, 18.0, 17.0, 9.0, 8.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.019874268124113e-06, -3.92413858207874e-06, -3.828402896033367e-06, -3.732666982614319e-06, -3.6369310691952705e-06, -3.5411953831498977e-06, -3.445459697104525e-06, -3.3497237836854765e-06, -3.2539880976401037e-06, -3.158252411594731e-06, -3.0625164981756825e-06, -2.9667808121303096e-06, -2.8710448987112613e-06, -2.7753092126658885e-06, -2.67957329924684e-06, -2.5838376132014673e-06, -2.4881019271560945e-06, -2.3923662411107216e-06, -2.2966303276916733e-06, -2.2008946416463004e-06, -2.105158728227252e-06, -2.0094230421818793e-06, -1.9136873561365064e-06, -1.8179514427174581e-06, -1.7222155292984098e-06, -1.6264797295661992e-06, -1.5307439298339887e-06, -1.4350082437886158e-06, -1.3392724440564052e-06, -1.2435366443241946e-06, -1.147800844591984e-06, -1.0520650448597735e-06, -9.563293588144006e-07, -8.6059355908219e-07, -7.648578161933983e-07, -6.691220164611877e-07, -5.73386273572396e-07, -4.776504738401854e-07, -3.8191467410797486e-07, -2.8617893121918314e-07, -1.9044313148697256e-07, -9.470735307104405e-08, 1.0284253448844538e-09, 9.676421086624032e-08, 1.9249998217674147e-07, 2.882357534872426e-07, 3.839715532194532e-07, 4.797072961082449e-07, 5.754430958404555e-07, 6.711788955726661e-07, 7.669146384614578e-07, 8.626504381936684e-07, 9.5838618108246e-07, 1.0541219808146707e-06, 1.1498577805468813e-06, 1.2455934665922541e-06, 1.3413293800113024e-06, 1.437065179743513e-06, 1.5328009794757236e-06, 1.6285366655210964e-06, 1.724272465253307e-06, 1.8200082649855176e-06, 1.915744178404566e-06, 2.0114798644499388e-06, 2.1072155504953116e-06]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 2.0, 5.0, 9.0, 8.0, 8.0, 7.0, 14.0, 14.0, 14.0, 27.0, 19.0, 33.0, 21.0, 29.0, 28.0, 38.0, 58.0, 54.0, 38.0, 48.0, 42.0, 47.0, 39.0, 49.0, 35.0, 40.0, 38.0, 26.0, 28.0, 25.0, 24.0, 22.0, 27.0, 12.0, 15.0, 13.0, 4.0, 13.0, 9.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3553559483625577e-06, -1.3104601066515897e-06, -1.265564151253784e-06, -1.2206683095428161e-06, -1.1757723541450105e-06, -1.1308765124340425e-06, -1.0859805570362369e-06, -1.041084715325269e-06, -9.96188873614301e-07, -9.512929750599142e-07, -9.063970765055274e-07, -8.615012347945594e-07, -8.166052793967538e-07, -7.717094376857858e-07, -7.26813539131399e-07, -6.819176405770122e-07, -6.370216851792065e-07, -5.921257866248197e-07, -5.472298880704329e-07, -5.02334046359465e-07, -4.5743811938336876e-07, -4.1254222082898195e-07, -3.676463506963046e-07, -3.227504521419178e-07, -2.7785455358753097e-07, -2.3295865503314417e-07, -1.8806277068961208e-07, -1.4316688634608e-07, -9.827098779169319e-08, -5.3375089237306383e-08, -8.47921910462901e-09, 3.6416679449757794e-08, 8.131246431730688e-08, 1.2620836287169368e-07, 1.7110424721522577e-07, 2.1600013155875786e-07, 2.6089603011314466e-07, 3.0579192866753147e-07, 3.5068779880020884e-07, 3.9558369735459564e-07, 4.4047959590898245e-07, 4.853754944633693e-07, 5.302713930177561e-07, 5.751672915721429e-07, 6.200631332831108e-07, 6.649590886809165e-07, 7.098549303918844e-07, 7.547508289462712e-07, 7.99646727500658e-07, 8.445426260550448e-07, 8.894385246094316e-07, 9.343343663203996e-07, 9.792303217182052e-07, 1.0241261634291732e-06, 1.0690221188269788e-06, 1.1139179605379468e-06, 1.1588138022489147e-06, 1.2037096439598827e-06, 1.2486055993576883e-06, 1.2935014410686563e-06, 1.338397396466462e-06, 1.3832932381774299e-06, 1.4281890798883978e-06, 1.4730850352862035e-06, 1.5179809906840092e-06]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 24.0, 0.0, 60.0, 0.0, 116.0, 0.0, 266.0, 0.0, 468.0, 790.0, 0.0, 1897.0, 0.0, 6505.0, 0.0, 20396.0, 0.0, 46701.0, 0.0, 69237.0, 0.0, 65587.0, 0.0, 54640.0, 0.0, 3687914.0, 48632.0, 0.0, 59345.0, 0.0, 62076.0, 0.0, 42126.0, 0.0, 18285.0, 0.0, 5809.0, 0.0, 1654.0, 0.0, 783.0, 454.0, 0.0, 275.0, 0.0, 139.0, 0.0, 71.0, 0.0, 29.0, 0.0, 9.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-1.0132789611816406e-06, -9.816139936447144e-07, -9.499490261077881e-07, -9.182840585708618e-07, -8.866190910339355e-07, -8.549541234970093e-07, -8.23289155960083e-07, -7.916241884231567e-07, -7.599592208862305e-07, -7.282942533493042e-07, -6.966292858123779e-07, -6.649643182754517e-07, -6.332993507385254e-07, -6.016343832015991e-07, -5.699694156646729e-07, -5.383044481277466e-07, -5.066394805908203e-07, -4.7497451305389404e-07, -4.4330954551696777e-07, -4.116445779800415e-07, -3.7997961044311523e-07, -3.4831464290618896e-07, -3.166496753692627e-07, -2.849847078323364e-07, -2.5331974029541016e-07, -2.2165477275848389e-07, -1.8998980522155762e-07, -1.5832483768463135e-07, -1.2665987014770508e-07, -9.499490261077881e-08, -6.332993507385254e-08, -3.166496753692627e-08, 0.0, 3.166496753692627e-08, 6.332993507385254e-08, 9.499490261077881e-08, 1.2665987014770508e-07, 1.5832483768463135e-07, 1.8998980522155762e-07, 2.2165477275848389e-07, 2.5331974029541016e-07, 2.849847078323364e-07, 3.166496753692627e-07, 3.4831464290618896e-07, 3.7997961044311523e-07, 4.116445779800415e-07, 4.4330954551696777e-07, 4.7497451305389404e-07, 5.066394805908203e-07, 5.383044481277466e-07, 5.699694156646729e-07, 6.016343832015991e-07, 6.332993507385254e-07, 6.649643182754517e-07, 6.966292858123779e-07, 7.282942533493042e-07, 7.599592208862305e-07, 7.916241884231567e-07, 8.23289155960083e-07, 8.549541234970093e-07, 8.866190910339355e-07, 9.182840585708618e-07, 9.499490261077881e-07, 9.816139936447144e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 891.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 252.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 28.0, 9.0, 29.0, 86.0, 476.0, 2875.0, 21611.0, 129870.0, 4013882.0, 21495.0, 2814.0, 435.0, 90.0, 32.0, 9.0, 26.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 121.0, 125.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-2.2649765014648438e-06, -2.1941959857940674e-06, -2.123415470123291e-06, -2.0526349544525146e-06, -1.9818544387817383e-06, -1.911073923110962e-06, -1.8402934074401855e-06, -1.7695128917694092e-06, -1.6987323760986328e-06, -1.6279518604278564e-06, -1.55717134475708e-06, -1.4863908290863037e-06, -1.4156103134155273e-06, -1.344829797744751e-06, -1.2740492820739746e-06, -1.2032687664031982e-06, -1.1324882507324219e-06, -1.0617077350616455e-06, -9.909272193908691e-07, -9.201467037200928e-07, -8.493661880493164e-07, -7.7858567237854e-07, -7.078051567077637e-07, -6.370246410369873e-07, -5.662441253662109e-07, -4.954636096954346e-07, -4.246830940246582e-07, -3.5390257835388184e-07, -2.8312206268310547e-07, -2.123415470123291e-07, -1.4156103134155273e-07, -7.078051567077637e-08, 0.0, 7.078051567077637e-08, 1.4156103134155273e-07, 2.123415470123291e-07, 2.8312206268310547e-07, 3.5390257835388184e-07, 4.246830940246582e-07, 4.954636096954346e-07, 5.662441253662109e-07, 6.370246410369873e-07, 7.078051567077637e-07, 7.7858567237854e-07, 8.493661880493164e-07, 9.201467037200928e-07, 9.909272193908691e-07, 1.0617077350616455e-06, 1.1324882507324219e-06, 1.2032687664031982e-06, 1.2740492820739746e-06, 1.344829797744751e-06, 1.4156103134155273e-06, 1.4863908290863037e-06, 1.55717134475708e-06, 1.6279518604278564e-06, 1.6987323760986328e-06, 1.7695128917694092e-06, 1.8402934074401855e-06, 1.911073923110962e-06, 1.9818544387817383e-06, 2.0526349544525146e-06, 2.123415470123291e-06, 2.1941959857940674e-06, 2.2649765014648438e-06]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 281.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3518.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 280.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 5.0, 6.0, 7.0, 8.0, 10.0, 22.0, 24.0, 31.0, 58.0, 85.0, 143.0, 204.0, 138.0, 96.0, 42.0, 37.0, 13.0, 17.0, 9.0, 8.0, 8.0, 7.0, 11.0, 5.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0888630558602017e-07, -2.018031466377579e-07, -1.9472000190035033e-07, -1.8763684295208805e-07, -1.8055368400382577e-07, -1.734705392664182e-07, -1.6638738031815592e-07, -1.5930422136989364e-07, -1.5222107663248607e-07, -1.451379176842238e-07, -1.3805477294681623e-07, -1.3097161399855395e-07, -1.2388846926114638e-07, -1.168053103128841e-07, -1.0972215136462182e-07, -1.026389995217869e-07, -9.555584767895198e-08, -8.847269583611705e-08, -8.138954399328213e-08, -7.430638504501985e-08, -6.722323320218493e-08, -6.014008135935e-08, -5.3056925963801405e-08, -4.59737705682528e-08, -3.889061872541788e-08, -3.180746688258296e-08, -2.4724311487034356e-08, -1.7641157867842594e-08, -1.0558004248650832e-08, -3.474852405815909e-09, 3.6083029897326924e-09, 1.0691458385281294e-08, 1.77745960172615e-08, 2.4857749636453264e-08, 3.1940903255645026e-08, 3.902405865119363e-08, 4.610721049402855e-08, 5.319036233686347e-08, 6.027352128512575e-08, 6.735667312796068e-08, 7.44398249707956e-08, 8.152297681363052e-08, 8.860612865646544e-08, 9.568928760472772e-08, 1.0277243944756265e-07, 1.0985559129039757e-07, 1.1693875023865985e-07, 1.2402190918692213e-07, 1.311050539243297e-07, 1.3818821287259198e-07, 1.4527135760999954e-07, 1.5235451655826182e-07, 1.5943766129566939e-07, 1.6652082024393167e-07, 1.7360397919219395e-07, 1.806871239296015e-07, 1.877702828778638e-07, 1.9485344182612607e-07, 2.0193658656353364e-07, 2.0901974551179592e-07, 2.161029044600582e-07, 2.2318604919746576e-07, 2.3026920814572804e-07, 2.3735236709399032e-07, 2.444355118313979e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 4.0, 8.0, 6.0, 8.0, 12.0, 16.0, 14.0, 17.0, 26.0, 23.0, 33.0, 37.0, 36.0, 40.0, 61.0, 57.0, 56.0, 56.0, 56.0, 54.0, 47.0, 46.0, 46.0, 35.0, 27.0, 28.0, 30.0, 18.0, 18.0, 18.0, 19.0, 13.0, 8.0, 4.0, 7.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6387070900236722e-07, -1.591510709886279e-07, -1.544314329748886e-07, -1.4971179496114928e-07, -1.4499215694740997e-07, -1.4027250472281594e-07, -1.3555286670907662e-07, -1.308332286953373e-07, -1.26113590681598e-07, -1.2139395266785868e-07, -1.1667431465411937e-07, -1.119546695349527e-07, -1.0723503152121339e-07, -1.0251539350747407e-07, -9.77957483883074e-08, -9.307611037456809e-08, -8.835647236082877e-08, -8.363683434708946e-08, -7.891719633335015e-08, -7.419755121418348e-08, -6.947791320044416e-08, -6.475827518670485e-08, -6.003863006753818e-08, -5.5318992053798866e-08, -5.059935404005955e-08, -4.587971602632024e-08, -4.1160074459867246e-08, -3.6440432893414254e-08, -3.172079487967494e-08, -2.7001155089578788e-08, -2.2281515299482635e-08, -1.7561873733029643e-08, -1.2842235719290329e-08, -8.122595929194176e-09, -3.4029561390980234e-09, 1.3166836509981295e-09, 6.036323441094282e-09, 1.0755963231190435e-08, 1.5475603021286588e-08, 2.019524458773958e-08, 2.4914882601478894e-08, 2.9634522391575047e-08, 3.43541621816712e-08, 3.907380374812419e-08, 4.3793441761863505e-08, 4.851307977560282e-08, 5.323272134205581e-08, 5.79523629085088e-08, 6.267200092224812e-08, 6.739163893598743e-08, 7.211127694972674e-08, 7.683092206889341e-08, 8.155056008263273e-08, 8.627019809637204e-08, 9.098984321553871e-08, 9.570948122927803e-08, 1.0042911924301734e-07, 1.0514875725675665e-07, 1.0986839527049597e-07, 1.1458804038966264e-07, 1.193076855088293e-07, 1.2402732352256862e-07, 1.2874696153630794e-07, 1.3346659955004725e-07, 1.3818623756378656e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3974.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1040613.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3892.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 832.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 9.0, 10.0, 18.0, 23.0, 32.0, 51.0, 82.0, 125.0, 225.0, 146.0, 91.0, 47.0, 32.0, 20.0, 13.0, 11.0, 11.0, 7.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.868954058181771e-07, -1.7987474620895227e-07, -1.7285408659972745e-07, -1.6583342699050263e-07, -1.588127673812778e-07, -1.5179210777205299e-07, -1.4477146237368288e-07, -1.3775078855360334e-07, -1.3073014315523324e-07, -1.2370948354600841e-07, -1.1668882393678359e-07, -1.0966816432755877e-07, -1.0264750471833395e-07, -9.562684510910913e-08, -8.860619260531166e-08, -8.158553299608684e-08, -7.456486628143466e-08, -6.754420667220984e-08, -6.052354706298502e-08, -5.3502891006473874e-08, -4.648223139724905e-08, -3.946157178802423e-08, -3.244091573151309e-08, -2.5420256122288265e-08, -1.8399596513063443e-08, -1.1378937792017041e-08, -4.358279070970639e-09, 2.6623787618973438e-09, 9.683038371122166e-09, 1.6703697980346988e-08, 2.372435403685813e-08, 3.074501364608295e-08, 3.776565904445306e-08, 4.478631865367788e-08, 5.18069782629027e-08, 5.8827634319413846e-08, 6.584829748135235e-08, 7.286895709057717e-08, 7.988960959437463e-08, 8.691026920359946e-08, 9.393092881282428e-08, 1.009515884220491e-07, 1.0797224803127392e-07, 1.1499290053507139e-07, 1.220135601442962e-07, 1.2903421975352103e-07, 1.3605487936274585e-07, 1.4307553897197067e-07, 1.500961985811955e-07, 1.5711685819042032e-07, 1.6413751779964514e-07, 1.7115817740886996e-07, 1.7817883701809478e-07, 1.851994966273196e-07, 1.922201420256897e-07, 1.9924081584576925e-07, 2.0626146124413935e-07, 2.1328212085336418e-07, 2.20302780462589e-07, 2.2732344007181382e-07, 2.3434409968103864e-07, 2.4136474507940875e-07, 2.483854188994883e-07, 2.554060642978584e-07, 2.6242673811793793e-07]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 3.0, 7.0, 6.0, 5.0, 9.0, 12.0, 19.0, 15.0, 24.0, 25.0, 29.0, 38.0, 30.0, 41.0, 55.0, 69.0, 54.0, 55.0, 57.0, 60.0, 46.0, 49.0, 50.0, 36.0, 35.0, 22.0, 25.0, 23.0, 21.0, 22.0, 14.0, 11.0, 10.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.4673135240172996e-07, -1.4253325275603856e-07, -1.3833515311034716e-07, -1.3413703925380105e-07, -1.2993893960810965e-07, -1.2574083996241825e-07, -1.2154274031672685e-07, -1.1734463356560809e-07, -1.1314652681448933e-07, -1.0894842716879793e-07, -1.0475032041767918e-07, -1.0055222077198778e-07, -9.635411402086902e-08, -9.215601437517762e-08, -8.795791472948622e-08, -8.375980797836746e-08, -7.956170833267606e-08, -7.536360868698466e-08, -7.11655019358659e-08, -6.69674022901745e-08, -6.276929553905575e-08, -5.857119589336435e-08, -5.437309269495927e-08, -5.017498949655419e-08, -4.597688629814911e-08, -4.177878309974403e-08, -3.7580679901338954e-08, -3.3382576702933875e-08, -2.9184475280885636e-08, -2.4986372082480557e-08, -2.0788270660432318e-08, -1.659016746202724e-08, -1.239206426362216e-08, -8.193961065217081e-09, -3.995858754990422e-09, 2.0224355523623672e-10, 4.4003467536413154e-09, 8.598449952046394e-09, 1.2796551374094634e-08, 1.6994654572499712e-08, 2.119275777090479e-08, 2.539086096930987e-08, 2.958896416771495e-08, 3.378706736612003e-08, 3.798516701181143e-08, 4.2183273762930185e-08, 4.6381373408621585e-08, 5.057947660702666e-08, 5.477757980543174e-08, 5.897568300383682e-08, 6.31737862022419e-08, 6.73718858479333e-08, 7.156999259905206e-08, 7.576809224474346e-08, 7.996619899586221e-08, 8.416429864155361e-08, 8.836239828724501e-08, 9.256049793293641e-08, 9.675860468405517e-08, 1.0095670432974657e-07, 1.0515481108086533e-07, 1.0935291072655673e-07, 1.1355101037224813e-07, 1.1774911712336689e-07, 1.2194722387448564e-07]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [7.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.0, 0.0, 0.0, 0.0, 0.0, 697.0, 0.0, 0.0, 0.0, 4275.0, 0.0, 0.0, 0.0, 0.0, 17418.0, 0.0, 0.0, 0.0, 0.0, 1003506.0, 0.0, 0.0, 0.0, 17440.0, 0.0, 0.0, 0.0, 0.0, 4303.0, 0.0, 0.0, 0.0, 695.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 13.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 951.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 7.0, 6.0, 12.0, 13.0, 35.0, 52.0, 89.0, 135.0, 261.0, 195.0, 86.0, 31.0, 19.0, 19.0, 15.0, 9.0, 7.0, 4.0, 0.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.717465505014843e-08, -8.16058332020475e-08, -7.603701845937394e-08, -7.046819661127302e-08, -6.489938186859945e-08, -5.9330560020498524e-08, -5.37617381723976e-08, -4.8192919877010354e-08, -4.262410158162311e-08, -3.705528328623586e-08, -3.148646499084862e-08, -2.5917643142747693e-08, -2.0348824847360447e-08, -1.4780006551973202e-08, -9.211184703872277e-09, -3.6423664084850316e-09, 1.926451886902214e-09, 7.49527107046788e-09, 1.3064090254033545e-08, 1.863291032577763e-08, 2.4201728621164875e-08, 2.977054691655212e-08, 3.5339368764653045e-08, 4.090818706004029e-08, 4.6477005355427536e-08, 5.204582365081478e-08, 5.761464194620203e-08, 6.318346379430295e-08, 6.875228564240388e-08, 7.432110038507744e-08, 7.988992223317837e-08, 8.545873697585193e-08, 9.102754461309814e-08, 9.659636646119907e-08, 1.0216518120387263e-07, 1.0773400305197356e-07, 1.1330281779464713e-07, 1.1887163964274805e-07, 1.2444046149084897e-07, 1.300092833389499e-07, 1.355780909761961e-07, 1.4114691282429703e-07, 1.4671573467239796e-07, 1.5228454230964417e-07, 1.578533641577451e-07, 1.6342218600584602e-07, 1.6899100785394694e-07, 1.7455982970204786e-07, 1.801286515501488e-07, 1.856974733982497e-07, 1.9126629524635064e-07, 1.9683511709445156e-07, 2.0240392473169777e-07, 2.079727465797987e-07, 2.1354156842789962e-07, 2.1911039027600054e-07, 2.2467921212410147e-07, 2.302480339722024e-07, 2.3581685582030332e-07, 2.413856634575495e-07, 2.4695449951650517e-07, 2.525233071537514e-07, 2.58092143212707e-07, 2.636609508499532e-07, 2.6922975848719943e-07]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 6.0, 7.0, 9.0, 11.0, 13.0, 15.0, 23.0, 26.0, 26.0, 38.0, 40.0, 37.0, 56.0, 69.0, 53.0, 61.0, 54.0, 66.0, 44.0, 52.0, 48.0, 36.0, 36.0, 22.0, 22.0, 26.0, 24.0, 19.0, 11.0, 12.0, 9.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.595493028451529e-08, -8.356214209470636e-08, -8.116936101032479e-08, -7.877657282051587e-08, -7.638378463070694e-08, -7.399099644089802e-08, -7.159820825108909e-08, -6.920542716670752e-08, -6.68126389768986e-08, -6.441985078708967e-08, -6.20270697027081e-08, -5.963428151289918e-08, -5.7241493323090253e-08, -5.484870513328133e-08, -5.245592049618608e-08, -5.0063135859090835e-08, -4.767034766928191e-08, -4.5277559479472984e-08, -4.288477484237774e-08, -4.049199020528249e-08, -3.8099202015473566e-08, -3.570641382566464e-08, -3.3313629188569394e-08, -3.092084455147415e-08, -2.852805636166522e-08, -2.6135269948213136e-08, -2.374248353476105e-08, -2.1349697121308964e-08, -1.8956910707856878e-08, -1.6564124294404792e-08, -1.4171337880952706e-08, -1.177855146750062e-08, -9.385765054048534e-09, -6.992978640596448e-09, -4.600192227144362e-09, -2.207405813692276e-09, 1.8538059975981014e-10, 2.578167013211896e-09, 4.970953426663982e-09, 7.363739840116068e-09, 9.756526253568154e-09, 1.214931266702024e-08, 1.4542099080472326e-08, 1.6934885493924412e-08, 1.9327671907376498e-08, 2.1720458320828584e-08, 2.411324473428067e-08, 2.6506031147732756e-08, 2.8898817561184842e-08, 3.129160575099377e-08, 3.3684390388089014e-08, 3.607717502518426e-08, 3.8469963214993186e-08, 4.086275140480211e-08, 4.325553604189736e-08, 4.5648320678992604e-08, 4.804110886880153e-08, 5.0433897058610455e-08, 5.28266816957057e-08, 5.521946633280095e-08, 5.7612254522609874e-08, 6.00050427124188e-08, 6.239783090222772e-08, 6.479061198660929e-08, 6.718340017641822e-08]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 51.0, 0.0, 0.0, 0.0, 104.0, 0.0, 0.0, 0.0, 4193788.0, 0.0, 0.0, 180.0, 0.0, 0.0, 0.0, 85.0, 0.0, 0.0, 45.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-5.364418029785156e-07, -5.19677996635437e-07, -5.029141902923584e-07, -4.861503839492798e-07, -4.6938657760620117e-07, -4.5262277126312256e-07, -4.3585896492004395e-07, -4.1909515857696533e-07, -4.023313522338867e-07, -3.855675458908081e-07, -3.688037395477295e-07, -3.520399332046509e-07, -3.3527612686157227e-07, -3.1851232051849365e-07, -3.0174851417541504e-07, -2.849847078323364e-07, -2.682209014892578e-07, -2.514570951461792e-07, -2.3469328880310059e-07, -2.1792948246002197e-07, -2.0116567611694336e-07, -1.8440186977386475e-07, -1.6763806343078613e-07, -1.5087425708770752e-07, -1.341104507446289e-07, -1.1734664440155029e-07, -1.0058283805847168e-07, -8.381903171539307e-08, -6.705522537231445e-08, -5.029141902923584e-08, -3.3527612686157227e-08, -1.6763806343078613e-08, 0.0, 1.6763806343078613e-08, 3.3527612686157227e-08, 5.029141902923584e-08, 6.705522537231445e-08, 8.381903171539307e-08, 1.0058283805847168e-07, 1.1734664440155029e-07, 1.341104507446289e-07, 1.5087425708770752e-07, 1.6763806343078613e-07, 1.8440186977386475e-07, 2.0116567611694336e-07, 2.1792948246002197e-07, 2.3469328880310059e-07, 2.514570951461792e-07, 2.682209014892578e-07, 2.849847078323364e-07, 3.0174851417541504e-07, 3.1851232051849365e-07, 3.3527612686157227e-07, 3.520399332046509e-07, 3.688037395477295e-07, 3.855675458908081e-07, 4.023313522338867e-07, 4.1909515857696533e-07, 4.3585896492004395e-07, 4.5262277126312256e-07, 4.6938657760620117e-07, 4.861503839492798e-07, 5.029141902923584e-07, 5.19677996635437e-07, 5.364418029785156e-07]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1016.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 2.0, 17.0, 40.0, 47.0, 136.0, 242.0, 225.0, 133.0, 47.0, 43.0, 16.0, 15.0, 8.0, 5.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.313705659342304e-08, -3.9811492769104007e-08, -3.648592894478497e-08, -3.316036156775226e-08, -2.9834801296146907e-08, -2.6509235695471034e-08, -2.318367009479516e-08, -1.9858106270476128e-08, -1.6532542446157095e-08, -1.3206978621838061e-08, -9.881413909340608e-09, -6.555849196843155e-09, -3.230285372524122e-09, 9.527845179491123e-11, 3.420844052470784e-09, 6.746407876789817e-09, 1.007197170110885e-08, 1.3397535525427884e-08, 1.6723099349746917e-08, 2.004866495042279e-08, 2.3374228774741823e-08, 2.6699792599060856e-08, 3.002535819973673e-08, 3.335092202405576e-08, 3.6676485848374796e-08, 4.000204967269383e-08, 4.332761349701286e-08, 4.6653177321331896e-08, 4.997874469836461e-08, 5.330430496996996e-08, 5.6629872347002674e-08, 5.995543972403539e-08, 6.328099289021338e-08, 6.66065602672461e-08, 6.993212053885145e-08, 7.325768791588416e-08, 7.658324818748952e-08, 7.990881556452223e-08, 8.323438294155494e-08, 8.65599432131603e-08, 8.988550348476565e-08, 9.321107086179836e-08, 9.653663113340372e-08, 9.986219851043643e-08, 1.0318775878204178e-07, 1.065133261590745e-07, 1.0983889353610721e-07, 1.1316445380771256e-07, 1.1649002118474527e-07, 1.1981558145635063e-07, 1.2314114883338334e-07, 1.2646671621041605e-07, 1.2979228358744876e-07, 1.3311783675362676e-07, 1.3644340413065947e-07, 1.3976897150769219e-07, 1.430945388847249e-07, 1.464201062617576e-07, 1.4974567363879032e-07, 1.5307122680496832e-07, 1.5639679418200103e-07, 1.5972236155903374e-07, 1.6304792893606646e-07, 1.6637349631309917e-07, 1.6969904947927716e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 2.0, 10.0, 5.0, 8.0, 6.0, 13.0, 16.0, 19.0, 25.0, 20.0, 40.0, 30.0, 41.0, 45.0, 56.0, 70.0, 46.0, 62.0, 54.0, 62.0, 37.0, 65.0, 35.0, 41.0, 31.0, 30.0, 23.0, 25.0, 16.0, 20.0, 11.0, 12.0, 7.0, 5.0, 1.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.8219097098799466e-08, -5.663417113055402e-08, -5.504924871502226e-08, -5.3464322746776816e-08, -5.187939677853137e-08, -5.029447436299961e-08, -4.8709548394754165e-08, -4.712462242650872e-08, -4.553970001097696e-08, -4.3954774042731515e-08, -4.236985162719975e-08, -4.078492565895431e-08, -3.920000324342254e-08, -3.76150772751771e-08, -3.603015130693166e-08, -3.444522889139989e-08, -3.286030292315445e-08, -3.1275376954909007e-08, -2.9690454539377242e-08, -2.81055285711318e-08, -2.6520604379243196e-08, -2.4935680187354592e-08, -2.335075421910915e-08, -2.1765830027220545e-08, -2.018090583533194e-08, -1.8595981643443338e-08, -1.7011057451554734e-08, -1.542613148330929e-08, -1.3841207291420687e-08, -1.2256283099532084e-08, -1.067135801946506e-08, -9.086432939398037e-09, -7.501505194795755e-09, -5.916580558817941e-09, -4.3316559228401275e-09, -2.746731286862314e-09, -1.1618066508845004e-09, 4.2311754100410326e-10, 2.0080426210711266e-09, 3.59296770113815e-09, 5.177891893026754e-09, 6.762816529004567e-09, 8.34774116498238e-09, 9.932666245049404e-09, 1.1517590436938008e-08, 1.3102514628826611e-08, 1.4687439708893635e-08, 1.6272364788960658e-08, 1.7857288980849262e-08, 1.9442213172737866e-08, 2.102713736462647e-08, 2.2612063332871912e-08, 2.4196987524760516e-08, 2.578191171664912e-08, 2.7366837684894563e-08, 2.8951761876783166e-08, 3.053668606867177e-08, 3.212161203691721e-08, 3.370653445244898e-08, 3.529146042069442e-08, 3.6876386388939864e-08, 3.846130880447163e-08, 4.004623477271707e-08, 4.1631160740962514e-08, 4.321608315649428e-08]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048563.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 9.313225746154785e-10, 1.862645149230957e-09, 2.7939677238464355e-09, 3.725290298461914e-09, 4.6566128730773926e-09, 5.587935447692871e-09, 6.51925802230835e-09, 7.450580596923828e-09, 8.381903171539307e-09, 9.313225746154785e-09, 1.0244548320770264e-08, 1.1175870895385742e-08, 1.210719347000122e-08, 1.30385160446167e-08, 1.3969838619232178e-08, 1.4901161193847656e-08, 1.5832483768463135e-08, 1.6763806343078613e-08, 1.7695128917694092e-08, 1.862645149230957e-08, 1.955777406692505e-08, 2.0489096641540527e-08, 2.1420419216156006e-08, 2.2351741790771484e-08, 2.3283064365386963e-08, 2.421438694000244e-08, 2.514570951461792e-08, 2.60770320892334e-08, 2.7008354663848877e-08, 2.7939677238464355e-08, 2.8870999813079834e-08, 2.9802322387695312e-08, 3.073364496231079e-08, 3.166496753692627e-08, 3.259629011154175e-08, 3.3527612686157227e-08, 3.4458935260772705e-08, 3.5390257835388184e-08, 3.632158041000366e-08, 3.725290298461914e-08, 3.818422555923462e-08, 3.91155481338501e-08, 4.0046870708465576e-08, 4.0978193283081055e-08, 4.190951585769653e-08, 4.284083843231201e-08, 4.377216100692749e-08, 4.470348358154297e-08, 4.563480615615845e-08, 4.6566128730773926e-08, 4.7497451305389404e-08, 4.842877388000488e-08, 4.936009645462036e-08, 5.029141902923584e-08, 5.122274160385132e-08, 5.21540641784668e-08, 5.3085386753082275e-08, 5.4016709327697754e-08, 5.494803190231323e-08, 5.587935447692871e-08, 5.681067705154419e-08, 5.774199962615967e-08, 5.8673322200775146e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 14.0, 34.0, 44.0, 69.0, 116.0, 189.0, 195.0, 131.0, 53.0, 42.0, 26.0, 19.0, 12.0, 5.0, 9.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.494883729781577e-08, -8.265588036238114e-08, -8.036292342694651e-08, -7.806996649151188e-08, -7.577700955607725e-08, -7.348405972606997e-08, -7.119110279063534e-08, -6.889814585520071e-08, -6.660518891976608e-08, -6.431223198433145e-08, -6.201927504889682e-08, -5.972631811346218e-08, -5.743336473074123e-08, -5.51404077953066e-08, -5.284745441258565e-08, -5.055449747715102e-08, -4.8261540541716386e-08, -4.5968583606281754e-08, -4.367562667084712e-08, -4.138267328812617e-08, -3.908971635269154e-08, -3.679675941725691e-08, -3.4503806034535955e-08, -3.2210849099101324e-08, -2.991789216366669e-08, -2.762493522823206e-08, -2.533198006915427e-08, -2.3039024910076478e-08, -2.0746067974641846e-08, -1.8453111039207215e-08, -1.6160155880129423e-08, -1.3867200721051631e-08, -1.1574236680189642e-08, -9.28128063293343e-09, -6.988324585677219e-09, -4.6953685384210075e-09, -2.402412491164796e-09, -1.0945644390858433e-10, 2.1834996033476273e-09, 4.476454762425419e-09, 6.7694116978600505e-09, 9.062367745116262e-09, 1.1355323792372474e-08, 1.3648279839628685e-08, 1.5941235886884897e-08, 1.8234192822319528e-08, 2.052714798139732e-08, 2.2820103140475112e-08, 2.5113060075909743e-08, 2.7406017011344375e-08, 2.9698972170422167e-08, 3.199192732949996e-08, 3.428488426493459e-08, 3.657784120036922e-08, 3.8870794583090174e-08, 4.1163751518524805e-08, 4.3456708453959436e-08, 4.574966538939407e-08, 4.80426223248287e-08, 5.033557570754965e-08, 5.262853264298428e-08, 5.4921489578418914e-08, 5.7214442961139866e-08, 5.95073998965745e-08, 6.180035683200913e-08]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 5.0, 7.0, 9.0, 11.0, 5.0, 19.0, 10.0, 16.0, 26.0, 21.0, 38.0, 37.0, 41.0, 47.0, 56.0, 62.0, 53.0, 57.0, 60.0, 53.0, 53.0, 56.0, 34.0, 32.0, 33.0, 26.0, 24.0, 25.0, 23.0, 15.0, 12.0, 15.0, 4.0, 3.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.243281281901545e-08, -4.1272834039318695e-08, -4.011285525962194e-08, -3.895287647992518e-08, -3.779289770022842e-08, -3.6632918920531665e-08, -3.5472943693548586e-08, -3.431296491385183e-08, -3.315298613415507e-08, -3.1993007354458314e-08, -3.0833028574761556e-08, -2.96730497950648e-08, -2.851307279172488e-08, -2.7353094012028123e-08, -2.6193115232331365e-08, -2.5033138228991447e-08, -2.387315767293785e-08, -2.2713178893241093e-08, -2.1553200113544335e-08, -2.0393223110204417e-08, -1.923324433050766e-08, -1.8073265550810902e-08, -1.6913286771114144e-08, -1.5753307991417387e-08, -1.4593330099899049e-08, -1.3433351320202291e-08, -1.2273373428683954e-08, -1.1113394648987196e-08, -9.953415869290438e-09, -8.7934379777721e-09, -7.633459198075343e-09, -6.473481306557005e-09, -5.313502526860248e-09, -4.1535241912527e-09, -2.9935456336005473e-09, -1.8335670759483946e-09, -6.735887403408469e-10, 4.863895952667008e-10, 1.6463683749634583e-09, 2.806346266481796e-09, 3.966325046178554e-09, 5.1263033817861015e-09, 6.286281717393649e-09, 7.446260497090407e-09, 8.606239276787164e-09, 9.766217168305502e-09, 1.092619594800226e-08, 1.2086173839520598e-08, 1.3246152619217355e-08, 1.4406131398914113e-08, 1.556611017861087e-08, 1.672608718195079e-08, 1.7886065961647546e-08, 1.9046044741344303e-08, 2.020602352104106e-08, 2.136600230073782e-08, 2.2525981080434576e-08, 2.3685959860131334e-08, 2.484593863982809e-08, 2.600591741952485e-08, 2.7165894422864767e-08, 2.8325873202561525e-08, 2.9485851982258282e-08, 3.06458289855982e-08, 3.180580776529496e-08]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 7.0, 19.0, 53.0, 148.0, 511.0, 172.0, 54.0, 28.0, 11.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.185570480151e-07, -2.145515054507996e-07, -2.1054594867564447e-07, -2.0654039190048934e-07, -2.0253484933618893e-07, -1.9852930677188851e-07, -1.9452374999673339e-07, -1.9051819322157826e-07, -1.8651265065727785e-07, -1.8250710809297743e-07, -1.785015513178223e-07, -1.7449599454266718e-07, -1.7049045197836676e-07, -1.6648490941406635e-07, -1.6247935263891122e-07, -1.584737958637561e-07, -1.5446825329945568e-07, -1.5046271073515527e-07, -1.4645715396000014e-07, -1.4245159718484501e-07, -1.384460546205446e-07, -1.344405120562442e-07, -1.3043495528108906e-07, -1.2642939850593393e-07, -1.2242385594163352e-07, -1.1841830627190575e-07, -1.1441275660217798e-07, -1.1040720693245021e-07, -1.0640165726272244e-07, -1.0239610759299467e-07, -9.83905579232669e-08, -9.438500825353913e-08, -9.037944437295664e-08, -8.637389470322887e-08, -8.23683450335011e-08, -7.836279536377333e-08, -7.435724569404556e-08, -7.035169602431779e-08, -6.634614635459002e-08, -6.234059668486225e-08, -5.833505056784816e-08, -5.4329500898120386e-08, -5.0323951228392616e-08, -4.6318401558664846e-08, -4.2312851888937075e-08, -3.8307302219209305e-08, -3.4301752549481535e-08, -3.0296202879753764e-08, -2.6290653210025994e-08, -2.2285103540298223e-08, -1.8279553870570453e-08, -1.4274004200842683e-08, -1.0268454531114912e-08, -6.262904861387142e-09, -2.2573551916593715e-09, 1.7481944780683989e-09, 5.753744147796169e-09, 9.75929381752394e-09, 1.376484348725171e-08, 1.777039315697948e-08, 2.177594282670725e-08, 2.578149249643502e-08, 2.978704216616279e-08, 3.379259183589056e-08, 3.779814150561833e-08]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 5.0, 5.0, 8.0, 8.0, 10.0, 8.0, 18.0, 13.0, 22.0, 22.0, 31.0, 36.0, 41.0, 47.0, 53.0, 60.0, 53.0, 55.0, 65.0, 54.0, 52.0, 51.0, 46.0, 38.0, 31.0, 30.0, 22.0, 28.0, 26.0, 11.0, 17.0, 14.0, 4.0, 5.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-3.1608589523557384e-08, -3.075257026807776e-08, -2.989655101259814e-08, -2.9040533533475354e-08, -2.818451605435257e-08, -2.7328496798872948e-08, -2.6472479319750164e-08, -2.561646006427054e-08, -2.4760442585147757e-08, -2.3904423329668134e-08, -2.304840585054535e-08, -2.2192386595065727e-08, -2.1336369115942944e-08, -2.048034986046332e-08, -1.9624332381340537e-08, -1.8768313125860914e-08, -1.791229564673813e-08, -1.7056276391258507e-08, -1.6200258912135723e-08, -1.53442396566561e-08, -1.4488222177533316e-08, -1.3632202922053693e-08, -1.277618544293091e-08, -1.1920166187451287e-08, -1.1064146931971663e-08, -1.020812856467046e-08, -9.352110197369257e-09, -8.496091830068053e-09, -7.64007346276685e-09, -6.784054651376437e-09, -5.928036284075233e-09, -5.07201791677403e-09, -4.215999993562036e-09, -3.359981626260833e-09, -2.5039632589596295e-09, -1.6479446696138211e-09, -7.919263023126177e-10, 6.409228703319059e-11, 9.20110654334394e-10, 1.7761290216355974e-09, 2.6321473889368008e-09, 3.488165756238004e-09, 4.3441841235392076e-09, 5.200202934929621e-09, 6.056221302230824e-09, 6.912239669532028e-09, 7.768258036833231e-09, 8.624276404134434e-09, 9.480294771435638e-09, 1.0336313138736841e-08, 1.1192331506038045e-08, 1.2048349873339248e-08, 1.2904368240640451e-08, 1.3760386607941655e-08, 1.4616405863421278e-08, 1.547242334254406e-08, 1.6328442598023685e-08, 1.7184461853503308e-08, 1.804047933262609e-08, 1.8896498588105715e-08, 1.9752516067228498e-08, 2.060853532270812e-08, 2.1464552801830905e-08, 2.2320572057310528e-08, 2.3176589536433312e-08]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 6.0, 11.0, 49.0, 358.0, 491.0, 79.0, 22.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.558432298296111e-09, -3.665031611532754e-09, -2.771630924769397e-09, -1.878230460050645e-09, -9.84829773287288e-10, -9.142908652393089e-11, 8.019713781948212e-10, 1.6953722870027832e-09, 2.5887727517215353e-09, 3.4821734384848924e-09, 4.375574125248249e-09, 5.2689745899670015e-09, 6.1623754987749635e-09, 7.055775963493716e-09, 7.949176428212468e-09, 8.84257733702043e-09, 9.735977357649972e-09, 1.0629378266457934e-08, 1.1522778287087476e-08, 1.2416179195895438e-08, 1.33095801047034e-08, 1.4202980125332942e-08, 1.5096381034140904e-08, 1.5989781942948866e-08, 1.6883182851756828e-08, 1.777658376056479e-08, 1.8669984669372752e-08, 1.9563383801823875e-08, 2.0456784710631837e-08, 2.13501856194398e-08, 2.224358652824776e-08, 2.3136987437055723e-08, 2.4030386569506845e-08, 2.4923787478314807e-08, 2.581718838712277e-08, 2.6710587519573892e-08, 2.7603988428381854e-08, 2.8497389337189816e-08, 2.9390790245997778e-08, 3.028419115480574e-08, 3.11775920636137e-08, 3.2070992972421664e-08, 3.2964393881229626e-08, 3.385779479003759e-08, 3.475119569884555e-08, 3.564459660765351e-08, 3.6537997516461473e-08, 3.7431398425269435e-08, 3.832479578136372e-08, 3.921819669017168e-08, 4.011159759897964e-08, 4.1004998507787604e-08, 4.1898399416595566e-08, 4.279180032540353e-08, 4.368519768149781e-08, 4.4578598590305774e-08, 4.5472003051827414e-08, 4.6365403960635376e-08, 4.725880486944334e-08, 4.81522057782513e-08, 4.904560668705926e-08, 4.9939007595867224e-08, 5.083240495196151e-08, 5.172580586076947e-08, 5.261920676957743e-08]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 10.0, 5.0, 7.0, 19.0, 18.0, 18.0, 19.0, 25.0, 24.0, 31.0, 32.0, 47.0, 50.0, 50.0, 58.0, 53.0, 40.0, 54.0, 63.0, 41.0, 42.0, 43.0, 49.0, 34.0, 27.0, 19.0, 22.0, 21.0, 15.0, 20.0, 8.0, 6.0, 6.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-8.091109116037387e-09, -7.87557041803666e-09, -7.660032608214351e-09, -7.444493910213623e-09, -7.228955656302105e-09, -7.013417402390587e-09, -6.797879148479069e-09, -6.582340894567551e-09, -6.366802196566823e-09, -6.151263942655305e-09, -5.935725688743787e-09, -5.720186990743059e-09, -5.504648736831541e-09, -5.289110482920023e-09, -5.073572229008505e-09, -4.858033975096987e-09, -4.642495721185469e-09, -4.426957467273951e-09, -4.211419213362433e-09, -3.995880959450915e-09, -3.780342261450187e-09, -3.564804007538669e-09, -3.349265753627151e-09, -3.133727499715633e-09, -2.91818902375951e-09, -2.702650769847992e-09, -2.487112293891869e-09, -2.2715740399803508e-09, -2.0560357860688327e-09, -1.8404973101127098e-09, -1.6249590562011917e-09, -1.4094206912673712e-09, -1.1938827704227606e-09, -9.7834440548894e-10, -7.628060960662708e-10, -5.472677866436015e-10, -3.3172942170978104e-10, -1.1619105677596053e-10, 9.934719713555751e-11, 3.14885562069378e-10, 5.304239270031985e-10, 7.45962291937019e-10, 9.615006568708395e-10, 1.1770389107823576e-09, 1.392577275716178e-09, 1.6081156406499986e-09, 1.8236538945615166e-09, 2.0391923705176396e-09, 2.2547306244291576e-09, 2.4702688783406757e-09, 2.6858073542967986e-09, 2.9013456082083167e-09, 3.1168840841644396e-09, 3.3324223380759577e-09, 3.5479605919874757e-09, 3.763498845898994e-09, 3.979037543899722e-09, 4.19457579781124e-09, 4.410114051722758e-09, 4.625652749723486e-09, 4.841191003635004e-09, 5.056729257546522e-09, 5.27226751145804e-09, 5.487805765369558e-09, 5.703344019281076e-09]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 10.0, 10.0, 16.0, 14.0, 33.0, 42.0, 52.0, 81.0, 89.0, 118.0, 126.0, 112.0, 69.0, 60.0, 33.0, 18.0, 27.0, 11.0, 6.0, 15.0, 8.0, 7.0, 8.0, 6.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.085501714712336e-09, -3.9620902114734236e-09, -3.838678708234511e-09, -3.715267204995598e-09, -3.5918557017566854e-09, -3.4684441985177727e-09, -3.345032917323465e-09, -3.2216214140845523e-09, -3.0982099108456396e-09, -2.974798407606727e-09, -2.851386904367814e-09, -2.7279754011289015e-09, -2.6045641199345937e-09, -2.481152616695681e-09, -2.3577411134567683e-09, -2.2343296102178556e-09, -2.110918106978943e-09, -1.98750660374003e-09, -1.8640951005011175e-09, -1.7406837082845072e-09, -1.6172722050455945e-09, -1.4938607018066818e-09, -1.3704493095900716e-09, -1.247037806351159e-09, -1.1236263031122462e-09, -1.0002147998733335e-09, -8.76803352145572e-10, -7.533919044178106e-10, -6.299804011788979e-10, -5.065688979399852e-10, -3.831574502122237e-10, -2.597460024844622e-10, -1.3633405515633967e-10, -1.2922579673002588e-11, 1.104888958103345e-10, 2.339003712936716e-10, 3.5731184677700867e-10, 4.807233500159214e-10, 6.041347977436828e-10, 7.275462454714443e-10, 8.50957748710357e-10, 9.743692519492697e-10, 1.0977807551881824e-09, 1.2211921474047926e-09, 1.3446036506437054e-09, 1.468015153882618e-09, 1.5914265460992283e-09, 1.714838049338141e-09, 1.8382495525770537e-09, 1.9616610558159664e-09, 2.085072559054879e-09, 2.208484062293792e-09, 2.3318955655327045e-09, 2.455307068771617e-09, 2.578718349965925e-09, 2.7021298532048377e-09, 2.8255413564437504e-09, 2.948952859682663e-09, 3.0723643629215758e-09, 3.1957758661604885e-09, 3.3191871473547963e-09, 3.442598650593709e-09, 3.5660101538326217e-09, 3.6894216570715344e-09, 3.812833160310447e-09]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 3.0, 7.0, 4.0, 6.0, 5.0, 10.0, 13.0, 16.0, 18.0, 16.0, 23.0, 27.0, 26.0, 37.0, 38.0, 49.0, 51.0, 48.0, 48.0, 43.0, 58.0, 51.0, 48.0, 51.0, 31.0, 50.0, 39.0, 38.0, 21.0, 20.0, 20.0, 17.0, 21.0, 12.0, 8.0, 6.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0], "bins": [-4.0576479953813305e-09, -3.948050775193224e-09, -3.838453999094327e-09, -3.72885677890622e-09, -3.619259780762718e-09, -3.509662782619216e-09, -3.4000655624311094e-09, -3.2904685642876075e-09, -3.1808715661441056e-09, -3.0712745680006037e-09, -2.961677347812497e-09, -2.852080349668995e-09, -2.742483351525493e-09, -2.6328863533819913e-09, -2.5232891331938845e-09, -2.4136921350503826e-09, -2.304094914862276e-09, -2.194497916718774e-09, -2.084900696530667e-09, -1.9753036983871652e-09, -1.8657067002436634e-09, -1.756109591077859e-09, -1.6465124819120547e-09, -1.5369154837685528e-09, -1.4273183746027485e-09, -1.3177212654369441e-09, -1.2081242672934422e-09, -1.098527158127638e-09, -9.889300489618336e-10, -8.793330508183317e-10, -7.697359416525273e-10, -6.601388879978742e-10, -5.505418343432211e-10, -4.40944780688568e-10, -3.313476992783393e-10, -2.2175061786811057e-10, -1.1215356421345746e-10, -2.556510558804348e-12, 1.0704059860699999e-10, 2.166376522616531e-10, 3.262347059163062e-10, 4.358317595709593e-10, 5.454288132256124e-10, 6.550259223914168e-10, 7.646229760460699e-10, 8.74220029700723e-10, 9.838171388665273e-10, 1.0934142480323317e-09, 1.2030112461758335e-09, 1.3126083553416379e-09, 1.4222053534851398e-09, 1.5318024626509441e-09, 1.641399460794446e-09, 1.7509965699602503e-09, 1.8605936791260547e-09, 1.9701906772695565e-09, 2.0797878974576633e-09, 2.1893848956011652e-09, 2.298982115789272e-09, 2.408579113932774e-09, 2.5181761120762758e-09, 2.6277731102197777e-09, 2.7373703304078845e-09, 2.8469673285513863e-09, 2.9565643266948882e-09]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 11.0, 13.0, 28.0, 79.0, 158.0, 287.0, 239.0, 95.0, 48.0, 31.0, 10.0, 10.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7359845500285473e-09, -2.5041311246809528e-09, -2.2722776993333582e-09, -2.0404242739857636e-09, -1.808570848638169e-09, -1.5767174232905745e-09, -1.34486399794298e-09, -1.1130105725953854e-09, -8.811571472477908e-10, -6.493037219001963e-10, -4.174502965526017e-10, -1.8559687120500712e-10, 4.625655414258745e-11, 2.78109979490182e-10, 5.099634048377766e-10, 7.418168301853711e-10, 9.736702555329657e-10, 1.2055236808805603e-09, 1.4373771062281548e-09, 1.6692305315757494e-09, 1.901083956923344e-09, 2.1329373822709385e-09, 2.364790807618533e-09, 2.5966442329661277e-09, 2.8284976583137222e-09, 3.060351083661317e-09, 3.2922045090089114e-09, 3.524057934356506e-09, 3.7559111376594956e-09, 3.987764785051695e-09, 4.2196184324438946e-09, 4.451471635746884e-09, 4.683324839049874e-09, 4.915178486442073e-09, 5.147031689745063e-09, 5.378884893048053e-09, 5.610738540440252e-09, 5.842592187832452e-09, 6.074445391135441e-09, 6.306298594438431e-09, 6.53815224183063e-09, 6.77000588922283e-09, 7.0018590925258195e-09, 7.233712295828809e-09, 7.465565943221009e-09, 7.697419590613208e-09, 7.929273238005408e-09, 8.161125997219187e-09, 8.392979644611387e-09, 8.624833292003586e-09, 8.856686051217366e-09, 9.088539698609566e-09, 9.320393346001765e-09, 9.552246993393965e-09, 9.784100640786164e-09, 1.0015953399999944e-08, 1.0247807047392143e-08, 1.0479660694784343e-08, 1.0711513453998123e-08, 1.0943367101390322e-08, 1.1175220748782522e-08, 1.1407074396174721e-08, 1.163892804356692e-08, 1.18707808027807e-08, 1.21026344501729e-08]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 7.0, 7.0, 7.0, 7.0, 11.0, 16.0, 15.0, 16.0, 21.0, 35.0, 28.0, 34.0, 46.0, 58.0, 39.0, 51.0, 45.0, 56.0, 53.0, 59.0, 55.0, 41.0, 50.0, 32.0, 39.0, 30.0, 27.0, 22.0, 18.0, 21.0, 11.0, 10.0, 8.0, 6.0, 9.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.6534232588915074e-09, -2.5771995648682378e-09, -2.500975870844968e-09, -2.4247521768216984e-09, -2.3485284827984287e-09, -2.272304566730554e-09, -2.1960808727072845e-09, -2.119857178684015e-09, -2.043633484660745e-09, -1.9674097906374755e-09, -1.8911860966142058e-09, -1.8149622915686336e-09, -1.738738597545364e-09, -1.6625149035220943e-09, -1.5862910984765222e-09, -1.5100674044532525e-09, -1.4338437104299828e-09, -1.3576200164067131e-09, -1.2813963223834435e-09, -1.2051725173378713e-09, -1.1289488233146017e-09, -1.052725129291332e-09, -9.765013242457599e-10, -9.002776302224902e-10, -8.240539361992205e-10, -7.478302421759508e-10, -6.716064926415299e-10, -5.95382743107109e-10, -5.191590490838394e-10, -4.429353273049941e-10, -3.667116055261488e-10, -2.904878559917279e-10, -2.1426438401306314e-10, -1.3804066223421785e-10, -6.181694045537256e-11, 1.4406781323472728e-11, 9.063050310231802e-11, 1.668542248811633e-10, 2.430779466600086e-10, 3.193016961944295e-10, 3.9552539021769917e-10, 4.717490842409688e-10, 5.479728337753897e-10, 6.241965833098106e-10, 7.004202773330803e-10, 7.7664397135635e-10, 8.528677208907709e-10, 9.290914704251918e-10, 1.0053151644484615e-09, 1.0815388584717311e-09, 1.1577625524950008e-09, 1.233986357540573e-09, 1.3102100515638426e-09, 1.3864337455871123e-09, 1.4626575506326844e-09, 1.5388812446559541e-09, 1.6151049386792238e-09, 1.6913286327024935e-09, 1.7675523267257631e-09, 1.8437761317713353e-09, 1.9199997147723025e-09, 1.996223630840177e-09, 2.0724473248634467e-09, 2.1486710188867164e-09, 2.224894712909986e-09]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 2.0, 8.0, 7.0, 28.0, 30.0, 53.0, 78.0, 137.0, 193.0, 199.0, 102.0, 64.0, 49.0, 23.0, 14.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.275247236928408e-10, -8.68899063810602e-10, -8.102734594395145e-10, -7.516478550684269e-10, -6.930221951861881e-10, -6.343965353039493e-10, -5.757709309328618e-10, -5.171453265617743e-10, -4.585196666795355e-10, -3.998940345528723e-10, -3.4126840242620915e-10, -2.82642770299546e-10, -2.2401713817288282e-10, -1.6539150604621966e-10, -1.067658739195565e-10, -4.8140241792893335e-11, 1.0485390333769828e-11, 6.911102246043299e-11, 1.2773665458709615e-10, 1.8636228671375932e-10, 2.449879188404225e-10, 3.0361355096708564e-10, 3.622391830937488e-10, 4.2086481522041197e-10, 4.794904473470751e-10, 5.381161072293139e-10, 5.967417116004015e-10, 6.55367315971489e-10, 7.139929758537278e-10, 7.726186357359666e-10, 8.312442401070541e-10, 8.898698444781417e-10, 9.484955043603804e-10, 1.0071211642426192e-09, 1.065746824124858e-09, 1.1243723729847943e-09, 1.182998032867033e-09, 1.2416236927492719e-09, 1.3002492416092082e-09, 1.358874901491447e-09, 1.4175005613736857e-09, 1.4761262212559245e-09, 1.5347518811381633e-09, 1.5933774299980996e-09, 1.6520030898803384e-09, 1.7106287497625772e-09, 1.7692542986225135e-09, 1.8278799585047523e-09, 1.886505618386991e-09, 1.9451311672469274e-09, 2.0037569381514686e-09, 2.062382487011405e-09, 2.121008257915946e-09, 2.1796338067758825e-09, 2.2382593556358188e-09, 2.29688512654036e-09, 2.3555106754002963e-09, 2.4141362242602327e-09, 2.472761995164774e-09, 2.5313875440247102e-09, 2.5900130928846465e-09, 2.6486388637891878e-09, 2.707264412649124e-09, 2.7658901835536653e-09, 2.8245157324136017e-09]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 5.0, 10.0, 7.0, 7.0, 18.0, 14.0, 21.0, 13.0, 25.0, 32.0, 23.0, 23.0, 38.0, 35.0, 54.0, 44.0, 55.0, 56.0, 60.0, 52.0, 39.0, 43.0, 43.0, 34.0, 29.0, 31.0, 24.0, 25.0, 23.0, 19.0, 21.0, 19.0, 15.0, 11.0, 4.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.090763059520611e-10, -7.830818216092439e-10, -7.570872817552754e-10, -7.310927974124581e-10, -7.050982575584896e-10, -6.791037732156724e-10, -6.531092333617039e-10, -6.271147490188866e-10, -6.011202091649182e-10, -5.751257248221009e-10, -5.491311849681324e-10, -5.231367006253151e-10, -4.971421607713467e-10, -4.711476764285294e-10, -4.451531365745609e-10, -4.1915865223174364e-10, -3.9316414013335077e-10, -3.671696280349579e-10, -3.41175115936565e-10, -3.1518060383817215e-10, -2.8918609173977927e-10, -2.631915796413864e-10, -2.3719709529856914e-10, -2.1120256932238846e-10, -1.8520805722399558e-10, -1.592135451256027e-10, -1.3321903302720983e-10, -1.0722452786771086e-10, -8.123001576931799e-11, -5.5235510609819016e-11, -2.924099851142614e-11, -3.246486413033267e-12, 2.2748025685359607e-11, 4.874253778375248e-11, 7.473704988214536e-11, 1.0073155504164433e-10, 1.267260740789311e-10, 1.5272057229953617e-10, 1.7871508439792905e-10, 2.0470959649632192e-10, 2.307041085947148e-10, 2.5669860681531986e-10, 2.8269311891371274e-10, 3.086876310121056e-10, 3.346821431104985e-10, 3.6067665520889136e-10, 3.8667116730728424e-10, 4.126656794056771e-10, 4.3866019150407e-10, 4.6465470360246286e-10, 4.906491879452801e-10, 5.166437277992486e-10, 5.426382121420659e-10, 5.686327519960344e-10, 5.946272363388516e-10, 6.206217761928201e-10, 6.466162605356374e-10, 6.726107448784546e-10, 6.986052847324231e-10, 7.245997690752404e-10, 7.505943089292089e-10, 7.765887932720261e-10, 8.025833331259946e-10, 8.285778174688119e-10, 8.545723573227804e-10]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 2.0, 4.0, 11.0, 13.0, 19.0, 22.0, 43.0, 46.0, 63.0, 90.0, 112.0, 126.0, 132.0, 81.0, 59.0, 50.0, 42.0, 19.0, 16.0, 9.0, 15.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.771507964411285e-10, -8.425705688708263e-10, -8.079903968116753e-10, -7.734102247525243e-10, -7.388299971822221e-10, -7.042497696119199e-10, -6.696695975527689e-10, -6.350894254936179e-10, -6.005091979233157e-10, -5.659289703530135e-10, -5.313487982938625e-10, -4.967686262347115e-10, -4.621883986644093e-10, -4.276081988496827e-10, -3.930279990349561e-10, -3.584477992202295e-10, -3.238675994055029e-10, -2.892873995907763e-10, -2.547071997760497e-10, -2.2012699996132312e-10, -1.8554680014659652e-10, -1.5096660033186993e-10, -1.1638640051714333e-10, -8.180620070241673e-11, -4.7226000887690134e-11, -1.2645801072963536e-11, 2.193439874176306e-11, 5.651459855648966e-11, 9.109479837121626e-11, 1.2567499818594285e-10, 1.6025519800066945e-10, 1.9483539781539605e-10, 2.294157086524251e-10, 2.639959084671517e-10, 2.985761082818783e-10, 3.331563080966049e-10, 3.677365079113315e-10, 4.023167077260581e-10, 4.368969075407847e-10, 4.714770795999357e-10, 5.060573071702379e-10, 5.406375347405401e-10, 5.752177067996911e-10, 6.097978788588421e-10, 6.443781064291443e-10, 6.789583339994465e-10, 7.135385060585975e-10, 7.481186781177485e-10, 7.826989056880507e-10, 8.172791332583529e-10, 8.518593053175039e-10, 8.864394773766548e-10, 9.210197049469571e-10, 9.555999325172593e-10, 9.901801600875615e-10, 1.0247602766355612e-09, 1.0593405042058635e-09, 1.0939207317761657e-09, 1.1285008483241654e-09, 1.1630810758944676e-09, 1.1976613034647698e-09, 1.232241531035072e-09, 1.2668217586053743e-09, 1.301401875153374e-09, 1.3359821027236762e-09]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 4.0, 5.0, 0.0, 5.0, 5.0, 12.0, 4.0, 10.0, 14.0, 19.0, 15.0, 16.0, 15.0, 39.0, 31.0, 29.0, 38.0, 36.0, 46.0, 53.0, 52.0, 56.0, 62.0, 49.0, 47.0, 50.0, 31.0, 32.0, 34.0, 23.0, 29.0, 28.0, 23.0, 17.0, 15.0, 20.0, 11.0, 8.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.317131262534303e-10, -6.105670413703024e-10, -5.894210119983256e-10, -5.682749271151977e-10, -5.471288977432209e-10, -5.25982812860093e-10, -5.04836727976965e-10, -4.83690643093837e-10, -4.625446137218603e-10, -4.4139855659430793e-10, -4.202524994667556e-10, -3.991064145836276e-10, -3.7796035745607526e-10, -3.568143003285229e-10, -3.3566821544539494e-10, -3.145221583178426e-10, -2.9337610119029023e-10, -2.722300440627379e-10, -2.510839869351855e-10, -2.2993790205205755e-10, -2.087918449245052e-10, -1.8764578779695285e-10, -1.6649971679161268e-10, -1.4535364578627252e-10, -1.2420758865872017e-10, -1.0306152459227391e-10, -8.191546052582765e-11, -6.07693964593814e-11, -3.962333239293514e-11, -1.8477268326488883e-11, 2.6687957399573747e-12, 2.3814866745297536e-11, 4.496086836169866e-11, 6.610693242814492e-11, 8.725299649459117e-11, 1.0839906056103743e-10, 1.295451246274837e-10, 1.5069118175503604e-10, 1.718372527603762e-10, 1.9298332376571636e-10, 2.1412938089326872e-10, 2.3527543802082107e-10, 2.564214951483734e-10, 2.775675800315014e-10, 2.9871363715905375e-10, 3.198596942866061e-10, 3.4100577916973407e-10, 3.621518362972864e-10, 3.832978934248388e-10, 4.0444395055239113e-10, 4.255900076799435e-10, 4.4673609256307145e-10, 4.678821774461994e-10, 4.890282068181762e-10, 5.101742917013041e-10, 5.313203210732809e-10, 5.524664059564088e-10, 5.736124908395368e-10, 5.947585202115135e-10, 6.159046050946415e-10, 6.370506344666182e-10, 6.581967193497462e-10, 6.793428042328742e-10, 7.004888891160022e-10, 7.216349184879789e-10]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 7.0, 16.0, 12.0, 52.0, 108.0, 228.0, 290.0, 151.0, 92.0, 26.0, 22.0, 6.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.304039122997153e-10, -7.411964375592106e-10, -6.519889073075547e-10, -5.627813770558987e-10, -4.73573902315394e-10, -3.8436639981931364e-10, -2.951588973232333e-10, -2.0595142258272858e-10, -1.1674389233107263e-10, -2.7536389834992292e-11, 6.167111266108805e-11, 1.5087861515716838e-10, 2.400861176532487e-10, 3.2929362014932906e-10, 4.185011226454094e-10, 5.077085973859141e-10, 5.969161276375701e-10, 6.861236023780748e-10, 7.753311326297307e-10, 8.645386628813867e-10, 9.537461931330427e-10, 1.0429536123623961e-09, 1.132161142614052e-09, 1.2213685618434056e-09, 1.3105760920950615e-09, 1.3997836223467175e-09, 1.4889911525983734e-09, 1.578198571827727e-09, 1.6674061020793829e-09, 1.7566136323310388e-09, 1.8458210515603923e-09, 1.9350285818120483e-09, 2.024236334108309e-09, 2.113443864359965e-09, 2.202651394611621e-09, 2.291858924863277e-09, 2.381066455114933e-09, 2.470273763321984e-09, 2.55948129357364e-09, 2.648688823825296e-09, 2.737896354076952e-09, 2.827103884328608e-09, 2.9163114145802638e-09, 3.0055189448319197e-09, 3.0947262530389708e-09, 3.1839337832906267e-09, 3.2731413135422827e-09, 3.3623488437939386e-09, 3.4515563740455946e-09, 3.5407639042972505e-09, 3.6299714345489065e-09, 3.7191789648005624e-09, 3.808386495052218e-09, 3.897593803259269e-09, 3.98680155555553e-09, 4.076008863762581e-09, 4.165216616058842e-09, 4.254423924265893e-09, 4.343631676562154e-09, 4.432838984769205e-09, 4.522046737065466e-09, 4.611254045272517e-09, 4.700461797568778e-09, 4.789669105775829e-09, 4.87887641398288e-09]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 9.0, 2.0, 5.0, 11.0, 10.0, 9.0, 16.0, 20.0, 18.0, 32.0, 24.0, 22.0, 50.0, 46.0, 37.0, 61.0, 58.0, 75.0, 62.0, 60.0, 56.0, 53.0, 34.0, 41.0, 29.0, 29.0, 22.0, 23.0, 22.0, 16.0, 17.0, 8.0, 6.0, 1.0, 6.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0517692272671297e-09, -1.0126870453319725e-09, -9.736049744191178e-10, -9.345227924839605e-10, -8.954406105488033e-10, -8.563584841247973e-10, -8.172763577007913e-10, -7.781941757656341e-10, -7.391120493416281e-10, -7.000299229176221e-10, -6.609477409824649e-10, -6.218656145584589e-10, -5.827834881344529e-10, -5.437013061992957e-10, -5.046191797752897e-10, -4.655370255957081e-10, -4.264548714161265e-10, -3.8737271723654487e-10, -3.4829056305696326e-10, -3.0920843663295727e-10, -2.7012628245337567e-10, -2.3104412827379406e-10, -1.9196200184978807e-10, -1.5287984767020646e-10, -1.1379769349062485e-10, -7.471554624993715e-11, -3.5633399009249445e-11, 3.448741292544355e-12, 4.253089547212596e-11, 8.161304965170757e-11, 1.2069517607571356e-10, 1.5977733025529517e-10, 1.9885937341257431e-10, 2.379415275921559e-10, 2.7702368177173753e-10, 3.161058081957435e-10, 3.5518796237532513e-10, 3.9427011655490674e-10, 4.3335224297891273e-10, 4.7243442491407e-10, 5.115165513380759e-10, 5.505986777620819e-10, 5.896808596972392e-10, 6.287629861212451e-10, 6.678451125452511e-10, 7.069272944804084e-10, 7.460094209044144e-10, 7.850915473284203e-10, 8.241737292635776e-10, 8.632558556875836e-10, 9.023380376227408e-10, 9.414201640467468e-10, 9.80502345981904e-10, 1.0195844168947588e-09, 1.058666598829916e-09, 1.0977487807650732e-09, 1.136830851677928e-09, 1.1759130336130852e-09, 1.21499510452594e-09, 1.2540772864610972e-09, 1.2931594683962544e-09, 1.3322416503314116e-09, 1.3713237212442664e-09, 1.4104059031794236e-09, 1.4494880851145808e-09]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 13.0, 15.0, 13.0, 15.0, 24.0, 31.0, 40.0, 53.0, 84.0, 129.0, 216.0, 465.0, 1137.0, 517847.0, 2375.0, 880.0, 336.0, 184.0, 101.0, 68.0, 62.0, 38.0, 27.0, 23.0, 8.0, 9.0, 16.0, 13.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4253824787147096e-08, -1.3791398245643904e-08, -1.3328971704140713e-08, -1.2866545162637522e-08, -1.240411862113433e-08, -1.1941692079631139e-08, -1.1479265538127947e-08, -1.1016838996624756e-08, -1.0554412455121565e-08, -1.0091985913618373e-08, -9.629559372115182e-09, -9.16713283061199e-09, -8.704706289108799e-09, -8.242279747605608e-09, -7.779853206102416e-09, -7.317426664599225e-09, -6.855000123096033e-09, -6.392573581592842e-09, -5.9301470400896505e-09, -5.467720498586459e-09, -5.005293957083268e-09, -4.542867415580076e-09, -4.080440874076885e-09, -3.6180143325736935e-09, -3.155587791070502e-09, -2.6931612495673107e-09, -2.2307347080641193e-09, -1.768308166560928e-09, -1.3058816250577365e-09, -8.434550835545451e-10, -3.810285420513537e-10, 8.139799945183768e-11, 5.438245409550291e-10, 1.0062510824582205e-09, 1.4686776239614119e-09, 1.9311041654646033e-09, 2.3935307069677947e-09, 2.855957248470986e-09, 3.3183837899741775e-09, 3.780810331477369e-09, 4.24323687298056e-09, 4.705663414483752e-09, 5.168089955986943e-09, 5.6305164974901345e-09, 6.092943038993326e-09, 6.555369580496517e-09, 7.017796121999709e-09, 7.4802226635029e-09, 7.942649205006092e-09, 8.405075746509283e-09, 8.867502288012474e-09, 9.329928829515666e-09, 9.792355371018857e-09, 1.0254781912522049e-08, 1.071720845402524e-08, 1.1179634995528431e-08, 1.1642061537031623e-08, 1.2104488078534814e-08, 1.2566914620038006e-08, 1.3029341161541197e-08, 1.3491767703044388e-08, 1.395419424454758e-08, 1.4416620786050771e-08, 1.4879047327553963e-08, 1.5341473869057154e-08]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 7.0, 11.0, 18.0, 19.0, 18.0, 25.0, 22.0, 23.0, 35.0, 37.0, 36.0, 37.0, 45.0, 56.0, 1109.0, 66.0, 60.0, 49.0, 51.0, 40.0, 35.0, 30.0, 22.0, 25.0, 23.0, 16.0, 25.0, 10.0, 11.0, 7.0, 8.0, 7.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5647270146246228e-08, -1.512314362628331e-08, -1.4599017106320389e-08, -1.4074891474535889e-08, -1.3550764954572969e-08, -1.302663843461005e-08, -1.250251280282555e-08, -1.197838628286263e-08, -1.145425976289971e-08, -1.093013324293679e-08, -1.040600672297387e-08, -9.88188109118937e-09, -9.357754571226451e-09, -8.833628051263531e-09, -8.309502419479031e-09, -7.785375899516112e-09, -7.261249379553192e-09, -6.737122859590272e-09, -6.212996783716562e-09, -5.6888707078428524e-09, -5.164744187879933e-09, -4.640617667917013e-09, -4.116491592043303e-09, -3.5923652941249884e-09, -3.0682389962066736e-09, -2.544112698288359e-09, -2.019986400370044e-09, -1.4958601024517293e-09, -9.717338045334145e-10, -4.4760750661509974e-10, 7.651879130321504e-11, 6.006450892215298e-10, 1.124773163496684e-09, 1.6488994614149988e-09, 2.1730257593333135e-09, 2.6971520572516283e-09, 3.221278355169943e-09, 3.745404875132863e-09, 4.269530951006573e-09, 4.7936570268802825e-09, 5.317783546843202e-09, 5.841910066806122e-09, 6.366036142679832e-09, 6.890162218553542e-09, 7.414288738516461e-09, 7.938415258479381e-09, 8.462540890263881e-09, 8.9866674102268e-09, 9.51079393018972e-09, 1.003492045015264e-08, 1.055904697011556e-08, 1.108317260190006e-08, 1.160729912186298e-08, 1.21314256418259e-08, 1.26555512736104e-08, 1.3179677793573319e-08, 1.3703804313536239e-08, 1.4227930833499158e-08, 1.4752057353462078e-08, 1.5276183873424998e-08, 1.5800310393387917e-08, 1.6324435136993998e-08, 1.6848561656956917e-08, 1.7372688176919837e-08, 1.7896814696882757e-08]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 7.0, 7.0, 12.0, 13.0, 11.0, 15.0, 22.0, 35.0, 52.0, 70.0, 109.0, 147.0, 282.0, 508.0, 1167.0, 3281.0, 9071.0, 24439.0, 31181160.0, 20891.0, 9771.0, 2248.0, 476.0, 225.0, 141.0, 72.0, 72.0, 56.0, 47.0, 32.0, 25.0, 12.0, 12.0, 3.0, 10.0], "bins": [-474.75, -464.740234375, -454.73046875, -444.720703125, -434.7109375, -424.701171875, -414.69140625, -404.681640625, -394.671875, -384.662109375, -374.65234375, -364.642578125, -354.6328125, -344.623046875, -334.61328125, -324.603515625, -314.59375, -304.583984375, -294.57421875, -284.564453125, -274.5546875, -264.544921875, -254.53515625, -244.525390625, -234.515625, -224.505859375, -214.49609375, -204.486328125, -194.4765625, -184.466796875, -174.45703125, -164.447265625, -154.4375, -144.427734375, -134.41796875, -124.408203125, -114.3984375, -104.388671875, -94.37890625, -84.369140625, -74.359375, -64.349609375, -54.33984375, -44.330078125, -34.3203125, -24.310546875, -14.30078125, -4.291015625, 5.71875, 15.728515625, 25.73828125, 35.748046875, 45.7578125, 55.767578125, 65.77734375, 75.787109375, 85.796875, 95.806640625, 105.81640625, 115.826171875, 125.8359375, 135.845703125, 145.85546875, 155.865234375, 165.875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 4.0, 12.0, 9.0, 13.0, 11.0, 39.0, 32.0, 45.0, 55.0, 97.0, 131.0, 188.0, 246.0, 406.0, 598.0, 995.0, 1616.0, 2689.0, 4804.0, 9100.0, 18615.0, 41634.0, 101077.0, 289104.0, 1429453.0, 3697977.0, 445018.0, 141308.0, 55560.0, 24123.0, 11658.0, 6082.0, 3324.0, 1934.0, 1180.0, 727.0, 466.0, 328.0, 237.0, 173.0, 99.0, 75.0, 53.0, 39.0, 29.0, 32.0, 16.0, 15.0, 5.0, 2.0, 5.0, 2.0, 5.0], "bins": [-4.21484375, -4.098297119140625, -3.98175048828125, -3.865203857421875, -3.7486572265625, -3.632110595703125, -3.51556396484375, -3.399017333984375, -3.282470703125, -3.165924072265625, -3.04937744140625, -2.932830810546875, -2.8162841796875, -2.699737548828125, -2.58319091796875, -2.466644287109375, -2.35009765625, -2.233551025390625, -2.11700439453125, -2.000457763671875, -1.8839111328125, -1.767364501953125, -1.65081787109375, -1.534271240234375, -1.417724609375, -1.301177978515625, -1.18463134765625, -1.068084716796875, -0.9515380859375, -0.834991455078125, -0.71844482421875, -0.601898193359375, -0.4853515625, -0.368804931640625, -0.25225830078125, -0.135711669921875, -0.0191650390625, 0.097381591796875, 0.21392822265625, 0.330474853515625, 0.447021484375, 0.563568115234375, 0.68011474609375, 0.796661376953125, 0.9132080078125, 1.029754638671875, 1.14630126953125, 1.262847900390625, 1.37939453125, 1.495941162109375, 1.61248779296875, 1.729034423828125, 1.8455810546875, 1.962127685546875, 2.07867431640625, 2.195220947265625, 2.311767578125, 2.428314208984375, 2.54486083984375, 2.661407470703125, 2.7779541015625, 2.894500732421875, 3.01104736328125, 3.127593994140625, 3.244140625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 3.0, 8.0, 7.0, 13.0, 10.0, 19.0, 11.0, 17.0, 26.0, 22.0, 30.0, 34.0, 48.0, 57.0, 81.0, 111.0, 152.0, 249.0, 356.0, 200.0, 107.0, 82.0, 58.0, 53.0, 42.0, 39.0, 28.0, 29.0, 23.0, 19.0, 17.0, 7.0, 10.0, 10.0, 13.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 0.0, 3.0], "bins": [-3.544921875, -3.447723388671875, -3.35052490234375, -3.253326416015625, -3.1561279296875, -3.058929443359375, -2.96173095703125, -2.864532470703125, -2.767333984375, -2.670135498046875, -2.57293701171875, -2.475738525390625, -2.3785400390625, -2.281341552734375, -2.18414306640625, -2.086944580078125, -1.98974609375, -1.892547607421875, -1.79534912109375, -1.698150634765625, -1.6009521484375, -1.503753662109375, -1.40655517578125, -1.309356689453125, -1.212158203125, -1.114959716796875, -1.01776123046875, -0.920562744140625, -0.8233642578125, -0.726165771484375, -0.62896728515625, -0.531768798828125, -0.4345703125, -0.337371826171875, -0.24017333984375, -0.142974853515625, -0.0457763671875, 0.051422119140625, 0.14862060546875, 0.245819091796875, 0.343017578125, 0.440216064453125, 0.53741455078125, 0.634613037109375, 0.7318115234375, 0.829010009765625, 0.92620849609375, 1.023406982421875, 1.12060546875, 1.217803955078125, 1.31500244140625, 1.412200927734375, 1.5093994140625, 1.606597900390625, 1.70379638671875, 1.800994873046875, 1.898193359375, 1.995391845703125, 2.09259033203125, 2.189788818359375, 2.2869873046875, 2.384185791015625, 2.48138427734375, 2.578582763671875, 2.67578125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 13.0, 8.0, 13.0, 19.0, 25.0, 41.0, 54.0, 71.0, 93.0, 137.0, 215.0, 326.0, 461.0, 680.0, 995.0, 1387.0, 2113.0, 3137.0, 4975.0, 7908.0, 12808.0, 22257.0, 40444.0, 79951.0, 178634.0, 501359.0, 3584658.0, 1271692.0, 315056.0, 125371.0, 59132.0, 30992.0, 17463.0, 10211.0, 6383.0, 4086.0, 2723.0, 1822.0, 1236.0, 827.0, 526.0, 323.0, 240.0, 165.0, 120.0, 88.0, 56.0, 44.0, 25.0, 29.0, 16.0, 14.0, 12.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.12109375, -2.049896240234375, -1.97869873046875, -1.907501220703125, -1.8363037109375, -1.765106201171875, -1.69390869140625, -1.622711181640625, -1.551513671875, -1.480316162109375, -1.40911865234375, -1.337921142578125, -1.2667236328125, -1.195526123046875, -1.12432861328125, -1.053131103515625, -0.98193359375, -0.910736083984375, -0.83953857421875, -0.768341064453125, -0.6971435546875, -0.625946044921875, -0.55474853515625, -0.483551025390625, -0.412353515625, -0.341156005859375, -0.26995849609375, -0.198760986328125, -0.1275634765625, -0.056365966796875, 0.01483154296875, 0.086029052734375, 0.1572265625, 0.228424072265625, 0.29962158203125, 0.370819091796875, 0.4420166015625, 0.513214111328125, 0.58441162109375, 0.655609130859375, 0.726806640625, 0.798004150390625, 0.86920166015625, 0.940399169921875, 1.0115966796875, 1.082794189453125, 1.15399169921875, 1.225189208984375, 1.29638671875, 1.367584228515625, 1.43878173828125, 1.509979248046875, 1.5811767578125, 1.652374267578125, 1.72357177734375, 1.794769287109375, 1.865966796875, 1.937164306640625, 2.00836181640625, 2.079559326171875, 2.1507568359375, 2.221954345703125, 2.29315185546875, 2.364349365234375, 2.435546875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 5.0, 12.0, 14.0, 13.0, 12.0, 24.0, 26.0, 51.0, 39.0, 68.0, 78.0, 95.0, 142.0, 213.0, 366.0, 234.0, 131.0, 100.0, 75.0, 54.0, 49.0, 31.0, 28.0, 20.0, 25.0, 20.0, 21.0, 8.0, 10.0, 11.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6015625, -2.511627197265625, -2.42169189453125, -2.331756591796875, -2.2418212890625, -2.151885986328125, -2.06195068359375, -1.972015380859375, -1.882080078125, -1.792144775390625, -1.70220947265625, -1.612274169921875, -1.5223388671875, -1.432403564453125, -1.34246826171875, -1.252532958984375, -1.16259765625, -1.072662353515625, -0.98272705078125, -0.892791748046875, -0.8028564453125, -0.712921142578125, -0.62298583984375, -0.533050537109375, -0.443115234375, -0.353179931640625, -0.26324462890625, -0.173309326171875, -0.0833740234375, 0.006561279296875, 0.09649658203125, 0.186431884765625, 0.2763671875, 0.366302490234375, 0.45623779296875, 0.546173095703125, 0.6361083984375, 0.726043701171875, 0.81597900390625, 0.905914306640625, 0.995849609375, 1.085784912109375, 1.17572021484375, 1.265655517578125, 1.3555908203125, 1.445526123046875, 1.53546142578125, 1.625396728515625, 1.71533203125, 1.805267333984375, 1.89520263671875, 1.985137939453125, 2.0750732421875, 2.165008544921875, 2.25494384765625, 2.344879150390625, 2.434814453125, 2.524749755859375, 2.61468505859375, 2.704620361328125, 2.7945556640625, 2.884490966796875, 2.97442626953125, 3.064361572265625, 3.154296875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 19.0, 22.0, 18.0, 28.0, 35.0, 39.0, 63.0, 82.0, 102.0, 141.0, 191.0, 258.0, 354.0, 465.0, 773.0, 1459.0, 3041.0, 6643.0, 17175.0, 71614.0, 6026832.0, 121824.0, 23731.0, 8205.0, 3592.0, 1714.0, 983.0, 587.0, 397.0, 235.0, 176.0, 134.0, 116.0, 73.0, 69.0, 54.0, 48.0, 42.0, 20.0, 10.0, 14.0, 9.0, 4.0, 10.0, 5.0, 6.0, 1.0, 5.0, 3.0], "bins": [-16.140625, -15.6876220703125, -15.234619140625, -14.7816162109375, -14.32861328125, -13.8756103515625, -13.422607421875, -12.9696044921875, -12.5166015625, -12.0635986328125, -11.610595703125, -11.1575927734375, -10.70458984375, -10.2515869140625, -9.798583984375, -9.3455810546875, -8.892578125, -8.4395751953125, -7.986572265625, -7.5335693359375, -7.08056640625, -6.6275634765625, -6.174560546875, -5.7215576171875, -5.2685546875, -4.8155517578125, -4.362548828125, -3.9095458984375, -3.45654296875, -3.0035400390625, -2.550537109375, -2.0975341796875, -1.64453125, -1.1915283203125, -0.738525390625, -0.2855224609375, 0.16748046875, 0.6204833984375, 1.073486328125, 1.5264892578125, 1.9794921875, 2.4324951171875, 2.885498046875, 3.3385009765625, 3.79150390625, 4.2445068359375, 4.697509765625, 5.1505126953125, 5.603515625, 6.0565185546875, 6.509521484375, 6.9625244140625, 7.41552734375, 7.8685302734375, 8.321533203125, 8.7745361328125, 9.2275390625, 9.6805419921875, 10.133544921875, 10.5865478515625, 11.03955078125, 11.4925537109375, 11.945556640625, 12.3985595703125, 12.8515625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 9.0, 12.0, 14.0, 13.0, 17.0, 26.0, 25.0, 48.0, 56.0, 99.0, 104.0, 147.0, 208.0, 345.0, 377.0, 121.0, 72.0, 57.0, 41.0, 40.0, 34.0, 21.0, 28.0, 18.0, 10.0, 18.0, 6.0, 8.0, 6.0, 4.0, 5.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.015625, -2.915863037109375, -2.81610107421875, -2.716339111328125, -2.6165771484375, -2.516815185546875, -2.41705322265625, -2.317291259765625, -2.217529296875, -2.117767333984375, -2.01800537109375, -1.918243408203125, -1.8184814453125, -1.718719482421875, -1.61895751953125, -1.519195556640625, -1.41943359375, -1.319671630859375, -1.21990966796875, -1.120147705078125, -1.0203857421875, -0.920623779296875, -0.82086181640625, -0.721099853515625, -0.621337890625, -0.521575927734375, -0.42181396484375, -0.322052001953125, -0.2222900390625, -0.122528076171875, -0.02276611328125, 0.076995849609375, 0.1767578125, 0.276519775390625, 0.37628173828125, 0.476043701171875, 0.5758056640625, 0.675567626953125, 0.77532958984375, 0.875091552734375, 0.974853515625, 1.074615478515625, 1.17437744140625, 1.274139404296875, 1.3739013671875, 1.473663330078125, 1.57342529296875, 1.673187255859375, 1.77294921875, 1.872711181640625, 1.97247314453125, 2.072235107421875, 2.1719970703125, 2.271759033203125, 2.37152099609375, 2.471282958984375, 2.571044921875, 2.670806884765625, 2.77056884765625, 2.870330810546875, 2.9700927734375, 3.069854736328125, 3.16961669921875, 3.269378662109375, 3.369140625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 13.0, 28.0, 139.0, 816.0, 8.0, 4.0, 0.0, 2.0], "bins": [-335.026611328125, -329.36187744140625, -323.6971435546875, -318.0324401855469, -312.3677062988281, -306.7029724121094, -301.0382385253906, -295.3735046386719, -289.70880126953125, -284.0440673828125, -278.37933349609375, -272.7146301269531, -267.0498962402344, -261.3851623535156, -255.72042846679688, -250.05569458007812, -244.39096069335938, -238.72622680664062, -233.06150817871094, -227.3967742919922, -221.7320556640625, -216.06732177734375, -210.402587890625, -204.73785400390625, -199.07313537597656, -193.4084014892578, -187.74368286132812, -182.07894897460938, -176.41421508789062, -170.74949645996094, -165.0847625732422, -159.4200439453125, -153.75531005859375, -148.090576171875, -142.4258575439453, -136.76112365722656, -131.09640502929688, -125.43167114257812, -119.76693725585938, -114.10221099853516, -108.43748474121094, -102.77275848388672, -97.1080322265625, -91.44329833984375, -85.77857208251953, -80.11384582519531, -74.44911193847656, -68.78438568115234, -63.11966323852539, -57.454933166503906, -51.79020690917969, -46.12548065185547, -40.460750579833984, -34.7960205078125, -29.13129425048828, -23.466564178466797, -17.801837921142578, -12.137109756469727, -6.472381591796875, -0.8076534271240234, 4.857074737548828, 10.52180290222168, 16.18653106689453, 21.851261138916016, 27.515987396240234]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 11.0, 26.0, 55.0, 576.0, 272.0, 33.0, 14.0, 9.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-77.13157653808594, -75.51822662353516, -73.90487670898438, -72.2915267944336, -70.67817687988281, -69.06482696533203, -67.45147705078125, -65.83812713623047, -64.22477722167969, -62.611427307128906, -60.998077392578125, -59.384727478027344, -57.77137756347656, -56.15802764892578, -54.544677734375, -52.93132781982422, -51.31797790527344, -49.704627990722656, -48.091278076171875, -46.477928161621094, -44.86457824707031, -43.25122833251953, -41.63787841796875, -40.02452850341797, -38.41117477416992, -36.79782485961914, -35.18447494506836, -33.57112503051758, -31.957775115966797, -30.344425201416016, -28.731075286865234, -27.117725372314453, -25.504375457763672, -23.89102554321289, -22.27767562866211, -20.664325714111328, -19.050975799560547, -17.437625885009766, -15.824275016784668, -14.210925102233887, -12.597575187683105, -10.984225273132324, -9.370875358581543, -7.7575249671936035, -6.144175052642822, -4.530824661254883, -2.9174747467041016, -1.3041248321533203, 0.30922508239746094, 1.9225751161575317, 3.5359251499176025, 5.149275302886963, 6.762625217437744, 8.375975608825684, 9.989325523376465, 11.602675437927246, 13.216025352478027, 14.829375267028809, 16.442726135253906, 18.056076049804688, 19.66942596435547, 21.28277587890625, 22.89612579345703, 24.509475708007812, 26.122825622558594]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 10.0, 11.0, 31.0, 38.0, 66.0, 126.0, 177.0, 310.0, 508.0, 869.0, 1518.0, 2924.0, 6327.0, 17531.0, 84827.0, 3616448.0, 399894.0, 39293.0, 12642.0, 5246.0, 2431.0, 1114.0, 621.0, 308.0, 199.0, 162.0, 110.0, 78.0, 72.0, 59.0, 65.0, 43.0, 44.0, 30.0, 28.0, 32.0, 26.0, 18.0, 9.0, 5.0, 8.0, 8.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19189453125, -0.18308639526367188, -0.17427825927734375, -0.16547012329101562, -0.1566619873046875, -0.14785385131835938, -0.13904571533203125, -0.13023757934570312, -0.121429443359375, -0.11262130737304688, -0.10381317138671875, -0.09500503540039062, -0.0861968994140625, -0.07738876342773438, -0.06858062744140625, -0.059772491455078125, -0.05096435546875, -0.042156219482421875, -0.03334808349609375, -0.024539947509765625, -0.0157318115234375, -0.006923675537109375, 0.00188446044921875, 0.010692596435546875, 0.019500732421875, 0.028308868408203125, 0.03711700439453125, 0.045925140380859375, 0.0547332763671875, 0.06354141235351562, 0.07234954833984375, 0.08115768432617188, 0.0899658203125, 0.09877395629882812, 0.10758209228515625, 0.11639022827148438, 0.1251983642578125, 0.13400650024414062, 0.14281463623046875, 0.15162277221679688, 0.160430908203125, 0.16923904418945312, 0.17804718017578125, 0.18685531616210938, 0.1956634521484375, 0.20447158813476562, 0.21327972412109375, 0.22208786010742188, 0.23089599609375, 0.23970413208007812, 0.24851226806640625, 0.2573204040527344, 0.2661285400390625, 0.2749366760253906, 0.28374481201171875, 0.2925529479980469, 0.301361083984375, 0.3101692199707031, 0.31897735595703125, 0.3277854919433594, 0.3365936279296875, 0.3454017639160156, 0.35420989990234375, 0.3630180358886719, 0.371826171875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 8.0, 11.0, 18.0, 30.0, 79.0, 180.0, 215.0, 213.0, 119.0, 54.0, 21.0, 12.0, 10.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00897216796875, -0.008541345596313477, -0.008110523223876953, -0.00767970085144043, -0.007248878479003906, -0.006818056106567383, -0.006387233734130859, -0.005956411361694336, -0.0055255889892578125, -0.005094766616821289, -0.004663944244384766, -0.004233121871948242, -0.0038022994995117188, -0.0033714771270751953, -0.002940654754638672, -0.0025098323822021484, -0.002079010009765625, -0.0016481876373291016, -0.0012173652648925781, -0.0007865428924560547, -0.00035572052001953125, 7.510185241699219e-05, 0.0005059242248535156, 0.0009367465972900391, 0.0013675689697265625, 0.001798391342163086, 0.0022292137145996094, 0.002660036087036133, 0.0030908584594726562, 0.0035216808319091797, 0.003952503204345703, 0.0043833255767822266, 0.00481414794921875, 0.0052449703216552734, 0.005675792694091797, 0.00610661506652832, 0.006537437438964844, 0.006968259811401367, 0.007399082183837891, 0.007829904556274414, 0.008260726928710938, 0.008691549301147461, 0.009122371673583984, 0.009553194046020508, 0.009984016418457031, 0.010414838790893555, 0.010845661163330078, 0.011276483535766602, 0.011707305908203125, 0.012138128280639648, 0.012568950653076172, 0.012999773025512695, 0.013430595397949219, 0.013861417770385742, 0.014292240142822266, 0.014723062515258789, 0.015153884887695312, 0.015584707260131836, 0.01601552963256836, 0.016446352005004883, 0.016877174377441406, 0.01730799674987793, 0.017738819122314453, 0.018169641494750977, 0.0186004638671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 10.0, 13.0, 27.0, 32.0, 36.0, 54.0, 83.0, 118.0, 166.0, 232.0, 368.0, 561.0, 929.0, 1704.0, 3595.0, 8870.0, 29747.0, 170079.0, 3466554.0, 439535.0, 50142.0, 12292.0, 4280.0, 1993.0, 1021.0, 623.0, 356.0, 261.0, 174.0, 126.0, 78.0, 65.0, 45.0, 28.0, 31.0, 11.0, 14.0, 9.0, 10.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.160888671875, -0.1548614501953125, -0.148834228515625, -0.1428070068359375, -0.13677978515625, -0.1307525634765625, -0.124725341796875, -0.1186981201171875, -0.1126708984375, -0.1066436767578125, -0.100616455078125, -0.0945892333984375, -0.08856201171875, -0.0825347900390625, -0.076507568359375, -0.0704803466796875, -0.064453125, -0.0584259033203125, -0.052398681640625, -0.0463714599609375, -0.04034423828125, -0.0343170166015625, -0.028289794921875, -0.0222625732421875, -0.0162353515625, -0.0102081298828125, -0.004180908203125, 0.0018463134765625, 0.00787353515625, 0.0139007568359375, 0.019927978515625, 0.0259552001953125, 0.031982421875, 0.0380096435546875, 0.044036865234375, 0.0500640869140625, 0.05609130859375, 0.0621185302734375, 0.068145751953125, 0.0741729736328125, 0.0802001953125, 0.0862274169921875, 0.092254638671875, 0.0982818603515625, 0.10430908203125, 0.1103363037109375, 0.116363525390625, 0.1223907470703125, 0.12841796875, 0.1344451904296875, 0.140472412109375, 0.1464996337890625, 0.15252685546875, 0.1585540771484375, 0.164581298828125, 0.1706085205078125, 0.1766357421875, 0.1826629638671875, 0.188690185546875, 0.1947174072265625, 0.20074462890625, 0.2067718505859375, 0.212799072265625, 0.2188262939453125, 0.224853515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 14.0, 9.0, 6.0, 13.0, 12.0, 14.0, 23.0, 32.0, 32.0, 41.0, 39.0, 43.0, 66.0, 73.0, 87.0, 111.0, 135.0, 164.0, 260.0, 366.0, 618.0, 687.0, 285.0, 190.0, 126.0, 124.0, 100.0, 85.0, 68.0, 54.0, 27.0, 31.0, 20.0, 22.0, 21.0, 14.0, 5.0, 12.0, 7.0, 7.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0222930908203125, -0.021657705307006836, -0.021022319793701172, -0.020386934280395508, -0.019751548767089844, -0.01911616325378418, -0.018480777740478516, -0.01784539222717285, -0.017210006713867188, -0.016574621200561523, -0.01593923568725586, -0.015303850173950195, -0.014668464660644531, -0.014033079147338867, -0.013397693634033203, -0.012762308120727539, -0.012126922607421875, -0.011491537094116211, -0.010856151580810547, -0.010220766067504883, -0.009585380554199219, -0.008949995040893555, -0.00831460952758789, -0.0076792240142822266, -0.0070438385009765625, -0.0064084529876708984, -0.005773067474365234, -0.00513768196105957, -0.004502296447753906, -0.003866910934448242, -0.003231525421142578, -0.002596139907836914, -0.00196075439453125, -0.001325368881225586, -0.0006899833679199219, -5.459785461425781e-05, 0.0005807876586914062, 0.0012161731719970703, 0.0018515586853027344, 0.0024869441986083984, 0.0031223297119140625, 0.0037577152252197266, 0.004393100738525391, 0.005028486251831055, 0.005663871765136719, 0.006299257278442383, 0.006934642791748047, 0.007570028305053711, 0.008205413818359375, 0.008840799331665039, 0.009476184844970703, 0.010111570358276367, 0.010746955871582031, 0.011382341384887695, 0.01201772689819336, 0.012653112411499023, 0.013288497924804688, 0.013923883438110352, 0.014559268951416016, 0.01519465446472168, 0.015830039978027344, 0.016465425491333008, 0.017100811004638672, 0.017736196517944336, 0.01837158203125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 5.0, 5.0, 12.0, 44.0, 147.0, 486.0, 270.0, 29.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7916419506073, -2.741672992706299, -2.691704034805298, -2.6417348384857178, -2.591765880584717, -2.541796922683716, -2.491827964782715, -2.4418587684631348, -2.391889810562134, -2.341920852661133, -2.291951894760132, -2.2419826984405518, -2.192013740539551, -2.14204478263855, -2.092075824737549, -2.0421066284179688, -1.9921377897262573, -1.9421688318252563, -1.8921997547149658, -1.8422307968139648, -1.7922617197036743, -1.7422927618026733, -1.6923236846923828, -1.6423547267913818, -1.5923857688903809, -1.5424168109893799, -1.4924477338790894, -1.4424787759780884, -1.3925096988677979, -1.3425407409667969, -1.292571783065796, -1.2426027059555054, -1.1926336288452148, -1.1426646709442139, -1.0926955938339233, -1.0427266359329224, -0.9927575588226318, -0.9427886009216309, -0.8928195834159851, -0.8428505659103394, -0.7928816080093384, -0.7429125905036926, -0.6929435729980469, -0.6429746150970459, -0.5930055379867554, -0.5430365800857544, -0.49306756258010864, -0.4430985450744629, -0.39312952756881714, -0.3431605100631714, -0.29319149255752563, -0.24322250485420227, -0.19325348734855652, -0.14328446984291077, -0.0933154821395874, -0.04334646463394165, 0.0066225528717041016, 0.05659156292676926, 0.10656057298183441, 0.15652957558631897, 0.20649859309196472, 0.2564676105976105, 0.30643659830093384, 0.3564056158065796, 0.40637463331222534]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 12.0, 9.0, 13.0, 18.0, 27.0, 42.0, 49.0, 51.0, 61.0, 68.0, 71.0, 92.0, 63.0, 61.0, 79.0, 65.0, 56.0, 35.0, 27.0, 26.0, 17.0, 20.0, 9.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.313027024269104, -0.3027944564819336, -0.2925618588924408, -0.2823292911052704, -0.2720966935157776, -0.2618641257286072, -0.25163155794143677, -0.24139896035194397, -0.23116639256477356, -0.22093380987644196, -0.21070122718811035, -0.20046865940093994, -0.19023607671260834, -0.18000349402427673, -0.16977091133594513, -0.15953832864761353, -0.14930574595928192, -0.13907316327095032, -0.1288405805826187, -0.1186080053448677, -0.1083754301071167, -0.0981428474187851, -0.08791026473045349, -0.07767768949270248, -0.06744510680437088, -0.057212527841329575, -0.04697994887828827, -0.036747366189956665, -0.02651478722691536, -0.016282208263874054, -0.00604962557554245, 0.004182949662208557, 0.014415532350540161, 0.024648111313581467, 0.03488069027662277, 0.045113272964954376, 0.05534585192799568, 0.06557843089103699, 0.07581101357936859, 0.0860435888171196, 0.0962761715054512, 0.1065087541937828, 0.11674132943153381, 0.12697391211986542, 0.13720649480819702, 0.14743906259536743, 0.15767166018486023, 0.16790422797203064, 0.17813681066036224, 0.18836939334869385, 0.19860197603702545, 0.20883455872535706, 0.21906712651252747, 0.22929970920085907, 0.23953229188919067, 0.24976485967636108, 0.2599974572658539, 0.2702300250530243, 0.2804626226425171, 0.2906951904296875, 0.3009277880191803, 0.3111603558063507, 0.3213929533958435, 0.3316255211830139, 0.3418580889701843]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 5.0, 4.0, 13.0, 16.0, 23.0, 31.0, 56.0, 69.0, 112.0, 149.0, 249.0, 392.0, 682.0, 1179.0, 2329.0, 5014.0, 13705.0, 57161.0, 555060.0, 347709.0, 43880.0, 11457.0, 4453.0, 2096.0, 1048.0, 595.0, 377.0, 215.0, 148.0, 98.0, 59.0, 53.0, 28.0, 22.0, 20.0, 10.0, 6.0, 8.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1419677734375, -0.13765525817871094, -0.13334274291992188, -0.1290302276611328, -0.12471771240234375, -0.12040519714355469, -0.11609268188476562, -0.11178016662597656, -0.1074676513671875, -0.10315513610839844, -0.09884262084960938, -0.09453010559082031, -0.09021759033203125, -0.08590507507324219, -0.08159255981445312, -0.07728004455566406, -0.072967529296875, -0.06865501403808594, -0.06434249877929688, -0.06002998352050781, -0.05571746826171875, -0.05140495300292969, -0.047092437744140625, -0.04277992248535156, -0.0384674072265625, -0.03415489196777344, -0.029842376708984375, -0.025529861450195312, -0.02121734619140625, -0.016904830932617188, -0.012592315673828125, -0.008279800415039062, -0.00396728515625, 0.0003452301025390625, 0.004657745361328125, 0.008970260620117188, 0.01328277587890625, 0.017595291137695312, 0.021907806396484375, 0.026220321655273438, 0.0305328369140625, 0.03484535217285156, 0.039157867431640625, 0.04347038269042969, 0.04778289794921875, 0.05209541320800781, 0.056407928466796875, 0.06072044372558594, 0.065032958984375, 0.06934547424316406, 0.07365798950195312, 0.07797050476074219, 0.08228302001953125, 0.08659553527832031, 0.09090805053710938, 0.09522056579589844, 0.0995330810546875, 0.10384559631347656, 0.10815811157226562, 0.11247062683105469, 0.11678314208984375, 0.12109565734863281, 0.12540817260742188, 0.12972068786621094, 0.134033203125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 2.0, 4.0, 4.0, 10.0, 16.0, 23.0, 35.0, 49.0, 68.0, 92.0, 75.0, 99.0, 119.0, 85.0, 91.0, 66.0, 46.0, 37.0, 24.0, 13.0, 9.0, 13.0, 1.0, 3.0, 8.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00927734375, -0.008988142013549805, -0.00869894027709961, -0.008409738540649414, -0.008120536804199219, -0.007831335067749023, -0.007542133331298828, -0.007252931594848633, -0.0069637298583984375, -0.006674528121948242, -0.006385326385498047, -0.0060961246490478516, -0.005806922912597656, -0.005517721176147461, -0.005228519439697266, -0.00493931770324707, -0.004650115966796875, -0.00436091423034668, -0.004071712493896484, -0.003782510757446289, -0.0034933090209960938, -0.0032041072845458984, -0.002914905548095703, -0.002625703811645508, -0.0023365020751953125, -0.002047300338745117, -0.0017580986022949219, -0.0014688968658447266, -0.0011796951293945312, -0.0008904933929443359, -0.0006012916564941406, -0.0003120899200439453, -2.288818359375e-05, 0.0002663135528564453, 0.0005555152893066406, 0.0008447170257568359, 0.0011339187622070312, 0.0014231204986572266, 0.0017123222351074219, 0.002001523971557617, 0.0022907257080078125, 0.002579927444458008, 0.002869129180908203, 0.0031583309173583984, 0.0034475326538085938, 0.003736734390258789, 0.004025936126708984, 0.00431513786315918, 0.004604339599609375, 0.00489354133605957, 0.005182743072509766, 0.005471944808959961, 0.005761146545410156, 0.0060503482818603516, 0.006339550018310547, 0.006628751754760742, 0.0069179534912109375, 0.007207155227661133, 0.007496356964111328, 0.0077855587005615234, 0.008074760437011719, 0.008363962173461914, 0.00865316390991211, 0.008942365646362305, 0.0092315673828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 5.0, 6.0, 6.0, 12.0, 9.0, 17.0, 25.0, 42.0, 94.0, 114.0, 186.0, 296.0, 611.0, 1195.0, 2386.0, 4878.0, 12800.0, 53503.0, 550534.0, 359885.0, 41989.0, 11116.0, 4323.0, 2118.0, 1121.0, 563.0, 284.0, 167.0, 88.0, 63.0, 32.0, 27.0, 16.0, 14.0, 15.0, 6.0, 1.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1375732421875, -0.13297653198242188, -0.12837982177734375, -0.12378311157226562, -0.1191864013671875, -0.11458969116210938, -0.10999298095703125, -0.10539627075195312, -0.100799560546875, -0.09620285034179688, -0.09160614013671875, -0.08700942993164062, -0.0824127197265625, -0.07781600952148438, -0.07321929931640625, -0.06862258911132812, -0.06402587890625, -0.059429168701171875, -0.05483245849609375, -0.050235748291015625, -0.0456390380859375, -0.041042327880859375, -0.03644561767578125, -0.031848907470703125, -0.027252197265625, -0.022655487060546875, -0.01805877685546875, -0.013462066650390625, -0.0088653564453125, -0.004268646240234375, 0.00032806396484375, 0.004924774169921875, 0.009521484375, 0.014118194580078125, 0.01871490478515625, 0.023311614990234375, 0.0279083251953125, 0.032505035400390625, 0.03710174560546875, 0.041698455810546875, 0.046295166015625, 0.050891876220703125, 0.05548858642578125, 0.060085296630859375, 0.0646820068359375, 0.06927871704101562, 0.07387542724609375, 0.07847213745117188, 0.08306884765625, 0.08766555786132812, 0.09226226806640625, 0.09685897827148438, 0.1014556884765625, 0.10605239868164062, 0.11064910888671875, 0.11524581909179688, 0.119842529296875, 0.12443923950195312, 0.12903594970703125, 0.13363265991210938, 0.1382293701171875, 0.14282608032226562, 0.14742279052734375, 0.15201950073242188, 0.1566162109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 10.0, 11.0, 11.0, 14.0, 14.0, 15.0, 20.0, 23.0, 23.0, 36.0, 29.0, 21.0, 24.0, 39.0, 40.0, 38.0, 33.0, 37.0, 49.0, 42.0, 33.0, 39.0, 39.0, 35.0, 37.0, 29.0, 33.0, 29.0, 17.0, 26.0, 25.0, 20.0, 14.0, 22.0, 10.0, 18.0, 16.0, 7.0, 2.0, 7.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.03997802734375, -0.03886890411376953, -0.03775978088378906, -0.036650657653808594, -0.035541534423828125, -0.034432411193847656, -0.03332328796386719, -0.03221416473388672, -0.03110504150390625, -0.02999591827392578, -0.028886795043945312, -0.027777671813964844, -0.026668548583984375, -0.025559425354003906, -0.024450302124023438, -0.02334117889404297, -0.0222320556640625, -0.02112293243408203, -0.020013809204101562, -0.018904685974121094, -0.017795562744140625, -0.016686439514160156, -0.015577316284179688, -0.014468193054199219, -0.01335906982421875, -0.012249946594238281, -0.011140823364257812, -0.010031700134277344, -0.008922576904296875, -0.007813453674316406, -0.0067043304443359375, -0.005595207214355469, -0.004486083984375, -0.0033769607543945312, -0.0022678375244140625, -0.0011587142944335938, -4.9591064453125e-05, 0.0010595321655273438, 0.0021686553955078125, 0.0032777786254882812, 0.00438690185546875, 0.005496025085449219, 0.0066051483154296875, 0.007714271545410156, 0.008823394775390625, 0.009932518005371094, 0.011041641235351562, 0.012150764465332031, 0.0132598876953125, 0.014369010925292969, 0.015478134155273438, 0.016587257385253906, 0.017696380615234375, 0.018805503845214844, 0.019914627075195312, 0.02102375030517578, 0.02213287353515625, 0.02324199676513672, 0.024351119995117188, 0.025460243225097656, 0.026569366455078125, 0.027678489685058594, 0.028787612915039062, 0.02989673614501953, 0.031005859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 5.0, 9.0, 13.0, 19.0, 22.0, 42.0, 58.0, 103.0, 170.0, 386.0, 1100.0, 4665.0, 59860.0, 956996.0, 20939.0, 2676.0, 783.0, 319.0, 154.0, 83.0, 39.0, 30.0, 23.0, 13.0, 8.0, 12.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.266357421875, -0.2575798034667969, -0.24880218505859375, -0.24002456665039062, -0.2312469482421875, -0.22246932983398438, -0.21369171142578125, -0.20491409301757812, -0.196136474609375, -0.18735885620117188, -0.17858123779296875, -0.16980361938476562, -0.1610260009765625, -0.15224838256835938, -0.14347076416015625, -0.13469314575195312, -0.12591552734375, -0.11713790893554688, -0.10836029052734375, -0.09958267211914062, -0.0908050537109375, -0.08202743530273438, -0.07324981689453125, -0.06447219848632812, -0.055694580078125, -0.046916961669921875, -0.03813934326171875, -0.029361724853515625, -0.0205841064453125, -0.011806488037109375, -0.00302886962890625, 0.005748748779296875, 0.0145263671875, 0.023303985595703125, 0.03208160400390625, 0.040859222412109375, 0.0496368408203125, 0.058414459228515625, 0.06719207763671875, 0.07596969604492188, 0.084747314453125, 0.09352493286132812, 0.10230255126953125, 0.11108016967773438, 0.1198577880859375, 0.12863540649414062, 0.13741302490234375, 0.14619064331054688, 0.15496826171875, 0.16374588012695312, 0.17252349853515625, 0.18130111694335938, 0.1900787353515625, 0.19885635375976562, 0.20763397216796875, 0.21641159057617188, 0.225189208984375, 0.23396682739257812, 0.24274444580078125, 0.2515220642089844, 0.2602996826171875, 0.2690773010253906, 0.27785491943359375, 0.2866325378417969, 0.29541015625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 9.0, 7.0, 12.0, 22.0, 19.0, 35.0, 88.0, 295.0, 308.0, 83.0, 31.0, 28.0, 12.0, 13.0, 6.0, 7.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016450881958007812, -0.00015981122851371765, -0.00015511363744735718, -0.0001504160463809967, -0.00014571845531463623, -0.00014102086424827576, -0.00013632327318191528, -0.0001316256821155548, -0.00012692809104919434, -0.00012223049998283386, -0.00011753290891647339, -0.00011283531785011292, -0.00010813772678375244, -0.00010344013571739197, -9.87425446510315e-05, -9.404495358467102e-05, -8.934736251831055e-05, -8.464977145195007e-05, -7.99521803855896e-05, -7.525458931922913e-05, -7.055699825286865e-05, -6.585940718650818e-05, -6.11618161201477e-05, -5.646422505378723e-05, -5.176663398742676e-05, -4.7069042921066284e-05, -4.237145185470581e-05, -3.767386078834534e-05, -3.297626972198486e-05, -2.827867865562439e-05, -2.3581087589263916e-05, -1.8883496522903442e-05, -1.4185905456542969e-05, -9.488314390182495e-06, -4.7907233238220215e-06, -9.313225746154785e-08, 4.604458808898926e-06, 9.3020498752594e-06, 1.3999640941619873e-05, 1.8697232007980347e-05, 2.339482307434082e-05, 2.8092414140701294e-05, 3.279000520706177e-05, 3.748759627342224e-05, 4.2185187339782715e-05, 4.688277840614319e-05, 5.158036947250366e-05, 5.6277960538864136e-05, 6.097555160522461e-05, 6.567314267158508e-05, 7.037073373794556e-05, 7.506832480430603e-05, 7.97659158706665e-05, 8.446350693702698e-05, 8.916109800338745e-05, 9.385868906974792e-05, 9.85562801361084e-05, 0.00010325387120246887, 0.00010795146226882935, 0.00011264905333518982, 0.00011734664440155029, 0.00012204423546791077, 0.00012674182653427124, 0.00013143941760063171, 0.0001361370086669922]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 4.0, 3.0, 6.0, 4.0, 14.0, 13.0, 11.0, 27.0, 16.0, 48.0, 51.0, 68.0, 99.0, 138.0, 176.0, 287.0, 451.0, 744.0, 1346.0, 2850.0, 7285.0, 29949.0, 735772.0, 238975.0, 19312.0, 5464.0, 2407.0, 1121.0, 665.0, 405.0, 226.0, 172.0, 111.0, 79.0, 54.0, 52.0, 36.0, 32.0, 27.0, 14.0, 8.0, 7.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.171142578125, -0.16623497009277344, -0.16132736206054688, -0.1564197540283203, -0.15151214599609375, -0.1466045379638672, -0.14169692993164062, -0.13678932189941406, -0.1318817138671875, -0.12697410583496094, -0.12206649780273438, -0.11715888977050781, -0.11225128173828125, -0.10734367370605469, -0.10243606567382812, -0.09752845764160156, -0.092620849609375, -0.08771324157714844, -0.08280563354492188, -0.07789802551269531, -0.07299041748046875, -0.06808280944824219, -0.06317520141601562, -0.05826759338378906, -0.0533599853515625, -0.04845237731933594, -0.043544769287109375, -0.03863716125488281, -0.03372955322265625, -0.028821945190429688, -0.023914337158203125, -0.019006729125976562, -0.01409912109375, -0.009191513061523438, -0.004283905029296875, 0.0006237030029296875, 0.00553131103515625, 0.010438919067382812, 0.015346527099609375, 0.020254135131835938, 0.0251617431640625, 0.030069351196289062, 0.034976959228515625, 0.03988456726074219, 0.04479217529296875, 0.04969978332519531, 0.054607391357421875, 0.05951499938964844, 0.064422607421875, 0.06933021545410156, 0.07423782348632812, 0.07914543151855469, 0.08405303955078125, 0.08896064758300781, 0.09386825561523438, 0.09877586364746094, 0.1036834716796875, 0.10859107971191406, 0.11349868774414062, 0.11840629577636719, 0.12331390380859375, 0.1282215118408203, 0.13312911987304688, 0.13803672790527344, 0.1429443359375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 10.0, 13.0, 23.0, 31.0, 45.0, 66.0, 94.0, 151.0, 179.0, 143.0, 93.0, 52.0, 31.0, 22.0, 12.0, 7.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09307861328125, -0.0906534194946289, -0.08822822570800781, -0.08580303192138672, -0.08337783813476562, -0.08095264434814453, -0.07852745056152344, -0.07610225677490234, -0.07367706298828125, -0.07125186920166016, -0.06882667541503906, -0.06640148162841797, -0.06397628784179688, -0.06155109405517578, -0.05912590026855469, -0.056700706481933594, -0.0542755126953125, -0.051850318908691406, -0.04942512512207031, -0.04699993133544922, -0.044574737548828125, -0.04214954376220703, -0.03972434997558594, -0.037299156188964844, -0.03487396240234375, -0.032448768615722656, -0.030023574829101562, -0.02759838104248047, -0.025173187255859375, -0.02274799346923828, -0.020322799682617188, -0.017897605895996094, -0.015472412109375, -0.013047218322753906, -0.010622024536132812, -0.008196830749511719, -0.005771636962890625, -0.0033464431762695312, -0.0009212493896484375, 0.0015039443969726562, 0.00392913818359375, 0.006354331970214844, 0.008779525756835938, 0.011204719543457031, 0.013629913330078125, 0.01605510711669922, 0.018480300903320312, 0.020905494689941406, 0.0233306884765625, 0.025755882263183594, 0.028181076049804688, 0.03060626983642578, 0.033031463623046875, 0.03545665740966797, 0.03788185119628906, 0.040307044982910156, 0.04273223876953125, 0.045157432556152344, 0.04758262634277344, 0.05000782012939453, 0.052433013916015625, 0.05485820770263672, 0.05728340148925781, 0.059708595275878906, 0.0621337890625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 11.0, 16.0, 24.0, 56.0, 163.0, 426.0, 205.0, 53.0, 16.0, 13.0, 5.0, 5.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.006993055343628, -2.9411299228668213, -2.8752670288085938, -2.809403896331787, -2.7435407638549805, -2.677677631378174, -2.611814498901367, -2.5459516048431396, -2.480088472366333, -2.4142253398895264, -2.348362445831299, -2.282499313354492, -2.2166361808776855, -2.150773048400879, -2.0849099159240723, -2.0190470218658447, -1.953183889389038, -1.8873207569122314, -1.8214577436447144, -1.7555947303771973, -1.6897315979003906, -1.623868465423584, -1.558005452156067, -1.4921424388885498, -1.4262793064117432, -1.3604161739349365, -1.2945531606674194, -1.2286901473999023, -1.1628270149230957, -1.096963882446289, -1.031100869178772, -0.9652377963066101, -0.8993748426437378, -0.8335117697715759, -0.7676486968994141, -0.7017856240272522, -0.6359225511550903, -0.5700594782829285, -0.5041964054107666, -0.43833333253860474, -0.37247025966644287, -0.306607186794281, -0.24074411392211914, -0.17488104104995728, -0.10901796817779541, -0.043154895305633545, 0.02270817756652832, 0.08857125043869019, 0.15443432331085205, 0.22029739618301392, 0.2861604690551758, 0.35202354192733765, 0.4178866147994995, 0.4837496876716614, 0.5496127605438232, 0.6154758334159851, 0.681338906288147, 0.7472019791603088, 0.8130650520324707, 0.8789281249046326, 0.9447911977767944, 1.0106542110443115, 1.0765173435211182, 1.1423804759979248, 1.208243489265442]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 10.0, 13.0, 17.0, 15.0, 34.0, 48.0, 57.0, 80.0, 84.0, 93.0, 92.0, 101.0, 75.0, 84.0, 57.0, 36.0, 38.0, 14.0, 10.0, 10.0, 5.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7356605529785156, -0.7103829383850098, -0.6851052641868591, -0.6598275899887085, -0.6345499753952026, -0.6092723608016968, -0.5839946866035461, -0.5587170124053955, -0.5334393978118896, -0.5081617832183838, -0.48288410902023315, -0.4576064646244049, -0.43232882022857666, -0.4070511758327484, -0.38177353143692017, -0.3564958870410919, -0.33121824264526367, -0.3059405982494354, -0.2806629538536072, -0.25538530945777893, -0.23010766506195068, -0.20483002066612244, -0.1795523762702942, -0.15427473187446594, -0.1289970874786377, -0.10371944308280945, -0.0784417986869812, -0.053164154291152954, -0.027886509895324707, -0.00260886549949646, 0.022668778896331787, 0.047946423292160034, 0.07322412729263306, 0.0985017716884613, 0.12377941608428955, 0.1490570604801178, 0.17433470487594604, 0.1996123492717743, 0.22488999366760254, 0.2501676380634308, 0.27544528245925903, 0.3007229268550873, 0.3260005712509155, 0.3512782156467438, 0.376555860042572, 0.40183350443840027, 0.4271111488342285, 0.45238879323005676, 0.477666437625885, 0.5029441118240356, 0.5282217264175415, 0.5534993410110474, 0.578777015209198, 0.6040546894073486, 0.6293323040008545, 0.6546099185943604, 0.679887592792511, 0.7051652669906616, 0.7304428815841675, 0.7557204961776733, 0.780998170375824, 0.8062758445739746, 0.8315534591674805, 0.8568310737609863, 0.882108747959137]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 1.0, 3.0, 7.0, 6.0, 6.0, 12.0, 15.0, 17.0, 28.0, 55.0, 140.0, 908.0, 41460.0, 4149420.0, 1851.0, 168.0, 53.0, 38.0, 29.0, 13.0, 11.0, 9.0, 6.0, 12.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.08203125, -3.985321044921875, -3.88861083984375, -3.791900634765625, -3.6951904296875, -3.598480224609375, -3.50177001953125, -3.405059814453125, -3.308349609375, -3.211639404296875, -3.11492919921875, -3.018218994140625, -2.9215087890625, -2.824798583984375, -2.72808837890625, -2.631378173828125, -2.53466796875, -2.437957763671875, -2.34124755859375, -2.244537353515625, -2.1478271484375, -2.051116943359375, -1.95440673828125, -1.857696533203125, -1.760986328125, -1.664276123046875, -1.56756591796875, -1.470855712890625, -1.3741455078125, -1.277435302734375, -1.18072509765625, -1.084014892578125, -0.9873046875, -0.890594482421875, -0.79388427734375, -0.697174072265625, -0.6004638671875, -0.503753662109375, -0.40704345703125, -0.310333251953125, -0.213623046875, -0.116912841796875, -0.02020263671875, 0.076507568359375, 0.1732177734375, 0.269927978515625, 0.36663818359375, 0.463348388671875, 0.56005859375, 0.656768798828125, 0.75347900390625, 0.850189208984375, 0.9468994140625, 1.043609619140625, 1.14031982421875, 1.237030029296875, 1.333740234375, 1.430450439453125, 1.52716064453125, 1.623870849609375, 1.7205810546875, 1.817291259765625, 1.91400146484375, 2.010711669921875, 2.107421875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 8.0, 5.0, 10.0, 18.0, 28.0, 20.0, 41.0, 34.0, 60.0, 47.0, 83.0, 82.0, 91.0, 83.0, 84.0, 69.0, 72.0, 39.0, 38.0, 24.0, 14.0, 19.0, 9.0, 6.0, 3.0, 3.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00881195068359375, -0.008541703224182129, -0.008271455764770508, -0.008001208305358887, -0.007730960845947266, -0.0074607133865356445, -0.0071904659271240234, -0.006920218467712402, -0.006649971008300781, -0.00637972354888916, -0.006109476089477539, -0.005839228630065918, -0.005568981170654297, -0.005298733711242676, -0.005028486251831055, -0.004758238792419434, -0.0044879913330078125, -0.004217743873596191, -0.00394749641418457, -0.0036772489547729492, -0.003407001495361328, -0.003136754035949707, -0.002866506576538086, -0.002596259117126465, -0.0023260116577148438, -0.0020557641983032227, -0.0017855167388916016, -0.0015152692794799805, -0.0012450218200683594, -0.0009747743606567383, -0.0007045269012451172, -0.0004342794418334961, -0.000164031982421875, 0.0001062154769897461, 0.0003764629364013672, 0.0006467103958129883, 0.0009169578552246094, 0.0011872053146362305, 0.0014574527740478516, 0.0017277002334594727, 0.0019979476928710938, 0.002268195152282715, 0.002538442611694336, 0.002808690071105957, 0.003078937530517578, 0.0033491849899291992, 0.0036194324493408203, 0.0038896799087524414, 0.0041599273681640625, 0.004430174827575684, 0.004700422286987305, 0.004970669746398926, 0.005240917205810547, 0.005511164665222168, 0.005781412124633789, 0.00605165958404541, 0.006321907043457031, 0.006592154502868652, 0.0068624019622802734, 0.0071326494216918945, 0.007402896881103516, 0.007673144340515137, 0.007943391799926758, 0.008213639259338379, 0.00848388671875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 9.0, 22.0, 73.0, 812.0, 4188260.0, 4350.0, 450.0, 197.0, 70.0, 29.0, 9.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0078125, -0.89105224609375, -0.7742919921875, -0.65753173828125, -0.540771484375, -0.42401123046875, -0.3072509765625, -0.19049072265625, -0.07373046875, 0.04302978515625, 0.1597900390625, 0.27655029296875, 0.393310546875, 0.51007080078125, 0.6268310546875, 0.74359130859375, 0.8603515625, 0.97711181640625, 1.0938720703125, 1.21063232421875, 1.327392578125, 1.44415283203125, 1.5609130859375, 1.67767333984375, 1.79443359375, 1.91119384765625, 2.0279541015625, 2.14471435546875, 2.261474609375, 2.37823486328125, 2.4949951171875, 2.61175537109375, 2.728515625, 2.84527587890625, 2.9620361328125, 3.07879638671875, 3.195556640625, 3.31231689453125, 3.4290771484375, 3.54583740234375, 3.66259765625, 3.77935791015625, 3.8961181640625, 4.01287841796875, 4.129638671875, 4.24639892578125, 4.3631591796875, 4.47991943359375, 4.5966796875, 4.71343994140625, 4.8302001953125, 4.94696044921875, 5.063720703125, 5.18048095703125, 5.2972412109375, 5.41400146484375, 5.53076171875, 5.64752197265625, 5.7642822265625, 5.88104248046875, 5.997802734375, 6.11456298828125, 6.2313232421875, 6.34808349609375, 6.46484375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 8.0, 8.0, 9.0, 13.0, 24.0, 43.0, 47.0, 73.0, 106.0, 262.0, 1668.0, 1055.0, 449.0, 161.0, 68.0, 37.0, 21.0, 4.0, 10.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0345458984375, -0.03321075439453125, -0.0318756103515625, -0.03054046630859375, -0.029205322265625, -0.02787017822265625, -0.0265350341796875, -0.02519989013671875, -0.02386474609375, -0.02252960205078125, -0.0211944580078125, -0.01985931396484375, -0.018524169921875, -0.01718902587890625, -0.0158538818359375, -0.01451873779296875, -0.01318359375, -0.01184844970703125, -0.0105133056640625, -0.00917816162109375, -0.007843017578125, -0.00650787353515625, -0.0051727294921875, -0.00383758544921875, -0.00250244140625, -0.00116729736328125, 0.0001678466796875, 0.00150299072265625, 0.002838134765625, 0.00417327880859375, 0.0055084228515625, 0.00684356689453125, 0.0081787109375, 0.00951385498046875, 0.0108489990234375, 0.01218414306640625, 0.013519287109375, 0.01485443115234375, 0.0161895751953125, 0.01752471923828125, 0.01885986328125, 0.02019500732421875, 0.0215301513671875, 0.02286529541015625, 0.024200439453125, 0.02553558349609375, 0.0268707275390625, 0.02820587158203125, 0.029541015625, 0.03087615966796875, 0.0322113037109375, 0.03354644775390625, 0.034881591796875, 0.03621673583984375, 0.0375518798828125, 0.03888702392578125, 0.04022216796875, 0.04155731201171875, 0.0428924560546875, 0.04422760009765625, 0.045562744140625, 0.04689788818359375, 0.0482330322265625, 0.04956817626953125, 0.0509033203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 24.0, 967.0, 27.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.859286904335022, -0.47533461451530457, -0.09138232469558716, 0.29256999492645264, 0.6765222549438477, 1.0604745149612427, 1.4444268941879272, 1.8283790349960327, 2.2123312950134277, 2.5962836742401123, 2.9802358150482178, 3.3641881942749023, 3.748140335083008, 4.132092475891113, 4.516045093536377, 4.899997234344482, 5.283949851989746, 5.667901992797852, 6.051854610443115, 6.435806751251221, 6.819758892059326, 7.20371150970459, 7.587663650512695, 7.971615791320801, 8.355567932128906, 8.739520072937012, 9.123472213745117, 9.507425308227539, 9.891377449035645, 10.27532958984375, 10.659281730651855, 11.043233871459961, 11.427186012268066, 11.811138153076172, 12.195090293884277, 12.579042434692383, 12.962995529174805, 13.34694766998291, 13.730899810791016, 14.114851951599121, 14.498804092407227, 14.882756233215332, 15.266708374023438, 15.65066146850586, 16.03461265563965, 16.41856575012207, 16.80251693725586, 17.18647003173828, 17.570423126220703, 17.954376220703125, 18.338327407836914, 18.722280502319336, 19.106231689453125, 19.490184783935547, 19.87413787841797, 20.258089065551758, 20.642040252685547, 21.02599334716797, 21.409944534301758, 21.79389762878418, 22.17784881591797, 22.56180191040039, 22.945755004882812, 23.3297061920166, 23.713659286499023]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 5.0, 12.0, 23.0, 49.0, 76.0, 144.0, 210.0, 201.0, 144.0, 79.0, 39.0, 17.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21184486150741577, -0.18568839132785797, -0.15953192114830017, -0.13337543606758118, -0.10721896588802338, -0.08106249570846558, -0.05490601062774658, -0.028749540448188782, -0.0025930702686309814, 0.023563403636217117, 0.049719877541065216, 0.07587635517120361, 0.10203282535076141, 0.1281892955303192, 0.1543457806110382, 0.180502250790596, 0.2066587209701538, 0.2328151911497116, 0.2589716613292694, 0.2851281464099884, 0.311284601688385, 0.337441086769104, 0.363597571849823, 0.389754056930542, 0.4159105122089386, 0.4420669972896576, 0.4682234525680542, 0.4943799376487732, 0.5205364227294922, 0.5466928482055664, 0.5728493928909302, 0.5990058183670044, 0.6251622438430786, 0.6513187289237976, 0.6774752140045166, 0.7036316394805908, 0.7297881245613098, 0.7559446096420288, 0.7821010947227478, 0.8082575798034668, 0.834414005279541, 0.86057049036026, 0.886726975440979, 0.9128834009170532, 0.9390398859977722, 0.9651963710784912, 0.9913528561592102, 1.0175093412399292, 1.043665885925293, 1.0698223114013672, 1.095978856086731, 1.1221352815628052, 1.148291826248169, 1.1744482517242432, 1.2006046772003174, 1.2267612218856812, 1.2529176473617554, 1.2790740728378296, 1.3052306175231934, 1.3313870429992676, 1.3575435876846313, 1.3837000131607056, 1.4098565578460693, 1.4360129833221436, 1.4621694087982178]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 12.0, 19.0, 17.0, 33.0, 36.0, 53.0, 70.0, 151.0, 207.0, 353.0, 567.0, 1022.0, 1903.0, 3501.0, 7635.0, 17968.0, 53614.0, 234560.0, 564199.0, 108582.0, 30903.0, 11962.0, 5193.0, 2527.0, 1430.0, 781.0, 439.0, 269.0, 179.0, 111.0, 62.0, 52.0, 37.0, 18.0, 19.0, 11.0, 14.0, 6.0, 8.0, 3.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.201171875, -0.19452476501464844, -0.18787765502929688, -0.1812305450439453, -0.17458343505859375, -0.1679363250732422, -0.16128921508789062, -0.15464210510253906, -0.1479949951171875, -0.14134788513183594, -0.13470077514648438, -0.1280536651611328, -0.12140655517578125, -0.11475944519042969, -0.10811233520507812, -0.10146522521972656, -0.094818115234375, -0.08817100524902344, -0.08152389526367188, -0.07487678527832031, -0.06822967529296875, -0.06158256530761719, -0.054935455322265625, -0.04828834533691406, -0.0416412353515625, -0.03499412536621094, -0.028347015380859375, -0.021699905395507812, -0.01505279541015625, -0.008405685424804688, -0.001758575439453125, 0.0048885345458984375, 0.01153564453125, 0.018182754516601562, 0.024829864501953125, 0.03147697448730469, 0.03812408447265625, 0.04477119445800781, 0.051418304443359375, 0.05806541442871094, 0.0647125244140625, 0.07135963439941406, 0.07800674438476562, 0.08465385437011719, 0.09130096435546875, 0.09794807434082031, 0.10459518432617188, 0.11124229431152344, 0.117889404296875, 0.12453651428222656, 0.13118362426757812, 0.1378307342529297, 0.14447784423828125, 0.1511249542236328, 0.15777206420898438, 0.16441917419433594, 0.1710662841796875, 0.17771339416503906, 0.18436050415039062, 0.1910076141357422, 0.19765472412109375, 0.2043018341064453, 0.21094894409179688, 0.21759605407714844, 0.2242431640625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 11.0, 4.0, 8.0, 9.0, 19.0, 23.0, 43.0, 53.0, 37.0, 68.0, 85.0, 83.0, 77.0, 87.0, 86.0, 77.0, 54.0, 43.0, 34.0, 27.0, 22.0, 6.0, 14.0, 15.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01204681396484375, -0.011665105819702148, -0.011283397674560547, -0.010901689529418945, -0.010519981384277344, -0.010138273239135742, -0.00975656509399414, -0.009374856948852539, -0.008993148803710938, -0.008611440658569336, -0.008229732513427734, -0.007848024368286133, -0.007466316223144531, -0.00708460807800293, -0.006702899932861328, -0.0063211917877197266, -0.005939483642578125, -0.0055577754974365234, -0.005176067352294922, -0.00479435920715332, -0.004412651062011719, -0.004030942916870117, -0.0036492347717285156, -0.003267526626586914, -0.0028858184814453125, -0.002504110336303711, -0.0021224021911621094, -0.0017406940460205078, -0.0013589859008789062, -0.0009772777557373047, -0.0005955696105957031, -0.00021386146545410156, 0.0001678466796875, 0.0005495548248291016, 0.0009312629699707031, 0.0013129711151123047, 0.0016946792602539062, 0.002076387405395508, 0.0024580955505371094, 0.002839803695678711, 0.0032215118408203125, 0.003603219985961914, 0.003984928131103516, 0.004366636276245117, 0.004748344421386719, 0.00513005256652832, 0.005511760711669922, 0.0058934688568115234, 0.006275177001953125, 0.0066568851470947266, 0.007038593292236328, 0.00742030143737793, 0.007802009582519531, 0.008183717727661133, 0.008565425872802734, 0.008947134017944336, 0.009328842163085938, 0.009710550308227539, 0.01009225845336914, 0.010473966598510742, 0.010855674743652344, 0.011237382888793945, 0.011619091033935547, 0.012000799179077148, 0.01238250732421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 1.0, 8.0, 5.0, 12.0, 8.0, 18.0, 9.0, 16.0, 15.0, 26.0, 25.0, 50.0, 123.0, 776.0, 12020.0, 980673.0, 52610.0, 1689.0, 228.0, 71.0, 33.0, 18.0, 26.0, 10.0, 9.0, 13.0, 8.0, 9.0, 10.0, 6.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54345703125, -0.5238189697265625, -0.504180908203125, -0.4845428466796875, -0.46490478515625, -0.4452667236328125, -0.425628662109375, -0.4059906005859375, -0.3863525390625, -0.3667144775390625, -0.347076416015625, -0.3274383544921875, -0.30780029296875, -0.2881622314453125, -0.268524169921875, -0.2488861083984375, -0.229248046875, -0.2096099853515625, -0.189971923828125, -0.1703338623046875, -0.15069580078125, -0.1310577392578125, -0.111419677734375, -0.0917816162109375, -0.0721435546875, -0.0525054931640625, -0.032867431640625, -0.0132293701171875, 0.00640869140625, 0.0260467529296875, 0.045684814453125, 0.0653228759765625, 0.0849609375, 0.1045989990234375, 0.124237060546875, 0.1438751220703125, 0.16351318359375, 0.1831512451171875, 0.202789306640625, 0.2224273681640625, 0.2420654296875, 0.2617034912109375, 0.281341552734375, 0.3009796142578125, 0.32061767578125, 0.3402557373046875, 0.359893798828125, 0.3795318603515625, 0.399169921875, 0.4188079833984375, 0.438446044921875, 0.4580841064453125, 0.47772216796875, 0.4973602294921875, 0.516998291015625, 0.5366363525390625, 0.5562744140625, 0.5759124755859375, 0.595550537109375, 0.6151885986328125, 0.63482666015625, 0.6544647216796875, 0.674102783203125, 0.6937408447265625, 0.71337890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 4.0, 7.0, 4.0, 10.0, 4.0, 14.0, 9.0, 14.0, 23.0, 20.0, 21.0, 35.0, 28.0, 39.0, 40.0, 37.0, 40.0, 44.0, 47.0, 46.0, 59.0, 49.0, 62.0, 53.0, 40.0, 42.0, 25.0, 25.0, 40.0, 18.0, 16.0, 13.0, 15.0, 19.0, 8.0, 10.0, 9.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04669189453125, -0.045372962951660156, -0.04405403137207031, -0.04273509979248047, -0.041416168212890625, -0.04009723663330078, -0.03877830505371094, -0.037459373474121094, -0.03614044189453125, -0.034821510314941406, -0.03350257873535156, -0.03218364715576172, -0.030864715576171875, -0.02954578399658203, -0.028226852416992188, -0.026907920837402344, -0.0255889892578125, -0.024270057678222656, -0.022951126098632812, -0.02163219451904297, -0.020313262939453125, -0.01899433135986328, -0.017675399780273438, -0.016356468200683594, -0.01503753662109375, -0.013718605041503906, -0.012399673461914062, -0.011080741882324219, -0.009761810302734375, -0.008442878723144531, -0.0071239471435546875, -0.005805015563964844, -0.004486083984375, -0.0031671524047851562, -0.0018482208251953125, -0.0005292892456054688, 0.000789642333984375, 0.0021085739135742188, 0.0034275054931640625, 0.004746437072753906, 0.00606536865234375, 0.007384300231933594, 0.008703231811523438, 0.010022163391113281, 0.011341094970703125, 0.012660026550292969, 0.013978958129882812, 0.015297889709472656, 0.0166168212890625, 0.017935752868652344, 0.019254684448242188, 0.02057361602783203, 0.021892547607421875, 0.02321147918701172, 0.024530410766601562, 0.025849342346191406, 0.02716827392578125, 0.028487205505371094, 0.029806137084960938, 0.03112506866455078, 0.032444000244140625, 0.03376293182373047, 0.03508186340332031, 0.036400794982910156, 0.0377197265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 8.0, 5.0, 25.0, 34.0, 102.0, 697.0, 753028.0, 293807.0, 659.0, 112.0, 35.0, 14.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5703125, -5.41973876953125, -5.2691650390625, -5.11859130859375, -4.968017578125, -4.81744384765625, -4.6668701171875, -4.51629638671875, -4.36572265625, -4.21514892578125, -4.0645751953125, -3.91400146484375, -3.763427734375, -3.61285400390625, -3.4622802734375, -3.31170654296875, -3.1611328125, -3.01055908203125, -2.8599853515625, -2.70941162109375, -2.558837890625, -2.40826416015625, -2.2576904296875, -2.10711669921875, -1.95654296875, -1.80596923828125, -1.6553955078125, -1.50482177734375, -1.354248046875, -1.20367431640625, -1.0531005859375, -0.90252685546875, -0.751953125, -0.60137939453125, -0.4508056640625, -0.30023193359375, -0.149658203125, 0.00091552734375, 0.1514892578125, 0.30206298828125, 0.45263671875, 0.60321044921875, 0.7537841796875, 0.90435791015625, 1.054931640625, 1.20550537109375, 1.3560791015625, 1.50665283203125, 1.6572265625, 1.80780029296875, 1.9583740234375, 2.10894775390625, 2.259521484375, 2.41009521484375, 2.5606689453125, 2.71124267578125, 2.86181640625, 3.01239013671875, 3.1629638671875, 3.31353759765625, 3.464111328125, 3.61468505859375, 3.7652587890625, 3.91583251953125, 4.06640625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 7.0, 9.0, 7.0, 9.0, 17.0, 17.0, 24.0, 65.0, 311.0, 361.0, 52.0, 45.0, 28.0, 18.0, 6.0, 3.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007448196411132812, -0.0007229223847389221, -0.000701025128364563, -0.0006791278719902039, -0.0006572306156158447, -0.0006353333592414856, -0.0006134361028671265, -0.0005915388464927673, -0.0005696415901184082, -0.0005477443337440491, -0.0005258470773696899, -0.0005039498209953308, -0.0004820525646209717, -0.00046015530824661255, -0.0004382580518722534, -0.0004163607954978943, -0.00039446353912353516, -0.000372566282749176, -0.0003506690263748169, -0.00032877177000045776, -0.00030687451362609863, -0.0002849772572517395, -0.00026308000087738037, -0.00024118274450302124, -0.0002192854881286621, -0.00019738823175430298, -0.00017549097537994385, -0.00015359371900558472, -0.00013169646263122559, -0.00010979920625686646, -8.790194988250732e-05, -6.60046935081482e-05, -4.410743713378906e-05, -2.221018075942993e-05, -3.129243850708008e-07, 2.158433198928833e-05, 4.348158836364746e-05, 6.537884473800659e-05, 8.727610111236572e-05, 0.00010917335748672485, 0.00013107061386108398, 0.00015296787023544312, 0.00017486512660980225, 0.00019676238298416138, 0.0002186596393585205, 0.00024055689573287964, 0.00026245415210723877, 0.0002843514084815979, 0.00030624866485595703, 0.00032814592123031616, 0.0003500431776046753, 0.0003719404339790344, 0.00039383769035339355, 0.0004157349467277527, 0.0004376322031021118, 0.00045952945947647095, 0.0004814267158508301, 0.0005033239722251892, 0.0005252212285995483, 0.0005471184849739075, 0.0005690157413482666, 0.0005909129977226257, 0.0006128102540969849, 0.000634707510471344, 0.0006566047668457031]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 10.0, 10.0, 15.0, 21.0, 18.0, 34.0, 70.0, 100.0, 143.0, 256.0, 576.0, 1355.0, 3809.0, 21632.0, 1001142.0, 14162.0, 2974.0, 1070.0, 468.0, 253.0, 146.0, 100.0, 52.0, 51.0, 32.0, 18.0, 11.0, 11.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.03387451171875, -1.9622802734375, -1.89068603515625, -1.819091796875, -1.74749755859375, -1.6759033203125, -1.60430908203125, -1.53271484375, -1.46112060546875, -1.3895263671875, -1.31793212890625, -1.246337890625, -1.17474365234375, -1.1031494140625, -1.03155517578125, -0.9599609375, -0.88836669921875, -0.8167724609375, -0.74517822265625, -0.673583984375, -0.60198974609375, -0.5303955078125, -0.45880126953125, -0.38720703125, -0.31561279296875, -0.2440185546875, -0.17242431640625, -0.100830078125, -0.02923583984375, 0.0423583984375, 0.11395263671875, 0.185546875, 0.25714111328125, 0.3287353515625, 0.40032958984375, 0.471923828125, 0.54351806640625, 0.6151123046875, 0.68670654296875, 0.75830078125, 0.82989501953125, 0.9014892578125, 0.97308349609375, 1.044677734375, 1.11627197265625, 1.1878662109375, 1.25946044921875, 1.3310546875, 1.40264892578125, 1.4742431640625, 1.54583740234375, 1.617431640625, 1.68902587890625, 1.7606201171875, 1.83221435546875, 1.90380859375, 1.97540283203125, 2.0469970703125, 2.11859130859375, 2.190185546875, 2.26177978515625, 2.3333740234375, 2.40496826171875, 2.4765625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 11.0, 10.0, 16.0, 63.0, 773.0, 65.0, 20.0, 12.0, 8.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.96435546875, -0.9364471435546875, -0.908538818359375, -0.8806304931640625, -0.85272216796875, -0.8248138427734375, -0.796905517578125, -0.7689971923828125, -0.7410888671875, -0.7131805419921875, -0.685272216796875, -0.6573638916015625, -0.62945556640625, -0.6015472412109375, -0.573638916015625, -0.5457305908203125, -0.517822265625, -0.4899139404296875, -0.462005615234375, -0.4340972900390625, -0.40618896484375, -0.3782806396484375, -0.350372314453125, -0.3224639892578125, -0.2945556640625, -0.2666473388671875, -0.238739013671875, -0.2108306884765625, -0.18292236328125, -0.1550140380859375, -0.127105712890625, -0.0991973876953125, -0.0712890625, -0.0433807373046875, -0.015472412109375, 0.0124359130859375, 0.04034423828125, 0.0682525634765625, 0.096160888671875, 0.1240692138671875, 0.1519775390625, 0.1798858642578125, 0.207794189453125, 0.2357025146484375, 0.26361083984375, 0.2915191650390625, 0.319427490234375, 0.3473358154296875, 0.375244140625, 0.4031524658203125, 0.431060791015625, 0.4589691162109375, 0.48687744140625, 0.5147857666015625, 0.542694091796875, 0.5706024169921875, 0.5985107421875, 0.6264190673828125, 0.654327392578125, 0.6822357177734375, 0.71014404296875, 0.7380523681640625, 0.765960693359375, 0.7938690185546875, 0.82177734375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 12.0, 11.0, 13.0, 18.0, 50.0, 84.0, 106.0, 165.0, 172.0, 112.0, 78.0, 53.0, 30.0, 24.0, 10.0, 17.0, 13.0, 10.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2528212070465088, -1.2148464918136597, -1.176871657371521, -1.1388969421386719, -1.1009221076965332, -1.062947392463684, -1.024972677230835, -0.9869978427886963, -0.9490231275558472, -0.9110483527183533, -0.8730735778808594, -0.8350988626480103, -0.7971240878105164, -0.7591493129730225, -0.7211745381355286, -0.6831997632980347, -0.6452249884605408, -0.6072502136230469, -0.569275438785553, -0.5313006639480591, -0.49332594871520996, -0.45535117387771606, -0.41737639904022217, -0.37940165400505066, -0.34142687916755676, -0.30345210433006287, -0.26547735929489136, -0.22750258445739746, -0.18952782452106476, -0.15155306458473206, -0.11357828974723816, -0.07560354471206665, -0.037628769874572754, 0.0003459937870502472, 0.03832075744867325, 0.07629552483558655, 0.11427028477191925, 0.15224504470825195, 0.19021981954574585, 0.22819456458091736, 0.26616933941841125, 0.30414411425590515, 0.34211885929107666, 0.38009363412857056, 0.41806840896606445, 0.45604315400123596, 0.49401792883872986, 0.5319926738739014, 0.5699674487113953, 0.6079422235488892, 0.6459169983863831, 0.683891773223877, 0.7218664884567261, 0.75984126329422, 0.7978160381317139, 0.835790753364563, 0.8737655878067017, 0.9117403626441956, 0.9497151374816895, 0.9876898527145386, 1.0256646871566772, 1.0636394023895264, 1.101614236831665, 1.1395889520645142, 1.1775636672973633]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 0.0, 13.0, 7.0, 21.0, 8.0, 12.0, 23.0, 35.0, 26.0, 41.0, 41.0, 42.0, 52.0, 51.0, 63.0, 62.0, 65.0, 48.0, 51.0, 58.0, 40.0, 50.0, 44.0, 22.0, 37.0, 18.0, 16.0, 15.0, 8.0, 8.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7098373770713806, -0.6912980675697327, -0.6727586984634399, -0.654219388961792, -0.635680079460144, -0.6171407699584961, -0.5986014604568481, -0.5800620913505554, -0.5615227818489075, -0.5429834723472595, -0.5244441032409668, -0.5059047937393188, -0.4873654842376709, -0.46882617473602295, -0.4502868354320526, -0.4317474961280823, -0.4132081866264343, -0.3946688771247864, -0.37612953782081604, -0.3575901985168457, -0.33905088901519775, -0.3205115795135498, -0.30197224020957947, -0.28343290090560913, -0.2648935914039612, -0.24635426700115204, -0.2278149425983429, -0.20927561819553375, -0.1907362937927246, -0.17219696938991547, -0.15365764498710632, -0.13511832058429718, -0.11657905578613281, -0.09803973138332367, -0.07950040698051453, -0.06096108257770538, -0.04242175817489624, -0.023882433772087097, -0.005343109369277954, 0.013196215033531189, 0.03173553943634033, 0.050274863839149475, 0.06881418824195862, 0.08735351264476776, 0.1058928370475769, 0.12443216145038605, 0.1429714858531952, 0.16151081025600433, 0.18005013465881348, 0.19858945906162262, 0.21712878346443176, 0.2356681078672409, 0.25420743227005005, 0.272746741771698, 0.29128608107566833, 0.30982542037963867, 0.3283647298812866, 0.34690403938293457, 0.3654433786869049, 0.38398271799087524, 0.4025220274925232, 0.42106133699417114, 0.4396006762981415, 0.4581400156021118, 0.47667932510375977]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 0.0, 6.0, 0.0, 10.0, 8.0, 8.0, 2.0, 4.0, 10.0, 10.0, 8.0, 12.0, 14.0, 18.0, 28.0, 63.0, 104.0, 816.0, 4173456.0, 19256.0, 245.0, 46.0, 30.0, 18.0, 10.0, 10.0, 10.0, 12.0, 10.0, 8.0, 12.0, 10.0, 4.0, 2.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-4.87109375, -4.72247314453125, -4.5738525390625, -4.42523193359375, -4.276611328125, -4.12799072265625, -3.9793701171875, -3.83074951171875, -3.68212890625, -3.53350830078125, -3.3848876953125, -3.23626708984375, -3.087646484375, -2.93902587890625, -2.7904052734375, -2.64178466796875, -2.4931640625, -2.34454345703125, -2.1959228515625, -2.04730224609375, -1.898681640625, -1.75006103515625, -1.6014404296875, -1.45281982421875, -1.30419921875, -1.15557861328125, -1.0069580078125, -0.85833740234375, -0.709716796875, -0.56109619140625, -0.4124755859375, -0.26385498046875, -0.115234375, 0.03338623046875, 0.1820068359375, 0.33062744140625, 0.479248046875, 0.62786865234375, 0.7764892578125, 0.92510986328125, 1.07373046875, 1.22235107421875, 1.3709716796875, 1.51959228515625, 1.668212890625, 1.81683349609375, 1.9654541015625, 2.11407470703125, 2.2626953125, 2.41131591796875, 2.5599365234375, 2.70855712890625, 2.857177734375, 3.00579833984375, 3.1544189453125, 3.30303955078125, 3.45166015625, 3.60028076171875, 3.7489013671875, 3.89752197265625, 4.046142578125, 4.19476318359375, 4.3433837890625, 4.49200439453125, 4.640625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 12.0, 9.0, 21.0, 14.0, 41.0, 42.0, 56.0, 61.0, 82.0, 83.0, 92.0, 95.0, 76.0, 81.0, 65.0, 50.0, 40.0, 27.0, 14.0, 15.0, 11.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.025634765625, -0.025048017501831055, -0.02446126937866211, -0.023874521255493164, -0.02328777313232422, -0.022701025009155273, -0.022114276885986328, -0.021527528762817383, -0.020940780639648438, -0.020354032516479492, -0.019767284393310547, -0.0191805362701416, -0.018593788146972656, -0.01800704002380371, -0.017420291900634766, -0.01683354377746582, -0.016246795654296875, -0.01566004753112793, -0.015073299407958984, -0.014486551284790039, -0.013899803161621094, -0.013313055038452148, -0.012726306915283203, -0.012139558792114258, -0.011552810668945312, -0.010966062545776367, -0.010379314422607422, -0.009792566299438477, -0.009205818176269531, -0.008619070053100586, -0.00803232192993164, -0.007445573806762695, -0.00685882568359375, -0.006272077560424805, -0.005685329437255859, -0.005098581314086914, -0.004511833190917969, -0.0039250850677490234, -0.003338336944580078, -0.002751588821411133, -0.0021648406982421875, -0.0015780925750732422, -0.0009913444519042969, -0.00040459632873535156, 0.00018215179443359375, 0.0007688999176025391, 0.0013556480407714844, 0.0019423961639404297, 0.002529144287109375, 0.0031158924102783203, 0.0037026405334472656, 0.004289388656616211, 0.004876136779785156, 0.0054628849029541016, 0.006049633026123047, 0.006636381149291992, 0.0072231292724609375, 0.007809877395629883, 0.008396625518798828, 0.008983373641967773, 0.009570121765136719, 0.010156869888305664, 0.01074361801147461, 0.011330366134643555, 0.0119171142578125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 5.0, 11.0, 7.0, 11.0, 12.0, 14.0, 22.0, 28.0, 17.0, 35.0, 40.0, 61.0, 68.0, 87.0, 179.0, 406.0, 1433.0, 4189201.0, 2392.0, 165.0, 50.0, 18.0, 10.0, 6.0], "bins": [-11.28125, -11.085281372070312, -10.889312744140625, -10.693344116210938, -10.49737548828125, -10.301406860351562, -10.105438232421875, -9.909469604492188, -9.7135009765625, -9.517532348632812, -9.321563720703125, -9.125595092773438, -8.92962646484375, -8.733657836914062, -8.537689208984375, -8.341720581054688, -8.145751953125, -7.9497833251953125, -7.753814697265625, -7.5578460693359375, -7.36187744140625, -7.1659088134765625, -6.969940185546875, -6.7739715576171875, -6.5780029296875, -6.3820343017578125, -6.186065673828125, -5.9900970458984375, -5.79412841796875, -5.5981597900390625, -5.402191162109375, -5.2062225341796875, -5.01025390625, -4.8142852783203125, -4.618316650390625, -4.4223480224609375, -4.22637939453125, -4.0304107666015625, -3.834442138671875, -3.6384735107421875, -3.4425048828125, -3.2465362548828125, -3.050567626953125, -2.8545989990234375, -2.65863037109375, -2.4626617431640625, -2.266693115234375, -2.0707244873046875, -1.874755859375, -1.6787872314453125, -1.482818603515625, -1.2868499755859375, -1.09088134765625, -0.8949127197265625, -0.698944091796875, -0.5029754638671875, -0.3070068359375, -0.1110382080078125, 0.084930419921875, 0.2808990478515625, 0.47686767578125, 0.6728363037109375, 0.868804931640625, 1.0647735595703125, 1.2607421875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 5.0, 15.0, 10.0, 36.0, 44.0, 63.0, 97.0, 157.0, 289.0, 819.0, 1927.0, 299.0, 105.0, 65.0, 44.0, 26.0, 16.0, 15.0, 9.0, 10.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04351806640625, -0.041152000427246094, -0.03878593444824219, -0.03641986846923828, -0.034053802490234375, -0.03168773651123047, -0.029321670532226562, -0.026955604553222656, -0.02458953857421875, -0.022223472595214844, -0.019857406616210938, -0.01749134063720703, -0.015125274658203125, -0.012759208679199219, -0.010393142700195312, -0.008027076721191406, -0.0056610107421875, -0.0032949447631835938, -0.0009288787841796875, 0.0014371871948242188, 0.003803253173828125, 0.006169319152832031, 0.008535385131835938, 0.010901451110839844, 0.01326751708984375, 0.015633583068847656, 0.017999649047851562, 0.02036571502685547, 0.022731781005859375, 0.02509784698486328, 0.027463912963867188, 0.029829978942871094, 0.032196044921875, 0.034562110900878906, 0.03692817687988281, 0.03929424285888672, 0.041660308837890625, 0.04402637481689453, 0.04639244079589844, 0.048758506774902344, 0.05112457275390625, 0.053490638732910156, 0.05585670471191406, 0.05822277069091797, 0.060588836669921875, 0.06295490264892578, 0.06532096862792969, 0.0676870346069336, 0.0700531005859375, 0.0724191665649414, 0.07478523254394531, 0.07715129852294922, 0.07951736450195312, 0.08188343048095703, 0.08424949645996094, 0.08661556243896484, 0.08898162841796875, 0.09134769439697266, 0.09371376037597656, 0.09607982635498047, 0.09844589233398438, 0.10081195831298828, 0.10317802429199219, 0.1055440902709961, 0.10791015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 15.0, 985.0, 22.0], "bins": [-30.616111755371094, -30.127099990844727, -29.63808822631836, -29.149076461791992, -28.660064697265625, -28.171052932739258, -27.68204116821289, -27.193029403686523, -26.704017639160156, -26.21500587463379, -25.725994110107422, -25.236982345581055, -24.747970581054688, -24.25895881652832, -23.769947052001953, -23.280935287475586, -22.79192543029785, -22.302913665771484, -21.813901901245117, -21.32489013671875, -20.835878372192383, -20.346866607666016, -19.85785484313965, -19.36884307861328, -18.879831314086914, -18.390819549560547, -17.90180778503418, -17.412796020507812, -16.923784255981445, -16.434772491455078, -15.945760726928711, -15.45674991607666, -14.96773910522461, -14.478727340698242, -13.989715576171875, -13.500703811645508, -13.01169204711914, -12.522680282592773, -12.033668518066406, -11.544657707214355, -11.055644989013672, -10.566633224487305, -10.077621459960938, -9.58860969543457, -9.099597930908203, -8.610586166381836, -8.121574401855469, -7.632563591003418, -7.143551826477051, -6.654540061950684, -6.165528297424316, -5.676516532897949, -5.18750524520874, -4.698493480682373, -4.209481716156006, -3.7204701900482178, -3.2314586639404297, -2.7424468994140625, -2.2534353733062744, -1.7644236087799072, -1.2754119634628296, -0.786400318145752, -0.29738855361938477, 0.19162297248840332, 0.6806348562240601]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 4.0, 8.0, 6.0, 5.0, 8.0, 9.0, 20.0, 14.0, 20.0, 24.0, 23.0, 27.0, 36.0, 41.0, 37.0, 40.0, 29.0, 48.0, 34.0, 49.0, 64.0, 37.0, 47.0, 36.0, 34.0, 31.0, 29.0, 28.0, 31.0, 30.0, 22.0, 24.0, 21.0, 20.0, 12.0, 10.0, 9.0, 12.0, 6.0, 2.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49897390604019165, -0.48195475339889526, -0.4649355709552765, -0.4479164183139801, -0.43089723587036133, -0.41387808322906494, -0.39685893058776855, -0.3798397481441498, -0.362820565700531, -0.3458014130592346, -0.32878223061561584, -0.31176307797431946, -0.2947438955307007, -0.2777247428894043, -0.2607055902481079, -0.24368640780448914, -0.22666725516319275, -0.20964808762073517, -0.1926289200782776, -0.1756097674369812, -0.15859058499336243, -0.14157143235206604, -0.12455226480960846, -0.10753309726715088, -0.0905139297246933, -0.07349476218223572, -0.056475598365068436, -0.039456434547901154, -0.022437267005443573, -0.005418099462985992, 0.011601060628890991, 0.028620228171348572, 0.04563939571380615, 0.06265856325626373, 0.07967773079872131, 0.0966968908905983, 0.11371605843305588, 0.13073521852493286, 0.14775438606739044, 0.16477355360984802, 0.1817927211523056, 0.19881188869476318, 0.21583105623722076, 0.23285022377967834, 0.24986937642097473, 0.2668885588645935, 0.2839077115058899, 0.3009268641471863, 0.31794604659080505, 0.33496519923210144, 0.3519843816757202, 0.3690035343170166, 0.3860227167606354, 0.40304186940193176, 0.42006105184555054, 0.4370802044868469, 0.4540993571281433, 0.4711185097694397, 0.48813769221305847, 0.5051568746566772, 0.5221760272979736, 0.53919517993927, 0.5562143325805664, 0.5732334852218628, 0.590252697467804]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 9.0, 4.0, 7.0, 5.0, 8.0, 10.0, 22.0, 8.0, 17.0, 18.0, 29.0, 23.0, 35.0, 25.0, 34.0, 48.0, 66.0, 80.0, 245.0, 14471.0, 1008131.0, 24479.0, 285.0, 107.0, 63.0, 40.0, 37.0, 29.0, 43.0, 26.0, 27.0, 15.0, 18.0, 17.0, 12.0, 10.0, 9.0, 11.0, 5.0, 6.0, 6.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.287109375, -2.216827392578125, -2.14654541015625, -2.076263427734375, -2.0059814453125, -1.935699462890625, -1.86541748046875, -1.795135498046875, -1.724853515625, -1.654571533203125, -1.58428955078125, -1.514007568359375, -1.4437255859375, -1.373443603515625, -1.30316162109375, -1.232879638671875, -1.16259765625, -1.092315673828125, -1.02203369140625, -0.951751708984375, -0.8814697265625, -0.811187744140625, -0.74090576171875, -0.670623779296875, -0.600341796875, -0.530059814453125, -0.45977783203125, -0.389495849609375, -0.3192138671875, -0.248931884765625, -0.17864990234375, -0.108367919921875, -0.0380859375, 0.032196044921875, 0.10247802734375, 0.172760009765625, 0.2430419921875, 0.313323974609375, 0.38360595703125, 0.453887939453125, 0.524169921875, 0.594451904296875, 0.66473388671875, 0.735015869140625, 0.8052978515625, 0.875579833984375, 0.94586181640625, 1.016143798828125, 1.08642578125, 1.156707763671875, 1.22698974609375, 1.297271728515625, 1.3675537109375, 1.437835693359375, 1.50811767578125, 1.578399658203125, 1.648681640625, 1.718963623046875, 1.78924560546875, 1.859527587890625, 1.9298095703125, 2.000091552734375, 2.07037353515625, 2.140655517578125, 2.2109375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 9.0, 19.0, 51.0, 83.0, 133.0, 185.0, 186.0, 164.0, 87.0, 60.0, 33.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02960205078125, -0.02598094940185547, -0.022359848022460938, -0.018738746643066406, -0.015117645263671875, -0.011496543884277344, -0.007875442504882812, -0.004254341125488281, -0.00063323974609375, 0.0029878616333007812, 0.0066089630126953125, 0.010230064392089844, 0.013851165771484375, 0.017472267150878906, 0.021093368530273438, 0.02471446990966797, 0.0283355712890625, 0.03195667266845703, 0.03557777404785156, 0.039198875427246094, 0.042819976806640625, 0.046441078186035156, 0.05006217956542969, 0.05368328094482422, 0.05730438232421875, 0.06092548370361328, 0.06454658508300781, 0.06816768646240234, 0.07178878784179688, 0.0754098892211914, 0.07903099060058594, 0.08265209197998047, 0.086273193359375, 0.08989429473876953, 0.09351539611816406, 0.0971364974975586, 0.10075759887695312, 0.10437870025634766, 0.10799980163574219, 0.11162090301513672, 0.11524200439453125, 0.11886310577392578, 0.12248420715332031, 0.12610530853271484, 0.12972640991210938, 0.1333475112915039, 0.13696861267089844, 0.14058971405029297, 0.1442108154296875, 0.14783191680908203, 0.15145301818847656, 0.1550741195678711, 0.15869522094726562, 0.16231632232666016, 0.1659374237060547, 0.16955852508544922, 0.17317962646484375, 0.17680072784423828, 0.1804218292236328, 0.18404293060302734, 0.18766403198242188, 0.1912851333618164, 0.19490623474121094, 0.19852733612060547, 0.2021484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 6.0, 6.0, 24.0, 17.0, 24.0, 59.0, 68.0, 183.0, 541.0, 2587.0, 21084.0, 400971.0, 587581.0, 30834.0, 3429.0, 671.0, 221.0, 96.0, 42.0, 39.0, 17.0, 15.0, 14.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5244140625, -1.473724365234375, -1.42303466796875, -1.372344970703125, -1.3216552734375, -1.270965576171875, -1.22027587890625, -1.169586181640625, -1.118896484375, -1.068206787109375, -1.01751708984375, -0.966827392578125, -0.9161376953125, -0.865447998046875, -0.81475830078125, -0.764068603515625, -0.71337890625, -0.662689208984375, -0.61199951171875, -0.561309814453125, -0.5106201171875, -0.459930419921875, -0.40924072265625, -0.358551025390625, -0.307861328125, -0.257171630859375, -0.20648193359375, -0.155792236328125, -0.1051025390625, -0.054412841796875, -0.00372314453125, 0.046966552734375, 0.09765625, 0.148345947265625, 0.19903564453125, 0.249725341796875, 0.3004150390625, 0.351104736328125, 0.40179443359375, 0.452484130859375, 0.503173828125, 0.553863525390625, 0.60455322265625, 0.655242919921875, 0.7059326171875, 0.756622314453125, 0.80731201171875, 0.858001708984375, 0.90869140625, 0.959381103515625, 1.01007080078125, 1.060760498046875, 1.1114501953125, 1.162139892578125, 1.21282958984375, 1.263519287109375, 1.314208984375, 1.364898681640625, 1.41558837890625, 1.466278076171875, 1.5169677734375, 1.567657470703125, 1.61834716796875, 1.669036865234375, 1.7197265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 3.0, 10.0, 20.0, 21.0, 39.0, 52.0, 46.0, 62.0, 91.0, 86.0, 105.0, 102.0, 85.0, 83.0, 55.0, 48.0, 37.0, 17.0, 11.0, 12.0, 9.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.378662109375, -0.3649711608886719, -0.35128021240234375, -0.3375892639160156, -0.3238983154296875, -0.3102073669433594, -0.29651641845703125, -0.2828254699707031, -0.269134521484375, -0.2554435729980469, -0.24175262451171875, -0.22806167602539062, -0.2143707275390625, -0.20067977905273438, -0.18698883056640625, -0.17329788208007812, -0.15960693359375, -0.14591598510742188, -0.13222503662109375, -0.11853408813476562, -0.1048431396484375, -0.09115219116210938, -0.07746124267578125, -0.06377029418945312, -0.050079345703125, -0.036388397216796875, -0.02269744873046875, -0.009006500244140625, 0.0046844482421875, 0.018375396728515625, 0.03206634521484375, 0.045757293701171875, 0.0594482421875, 0.07313919067382812, 0.08683013916015625, 0.10052108764648438, 0.1142120361328125, 0.12790298461914062, 0.14159393310546875, 0.15528488159179688, 0.168975830078125, 0.18266677856445312, 0.19635772705078125, 0.21004867553710938, 0.2237396240234375, 0.23743057250976562, 0.25112152099609375, 0.2648124694824219, 0.27850341796875, 0.2921943664550781, 0.30588531494140625, 0.3195762634277344, 0.3332672119140625, 0.3469581604003906, 0.36064910888671875, 0.3743400573730469, 0.388031005859375, 0.4017219543457031, 0.41541290283203125, 0.4291038513183594, 0.4427947998046875, 0.4564857482910156, 0.47017669677734375, 0.4838676452636719, 0.49755859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 7.0, 11.0, 15.0, 32.0, 44.0, 61.0, 110.0, 183.0, 327.0, 617.0, 1322.0, 2960.0, 8422.0, 37487.0, 449729.0, 492033.0, 40450.0, 8950.0, 3045.0, 1344.0, 587.0, 336.0, 182.0, 106.0, 67.0, 35.0, 27.0, 18.0, 10.0, 8.0, 7.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8662109375, -0.835296630859375, -0.80438232421875, -0.773468017578125, -0.7425537109375, -0.711639404296875, -0.68072509765625, -0.649810791015625, -0.618896484375, -0.587982177734375, -0.55706787109375, -0.526153564453125, -0.4952392578125, -0.464324951171875, -0.43341064453125, -0.402496337890625, -0.37158203125, -0.340667724609375, -0.30975341796875, -0.278839111328125, -0.2479248046875, -0.217010498046875, -0.18609619140625, -0.155181884765625, -0.124267578125, -0.093353271484375, -0.06243896484375, -0.031524658203125, -0.0006103515625, 0.030303955078125, 0.06121826171875, 0.092132568359375, 0.123046875, 0.153961181640625, 0.18487548828125, 0.215789794921875, 0.2467041015625, 0.277618408203125, 0.30853271484375, 0.339447021484375, 0.370361328125, 0.401275634765625, 0.43218994140625, 0.463104248046875, 0.4940185546875, 0.524932861328125, 0.55584716796875, 0.586761474609375, 0.61767578125, 0.648590087890625, 0.67950439453125, 0.710418701171875, 0.7413330078125, 0.772247314453125, 0.80316162109375, 0.834075927734375, 0.864990234375, 0.895904541015625, 0.92681884765625, 0.957733154296875, 0.9886474609375, 1.019561767578125, 1.05047607421875, 1.081390380859375, 1.1123046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 5.0, 3.0, 12.0, 23.0, 31.0, 43.0, 62.0, 101.0, 115.0, 117.0, 139.0, 121.0, 72.0, 55.0, 43.0, 23.0, 13.0, 7.0, 5.0, 8.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.398294448852539e-05, -8.132122457027435e-05, -7.865950465202332e-05, -7.599778473377228e-05, -7.333606481552124e-05, -7.06743448972702e-05, -6.801262497901917e-05, -6.535090506076813e-05, -6.268918514251709e-05, -6.002746522426605e-05, -5.7365745306015015e-05, -5.470402538776398e-05, -5.204230546951294e-05, -4.93805855512619e-05, -4.6718865633010864e-05, -4.405714571475983e-05, -4.139542579650879e-05, -3.873370587825775e-05, -3.6071985960006714e-05, -3.3410266041755676e-05, -3.074854612350464e-05, -2.80868262052536e-05, -2.5425106287002563e-05, -2.2763386368751526e-05, -2.0101666450500488e-05, -1.743994653224945e-05, -1.4778226613998413e-05, -1.2116506695747375e-05, -9.454786777496338e-06, -6.7930668592453e-06, -4.131346940994263e-06, -1.469627022743225e-06, 1.1920928955078125e-06, 3.85381281375885e-06, 6.515532732009888e-06, 9.177252650260925e-06, 1.1838972568511963e-05, 1.4500692486763e-05, 1.7162412405014038e-05, 1.9824132323265076e-05, 2.2485852241516113e-05, 2.514757215976715e-05, 2.780929207801819e-05, 3.0471011996269226e-05, 3.3132731914520264e-05, 3.57944518327713e-05, 3.845617175102234e-05, 4.1117891669273376e-05, 4.3779611587524414e-05, 4.644133150577545e-05, 4.910305142402649e-05, 5.176477134227753e-05, 5.4426491260528564e-05, 5.70882111787796e-05, 5.974993109703064e-05, 6.241165101528168e-05, 6.507337093353271e-05, 6.773509085178375e-05, 7.039681077003479e-05, 7.305853068828583e-05, 7.572025060653687e-05, 7.83819705247879e-05, 8.104369044303894e-05, 8.370541036128998e-05, 8.636713027954102e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 7.0, 20.0, 18.0, 31.0, 79.0, 181.0, 439.0, 1513.0, 7755.0, 198338.0, 817316.0, 18962.0, 2617.0, 768.0, 254.0, 120.0, 55.0, 29.0, 17.0, 9.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.73046875, -2.6700439453125, -2.609619140625, -2.5491943359375, -2.48876953125, -2.4283447265625, -2.367919921875, -2.3074951171875, -2.2470703125, -2.1866455078125, -2.126220703125, -2.0657958984375, -2.00537109375, -1.9449462890625, -1.884521484375, -1.8240966796875, -1.763671875, -1.7032470703125, -1.642822265625, -1.5823974609375, -1.52197265625, -1.4615478515625, -1.401123046875, -1.3406982421875, -1.2802734375, -1.2198486328125, -1.159423828125, -1.0989990234375, -1.03857421875, -0.9781494140625, -0.917724609375, -0.8572998046875, -0.796875, -0.7364501953125, -0.676025390625, -0.6156005859375, -0.55517578125, -0.4947509765625, -0.434326171875, -0.3739013671875, -0.3134765625, -0.2530517578125, -0.192626953125, -0.1322021484375, -0.07177734375, -0.0113525390625, 0.049072265625, 0.1094970703125, 0.169921875, 0.2303466796875, 0.290771484375, 0.3511962890625, 0.41162109375, 0.4720458984375, 0.532470703125, 0.5928955078125, 0.6533203125, 0.7137451171875, 0.774169921875, 0.8345947265625, 0.89501953125, 0.9554443359375, 1.015869140625, 1.0762939453125, 1.13671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 3.0, 4.0, 8.0, 11.0, 16.0, 18.0, 18.0, 39.0, 59.0, 97.0, 113.0, 123.0, 131.0, 101.0, 78.0, 47.0, 49.0, 23.0, 14.0, 14.0, 7.0, 12.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.497314453125, -0.48348236083984375, -0.4696502685546875, -0.45581817626953125, -0.441986083984375, -0.42815399169921875, -0.4143218994140625, -0.40048980712890625, -0.38665771484375, -0.37282562255859375, -0.3589935302734375, -0.34516143798828125, -0.331329345703125, -0.31749725341796875, -0.3036651611328125, -0.28983306884765625, -0.2760009765625, -0.26216888427734375, -0.2483367919921875, -0.23450469970703125, -0.220672607421875, -0.20684051513671875, -0.1930084228515625, -0.17917633056640625, -0.16534423828125, -0.15151214599609375, -0.1376800537109375, -0.12384796142578125, -0.110015869140625, -0.09618377685546875, -0.0823516845703125, -0.06851959228515625, -0.0546875, -0.04085540771484375, -0.0270233154296875, -0.01319122314453125, 0.000640869140625, 0.01447296142578125, 0.0283050537109375, 0.04213714599609375, 0.05596923828125, 0.06980133056640625, 0.0836334228515625, 0.09746551513671875, 0.111297607421875, 0.12512969970703125, 0.1389617919921875, 0.15279388427734375, 0.1666259765625, 0.18045806884765625, 0.1942901611328125, 0.20812225341796875, 0.221954345703125, 0.23578643798828125, 0.2496185302734375, 0.26345062255859375, 0.27728271484375, 0.29111480712890625, 0.3049468994140625, 0.31877899169921875, 0.332611083984375, 0.34644317626953125, 0.3602752685546875, 0.37410736083984375, 0.387939453125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 251.0, 753.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.399930953979492, -4.868659496307373, -3.337388038635254, -1.8061165809631348, -0.2748451232910156, 1.2564263343811035, 2.7876977920532227, 4.3189697265625, 5.850240707397461, 7.38151216506958, 8.9127836227417, 10.444055557250977, 11.975326538085938, 13.506597518920898, 15.037869453430176, 16.569141387939453, 18.100412368774414, 19.631683349609375, 21.16295623779297, 22.69422721862793, 24.22549819946289, 25.75676918029785, 27.288040161132812, 28.819313049316406, 30.350584030151367, 31.881855010986328, 33.41312789916992, 34.94439697265625, 36.475669860839844, 38.00694274902344, 39.538211822509766, 41.06948471069336, 42.60075378417969, 44.13202667236328, 45.66329574584961, 47.1945686340332, 48.72583770751953, 50.257110595703125, 51.78838348388672, 53.31965637207031, 54.85092544555664, 56.382198333740234, 57.91346740722656, 59.444740295410156, 60.97601318359375, 62.50728225708008, 64.0385513305664, 65.56982421875, 67.1010971069336, 68.63236999511719, 70.16364288330078, 71.69490814208984, 73.22618103027344, 74.75745391845703, 76.28872680664062, 77.81999969482422, 79.35127258300781, 80.8825454711914, 82.413818359375, 83.94508361816406, 85.47635650634766, 87.00762939453125, 88.53890228271484, 90.07017517089844, 91.6014404296875]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 12.0, 18.0, 25.0, 32.0, 32.0, 40.0, 48.0, 59.0, 73.0, 73.0, 80.0, 58.0, 80.0, 70.0, 75.0, 49.0, 44.0, 29.0, 23.0, 16.0, 18.0, 12.0, 9.0, 10.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.240800380706787, -2.149399995803833, -2.0579993724823, -1.9665989875793457, -1.875198483467102, -1.7837979793548584, -1.6923975944519043, -1.6009970903396606, -1.509596586227417, -1.4181960821151733, -1.3267955780029297, -1.2353951930999756, -1.143994688987732, -1.0525941848754883, -0.9611937403678894, -0.8697932958602905, -0.7783927917480469, -0.6869922876358032, -0.5955918431282043, -0.5041913986206055, -0.4127908945083618, -0.32139042019844055, -0.2299899458885193, -0.1385895013809204, -0.04718899726867676, 0.04421147704124451, 0.13561195135116577, 0.22701242566108704, 0.3184128999710083, 0.40981337428092957, 0.5012138485908508, 0.5926142930984497, 0.6840145587921143, 0.7754150629043579, 0.8668155074119568, 0.9582159519195557, 1.0496164560317993, 1.141016960144043, 1.232417345046997, 1.3238178491592407, 1.4152183532714844, 1.506618857383728, 1.5980193614959717, 1.6894197463989258, 1.7808202505111694, 1.872220754623413, 1.9636211395263672, 2.0550217628479004, 2.1464221477508545, 2.2378225326538086, 2.329223155975342, 2.420623540878296, 2.51202392578125, 2.603424549102783, 2.6948249340057373, 2.7862253189086914, 2.8776259422302246, 2.9690263271331787, 3.060426950454712, 3.151827335357666, 3.243227958679199, 3.3346283435821533, 3.4260287284851074, 3.5174293518066406, 3.6088297367095947]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 19.0, 16.0, 51.0, 159.0, 365.0, 1282.0, 4157978.0, 33155.0, 696.0, 291.0, 124.0, 61.0, 27.0, 15.0, 19.0, 10.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.86260986328125, -5.6353759765625, -5.40814208984375, -5.180908203125, -4.95367431640625, -4.7264404296875, -4.49920654296875, -4.27197265625, -4.04473876953125, -3.8175048828125, -3.59027099609375, -3.363037109375, -3.13580322265625, -2.9085693359375, -2.68133544921875, -2.4541015625, -2.22686767578125, -1.9996337890625, -1.77239990234375, -1.545166015625, -1.31793212890625, -1.0906982421875, -0.86346435546875, -0.63623046875, -0.40899658203125, -0.1817626953125, 0.04547119140625, 0.272705078125, 0.49993896484375, 0.7271728515625, 0.95440673828125, 1.181640625, 1.40887451171875, 1.6361083984375, 1.86334228515625, 2.090576171875, 2.31781005859375, 2.5450439453125, 2.77227783203125, 2.99951171875, 3.22674560546875, 3.4539794921875, 3.68121337890625, 3.908447265625, 4.13568115234375, 4.3629150390625, 4.59014892578125, 4.8173828125, 5.04461669921875, 5.2718505859375, 5.49908447265625, 5.726318359375, 5.95355224609375, 6.1807861328125, 6.40802001953125, 6.63525390625, 6.86248779296875, 7.0897216796875, 7.31695556640625, 7.544189453125, 7.77142333984375, 7.9986572265625, 8.22589111328125, 8.453125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 18.0, 24.0, 48.0, 99.0, 136.0, 164.0, 159.0, 159.0, 90.0, 57.0, 28.0, 18.0, 9.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0445556640625, -0.04055595397949219, -0.036556243896484375, -0.03255653381347656, -0.02855682373046875, -0.024557113647460938, -0.020557403564453125, -0.016557693481445312, -0.0125579833984375, -0.008558273315429688, -0.004558563232421875, -0.0005588531494140625, 0.00344085693359375, 0.0074405670166015625, 0.011440277099609375, 0.015439987182617188, 0.019439697265625, 0.023439407348632812, 0.027439117431640625, 0.03143882751464844, 0.03543853759765625, 0.03943824768066406, 0.043437957763671875, 0.04743766784667969, 0.0514373779296875, 0.05543708801269531, 0.059436798095703125, 0.06343650817871094, 0.06743621826171875, 0.07143592834472656, 0.07543563842773438, 0.07943534851074219, 0.08343505859375, 0.08743476867675781, 0.09143447875976562, 0.09543418884277344, 0.09943389892578125, 0.10343360900878906, 0.10743331909179688, 0.11143302917480469, 0.1154327392578125, 0.11943244934082031, 0.12343215942382812, 0.12743186950683594, 0.13143157958984375, 0.13543128967285156, 0.13943099975585938, 0.1434307098388672, 0.147430419921875, 0.1514301300048828, 0.15542984008789062, 0.15942955017089844, 0.16342926025390625, 0.16742897033691406, 0.17142868041992188, 0.1754283905029297, 0.1794281005859375, 0.1834278106689453, 0.18742752075195312, 0.19142723083496094, 0.19542694091796875, 0.19942665100097656, 0.20342636108398438, 0.2074260711669922, 0.21142578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 10.0, 15.0, 26.0, 65.0, 112.0, 164.0, 311.0, 1541.0, 4183392.0, 7867.0, 349.0, 199.0, 94.0, 65.0, 36.0, 21.0, 11.0, 5.0, 2.0, 3.0, 3.0], "bins": [-21.078125, -20.67010498046875, -20.2620849609375, -19.85406494140625, -19.446044921875, -19.03802490234375, -18.6300048828125, -18.22198486328125, -17.81396484375, -17.40594482421875, -16.9979248046875, -16.58990478515625, -16.181884765625, -15.77386474609375, -15.3658447265625, -14.95782470703125, -14.5498046875, -14.14178466796875, -13.7337646484375, -13.32574462890625, -12.917724609375, -12.50970458984375, -12.1016845703125, -11.69366455078125, -11.28564453125, -10.87762451171875, -10.4696044921875, -10.06158447265625, -9.653564453125, -9.24554443359375, -8.8375244140625, -8.42950439453125, -8.021484375, -7.61346435546875, -7.2054443359375, -6.79742431640625, -6.389404296875, -5.98138427734375, -5.5733642578125, -5.16534423828125, -4.75732421875, -4.34930419921875, -3.9412841796875, -3.53326416015625, -3.125244140625, -2.71722412109375, -2.3092041015625, -1.90118408203125, -1.4931640625, -1.08514404296875, -0.6771240234375, -0.26910400390625, 0.138916015625, 0.54693603515625, 0.9549560546875, 1.36297607421875, 1.77099609375, 2.17901611328125, 2.5870361328125, 2.99505615234375, 3.403076171875, 3.81109619140625, 4.2191162109375, 4.62713623046875, 5.03515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 17.0, 46.0, 62.0, 268.0, 2633.0, 846.0, 126.0, 46.0, 18.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.892578125, -0.8739128112792969, -0.8552474975585938, -0.8365821838378906, -0.8179168701171875, -0.7992515563964844, -0.7805862426757812, -0.7619209289550781, -0.743255615234375, -0.7245903015136719, -0.7059249877929688, -0.6872596740722656, -0.6685943603515625, -0.6499290466308594, -0.6312637329101562, -0.6125984191894531, -0.59393310546875, -0.5752677917480469, -0.5566024780273438, -0.5379371643066406, -0.5192718505859375, -0.5006065368652344, -0.48194122314453125, -0.4632759094238281, -0.444610595703125, -0.4259452819824219, -0.40727996826171875, -0.3886146545410156, -0.3699493408203125, -0.3512840270996094, -0.33261871337890625, -0.3139533996582031, -0.2952880859375, -0.2766227722167969, -0.25795745849609375, -0.23929214477539062, -0.2206268310546875, -0.20196151733398438, -0.18329620361328125, -0.16463088989257812, -0.145965576171875, -0.12730026245117188, -0.10863494873046875, -0.08996963500976562, -0.0713043212890625, -0.052639007568359375, -0.03397369384765625, -0.015308380126953125, 0.00335693359375, 0.022022247314453125, 0.04068756103515625, 0.059352874755859375, 0.0780181884765625, 0.09668350219726562, 0.11534881591796875, 0.13401412963867188, 0.152679443359375, 0.17134475708007812, 0.19001007080078125, 0.20867538452148438, 0.2273406982421875, 0.24600601196289062, 0.26467132568359375, 0.2833366394042969, 0.302001953125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 45.0, 532.0, 396.0, 26.0, 8.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.080528259277344, -25.61474609375, -25.148963928222656, -24.683181762695312, -24.217397689819336, -23.751615524291992, -23.28583335876465, -22.820051193237305, -22.35426902770996, -21.888486862182617, -21.422704696655273, -20.956920623779297, -20.491138458251953, -20.02535629272461, -19.559574127197266, -19.093791961669922, -18.628007888793945, -18.1622257232666, -17.696443557739258, -17.23065948486328, -16.764877319335938, -16.299095153808594, -15.83331298828125, -15.367530822753906, -14.901748657226562, -14.435966491699219, -13.970183372497559, -13.504401206970215, -13.038619041442871, -12.572835922241211, -12.107053756713867, -11.641271591186523, -11.175487518310547, -10.709705352783203, -10.243922233581543, -9.7781400680542, -9.312357902526855, -8.846574783325195, -8.380792617797852, -7.91500997543335, -7.449227809906006, -6.983445167541504, -6.51766300201416, -6.051880359649658, -5.586097717285156, -5.1203155517578125, -4.6545329093933105, -4.188750267028809, -3.7229678630828857, -3.257185459136963, -2.791402816772461, -2.325620412826538, -1.8598378896713257, -1.3940553665161133, -0.9282729625701904, -0.4624903202056885, 0.003292083740234375, 0.4690745770931244, 0.9348570704460144, 1.400639533996582, 1.8664220571517944, 2.332204580307007, 2.7979869842529297, 3.2637696266174316, 3.7295520305633545]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 6.0, 6.0, 5.0, 16.0, 19.0, 23.0, 33.0, 30.0, 45.0, 44.0, 40.0, 62.0, 63.0, 63.0, 73.0, 60.0, 49.0, 86.0, 46.0, 37.0, 39.0, 31.0, 27.0, 34.0, 19.0, 7.0, 12.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9045146107673645, -0.8718976378440857, -0.8392806649208069, -0.8066636919975281, -0.774046778678894, -0.7414298057556152, -0.7088128328323364, -0.6761958599090576, -0.6435788869857788, -0.6109619140625, -0.5783449411392212, -0.5457279682159424, -0.5131109952926636, -0.48049405217170715, -0.44787710905075073, -0.4152601361274719, -0.3826431632041931, -0.3500261902809143, -0.3174092173576355, -0.2847922742366791, -0.25217530131340027, -0.21955832839012146, -0.18694137036800385, -0.15432441234588623, -0.12170743942260742, -0.08909047394990921, -0.056473508477211, -0.023856543004512787, 0.008760422468185425, 0.04137739539146423, 0.07399435341358185, 0.10661131143569946, 0.13922834396362305, 0.17184531688690186, 0.20446227490901947, 0.23707923293113708, 0.2696962058544159, 0.3023131787776947, 0.3349301218986511, 0.36754709482192993, 0.40016406774520874, 0.43278104066848755, 0.46539801359176636, 0.4980149567127228, 0.5306318998336792, 0.563248872756958, 0.5958658456802368, 0.6284828186035156, 0.6610997915267944, 0.6937167644500732, 0.726333737373352, 0.7589507102966309, 0.7915676832199097, 0.8241846561431885, 0.8568015694618225, 0.8894185423851013, 0.9220355153083801, 0.9546524882316589, 0.9872694611549377, 1.0198863744735718, 1.0525033473968506, 1.0851203203201294, 1.1177372932434082, 1.150354266166687, 1.1829712390899658]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 2.0, 6.0, 8.0, 11.0, 15.0, 14.0, 19.0, 21.0, 24.0, 26.0, 26.0, 49.0, 75.0, 132.0, 338.0, 828.0, 3241.0, 36076.0, 721478.0, 271256.0, 12029.0, 1703.0, 554.0, 221.0, 105.0, 69.0, 44.0, 26.0, 31.0, 20.0, 22.0, 15.0, 13.0, 13.0, 13.0, 7.0, 6.0, 1.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.373046875, -2.2906494140625, -2.208251953125, -2.1258544921875, -2.04345703125, -1.9610595703125, -1.878662109375, -1.7962646484375, -1.7138671875, -1.6314697265625, -1.549072265625, -1.4666748046875, -1.38427734375, -1.3018798828125, -1.219482421875, -1.1370849609375, -1.0546875, -0.9722900390625, -0.889892578125, -0.8074951171875, -0.72509765625, -0.6427001953125, -0.560302734375, -0.4779052734375, -0.3955078125, -0.3131103515625, -0.230712890625, -0.1483154296875, -0.06591796875, 0.0164794921875, 0.098876953125, 0.1812744140625, 0.263671875, 0.3460693359375, 0.428466796875, 0.5108642578125, 0.59326171875, 0.6756591796875, 0.758056640625, 0.8404541015625, 0.9228515625, 1.0052490234375, 1.087646484375, 1.1700439453125, 1.25244140625, 1.3348388671875, 1.417236328125, 1.4996337890625, 1.58203125, 1.6644287109375, 1.746826171875, 1.8292236328125, 1.91162109375, 1.9940185546875, 2.076416015625, 2.1588134765625, 2.2412109375, 2.3236083984375, 2.406005859375, 2.4884033203125, 2.57080078125, 2.6531982421875, 2.735595703125, 2.8179931640625, 2.900390625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 14.0, 19.0, 23.0, 50.0, 61.0, 138.0, 145.0, 139.0, 130.0, 88.0, 95.0, 48.0, 27.0, 19.0, 9.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044525146484375, -0.04028177261352539, -0.03603839874267578, -0.03179502487182617, -0.027551651000976562, -0.023308277130126953, -0.019064903259277344, -0.014821529388427734, -0.010578155517578125, -0.006334781646728516, -0.0020914077758789062, 0.002151966094970703, 0.0063953399658203125, 0.010638713836669922, 0.014882087707519531, 0.01912546157836914, 0.02336883544921875, 0.02761220932006836, 0.03185558319091797, 0.03609895706176758, 0.04034233093261719, 0.0445857048034668, 0.048829078674316406, 0.053072452545166016, 0.057315826416015625, 0.061559200286865234, 0.06580257415771484, 0.07004594802856445, 0.07428932189941406, 0.07853269577026367, 0.08277606964111328, 0.08701944351196289, 0.0912628173828125, 0.09550619125366211, 0.09974956512451172, 0.10399293899536133, 0.10823631286621094, 0.11247968673706055, 0.11672306060791016, 0.12096643447875977, 0.12520980834960938, 0.12945318222045898, 0.1336965560913086, 0.1379399299621582, 0.1421833038330078, 0.14642667770385742, 0.15067005157470703, 0.15491342544555664, 0.15915679931640625, 0.16340017318725586, 0.16764354705810547, 0.17188692092895508, 0.1761302947998047, 0.1803736686706543, 0.1846170425415039, 0.18886041641235352, 0.19310379028320312, 0.19734716415405273, 0.20159053802490234, 0.20583391189575195, 0.21007728576660156, 0.21432065963745117, 0.21856403350830078, 0.2228074073791504, 0.22705078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 9.0, 10.0, 14.0, 6.0, 15.0, 14.0, 11.0, 23.0, 33.0, 32.0, 44.0, 76.0, 104.0, 205.0, 330.0, 735.0, 1589.0, 4286.0, 13113.0, 48333.0, 194569.0, 457667.0, 241994.0, 60899.0, 15914.0, 5008.0, 1783.0, 757.0, 379.0, 201.0, 134.0, 63.0, 42.0, 36.0, 34.0, 20.0, 16.0, 17.0, 14.0, 4.0, 8.0, 4.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0625, -1.0317764282226562, -1.0010528564453125, -0.9703292846679688, -0.939605712890625, -0.9088821411132812, -0.8781585693359375, -0.8474349975585938, -0.81671142578125, -0.7859878540039062, -0.7552642822265625, -0.7245407104492188, -0.693817138671875, -0.6630935668945312, -0.6323699951171875, -0.6016464233398438, -0.5709228515625, -0.5401992797851562, -0.5094757080078125, -0.47875213623046875, -0.448028564453125, -0.41730499267578125, -0.3865814208984375, -0.35585784912109375, -0.32513427734375, -0.29441070556640625, -0.2636871337890625, -0.23296356201171875, -0.202239990234375, -0.17151641845703125, -0.1407928466796875, -0.11006927490234375, -0.079345703125, -0.04862213134765625, -0.0178985595703125, 0.01282501220703125, 0.043548583984375, 0.07427215576171875, 0.1049957275390625, 0.13571929931640625, 0.16644287109375, 0.19716644287109375, 0.2278900146484375, 0.25861358642578125, 0.289337158203125, 0.32006072998046875, 0.3507843017578125, 0.38150787353515625, 0.4122314453125, 0.44295501708984375, 0.4736785888671875, 0.5044021606445312, 0.535125732421875, 0.5658493041992188, 0.5965728759765625, 0.6272964477539062, 0.65802001953125, 0.6887435913085938, 0.7194671630859375, 0.7501907348632812, 0.780914306640625, 0.8116378784179688, 0.8423614501953125, 0.8730850219726562, 0.90380859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 6.0, 6.0, 5.0, 12.0, 11.0, 11.0, 10.0, 16.0, 17.0, 30.0, 20.0, 34.0, 28.0, 23.0, 27.0, 32.0, 42.0, 37.0, 35.0, 42.0, 33.0, 33.0, 46.0, 41.0, 39.0, 46.0, 31.0, 39.0, 32.0, 29.0, 22.0, 21.0, 23.0, 24.0, 13.0, 15.0, 14.0, 12.0, 7.0, 6.0, 4.0, 5.0, 4.0, 3.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2509765625, -0.24266815185546875, -0.2343597412109375, -0.22605133056640625, -0.217742919921875, -0.20943450927734375, -0.2011260986328125, -0.19281768798828125, -0.18450927734375, -0.17620086669921875, -0.1678924560546875, -0.15958404541015625, -0.151275634765625, -0.14296722412109375, -0.1346588134765625, -0.12635040283203125, -0.1180419921875, -0.10973358154296875, -0.1014251708984375, -0.09311676025390625, -0.084808349609375, -0.07649993896484375, -0.0681915283203125, -0.05988311767578125, -0.05157470703125, -0.04326629638671875, -0.0349578857421875, -0.02664947509765625, -0.018341064453125, -0.01003265380859375, -0.0017242431640625, 0.00658416748046875, 0.014892578125, 0.02320098876953125, 0.0315093994140625, 0.03981781005859375, 0.048126220703125, 0.05643463134765625, 0.0647430419921875, 0.07305145263671875, 0.08135986328125, 0.08966827392578125, 0.0979766845703125, 0.10628509521484375, 0.114593505859375, 0.12290191650390625, 0.1312103271484375, 0.13951873779296875, 0.1478271484375, 0.15613555908203125, 0.1644439697265625, 0.17275238037109375, 0.181060791015625, 0.18936920166015625, 0.1976776123046875, 0.20598602294921875, 0.21429443359375, 0.22260284423828125, 0.2309112548828125, 0.23921966552734375, 0.247528076171875, 0.25583648681640625, 0.2641448974609375, 0.27245330810546875, 0.28076171875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 11.0, 12.0, 7.0, 17.0, 24.0, 26.0, 45.0, 62.0, 94.0, 144.0, 229.0, 476.0, 821.0, 1877.0, 4372.0, 12234.0, 45544.0, 293718.0, 557721.0, 98255.0, 20666.0, 6752.0, 2731.0, 1209.0, 610.0, 330.0, 206.0, 118.0, 71.0, 45.0, 39.0, 25.0, 13.0, 21.0, 7.0, 6.0, 9.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9248046875, -0.893157958984375, -0.86151123046875, -0.829864501953125, -0.7982177734375, -0.766571044921875, -0.73492431640625, -0.703277587890625, -0.671630859375, -0.639984130859375, -0.60833740234375, -0.576690673828125, -0.5450439453125, -0.513397216796875, -0.48175048828125, -0.450103759765625, -0.41845703125, -0.386810302734375, -0.35516357421875, -0.323516845703125, -0.2918701171875, -0.260223388671875, -0.22857666015625, -0.196929931640625, -0.165283203125, -0.133636474609375, -0.10198974609375, -0.070343017578125, -0.0386962890625, -0.007049560546875, 0.02459716796875, 0.056243896484375, 0.087890625, 0.119537353515625, 0.15118408203125, 0.182830810546875, 0.2144775390625, 0.246124267578125, 0.27777099609375, 0.309417724609375, 0.341064453125, 0.372711181640625, 0.40435791015625, 0.436004638671875, 0.4676513671875, 0.499298095703125, 0.53094482421875, 0.562591552734375, 0.59423828125, 0.625885009765625, 0.65753173828125, 0.689178466796875, 0.7208251953125, 0.752471923828125, 0.78411865234375, 0.815765380859375, 0.847412109375, 0.879058837890625, 0.91070556640625, 0.942352294921875, 0.9739990234375, 1.005645751953125, 1.03729248046875, 1.068939208984375, 1.1005859375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 8.0, 11.0, 18.0, 20.0, 37.0, 31.0, 61.0, 61.0, 76.0, 101.0, 105.0, 104.0, 84.0, 73.0, 62.0, 41.0, 30.0, 21.0, 15.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.715557098388672e-05, -9.409431368112564e-05, -9.103305637836456e-05, -8.797179907560349e-05, -8.491054177284241e-05, -8.184928447008133e-05, -7.878802716732025e-05, -7.572676986455917e-05, -7.26655125617981e-05, -6.960425525903702e-05, -6.654299795627594e-05, -6.348174065351486e-05, -6.0420483350753784e-05, -5.7359226047992706e-05, -5.429796874523163e-05, -5.123671144247055e-05, -4.817545413970947e-05, -4.5114196836948395e-05, -4.205293953418732e-05, -3.899168223142624e-05, -3.593042492866516e-05, -3.286916762590408e-05, -2.9807910323143005e-05, -2.6746653020381927e-05, -2.368539571762085e-05, -2.0624138414859772e-05, -1.7562881112098694e-05, -1.4501623809337616e-05, -1.1440366506576538e-05, -8.37910920381546e-06, -5.317851901054382e-06, -2.2565945982933044e-06, 8.046627044677734e-07, 3.865920007228851e-06, 6.927177309989929e-06, 9.988434612751007e-06, 1.3049691915512085e-05, 1.6110949218273163e-05, 1.917220652103424e-05, 2.223346382379532e-05, 2.5294721126556396e-05, 2.8355978429317474e-05, 3.141723573207855e-05, 3.447849303483963e-05, 3.753975033760071e-05, 4.0601007640361786e-05, 4.3662264943122864e-05, 4.672352224588394e-05, 4.978477954864502e-05, 5.28460368514061e-05, 5.5907294154167175e-05, 5.896855145692825e-05, 6.202980875968933e-05, 6.509106606245041e-05, 6.815232336521149e-05, 7.121358066797256e-05, 7.427483797073364e-05, 7.733609527349472e-05, 8.03973525762558e-05, 8.345860987901688e-05, 8.651986718177795e-05, 8.958112448453903e-05, 9.264238178730011e-05, 9.570363909006119e-05, 9.876489639282227e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 11.0, 7.0, 22.0, 62.0, 77.0, 200.0, 930.0, 8271.0, 806118.0, 227701.0, 4242.0, 620.0, 149.0, 78.0, 36.0, 10.0, 7.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.0859375, -4.970001220703125, -4.85406494140625, -4.738128662109375, -4.6221923828125, -4.506256103515625, -4.39031982421875, -4.274383544921875, -4.158447265625, -4.042510986328125, -3.92657470703125, -3.810638427734375, -3.6947021484375, -3.578765869140625, -3.46282958984375, -3.346893310546875, -3.23095703125, -3.115020751953125, -2.99908447265625, -2.883148193359375, -2.7672119140625, -2.651275634765625, -2.53533935546875, -2.419403076171875, -2.303466796875, -2.187530517578125, -2.07159423828125, -1.955657958984375, -1.8397216796875, -1.723785400390625, -1.60784912109375, -1.491912841796875, -1.3759765625, -1.260040283203125, -1.14410400390625, -1.028167724609375, -0.9122314453125, -0.796295166015625, -0.68035888671875, -0.564422607421875, -0.448486328125, -0.332550048828125, -0.21661376953125, -0.100677490234375, 0.0152587890625, 0.131195068359375, 0.24713134765625, 0.363067626953125, 0.47900390625, 0.594940185546875, 0.71087646484375, 0.826812744140625, 0.9427490234375, 1.058685302734375, 1.17462158203125, 1.290557861328125, 1.406494140625, 1.522430419921875, 1.63836669921875, 1.754302978515625, 1.8702392578125, 1.986175537109375, 2.10211181640625, 2.218048095703125, 2.333984375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 6.0, 11.0, 15.0, 33.0, 43.0, 75.0, 85.0, 134.0, 165.0, 144.0, 103.0, 80.0, 29.0, 24.0, 23.0, 12.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.09375, -1.0668182373046875, -1.039886474609375, -1.0129547119140625, -0.98602294921875, -0.9590911865234375, -0.932159423828125, -0.9052276611328125, -0.8782958984375, -0.8513641357421875, -0.824432373046875, -0.7975006103515625, -0.77056884765625, -0.7436370849609375, -0.716705322265625, -0.6897735595703125, -0.662841796875, -0.6359100341796875, -0.608978271484375, -0.5820465087890625, -0.55511474609375, -0.5281829833984375, -0.501251220703125, -0.4743194580078125, -0.4473876953125, -0.4204559326171875, -0.393524169921875, -0.3665924072265625, -0.33966064453125, -0.3127288818359375, -0.285797119140625, -0.2588653564453125, -0.23193359375, -0.2050018310546875, -0.178070068359375, -0.1511383056640625, -0.12420654296875, -0.0972747802734375, -0.070343017578125, -0.0434112548828125, -0.0164794921875, 0.0104522705078125, 0.037384033203125, 0.0643157958984375, 0.09124755859375, 0.1181793212890625, 0.145111083984375, 0.1720428466796875, 0.198974609375, 0.2259063720703125, 0.252838134765625, 0.2797698974609375, 0.30670166015625, 0.3336334228515625, 0.360565185546875, 0.3874969482421875, 0.4144287109375, 0.4413604736328125, 0.468292236328125, 0.4952239990234375, 0.52215576171875, 0.5490875244140625, 0.576019287109375, 0.6029510498046875, 0.6298828125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 53.0, 613.0, 334.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.101140975952148, -12.805658340454102, -11.510175704956055, -10.214692115783691, -8.919209480285645, -7.623726844787598, -6.328243732452393, -5.0327606201171875, -3.7372779846191406, -2.4417951107025146, -1.1463122367858887, 0.1491706371307373, 1.4446535110473633, 2.74013614654541, 4.035619258880615, 5.33110237121582, 6.626585006713867, 7.922067642211914, 9.217550277709961, 10.513033866882324, 11.808516502380371, 13.103999137878418, 14.399482727050781, 15.694965362548828, 16.990447998046875, 18.285930633544922, 19.58141326904297, 20.876895904541016, 22.172378540039062, 23.46786117553711, 24.76334571838379, 26.058828353881836, 27.35430908203125, 28.649791717529297, 29.945274353027344, 31.24075698852539, 32.53623962402344, 33.831722259521484, 35.12720489501953, 36.422691345214844, 37.718170166015625, 39.01365280151367, 40.30913543701172, 41.604618072509766, 42.90010070800781, 44.19558334350586, 45.491065979003906, 46.78655242919922, 48.082035064697266, 49.37751770019531, 50.67300033569336, 51.968482971191406, 53.26396560668945, 54.5594482421875, 55.85493087768555, 57.150413513183594, 58.445899963378906, 59.74138259887695, 61.036865234375, 62.33234786987305, 63.627830505371094, 64.9233169555664, 66.21879577636719, 67.5142822265625, 68.80976104736328]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 9.0, 4.0, 8.0, 10.0, 8.0, 19.0, 12.0, 30.0, 21.0, 25.0, 25.0, 40.0, 26.0, 42.0, 34.0, 45.0, 42.0, 52.0, 57.0, 54.0, 44.0, 47.0, 50.0, 48.0, 30.0, 44.0, 25.0, 24.0, 22.0, 19.0, 9.0, 16.0, 13.0, 9.0, 7.0, 6.0, 4.0, 2.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-2.8459291458129883, -2.767394542694092, -2.6888599395751953, -2.6103250980377197, -2.5317904949188232, -2.4532558917999268, -2.3747212886810303, -2.296186685562134, -2.217651844024658, -2.1391172409057617, -2.0605826377868652, -1.9820479154586792, -1.9035131931304932, -1.8249785900115967, -1.7464439868927002, -1.6679093837738037, -1.5893747806549072, -1.5108401775360107, -1.4323054552078247, -1.3537708520889282, -1.2752361297607422, -1.1967015266418457, -1.1181669235229492, -1.0396323204040527, -0.9610975980758667, -0.8825629353523254, -0.8040282726287842, -0.7254936695098877, -0.6469590067863464, -0.5684243440628052, -0.4898897111415863, -0.41135507822036743, -0.33282017707824707, -0.2542855143547058, -0.17575088143348694, -0.09721623361110687, -0.018681585788726807, 0.05985307693481445, 0.13838770985603333, 0.2169223427772522, 0.29545700550079346, 0.3739916682243347, 0.4525263011455536, 0.5310609340667725, 0.6095955967903137, 0.688130259513855, 0.7666648626327515, 0.8451995253562927, 0.923734188079834, 1.0022687911987305, 1.0808035135269165, 1.159338116645813, 1.237872838973999, 1.3164074420928955, 1.394942045211792, 1.4734766483306885, 1.5520113706588745, 1.630545973777771, 1.709080696105957, 1.7876152992248535, 1.86614990234375, 1.944684624671936, 2.023219347000122, 2.1017539501190186, 2.180288553237915]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 8.0, 12.0, 18.0, 32.0, 48.0, 81.0, 132.0, 290.0, 816.0, 2834.0, 18584.0, 717035.0, 3421582.0, 27661.0, 3478.0, 861.0, 322.0, 146.0, 92.0, 61.0, 39.0, 23.0, 22.0, 21.0, 19.0, 12.0, 16.0, 8.0, 3.0, 6.0, 8.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8701171875, -1.7814483642578125, -1.692779541015625, -1.6041107177734375, -1.51544189453125, -1.4267730712890625, -1.338104248046875, -1.2494354248046875, -1.1607666015625, -1.0720977783203125, -0.983428955078125, -0.8947601318359375, -0.80609130859375, -0.7174224853515625, -0.628753662109375, -0.5400848388671875, -0.451416015625, -0.3627471923828125, -0.274078369140625, -0.1854095458984375, -0.09674072265625, -0.0080718994140625, 0.080596923828125, 0.1692657470703125, 0.2579345703125, 0.3466033935546875, 0.435272216796875, 0.5239410400390625, 0.61260986328125, 0.7012786865234375, 0.789947509765625, 0.8786163330078125, 0.96728515625, 1.0559539794921875, 1.144622802734375, 1.2332916259765625, 1.32196044921875, 1.4106292724609375, 1.499298095703125, 1.5879669189453125, 1.6766357421875, 1.7653045654296875, 1.853973388671875, 1.9426422119140625, 2.03131103515625, 2.1199798583984375, 2.208648681640625, 2.2973175048828125, 2.385986328125, 2.4746551513671875, 2.563323974609375, 2.6519927978515625, 2.74066162109375, 2.8293304443359375, 2.917999267578125, 3.0066680908203125, 3.0953369140625, 3.1840057373046875, 3.272674560546875, 3.3613433837890625, 3.45001220703125, 3.5386810302734375, 3.627349853515625, 3.7160186767578125, 3.8046875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 7.0, 4.0, 3.0, 6.0, 16.0, 20.0, 39.0, 55.0, 70.0, 95.0, 117.0, 97.0, 106.0, 113.0, 89.0, 64.0, 38.0, 32.0, 19.0, 8.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06976318359375, -0.06502819061279297, -0.06029319763183594, -0.055558204650878906, -0.050823211669921875, -0.046088218688964844, -0.04135322570800781, -0.03661823272705078, -0.03188323974609375, -0.02714824676513672, -0.022413253784179688, -0.017678260803222656, -0.012943267822265625, -0.008208274841308594, -0.0034732818603515625, 0.0012617111206054688, 0.0059967041015625, 0.010731697082519531, 0.015466690063476562, 0.020201683044433594, 0.024936676025390625, 0.029671669006347656, 0.03440666198730469, 0.03914165496826172, 0.04387664794921875, 0.04861164093017578, 0.05334663391113281, 0.058081626892089844, 0.06281661987304688, 0.0675516128540039, 0.07228660583496094, 0.07702159881591797, 0.081756591796875, 0.08649158477783203, 0.09122657775878906, 0.0959615707397461, 0.10069656372070312, 0.10543155670166016, 0.11016654968261719, 0.11490154266357422, 0.11963653564453125, 0.12437152862548828, 0.1291065216064453, 0.13384151458740234, 0.13857650756835938, 0.1433115005493164, 0.14804649353027344, 0.15278148651123047, 0.1575164794921875, 0.16225147247314453, 0.16698646545410156, 0.1717214584350586, 0.17645645141601562, 0.18119144439697266, 0.1859264373779297, 0.19066143035888672, 0.19539642333984375, 0.20013141632080078, 0.2048664093017578, 0.20960140228271484, 0.21433639526367188, 0.2190713882446289, 0.22380638122558594, 0.22854137420654297, 0.2332763671875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 7.0, 10.0, 16.0, 27.0, 17.0, 42.0, 65.0, 108.0, 204.0, 506.0, 2037.0, 41852.0, 4131373.0, 15267.0, 1640.0, 531.0, 235.0, 88.0, 72.0, 52.0, 38.0, 32.0, 19.0, 13.0, 12.0, 8.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.78515625, -7.57122802734375, -7.3572998046875, -7.14337158203125, -6.929443359375, -6.71551513671875, -6.5015869140625, -6.28765869140625, -6.07373046875, -5.85980224609375, -5.6458740234375, -5.43194580078125, -5.218017578125, -5.00408935546875, -4.7901611328125, -4.57623291015625, -4.3623046875, -4.14837646484375, -3.9344482421875, -3.72052001953125, -3.506591796875, -3.29266357421875, -3.0787353515625, -2.86480712890625, -2.65087890625, -2.43695068359375, -2.2230224609375, -2.00909423828125, -1.795166015625, -1.58123779296875, -1.3673095703125, -1.15338134765625, -0.939453125, -0.72552490234375, -0.5115966796875, -0.29766845703125, -0.083740234375, 0.13018798828125, 0.3441162109375, 0.55804443359375, 0.77197265625, 0.98590087890625, 1.1998291015625, 1.41375732421875, 1.627685546875, 1.84161376953125, 2.0555419921875, 2.26947021484375, 2.4833984375, 2.69732666015625, 2.9112548828125, 3.12518310546875, 3.339111328125, 3.55303955078125, 3.7669677734375, 3.98089599609375, 4.19482421875, 4.40875244140625, 4.6226806640625, 4.83660888671875, 5.050537109375, 5.26446533203125, 5.4783935546875, 5.69232177734375, 5.90625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 11.0, 18.0, 30.0, 42.0, 95.0, 211.0, 708.0, 1989.0, 553.0, 223.0, 96.0, 47.0, 21.0, 14.0, 5.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285400390625, -0.2679786682128906, -0.25055694580078125, -0.23313522338867188, -0.2157135009765625, -0.19829177856445312, -0.18087005615234375, -0.16344833374023438, -0.146026611328125, -0.12860488891601562, -0.11118316650390625, -0.09376144409179688, -0.0763397216796875, -0.058917999267578125, -0.04149627685546875, -0.024074554443359375, -0.00665283203125, 0.010768890380859375, 0.02819061279296875, 0.045612335205078125, 0.0630340576171875, 0.08045578002929688, 0.09787750244140625, 0.11529922485351562, 0.132720947265625, 0.15014266967773438, 0.16756439208984375, 0.18498611450195312, 0.2024078369140625, 0.21982955932617188, 0.23725128173828125, 0.2546730041503906, 0.2720947265625, 0.2895164489746094, 0.30693817138671875, 0.3243598937988281, 0.3417816162109375, 0.3592033386230469, 0.37662506103515625, 0.3940467834472656, 0.411468505859375, 0.4288902282714844, 0.44631195068359375, 0.4637336730957031, 0.4811553955078125, 0.4985771179199219, 0.5159988403320312, 0.5334205627441406, 0.55084228515625, 0.5682640075683594, 0.5856857299804688, 0.6031074523925781, 0.6205291748046875, 0.6379508972167969, 0.6553726196289062, 0.6727943420410156, 0.690216064453125, 0.7076377868652344, 0.7250595092773438, 0.7424812316894531, 0.7599029541015625, 0.7773246765136719, 0.7947463989257812, 0.8121681213378906, 0.82958984375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 19.0, 143.0, 484.0, 283.0, 48.0, 15.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.860128879547119, -5.459834098815918, -5.059539794921875, -4.659245014190674, -4.258950233459473, -3.8586556911468506, -3.4583611488342285, -3.0580663681030273, -2.6577718257904053, -2.257477283477783, -1.857182502746582, -1.45688796043396, -1.0565932989120483, -0.6562986373901367, -0.25600409507751465, 0.14429068565368652, 0.5445852279663086, 0.9448798894882202, 1.3451745510101318, 1.745469093322754, 2.145763874053955, 2.546058416366577, 2.946352958679199, 3.3466477394104004, 3.7469422817230225, 4.1472368240356445, 4.547531604766846, 4.947826385498047, 5.34812068939209, 5.748415470123291, 6.148710250854492, 6.549004554748535, 6.9492998123168945, 7.349594593048096, 7.749888896942139, 8.15018367767334, 8.550477981567383, 8.950773239135742, 9.351067543029785, 9.751361846923828, 10.151657104492188, 10.55195140838623, 10.95224666595459, 11.352540969848633, 11.752835273742676, 12.153130531311035, 12.553424835205078, 12.953720092773438, 13.354013442993164, 13.754307746887207, 14.154603004455566, 14.55489730834961, 14.955191612243652, 15.355486869812012, 15.755781173706055, 16.156076431274414, 16.556371688842773, 16.956666946411133, 17.35696029663086, 17.75725555419922, 18.157550811767578, 18.557844161987305, 18.958139419555664, 19.358434677124023, 19.75872802734375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 10.0, 9.0, 14.0, 21.0, 30.0, 37.0, 32.0, 50.0, 64.0, 76.0, 81.0, 72.0, 80.0, 64.0, 66.0, 54.0, 48.0, 46.0, 34.0, 29.0, 26.0, 12.0, 15.0, 11.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2902965545654297, -2.2196991443634033, -2.149101734161377, -2.0785043239593506, -2.007906913757324, -1.9373093843460083, -1.8667118549346924, -1.796114444732666, -1.7255170345306396, -1.6549196243286133, -1.584322214126587, -1.513724684715271, -1.4431272745132446, -1.3725298643112183, -1.3019323348999023, -1.231334924697876, -1.1607375144958496, -1.0901401042938232, -1.0195426940917969, -0.948945164680481, -0.8783477544784546, -0.8077503442764282, -0.7371528744697571, -0.6665554046630859, -0.5959579944610596, -0.5253605842590332, -0.45476311445236206, -0.3841656744480133, -0.31356823444366455, -0.2429707944393158, -0.17237335443496704, -0.10177591443061829, -0.03117823600769043, 0.039419203996658325, 0.11001664400100708, 0.18061408400535583, 0.2512115240097046, 0.32180896401405334, 0.3924064040184021, 0.46300384402275085, 0.5336012840270996, 0.604198694229126, 0.6747961640357971, 0.7453936338424683, 0.8159910440444946, 0.886588454246521, 0.9571859240531921, 1.0277833938598633, 1.0983808040618896, 1.168978214263916, 1.2395756244659424, 1.3101731538772583, 1.3807705640792847, 1.451367974281311, 1.521965503692627, 1.5925629138946533, 1.6631603240966797, 1.733757734298706, 1.8043551445007324, 1.8749526739120483, 1.9455500841140747, 2.0161476135253906, 2.086745023727417, 2.1573424339294434, 2.2279398441314697]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 6.0, 4.0, 7.0, 9.0, 9.0, 9.0, 11.0, 10.0, 24.0, 23.0, 34.0, 49.0, 65.0, 76.0, 134.0, 195.0, 305.0, 644.0, 1758.0, 5701.0, 24477.0, 135329.0, 524965.0, 287414.0, 51794.0, 10435.0, 2871.0, 969.0, 446.0, 260.0, 127.0, 96.0, 70.0, 58.0, 42.0, 19.0, 22.0, 14.0, 18.0, 11.0, 9.0, 6.0, 12.0, 2.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-1.9912109375, -1.9354705810546875, -1.879730224609375, -1.8239898681640625, -1.76824951171875, -1.7125091552734375, -1.656768798828125, -1.6010284423828125, -1.5452880859375, -1.4895477294921875, -1.433807373046875, -1.3780670166015625, -1.32232666015625, -1.2665863037109375, -1.210845947265625, -1.1551055908203125, -1.099365234375, -1.0436248779296875, -0.987884521484375, -0.9321441650390625, -0.87640380859375, -0.8206634521484375, -0.764923095703125, -0.7091827392578125, -0.6534423828125, -0.5977020263671875, -0.541961669921875, -0.4862213134765625, -0.43048095703125, -0.3747406005859375, -0.319000244140625, -0.2632598876953125, -0.20751953125, -0.1517791748046875, -0.096038818359375, -0.0402984619140625, 0.01544189453125, 0.0711822509765625, 0.126922607421875, 0.1826629638671875, 0.2384033203125, 0.2941436767578125, 0.349884033203125, 0.4056243896484375, 0.46136474609375, 0.5171051025390625, 0.572845458984375, 0.6285858154296875, 0.684326171875, 0.7400665283203125, 0.795806884765625, 0.8515472412109375, 0.90728759765625, 0.9630279541015625, 1.018768310546875, 1.0745086669921875, 1.1302490234375, 1.1859893798828125, 1.241729736328125, 1.2974700927734375, 1.35321044921875, 1.4089508056640625, 1.464691162109375, 1.5204315185546875, 1.576171875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 11.0, 15.0, 31.0, 26.0, 36.0, 51.0, 80.0, 81.0, 90.0, 94.0, 74.0, 82.0, 73.0, 56.0, 46.0, 40.0, 32.0, 24.0, 18.0, 14.0, 10.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10546875, -0.10042953491210938, -0.09539031982421875, -0.09035110473632812, -0.0853118896484375, -0.08027267456054688, -0.07523345947265625, -0.07019424438476562, -0.065155029296875, -0.060115814208984375, -0.05507659912109375, -0.050037384033203125, -0.0449981689453125, -0.039958953857421875, -0.03491973876953125, -0.029880523681640625, -0.02484130859375, -0.019802093505859375, -0.01476287841796875, -0.009723663330078125, -0.0046844482421875, 0.000354766845703125, 0.00539398193359375, 0.010433197021484375, 0.015472412109375, 0.020511627197265625, 0.02555084228515625, 0.030590057373046875, 0.0356292724609375, 0.040668487548828125, 0.04570770263671875, 0.050746917724609375, 0.0557861328125, 0.060825347900390625, 0.06586456298828125, 0.07090377807617188, 0.0759429931640625, 0.08098220825195312, 0.08602142333984375, 0.09106063842773438, 0.096099853515625, 0.10113906860351562, 0.10617828369140625, 0.11121749877929688, 0.1162567138671875, 0.12129592895507812, 0.12633514404296875, 0.13137435913085938, 0.13641357421875, 0.14145278930664062, 0.14649200439453125, 0.15153121948242188, 0.1565704345703125, 0.16160964965820312, 0.16664886474609375, 0.17168807983398438, 0.176727294921875, 0.18176651000976562, 0.18680572509765625, 0.19184494018554688, 0.1968841552734375, 0.20192337036132812, 0.20696258544921875, 0.21200180053710938, 0.217041015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 12.0, 8.0, 11.0, 21.0, 25.0, 36.0, 59.0, 79.0, 121.0, 149.0, 310.0, 447.0, 853.0, 1624.0, 3104.0, 6779.0, 16666.0, 43305.0, 114814.0, 255123.0, 311795.0, 177371.0, 69735.0, 26289.0, 10381.0, 4465.0, 2153.0, 1147.0, 607.0, 416.0, 221.0, 135.0, 81.0, 52.0, 43.0, 29.0, 23.0, 21.0, 15.0, 9.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.763671875, -0.7375564575195312, -0.7114410400390625, -0.6853256225585938, -0.659210205078125, -0.6330947875976562, -0.6069793701171875, -0.5808639526367188, -0.55474853515625, -0.5286331176757812, -0.5025177001953125, -0.47640228271484375, -0.450286865234375, -0.42417144775390625, -0.3980560302734375, -0.37194061279296875, -0.3458251953125, -0.31970977783203125, -0.2935943603515625, -0.26747894287109375, -0.241363525390625, -0.21524810791015625, -0.1891326904296875, -0.16301727294921875, -0.13690185546875, -0.11078643798828125, -0.0846710205078125, -0.05855560302734375, -0.032440185546875, -0.00632476806640625, 0.0197906494140625, 0.04590606689453125, 0.072021484375, 0.09813690185546875, 0.1242523193359375, 0.15036773681640625, 0.176483154296875, 0.20259857177734375, 0.2287139892578125, 0.25482940673828125, 0.28094482421875, 0.30706024169921875, 0.3331756591796875, 0.35929107666015625, 0.385406494140625, 0.41152191162109375, 0.4376373291015625, 0.46375274658203125, 0.4898681640625, 0.5159835815429688, 0.5420989990234375, 0.5682144165039062, 0.594329833984375, 0.6204452514648438, 0.6465606689453125, 0.6726760864257812, 0.69879150390625, 0.7249069213867188, 0.7510223388671875, 0.7771377563476562, 0.803253173828125, 0.8293685913085938, 0.8554840087890625, 0.8815994262695312, 0.90771484375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 9.0, 5.0, 7.0, 11.0, 15.0, 16.0, 19.0, 15.0, 16.0, 25.0, 28.0, 35.0, 35.0, 47.0, 50.0, 52.0, 46.0, 46.0, 50.0, 49.0, 56.0, 40.0, 36.0, 47.0, 27.0, 32.0, 28.0, 28.0, 23.0, 20.0, 27.0, 8.0, 12.0, 11.0, 6.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.5634765625, -0.5468368530273438, -0.5301971435546875, -0.5135574340820312, -0.496917724609375, -0.48027801513671875, -0.4636383056640625, -0.44699859619140625, -0.43035888671875, -0.41371917724609375, -0.3970794677734375, -0.38043975830078125, -0.363800048828125, -0.34716033935546875, -0.3305206298828125, -0.31388092041015625, -0.2972412109375, -0.28060150146484375, -0.2639617919921875, -0.24732208251953125, -0.230682373046875, -0.21404266357421875, -0.1974029541015625, -0.18076324462890625, -0.16412353515625, -0.14748382568359375, -0.1308441162109375, -0.11420440673828125, -0.097564697265625, -0.08092498779296875, -0.0642852783203125, -0.04764556884765625, -0.031005859375, -0.01436614990234375, 0.0022735595703125, 0.01891326904296875, 0.035552978515625, 0.05219268798828125, 0.0688323974609375, 0.08547210693359375, 0.10211181640625, 0.11875152587890625, 0.1353912353515625, 0.15203094482421875, 0.168670654296875, 0.18531036376953125, 0.2019500732421875, 0.21858978271484375, 0.2352294921875, 0.25186920166015625, 0.2685089111328125, 0.28514862060546875, 0.301788330078125, 0.31842803955078125, 0.3350677490234375, 0.35170745849609375, 0.36834716796875, 0.38498687744140625, 0.4016265869140625, 0.41826629638671875, 0.434906005859375, 0.45154571533203125, 0.4681854248046875, 0.48482513427734375, 0.50146484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 5.0, 6.0, 9.0, 9.0, 17.0, 21.0, 45.0, 42.0, 63.0, 95.0, 170.0, 264.0, 367.0, 560.0, 949.0, 1664.0, 2876.0, 5083.0, 10489.0, 23613.0, 63485.0, 205729.0, 411587.0, 210381.0, 64381.0, 23557.0, 10572.0, 5308.0, 2787.0, 1617.0, 1017.0, 589.0, 410.0, 255.0, 176.0, 98.0, 76.0, 61.0, 32.0, 17.0, 21.0, 11.0, 11.0, 11.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7216796875, -0.7001419067382812, -0.6786041259765625, -0.6570663452148438, -0.635528564453125, -0.6139907836914062, -0.5924530029296875, -0.5709152221679688, -0.54937744140625, -0.5278396606445312, -0.5063018798828125, -0.48476409912109375, -0.463226318359375, -0.44168853759765625, -0.4201507568359375, -0.39861297607421875, -0.3770751953125, -0.35553741455078125, -0.3339996337890625, -0.31246185302734375, -0.290924072265625, -0.26938629150390625, -0.2478485107421875, -0.22631072998046875, -0.20477294921875, -0.18323516845703125, -0.1616973876953125, -0.14015960693359375, -0.118621826171875, -0.09708404541015625, -0.0755462646484375, -0.05400848388671875, -0.032470703125, -0.01093292236328125, 0.0106048583984375, 0.03214263916015625, 0.053680419921875, 0.07521820068359375, 0.0967559814453125, 0.11829376220703125, 0.13983154296875, 0.16136932373046875, 0.1829071044921875, 0.20444488525390625, 0.225982666015625, 0.24752044677734375, 0.2690582275390625, 0.29059600830078125, 0.3121337890625, 0.33367156982421875, 0.3552093505859375, 0.37674713134765625, 0.398284912109375, 0.41982269287109375, 0.4413604736328125, 0.46289825439453125, 0.48443603515625, 0.5059738159179688, 0.5275115966796875, 0.5490493774414062, 0.570587158203125, 0.5921249389648438, 0.6136627197265625, 0.6352005004882812, 0.65673828125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 4.0, 10.0, 12.0, 9.0, 15.0, 13.0, 15.0, 30.0, 28.0, 31.0, 51.0, 52.0, 54.0, 82.0, 69.0, 69.0, 71.0, 83.0, 65.0, 54.0, 41.0, 26.0, 25.0, 29.0, 17.0, 11.0, 10.0, 8.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.614229202270508e-05, -9.332504123449326e-05, -9.050779044628143e-05, -8.769053965806961e-05, -8.487328886985779e-05, -8.205603808164597e-05, -7.923878729343414e-05, -7.642153650522232e-05, -7.36042857170105e-05, -7.078703492879868e-05, -6.796978414058685e-05, -6.515253335237503e-05, -6.233528256416321e-05, -5.9518031775951385e-05, -5.670078098773956e-05, -5.388353019952774e-05, -5.106627941131592e-05, -4.8249028623104095e-05, -4.543177783489227e-05, -4.261452704668045e-05, -3.979727625846863e-05, -3.6980025470256805e-05, -3.416277468204498e-05, -3.134552389383316e-05, -2.8528273105621338e-05, -2.5711022317409515e-05, -2.2893771529197693e-05, -2.007652074098587e-05, -1.7259269952774048e-05, -1.4442019164562225e-05, -1.1624768376350403e-05, -8.80751758813858e-06, -5.990266799926758e-06, -3.1730160117149353e-06, -3.557652235031128e-07, 2.4614855647087097e-06, 5.278736352920532e-06, 8.095987141132355e-06, 1.0913237929344177e-05, 1.3730488717556e-05, 1.6547739505767822e-05, 1.9364990293979645e-05, 2.2182241082191467e-05, 2.499949187040329e-05, 2.7816742658615112e-05, 3.0633993446826935e-05, 3.345124423503876e-05, 3.626849502325058e-05, 3.90857458114624e-05, 4.1902996599674225e-05, 4.472024738788605e-05, 4.753749817609787e-05, 5.035474896430969e-05, 5.3171999752521515e-05, 5.598925054073334e-05, 5.880650132894516e-05, 6.162375211715698e-05, 6.44410029053688e-05, 6.725825369358063e-05, 7.007550448179245e-05, 7.289275527000427e-05, 7.57100060582161e-05, 7.852725684642792e-05, 8.134450763463974e-05, 8.416175842285156e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 5.0, 4.0, 3.0, 11.0, 13.0, 29.0, 30.0, 37.0, 96.0, 140.0, 293.0, 645.0, 1316.0, 3092.0, 9046.0, 39377.0, 391584.0, 532531.0, 52786.0, 10885.0, 3766.0, 1485.0, 682.0, 297.0, 159.0, 87.0, 62.0, 28.0, 22.0, 13.0, 11.0, 9.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3095703125, -1.2593536376953125, -1.209136962890625, -1.1589202880859375, -1.10870361328125, -1.0584869384765625, -1.008270263671875, -0.9580535888671875, -0.9078369140625, -0.8576202392578125, -0.807403564453125, -0.7571868896484375, -0.70697021484375, -0.6567535400390625, -0.606536865234375, -0.5563201904296875, -0.506103515625, -0.4558868408203125, -0.405670166015625, -0.3554534912109375, -0.30523681640625, -0.2550201416015625, -0.204803466796875, -0.1545867919921875, -0.1043701171875, -0.0541534423828125, -0.003936767578125, 0.0462799072265625, 0.09649658203125, 0.1467132568359375, 0.196929931640625, 0.2471466064453125, 0.29736328125, 0.3475799560546875, 0.397796630859375, 0.4480133056640625, 0.49822998046875, 0.5484466552734375, 0.598663330078125, 0.6488800048828125, 0.6990966796875, 0.7493133544921875, 0.799530029296875, 0.8497467041015625, 0.89996337890625, 0.9501800537109375, 1.000396728515625, 1.0506134033203125, 1.100830078125, 1.1510467529296875, 1.201263427734375, 1.2514801025390625, 1.30169677734375, 1.3519134521484375, 1.402130126953125, 1.4523468017578125, 1.5025634765625, 1.5527801513671875, 1.602996826171875, 1.6532135009765625, 1.70343017578125, 1.7536468505859375, 1.803863525390625, 1.8540802001953125, 1.904296875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 5.0, 5.0, 6.0, 9.0, 7.0, 10.0, 11.0, 14.0, 27.0, 29.0, 62.0, 72.0, 97.0, 132.0, 115.0, 91.0, 95.0, 59.0, 44.0, 23.0, 12.0, 18.0, 13.0, 7.0, 9.0, 6.0, 4.0, 6.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6572265625, -0.63116455078125, -0.6051025390625, -0.57904052734375, -0.552978515625, -0.52691650390625, -0.5008544921875, -0.47479248046875, -0.44873046875, -0.42266845703125, -0.3966064453125, -0.37054443359375, -0.344482421875, -0.31842041015625, -0.2923583984375, -0.26629638671875, -0.240234375, -0.21417236328125, -0.1881103515625, -0.16204833984375, -0.135986328125, -0.10992431640625, -0.0838623046875, -0.05780029296875, -0.03173828125, -0.00567626953125, 0.0203857421875, 0.04644775390625, 0.072509765625, 0.09857177734375, 0.1246337890625, 0.15069580078125, 0.1767578125, 0.20281982421875, 0.2288818359375, 0.25494384765625, 0.281005859375, 0.30706787109375, 0.3331298828125, 0.35919189453125, 0.38525390625, 0.41131591796875, 0.4373779296875, 0.46343994140625, 0.489501953125, 0.51556396484375, 0.5416259765625, 0.56768798828125, 0.59375, 0.61981201171875, 0.6458740234375, 0.67193603515625, 0.697998046875, 0.72406005859375, 0.7501220703125, 0.77618408203125, 0.80224609375, 0.82830810546875, 0.8543701171875, 0.88043212890625, 0.906494140625, 0.93255615234375, 0.9586181640625, 0.98468017578125, 1.0107421875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 10.0, 32.0, 112.0, 192.0, 256.0, 212.0, 105.0, 48.0, 22.0, 10.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.913578033447266, -13.390656471252441, -12.867734909057617, -12.344812393188477, -11.821890830993652, -11.298969268798828, -10.776046752929688, -10.253125190734863, -9.730203628540039, -9.207282066345215, -8.68436050415039, -8.16143798828125, -7.638516426086426, -7.115594863891602, -6.592672824859619, -6.069750785827637, -5.5468292236328125, -5.023907661437988, -4.500985622406006, -3.9780638217926025, -3.455142021179199, -2.932220220565796, -2.4092984199523926, -1.8863766193389893, -1.363454818725586, -0.8405330181121826, -0.3176112174987793, 0.20531058311462402, 0.7282323837280273, 1.2511541843414307, 1.774075984954834, 2.2969977855682373, 2.8199214935302734, 3.3428432941436768, 3.86576509475708, 4.3886871337890625, 4.911608695983887, 5.434530258178711, 5.957452297210693, 6.480374336242676, 7.0032958984375, 7.526217460632324, 8.049139022827148, 8.572061538696289, 9.094983100891113, 9.617904663085938, 10.140827178955078, 10.663748741149902, 11.186670303344727, 11.70959186553955, 12.232513427734375, 12.755435943603516, 13.27835750579834, 13.801279067993164, 14.324201583862305, 14.847123146057129, 15.370044708251953, 15.892966270446777, 16.4158878326416, 16.938810348510742, 17.46173095703125, 17.98465347290039, 18.50757598876953, 19.03049659729004, 19.55341911315918]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 2.0, 5.0, 13.0, 15.0, 19.0, 14.0, 27.0, 35.0, 29.0, 34.0, 44.0, 52.0, 48.0, 59.0, 56.0, 41.0, 48.0, 65.0, 60.0, 64.0, 40.0, 33.0, 45.0, 24.0, 19.0, 22.0, 9.0, 14.0, 13.0, 12.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.012479782104492, -3.881399393081665, -3.750318765640259, -3.6192383766174316, -3.4881577491760254, -3.3570773601531982, -3.225996971130371, -3.094916343688965, -2.9638357162475586, -2.8327553272247314, -2.701674699783325, -2.570594310760498, -2.439513683319092, -2.3084332942962646, -2.1773529052734375, -2.0462722778320312, -1.915191888809204, -1.7841113805770874, -1.6530308723449707, -1.5219504833221436, -1.3908698558807373, -1.2597894668579102, -1.1287089586257935, -0.9976284503936768, -0.8665479421615601, -0.7354674339294434, -0.6043869256973267, -0.47330647706985474, -0.34222596883773804, -0.21114546060562134, -0.08006501197814941, 0.051015496253967285, 0.18209600448608398, 0.3131765127182007, 0.444256991147995, 0.5753374695777893, 0.706417977809906, 0.8374984860420227, 0.9685789346694946, 1.0996594429016113, 1.230739951133728, 1.3618204593658447, 1.4929009675979614, 1.6239814758300781, 1.7550618648529053, 1.8861424922943115, 2.0172228813171387, 2.148303508758545, 2.279383897781372, 2.410464286804199, 2.5415449142456055, 2.6726253032684326, 2.803705930709839, 2.934786319732666, 3.0658669471740723, 3.1969473361968994, 3.3280277252197266, 3.4591081142425537, 3.59018874168396, 3.721269130706787, 3.8523497581481934, 3.9834301471710205, 4.114510536193848, 4.245591163635254, 4.37667179107666]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 4.0, 5.0, 7.0, 11.0, 13.0, 24.0, 44.0, 70.0, 140.0, 218.0, 518.0, 1327.0, 4544.0, 22632.0, 406810.0, 3684506.0, 61354.0, 8025.0, 2196.0, 892.0, 358.0, 176.0, 107.0, 94.0, 48.0, 34.0, 34.0, 22.0, 23.0, 10.0, 5.0, 9.0, 9.0, 1.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.724609375, -1.643341064453125, -1.56207275390625, -1.480804443359375, -1.3995361328125, -1.318267822265625, -1.23699951171875, -1.155731201171875, -1.074462890625, -0.993194580078125, -0.91192626953125, -0.830657958984375, -0.7493896484375, -0.668121337890625, -0.58685302734375, -0.505584716796875, -0.42431640625, -0.343048095703125, -0.26177978515625, -0.180511474609375, -0.0992431640625, -0.017974853515625, 0.06329345703125, 0.144561767578125, 0.225830078125, 0.307098388671875, 0.38836669921875, 0.469635009765625, 0.5509033203125, 0.632171630859375, 0.71343994140625, 0.794708251953125, 0.8759765625, 0.957244873046875, 1.03851318359375, 1.119781494140625, 1.2010498046875, 1.282318115234375, 1.36358642578125, 1.444854736328125, 1.526123046875, 1.607391357421875, 1.68865966796875, 1.769927978515625, 1.8511962890625, 1.932464599609375, 2.01373291015625, 2.095001220703125, 2.17626953125, 2.257537841796875, 2.33880615234375, 2.420074462890625, 2.5013427734375, 2.582611083984375, 2.66387939453125, 2.745147705078125, 2.826416015625, 2.907684326171875, 2.98895263671875, 3.070220947265625, 3.1514892578125, 3.232757568359375, 3.31402587890625, 3.395294189453125, 3.4765625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 11.0, 7.0, 9.0, 12.0, 22.0, 23.0, 42.0, 50.0, 57.0, 81.0, 80.0, 75.0, 81.0, 75.0, 78.0, 78.0, 55.0, 42.0, 31.0, 19.0, 30.0, 6.0, 12.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12005615234375, -0.11443424224853516, -0.10881233215332031, -0.10319042205810547, -0.09756851196289062, -0.09194660186767578, -0.08632469177246094, -0.0807027816772461, -0.07508087158203125, -0.0694589614868164, -0.06383705139160156, -0.05821514129638672, -0.052593231201171875, -0.04697132110595703, -0.04134941101074219, -0.035727500915527344, -0.0301055908203125, -0.024483680725097656, -0.018861770629882812, -0.013239860534667969, -0.007617950439453125, -0.0019960403442382812, 0.0036258697509765625, 0.009247779846191406, 0.01486968994140625, 0.020491600036621094, 0.026113510131835938, 0.03173542022705078, 0.037357330322265625, 0.04297924041748047, 0.04860115051269531, 0.054223060607910156, 0.059844970703125, 0.06546688079833984, 0.07108879089355469, 0.07671070098876953, 0.08233261108398438, 0.08795452117919922, 0.09357643127441406, 0.0991983413696289, 0.10482025146484375, 0.1104421615600586, 0.11606407165527344, 0.12168598175048828, 0.12730789184570312, 0.13292980194091797, 0.1385517120361328, 0.14417362213134766, 0.1497955322265625, 0.15541744232177734, 0.1610393524169922, 0.16666126251220703, 0.17228317260742188, 0.17790508270263672, 0.18352699279785156, 0.1891489028930664, 0.19477081298828125, 0.2003927230834961, 0.20601463317871094, 0.21163654327392578, 0.21725845336914062, 0.22288036346435547, 0.2285022735595703, 0.23412418365478516, 0.23974609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 10.0, 9.0, 15.0, 9.0, 24.0, 20.0, 27.0, 33.0, 27.0, 32.0, 57.0, 98.0, 205.0, 816.0, 5181.0, 153554.0, 3992956.0, 37213.0, 2941.0, 516.0, 176.0, 69.0, 54.0, 47.0, 38.0, 27.0, 20.0, 25.0, 18.0, 13.0, 9.0, 11.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.0859375, -4.91827392578125, -4.7506103515625, -4.58294677734375, -4.415283203125, -4.24761962890625, -4.0799560546875, -3.91229248046875, -3.74462890625, -3.57696533203125, -3.4093017578125, -3.24163818359375, -3.073974609375, -2.90631103515625, -2.7386474609375, -2.57098388671875, -2.4033203125, -2.23565673828125, -2.0679931640625, -1.90032958984375, -1.732666015625, -1.56500244140625, -1.3973388671875, -1.22967529296875, -1.06201171875, -0.89434814453125, -0.7266845703125, -0.55902099609375, -0.391357421875, -0.22369384765625, -0.0560302734375, 0.11163330078125, 0.279296875, 0.44696044921875, 0.6146240234375, 0.78228759765625, 0.949951171875, 1.11761474609375, 1.2852783203125, 1.45294189453125, 1.62060546875, 1.78826904296875, 1.9559326171875, 2.12359619140625, 2.291259765625, 2.45892333984375, 2.6265869140625, 2.79425048828125, 2.9619140625, 3.12957763671875, 3.2972412109375, 3.46490478515625, 3.632568359375, 3.80023193359375, 3.9678955078125, 4.13555908203125, 4.30322265625, 4.47088623046875, 4.6385498046875, 4.80621337890625, 4.973876953125, 5.14154052734375, 5.3092041015625, 5.47686767578125, 5.64453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 11.0, 5.0, 11.0, 13.0, 25.0, 33.0, 39.0, 51.0, 70.0, 97.0, 187.0, 279.0, 545.0, 1182.0, 587.0, 310.0, 178.0, 146.0, 73.0, 58.0, 36.0, 26.0, 22.0, 13.0, 18.0, 9.0, 10.0, 13.0, 2.0, 6.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3408203125, -0.32967376708984375, -0.3185272216796875, -0.30738067626953125, -0.296234130859375, -0.28508758544921875, -0.2739410400390625, -0.26279449462890625, -0.25164794921875, -0.24050140380859375, -0.2293548583984375, -0.21820831298828125, -0.207061767578125, -0.19591522216796875, -0.1847686767578125, -0.17362213134765625, -0.1624755859375, -0.15132904052734375, -0.1401824951171875, -0.12903594970703125, -0.117889404296875, -0.10674285888671875, -0.0955963134765625, -0.08444976806640625, -0.07330322265625, -0.06215667724609375, -0.0510101318359375, -0.03986358642578125, -0.028717041015625, -0.01757049560546875, -0.0064239501953125, 0.00472259521484375, 0.015869140625, 0.02701568603515625, 0.0381622314453125, 0.04930877685546875, 0.060455322265625, 0.07160186767578125, 0.0827484130859375, 0.09389495849609375, 0.10504150390625, 0.11618804931640625, 0.1273345947265625, 0.13848114013671875, 0.149627685546875, 0.16077423095703125, 0.1719207763671875, 0.18306732177734375, 0.1942138671875, 0.20536041259765625, 0.2165069580078125, 0.22765350341796875, 0.238800048828125, 0.24994659423828125, 0.2610931396484375, 0.27223968505859375, 0.28338623046875, 0.29453277587890625, 0.3056793212890625, 0.31682586669921875, 0.327972412109375, 0.33911895751953125, 0.3502655029296875, 0.36141204833984375, 0.37255859375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 18.0, 84.0, 423.0, 395.0, 78.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6830472946167, -14.208569526672363, -13.734091758728027, -13.259613990783691, -12.785136222839355, -12.31065845489502, -11.836181640625, -11.361703872680664, -10.887226104736328, -10.412748336791992, -9.938270568847656, -9.46379280090332, -8.989315032958984, -8.514837265014648, -8.040359497070312, -7.565882205963135, -7.091403961181641, -6.616926193237305, -6.142448425292969, -5.667970657348633, -5.193492889404297, -4.719015121459961, -4.244537830352783, -3.7700600624084473, -3.2955822944641113, -2.8211045265197754, -2.3466267585754395, -1.8721492290496826, -1.3976714611053467, -0.9231936931610107, -0.4487161636352539, 0.02576160430908203, 0.500239372253418, 0.9747170805931091, 1.4491947889328003, 1.9236724376678467, 2.3981502056121826, 2.8726279735565186, 3.3471055030822754, 3.8215832710266113, 4.296061038970947, 4.770538806915283, 5.245016574859619, 5.719493865966797, 6.193971633911133, 6.668449401855469, 7.142927169799805, 7.617404937744141, 8.091882705688477, 8.566360473632812, 9.040838241577148, 9.515316009521484, 9.98979377746582, 10.464271545410156, 10.938749313354492, 11.413227081298828, 11.887704849243164, 12.3621826171875, 12.836660385131836, 13.311138153076172, 13.785615921020508, 14.260093688964844, 14.73457145690918, 15.209049224853516, 15.683526039123535]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 5.0, 6.0, 8.0, 22.0, 26.0, 39.0, 37.0, 52.0, 51.0, 64.0, 62.0, 74.0, 77.0, 59.0, 79.0, 63.0, 55.0, 48.0, 32.0, 32.0, 26.0, 23.0, 8.0, 16.0, 14.0, 7.0, 11.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.913069009780884, -2.8365015983581543, -2.759934425354004, -2.6833670139312744, -2.606799602508545, -2.5302324295043945, -2.453665018081665, -2.3770976066589355, -2.300530433654785, -2.2239630222320557, -2.1473958492279053, -2.070828437805176, -1.9942611455917358, -1.917693853378296, -1.8411264419555664, -1.7645591497421265, -1.6879918575286865, -1.6114245653152466, -1.5348572731018066, -1.4582898616790771, -1.3817225694656372, -1.3051552772521973, -1.2285878658294678, -1.1520205736160278, -1.075453281402588, -0.998885989189148, -0.9223186373710632, -0.8457512855529785, -0.7691839933395386, -0.6926167011260986, -0.6160493493080139, -0.5394819974899292, -0.4629148244857788, -0.3863475024700165, -0.30978018045425415, -0.23321285843849182, -0.1566455364227295, -0.08007821440696716, -0.003510892391204834, 0.07305645942687988, 0.14962375164031982, 0.22619107365608215, 0.3027583956718445, 0.3793257176876068, 0.45589303970336914, 0.5324603319168091, 0.6090276837348938, 0.6855950355529785, 0.7621623277664185, 0.8387296199798584, 0.9152969717979431, 0.9918643236160278, 1.0684316158294678, 1.1449989080429077, 1.2215662002563477, 1.2981336116790771, 1.374700903892517, 1.451268196105957, 1.5278356075286865, 1.6044028997421265, 1.6809701919555664, 1.7575374841690063, 1.8341047763824463, 1.9106721878051758, 1.9872394800186157]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 4.0, 3.0, 5.0, 2.0, 7.0, 6.0, 12.0, 14.0, 17.0, 13.0, 15.0, 23.0, 36.0, 46.0, 56.0, 105.0, 187.0, 327.0, 540.0, 1123.0, 2548.0, 7209.0, 22945.0, 78779.0, 236355.0, 379308.0, 216795.0, 70423.0, 20536.0, 6603.0, 2268.0, 964.0, 513.0, 281.0, 153.0, 91.0, 62.0, 36.0, 38.0, 25.0, 16.0, 17.0, 13.0, 9.0, 8.0, 7.0, 3.0, 5.0, 4.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.1552734375, -1.1146697998046875, -1.074066162109375, -1.0334625244140625, -0.99285888671875, -0.9522552490234375, -0.911651611328125, -0.8710479736328125, -0.8304443359375, -0.7898406982421875, -0.749237060546875, -0.7086334228515625, -0.66802978515625, -0.6274261474609375, -0.586822509765625, -0.5462188720703125, -0.505615234375, -0.4650115966796875, -0.424407958984375, -0.3838043212890625, -0.34320068359375, -0.3025970458984375, -0.261993408203125, -0.2213897705078125, -0.1807861328125, -0.1401824951171875, -0.099578857421875, -0.0589752197265625, -0.01837158203125, 0.0222320556640625, 0.062835693359375, 0.1034393310546875, 0.14404296875, 0.1846466064453125, 0.225250244140625, 0.2658538818359375, 0.30645751953125, 0.3470611572265625, 0.387664794921875, 0.4282684326171875, 0.4688720703125, 0.5094757080078125, 0.550079345703125, 0.5906829833984375, 0.63128662109375, 0.6718902587890625, 0.712493896484375, 0.7530975341796875, 0.793701171875, 0.8343048095703125, 0.874908447265625, 0.9155120849609375, 0.95611572265625, 0.9967193603515625, 1.037322998046875, 1.0779266357421875, 1.1185302734375, 1.1591339111328125, 1.199737548828125, 1.2403411865234375, 1.28094482421875, 1.3215484619140625, 1.362152099609375, 1.4027557373046875, 1.443359375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 9.0, 11.0, 14.0, 22.0, 23.0, 24.0, 34.0, 42.0, 48.0, 54.0, 47.0, 68.0, 80.0, 56.0, 73.0, 62.0, 57.0, 47.0, 50.0, 34.0, 38.0, 21.0, 14.0, 17.0, 10.0, 9.0, 10.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1663818359375, -0.16049957275390625, -0.1546173095703125, -0.14873504638671875, -0.142852783203125, -0.13697052001953125, -0.1310882568359375, -0.12520599365234375, -0.11932373046875, -0.11344146728515625, -0.1075592041015625, -0.10167694091796875, -0.095794677734375, -0.08991241455078125, -0.0840301513671875, -0.07814788818359375, -0.072265625, -0.06638336181640625, -0.0605010986328125, -0.05461883544921875, -0.048736572265625, -0.04285430908203125, -0.0369720458984375, -0.03108978271484375, -0.02520751953125, -0.01932525634765625, -0.0134429931640625, -0.00756072998046875, -0.001678466796875, 0.00420379638671875, 0.0100860595703125, 0.01596832275390625, 0.0218505859375, 0.02773284912109375, 0.0336151123046875, 0.03949737548828125, 0.045379638671875, 0.05126190185546875, 0.0571441650390625, 0.06302642822265625, 0.06890869140625, 0.07479095458984375, 0.0806732177734375, 0.08655548095703125, 0.092437744140625, 0.09832000732421875, 0.1042022705078125, 0.11008453369140625, 0.115966796875, 0.12184906005859375, 0.1277313232421875, 0.13361358642578125, 0.139495849609375, 0.14537811279296875, 0.1512603759765625, 0.15714263916015625, 0.16302490234375, 0.16890716552734375, 0.1747894287109375, 0.18067169189453125, 0.186553955078125, 0.19243621826171875, 0.1983184814453125, 0.20420074462890625, 0.2100830078125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 6.0, 10.0, 14.0, 14.0, 23.0, 25.0, 27.0, 52.0, 64.0, 124.0, 193.0, 250.0, 486.0, 846.0, 1569.0, 3042.0, 6039.0, 13819.0, 32642.0, 79714.0, 189655.0, 308975.0, 231680.0, 104050.0, 41909.0, 17554.0, 7653.0, 3707.0, 1899.0, 1044.0, 541.0, 325.0, 196.0, 118.0, 84.0, 50.0, 45.0, 25.0, 32.0, 9.0, 8.0, 5.0, 8.0, 4.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.0693359375, -1.0375518798828125, -1.005767822265625, -0.9739837646484375, -0.94219970703125, -0.9104156494140625, -0.878631591796875, -0.8468475341796875, -0.8150634765625, -0.7832794189453125, -0.751495361328125, -0.7197113037109375, -0.68792724609375, -0.6561431884765625, -0.624359130859375, -0.5925750732421875, -0.560791015625, -0.5290069580078125, -0.497222900390625, -0.4654388427734375, -0.43365478515625, -0.4018707275390625, -0.370086669921875, -0.3383026123046875, -0.3065185546875, -0.2747344970703125, -0.242950439453125, -0.2111663818359375, -0.17938232421875, -0.1475982666015625, -0.115814208984375, -0.0840301513671875, -0.05224609375, -0.0204620361328125, 0.011322021484375, 0.0431060791015625, 0.07489013671875, 0.1066741943359375, 0.138458251953125, 0.1702423095703125, 0.2020263671875, 0.2338104248046875, 0.265594482421875, 0.2973785400390625, 0.32916259765625, 0.3609466552734375, 0.392730712890625, 0.4245147705078125, 0.456298828125, 0.4880828857421875, 0.519866943359375, 0.5516510009765625, 0.58343505859375, 0.6152191162109375, 0.647003173828125, 0.6787872314453125, 0.7105712890625, 0.7423553466796875, 0.774139404296875, 0.8059234619140625, 0.83770751953125, 0.8694915771484375, 0.901275634765625, 0.9330596923828125, 0.96484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 4.0, 11.0, 3.0, 6.0, 17.0, 22.0, 10.0, 15.0, 18.0, 24.0, 28.0, 29.0, 28.0, 34.0, 42.0, 49.0, 55.0, 52.0, 57.0, 43.0, 47.0, 48.0, 50.0, 44.0, 34.0, 36.0, 26.0, 28.0, 25.0, 22.0, 17.0, 13.0, 11.0, 11.0, 13.0, 2.0, 4.0, 8.0, 2.0, 3.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.873046875, -0.8458328247070312, -0.8186187744140625, -0.7914047241210938, -0.764190673828125, -0.7369766235351562, -0.7097625732421875, -0.6825485229492188, -0.65533447265625, -0.6281204223632812, -0.6009063720703125, -0.5736923217773438, -0.546478271484375, -0.5192642211914062, -0.4920501708984375, -0.46483612060546875, -0.4376220703125, -0.41040802001953125, -0.3831939697265625, -0.35597991943359375, -0.328765869140625, -0.30155181884765625, -0.2743377685546875, -0.24712371826171875, -0.21990966796875, -0.19269561767578125, -0.1654815673828125, -0.13826751708984375, -0.111053466796875, -0.08383941650390625, -0.0566253662109375, -0.02941131591796875, -0.002197265625, 0.02501678466796875, 0.0522308349609375, 0.07944488525390625, 0.106658935546875, 0.13387298583984375, 0.1610870361328125, 0.18830108642578125, 0.21551513671875, 0.24272918701171875, 0.2699432373046875, 0.29715728759765625, 0.324371337890625, 0.35158538818359375, 0.3787994384765625, 0.40601348876953125, 0.4332275390625, 0.46044158935546875, 0.4876556396484375, 0.5148696899414062, 0.542083740234375, 0.5692977905273438, 0.5965118408203125, 0.6237258911132812, 0.65093994140625, 0.6781539916992188, 0.7053680419921875, 0.7325820922851562, 0.759796142578125, 0.7870101928710938, 0.8142242431640625, 0.8414382934570312, 0.86865234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 3.0, 7.0, 12.0, 13.0, 22.0, 20.0, 29.0, 61.0, 57.0, 91.0, 138.0, 209.0, 280.0, 423.0, 713.0, 1128.0, 2026.0, 3903.0, 7543.0, 16396.0, 37540.0, 100707.0, 292909.0, 357765.0, 137367.0, 49126.0, 20101.0, 9194.0, 4629.0, 2451.0, 1325.0, 850.0, 504.0, 342.0, 201.0, 124.0, 112.0, 57.0, 46.0, 28.0, 24.0, 27.0, 13.0, 12.0, 7.0, 1.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.6005859375, -0.581298828125, -0.56201171875, -0.542724609375, -0.5234375, -0.504150390625, -0.48486328125, -0.465576171875, -0.4462890625, -0.427001953125, -0.40771484375, -0.388427734375, -0.369140625, -0.349853515625, -0.33056640625, -0.311279296875, -0.2919921875, -0.272705078125, -0.25341796875, -0.234130859375, -0.21484375, -0.195556640625, -0.17626953125, -0.156982421875, -0.1376953125, -0.118408203125, -0.09912109375, -0.079833984375, -0.060546875, -0.041259765625, -0.02197265625, -0.002685546875, 0.0166015625, 0.035888671875, 0.05517578125, 0.074462890625, 0.09375, 0.113037109375, 0.13232421875, 0.151611328125, 0.1708984375, 0.190185546875, 0.20947265625, 0.228759765625, 0.248046875, 0.267333984375, 0.28662109375, 0.305908203125, 0.3251953125, 0.344482421875, 0.36376953125, 0.383056640625, 0.40234375, 0.421630859375, 0.44091796875, 0.460205078125, 0.4794921875, 0.498779296875, 0.51806640625, 0.537353515625, 0.556640625, 0.575927734375, 0.59521484375, 0.614501953125, 0.6337890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 2.0, 3.0, 8.0, 6.0, 12.0, 9.0, 17.0, 30.0, 26.0, 31.0, 39.0, 51.0, 64.0, 81.0, 101.0, 92.0, 85.0, 75.0, 58.0, 45.0, 39.0, 28.0, 30.0, 14.0, 16.0, 13.0, 12.0, 6.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001418590545654297, -0.00013804808259010315, -0.0001342371106147766, -0.00013042613863945007, -0.00012661516666412354, -0.000122804194688797, -0.00011899322271347046, -0.00011518225073814392, -0.00011137127876281738, -0.00010756030678749084, -0.0001037493348121643, -9.993836283683777e-05, -9.612739086151123e-05, -9.231641888618469e-05, -8.850544691085815e-05, -8.469447493553162e-05, -8.088350296020508e-05, -7.707253098487854e-05, -7.3261559009552e-05, -6.945058703422546e-05, -6.563961505889893e-05, -6.182864308357239e-05, -5.801767110824585e-05, -5.420669913291931e-05, -5.0395727157592773e-05, -4.6584755182266235e-05, -4.27737832069397e-05, -3.896281123161316e-05, -3.515183925628662e-05, -3.134086728096008e-05, -2.7529895305633545e-05, -2.3718923330307007e-05, -1.990795135498047e-05, -1.609697937965393e-05, -1.2286007404327393e-05, -8.475035429000854e-06, -4.664063453674316e-06, -8.530914783477783e-07, 2.9578804969787598e-06, 6.768852472305298e-06, 1.0579824447631836e-05, 1.4390796422958374e-05, 1.8201768398284912e-05, 2.201274037361145e-05, 2.5823712348937988e-05, 2.9634684324264526e-05, 3.3445656299591064e-05, 3.72566282749176e-05, 4.106760025024414e-05, 4.487857222557068e-05, 4.868954420089722e-05, 5.2500516176223755e-05, 5.631148815155029e-05, 6.012246012687683e-05, 6.393343210220337e-05, 6.774440407752991e-05, 7.155537605285645e-05, 7.536634802818298e-05, 7.917732000350952e-05, 8.298829197883606e-05, 8.67992639541626e-05, 9.061023592948914e-05, 9.442120790481567e-05, 9.823217988014221e-05, 0.00010204315185546875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 13.0, 13.0, 13.0, 23.0, 42.0, 54.0, 60.0, 133.0, 212.0, 343.0, 618.0, 1253.0, 2428.0, 5538.0, 13814.0, 38098.0, 129074.0, 443054.0, 296282.0, 75227.0, 24866.0, 9406.0, 3991.0, 1791.0, 930.0, 484.0, 295.0, 186.0, 104.0, 68.0, 54.0, 28.0, 18.0, 11.0, 11.0, 3.0, 1.0, 3.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.89013671875, -0.8645553588867188, -0.8389739990234375, -0.8133926391601562, -0.787811279296875, -0.7622299194335938, -0.7366485595703125, -0.7110671997070312, -0.68548583984375, -0.6599044799804688, -0.6343231201171875, -0.6087417602539062, -0.583160400390625, -0.5575790405273438, -0.5319976806640625, -0.5064163208007812, -0.4808349609375, -0.45525360107421875, -0.4296722412109375, -0.40409088134765625, -0.378509521484375, -0.35292816162109375, -0.3273468017578125, -0.30176544189453125, -0.27618408203125, -0.25060272216796875, -0.2250213623046875, -0.19944000244140625, -0.173858642578125, -0.14827728271484375, -0.1226959228515625, -0.09711456298828125, -0.071533203125, -0.04595184326171875, -0.0203704833984375, 0.00521087646484375, 0.030792236328125, 0.05637359619140625, 0.0819549560546875, 0.10753631591796875, 0.13311767578125, 0.15869903564453125, 0.1842803955078125, 0.20986175537109375, 0.235443115234375, 0.26102447509765625, 0.2866058349609375, 0.31218719482421875, 0.3377685546875, 0.36334991455078125, 0.3889312744140625, 0.41451263427734375, 0.440093994140625, 0.46567535400390625, 0.4912567138671875, 0.5168380737304688, 0.54241943359375, 0.5680007934570312, 0.5935821533203125, 0.6191635131835938, 0.644744873046875, 0.6703262329101562, 0.6959075927734375, 0.7214889526367188, 0.7470703125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 7.0, 12.0, 3.0, 13.0, 10.0, 11.0, 17.0, 31.0, 25.0, 20.0, 49.0, 56.0, 76.0, 77.0, 87.0, 69.0, 77.0, 62.0, 59.0, 45.0, 37.0, 25.0, 25.0, 23.0, 14.0, 12.0, 11.0, 13.0, 5.0, 2.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6611328125, -0.6427764892578125, -0.624420166015625, -0.6060638427734375, -0.58770751953125, -0.5693511962890625, -0.550994873046875, -0.5326385498046875, -0.5142822265625, -0.4959259033203125, -0.477569580078125, -0.4592132568359375, -0.44085693359375, -0.4225006103515625, -0.404144287109375, -0.3857879638671875, -0.367431640625, -0.3490753173828125, -0.330718994140625, -0.3123626708984375, -0.29400634765625, -0.2756500244140625, -0.257293701171875, -0.2389373779296875, -0.2205810546875, -0.2022247314453125, -0.183868408203125, -0.1655120849609375, -0.14715576171875, -0.1287994384765625, -0.110443115234375, -0.0920867919921875, -0.07373046875, -0.0553741455078125, -0.037017822265625, -0.0186614990234375, -0.00030517578125, 0.0180511474609375, 0.036407470703125, 0.0547637939453125, 0.0731201171875, 0.0914764404296875, 0.109832763671875, 0.1281890869140625, 0.14654541015625, 0.1649017333984375, 0.183258056640625, 0.2016143798828125, 0.219970703125, 0.2383270263671875, 0.256683349609375, 0.2750396728515625, 0.29339599609375, 0.3117523193359375, 0.330108642578125, 0.3484649658203125, 0.3668212890625, 0.3851776123046875, 0.403533935546875, 0.4218902587890625, 0.44024658203125, 0.4586029052734375, 0.476959228515625, 0.4953155517578125, 0.513671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 12.0, 11.0, 14.0, 21.0, 33.0, 45.0, 66.0, 100.0, 117.0, 131.0, 128.0, 115.0, 75.0, 43.0, 31.0, 26.0, 18.0, 12.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.284219741821289, -8.961447715759277, -8.638676643371582, -8.31590461730957, -7.993132591247559, -7.670361042022705, -7.347589492797852, -7.02481746673584, -6.702045440673828, -6.379273891448975, -6.056501865386963, -5.733730316162109, -5.410958290100098, -5.088186740875244, -4.765415191650391, -4.442643165588379, -4.119871616363525, -3.7970998287200928, -3.47432804107666, -3.1515564918518066, -2.828784465789795, -2.5060129165649414, -2.183241128921509, -1.8604693412780762, -1.5376975536346436, -1.214925765991211, -0.8921540379524231, -0.5693823099136353, -0.24661052227020264, 0.07616126537322998, 0.39893293380737305, 0.7217047214508057, 1.0444765090942383, 1.367248296737671, 1.6900200843811035, 2.012791633605957, 2.3355636596679688, 2.6583352088928223, 2.981106996536255, 3.3038787841796875, 3.62665057182312, 3.9494223594665527, 4.272193908691406, 4.594965934753418, 4.9177374839782715, 5.240509510040283, 5.563281059265137, 5.886053085327148, 6.208824634552002, 6.5315961837768555, 6.854368209838867, 7.177139759063721, 7.499911785125732, 7.822683334350586, 8.145455360412598, 8.46822738647461, 8.790998458862305, 9.113770484924316, 9.436541557312012, 9.759313583374023, 10.082085609436035, 10.404857635498047, 10.727628707885742, 11.050400733947754, 11.373172760009766]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 14.0, 16.0, 15.0, 17.0, 18.0, 30.0, 32.0, 40.0, 37.0, 50.0, 61.0, 65.0, 57.0, 54.0, 55.0, 81.0, 59.0, 60.0, 52.0, 33.0, 27.0, 24.0, 22.0, 13.0, 15.0, 12.0, 13.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.217851638793945, -7.992817401885986, -7.767783164978027, -7.542749404907227, -7.317715167999268, -7.092680931091309, -6.867647171020508, -6.642612934112549, -6.41757869720459, -6.192544460296631, -5.967510223388672, -5.742476463317871, -5.517442226409912, -5.292407989501953, -5.067374229431152, -4.842339992523193, -4.617305755615234, -4.392271518707275, -4.167237281799316, -3.9422035217285156, -3.7171692848205566, -3.4921350479125977, -3.2671010494232178, -3.042067050933838, -2.817032814025879, -2.59199857711792, -2.36696457862854, -2.14193058013916, -1.9168963432312012, -1.6918622255325317, -1.4668281078338623, -1.2417939901351929, -1.0167598724365234, -0.791725754737854, -0.5666916370391846, -0.34165751934051514, -0.1166234016418457, 0.10841071605682373, 0.33344483375549316, 0.5584789514541626, 0.783513069152832, 1.0085471868515015, 1.233581304550171, 1.4586154222488403, 1.6836495399475098, 1.9086836576461792, 2.1337177753448486, 2.3587517738342285, 2.5837860107421875, 2.8088202476501465, 3.0338542461395264, 3.2588882446289062, 3.4839224815368652, 3.708956718444824, 3.933990716934204, 4.159024715423584, 4.384058952331543, 4.609093189239502, 4.834127426147461, 5.059161186218262, 5.284195423126221, 5.50922966003418, 5.7342634201049805, 5.9592976570129395, 6.184331893920898]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 4.0, 7.0, 5.0, 12.0, 9.0, 18.0, 25.0, 55.0, 62.0, 127.0, 259.0, 497.0, 1026.0, 2514.0, 7024.0, 22697.0, 96953.0, 887000.0, 2965083.0, 162871.0, 32754.0, 9089.0, 3226.0, 1323.0, 623.0, 333.0, 225.0, 112.0, 83.0, 50.0, 45.0, 47.0, 31.0, 17.0, 15.0, 15.0, 8.0, 6.0, 6.0, 5.0, 10.0, 3.0, 4.0, 3.0, 7.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.006683349609375, -0.95672607421875, -0.906768798828125, -0.8568115234375, -0.806854248046875, -0.75689697265625, -0.706939697265625, -0.656982421875, -0.607025146484375, -0.55706787109375, -0.507110595703125, -0.4571533203125, -0.407196044921875, -0.35723876953125, -0.307281494140625, -0.25732421875, -0.207366943359375, -0.15740966796875, -0.107452392578125, -0.0574951171875, -0.007537841796875, 0.04241943359375, 0.092376708984375, 0.142333984375, 0.192291259765625, 0.24224853515625, 0.292205810546875, 0.3421630859375, 0.392120361328125, 0.44207763671875, 0.492034912109375, 0.5419921875, 0.591949462890625, 0.64190673828125, 0.691864013671875, 0.7418212890625, 0.791778564453125, 0.84173583984375, 0.891693115234375, 0.941650390625, 0.991607666015625, 1.04156494140625, 1.091522216796875, 1.1414794921875, 1.191436767578125, 1.24139404296875, 1.291351318359375, 1.34130859375, 1.391265869140625, 1.44122314453125, 1.491180419921875, 1.5411376953125, 1.591094970703125, 1.64105224609375, 1.691009521484375, 1.740966796875, 1.790924072265625, 1.84088134765625, 1.890838623046875, 1.9407958984375, 1.990753173828125, 2.04071044921875, 2.090667724609375, 2.140625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 9.0, 6.0, 6.0, 10.0, 15.0, 15.0, 21.0, 27.0, 26.0, 49.0, 37.0, 53.0, 61.0, 62.0, 61.0, 58.0, 55.0, 62.0, 61.0, 55.0, 46.0, 32.0, 38.0, 33.0, 25.0, 16.0, 20.0, 9.0, 11.0, 5.0, 8.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.20556640625, -0.19947242736816406, -0.19337844848632812, -0.1872844696044922, -0.18119049072265625, -0.1750965118408203, -0.16900253295898438, -0.16290855407714844, -0.1568145751953125, -0.15072059631347656, -0.14462661743164062, -0.1385326385498047, -0.13243865966796875, -0.1263446807861328, -0.12025070190429688, -0.11415672302246094, -0.108062744140625, -0.10196876525878906, -0.09587478637695312, -0.08978080749511719, -0.08368682861328125, -0.07759284973144531, -0.07149887084960938, -0.06540489196777344, -0.0593109130859375, -0.05321693420410156, -0.047122955322265625, -0.04102897644042969, -0.03493499755859375, -0.028841018676757812, -0.022747039794921875, -0.016653060913085938, -0.01055908203125, -0.0044651031494140625, 0.001628875732421875, 0.0077228546142578125, 0.01381683349609375, 0.019910812377929688, 0.026004791259765625, 0.03209877014160156, 0.0381927490234375, 0.04428672790527344, 0.050380706787109375, 0.05647468566894531, 0.06256866455078125, 0.06866264343261719, 0.07475662231445312, 0.08085060119628906, 0.086944580078125, 0.09303855895996094, 0.09913253784179688, 0.10522651672363281, 0.11132049560546875, 0.11741447448730469, 0.12350845336914062, 0.12960243225097656, 0.1356964111328125, 0.14179039001464844, 0.14788436889648438, 0.1539783477783203, 0.16007232666015625, 0.1661663055419922, 0.17226028442382812, 0.17835426330566406, 0.1844482421875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 7.0, 11.0, 10.0, 19.0, 36.0, 58.0, 82.0, 219.0, 654.0, 2658.0, 15641.0, 272579.0, 3787929.0, 102069.0, 9221.0, 1993.0, 582.0, 212.0, 95.0, 62.0, 42.0, 30.0, 24.0, 19.0, 10.0, 7.0, 4.0, 10.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.35546875, -5.231964111328125, -5.10845947265625, -4.984954833984375, -4.8614501953125, -4.737945556640625, -4.61444091796875, -4.490936279296875, -4.367431640625, -4.243927001953125, -4.12042236328125, -3.996917724609375, -3.8734130859375, -3.749908447265625, -3.62640380859375, -3.502899169921875, -3.37939453125, -3.255889892578125, -3.13238525390625, -3.008880615234375, -2.8853759765625, -2.761871337890625, -2.63836669921875, -2.514862060546875, -2.391357421875, -2.267852783203125, -2.14434814453125, -2.020843505859375, -1.8973388671875, -1.773834228515625, -1.65032958984375, -1.526824951171875, -1.4033203125, -1.279815673828125, -1.15631103515625, -1.032806396484375, -0.9093017578125, -0.785797119140625, -0.66229248046875, -0.538787841796875, -0.415283203125, -0.291778564453125, -0.16827392578125, -0.044769287109375, 0.0787353515625, 0.202239990234375, 0.32574462890625, 0.449249267578125, 0.57275390625, 0.696258544921875, 0.81976318359375, 0.943267822265625, 1.0667724609375, 1.190277099609375, 1.31378173828125, 1.437286376953125, 1.560791015625, 1.684295654296875, 1.80780029296875, 1.931304931640625, 2.0548095703125, 2.178314208984375, 2.30181884765625, 2.425323486328125, 2.548828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 9.0, 12.0, 10.0, 18.0, 26.0, 57.0, 110.0, 168.0, 387.0, 978.0, 1359.0, 455.0, 193.0, 126.0, 73.0, 37.0, 23.0, 14.0, 7.0, 7.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4619140625, -0.4314727783203125, -0.401031494140625, -0.3705902099609375, -0.34014892578125, -0.3097076416015625, -0.279266357421875, -0.2488250732421875, -0.2183837890625, -0.1879425048828125, -0.157501220703125, -0.1270599365234375, -0.09661865234375, -0.0661773681640625, -0.035736083984375, -0.0052947998046875, 0.025146484375, 0.0555877685546875, 0.086029052734375, 0.1164703369140625, 0.14691162109375, 0.1773529052734375, 0.207794189453125, 0.2382354736328125, 0.2686767578125, 0.2991180419921875, 0.329559326171875, 0.3600006103515625, 0.39044189453125, 0.4208831787109375, 0.451324462890625, 0.4817657470703125, 0.51220703125, 0.5426483154296875, 0.573089599609375, 0.6035308837890625, 0.63397216796875, 0.6644134521484375, 0.694854736328125, 0.7252960205078125, 0.7557373046875, 0.7861785888671875, 0.816619873046875, 0.8470611572265625, 0.87750244140625, 0.9079437255859375, 0.938385009765625, 0.9688262939453125, 0.999267578125, 1.0297088623046875, 1.060150146484375, 1.0905914306640625, 1.12103271484375, 1.1514739990234375, 1.181915283203125, 1.2123565673828125, 1.2427978515625, 1.2732391357421875, 1.303680419921875, 1.3341217041015625, 1.36456298828125, 1.3950042724609375, 1.425445556640625, 1.4558868408203125, 1.486328125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 17.0, 24.0, 40.0, 50.0, 70.0, 83.0, 98.0, 108.0, 102.0, 104.0, 86.0, 57.0, 47.0, 24.0, 22.0, 15.0, 11.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.0123467445373535, -3.8656444549560547, -3.7189419269561768, -3.572239398956299, -3.425537109375, -3.278834819793701, -3.1321322917938232, -2.9854297637939453, -2.8387274742126465, -2.6920251846313477, -2.5453226566314697, -2.398620128631592, -2.251917839050293, -2.105215549468994, -1.9585130214691162, -1.8118106126785278, -1.6651082038879395, -1.518405795097351, -1.3717033863067627, -1.2250009775161743, -1.078298568725586, -0.9315961599349976, -0.7848937511444092, -0.6381913423538208, -0.4914889335632324, -0.34478652477264404, -0.19808411598205566, -0.051381707191467285, 0.0953207015991211, 0.24202311038970947, 0.38872551918029785, 0.5354279279708862, 0.6821298599243164, 0.8288322687149048, 0.9755346775054932, 1.1222370862960815, 1.26893949508667, 1.4156419038772583, 1.5623443126678467, 1.709046721458435, 1.8557491302490234, 2.0024514198303223, 2.1491539478302, 2.295856475830078, 2.442558765411377, 2.589261054992676, 2.7359635829925537, 2.8826661109924316, 3.0293684005737305, 3.1760706901550293, 3.3227732181549072, 3.469475746154785, 3.616178035736084, 3.762880325317383, 3.9095828533172607, 4.056285381317139, 4.2029876708984375, 4.349689960479736, 4.496392250061035, 4.643095016479492, 4.789797306060791, 4.93649959564209, 5.083202362060547, 5.229904651641846, 5.3766069412231445]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 10.0, 10.0, 12.0, 16.0, 27.0, 26.0, 29.0, 40.0, 57.0, 64.0, 57.0, 49.0, 77.0, 60.0, 62.0, 53.0, 49.0, 48.0, 48.0, 56.0, 43.0, 29.0, 21.0, 17.0, 13.0, 13.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9530105590820312, -3.8373780250549316, -3.721745491027832, -3.6061131954193115, -3.490480661392212, -3.3748481273651123, -3.259215831756592, -3.143583297729492, -3.0279507637023926, -2.912318229675293, -2.7966856956481934, -2.681053400039673, -2.5654208660125732, -2.4497883319854736, -2.334156036376953, -2.2185235023498535, -2.102890968322754, -1.9872584342956543, -1.8716260194778442, -1.7559936046600342, -1.6403610706329346, -1.524728536605835, -1.409096121788025, -1.2934637069702148, -1.1778311729431152, -1.0621986389160156, -0.9465662240982056, -0.8309337496757507, -0.7153012752532959, -0.5996688008308411, -0.48403632640838623, -0.3684038519859314, -0.25277161598205566, -0.13713914155960083, -0.021506667137145996, 0.09412580728530884, 0.20975828170776367, 0.3253907561302185, 0.44102323055267334, 0.5566557049751282, 0.672288179397583, 0.7879206538200378, 0.9035531282424927, 1.0191855430603027, 1.1348180770874023, 1.250450611114502, 1.366083025932312, 1.481715440750122, 1.5973479747772217, 1.7129805088043213, 1.8286129236221313, 1.9442453384399414, 2.059877872467041, 2.1755104064941406, 2.2911429405212402, 2.4067752361297607, 2.5224077701568604, 2.63804030418396, 2.7536725997924805, 2.86930513381958, 2.9849376678466797, 3.1005702018737793, 3.216202735900879, 3.3318350315093994, 3.447467565536499]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 7.0, 9.0, 7.0, 13.0, 12.0, 6.0, 21.0, 27.0, 31.0, 59.0, 91.0, 137.0, 188.0, 319.0, 552.0, 1057.0, 2152.0, 4661.0, 11564.0, 30070.0, 80789.0, 197025.0, 315773.0, 235287.0, 103598.0, 38947.0, 14546.0, 6073.0, 2520.0, 1294.0, 651.0, 390.0, 215.0, 139.0, 94.0, 61.0, 46.0, 27.0, 23.0, 18.0, 18.0, 16.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1640625, -1.12725830078125, -1.0904541015625, -1.05364990234375, -1.016845703125, -0.98004150390625, -0.9432373046875, -0.90643310546875, -0.86962890625, -0.83282470703125, -0.7960205078125, -0.75921630859375, -0.722412109375, -0.68560791015625, -0.6488037109375, -0.61199951171875, -0.5751953125, -0.53839111328125, -0.5015869140625, -0.46478271484375, -0.427978515625, -0.39117431640625, -0.3543701171875, -0.31756591796875, -0.28076171875, -0.24395751953125, -0.2071533203125, -0.17034912109375, -0.133544921875, -0.09674072265625, -0.0599365234375, -0.02313232421875, 0.013671875, 0.05047607421875, 0.0872802734375, 0.12408447265625, 0.160888671875, 0.19769287109375, 0.2344970703125, 0.27130126953125, 0.30810546875, 0.34490966796875, 0.3817138671875, 0.41851806640625, 0.455322265625, 0.49212646484375, 0.5289306640625, 0.56573486328125, 0.6025390625, 0.63934326171875, 0.6761474609375, 0.71295166015625, 0.749755859375, 0.78656005859375, 0.8233642578125, 0.86016845703125, 0.89697265625, 0.93377685546875, 0.9705810546875, 1.00738525390625, 1.044189453125, 1.08099365234375, 1.1177978515625, 1.15460205078125, 1.19140625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 4.0, 6.0, 22.0, 18.0, 22.0, 48.0, 63.0, 58.0, 62.0, 69.0, 73.0, 69.0, 85.0, 74.0, 53.0, 76.0, 35.0, 45.0, 37.0, 23.0, 16.0, 8.0, 8.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2105712890625, -0.20199012756347656, -0.19340896606445312, -0.1848278045654297, -0.17624664306640625, -0.1676654815673828, -0.15908432006835938, -0.15050315856933594, -0.1419219970703125, -0.13334083557128906, -0.12475967407226562, -0.11617851257324219, -0.10759735107421875, -0.09901618957519531, -0.09043502807617188, -0.08185386657714844, -0.073272705078125, -0.06469154357910156, -0.056110382080078125, -0.04752922058105469, -0.03894805908203125, -0.030366897583007812, -0.021785736083984375, -0.013204574584960938, -0.0046234130859375, 0.0039577484130859375, 0.012538909912109375, 0.021120071411132812, 0.02970123291015625, 0.03828239440917969, 0.046863555908203125, 0.05544471740722656, 0.06402587890625, 0.07260704040527344, 0.08118820190429688, 0.08976936340332031, 0.09835052490234375, 0.10693168640136719, 0.11551284790039062, 0.12409400939941406, 0.1326751708984375, 0.14125633239746094, 0.14983749389648438, 0.1584186553955078, 0.16699981689453125, 0.1755809783935547, 0.18416213989257812, 0.19274330139160156, 0.201324462890625, 0.20990562438964844, 0.21848678588867188, 0.2270679473876953, 0.23564910888671875, 0.2442302703857422, 0.2528114318847656, 0.26139259338378906, 0.2699737548828125, 0.27855491638183594, 0.2871360778808594, 0.2957172393798828, 0.30429840087890625, 0.3128795623779297, 0.3214607238769531, 0.33004188537597656, 0.338623046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 5.0, 4.0, 5.0, 11.0, 17.0, 17.0, 16.0, 34.0, 44.0, 66.0, 95.0, 143.0, 201.0, 407.0, 606.0, 1021.0, 1763.0, 3360.0, 6225.0, 11922.0, 23837.0, 47795.0, 93942.0, 172013.0, 241568.0, 202057.0, 118177.0, 60429.0, 30205.0, 15112.0, 7717.0, 4180.0, 2248.0, 1277.0, 782.0, 437.0, 281.0, 164.0, 118.0, 58.0, 57.0, 32.0, 26.0, 17.0, 15.0, 7.0, 10.0, 4.0, 7.0, 4.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.85400390625, -0.8270416259765625, -0.800079345703125, -0.7731170654296875, -0.74615478515625, -0.7191925048828125, -0.692230224609375, -0.6652679443359375, -0.6383056640625, -0.6113433837890625, -0.584381103515625, -0.5574188232421875, -0.53045654296875, -0.5034942626953125, -0.476531982421875, -0.4495697021484375, -0.422607421875, -0.3956451416015625, -0.368682861328125, -0.3417205810546875, -0.31475830078125, -0.2877960205078125, -0.260833740234375, -0.2338714599609375, -0.2069091796875, -0.1799468994140625, -0.152984619140625, -0.1260223388671875, -0.09906005859375, -0.0720977783203125, -0.045135498046875, -0.0181732177734375, 0.0087890625, 0.0357513427734375, 0.062713623046875, 0.0896759033203125, 0.11663818359375, 0.1436004638671875, 0.170562744140625, 0.1975250244140625, 0.2244873046875, 0.2514495849609375, 0.278411865234375, 0.3053741455078125, 0.33233642578125, 0.3592987060546875, 0.386260986328125, 0.4132232666015625, 0.440185546875, 0.4671478271484375, 0.494110107421875, 0.5210723876953125, 0.54803466796875, 0.5749969482421875, 0.601959228515625, 0.6289215087890625, 0.6558837890625, 0.6828460693359375, 0.709808349609375, 0.7367706298828125, 0.76373291015625, 0.7906951904296875, 0.817657470703125, 0.8446197509765625, 0.87158203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 9.0, 9.0, 9.0, 15.0, 19.0, 12.0, 23.0, 23.0, 16.0, 22.0, 22.0, 33.0, 24.0, 48.0, 42.0, 41.0, 55.0, 49.0, 57.0, 42.0, 48.0, 46.0, 51.0, 34.0, 39.0, 28.0, 31.0, 24.0, 22.0, 18.0, 17.0, 15.0, 8.0, 11.0, 7.0, 11.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84912109375, -0.8178024291992188, -0.7864837646484375, -0.7551651000976562, -0.723846435546875, -0.6925277709960938, -0.6612091064453125, -0.6298904418945312, -0.59857177734375, -0.5672531127929688, -0.5359344482421875, -0.5046157836914062, -0.473297119140625, -0.44197845458984375, -0.4106597900390625, -0.37934112548828125, -0.3480224609375, -0.31670379638671875, -0.2853851318359375, -0.25406646728515625, -0.222747802734375, -0.19142913818359375, -0.1601104736328125, -0.12879180908203125, -0.09747314453125, -0.06615447998046875, -0.0348358154296875, -0.00351715087890625, 0.027801513671875, 0.05912017822265625, 0.0904388427734375, 0.12175750732421875, 0.153076171875, 0.18439483642578125, 0.2157135009765625, 0.24703216552734375, 0.278350830078125, 0.30966949462890625, 0.3409881591796875, 0.37230682373046875, 0.40362548828125, 0.43494415283203125, 0.4662628173828125, 0.49758148193359375, 0.528900146484375, 0.5602188110351562, 0.5915374755859375, 0.6228561401367188, 0.6541748046875, 0.6854934692382812, 0.7168121337890625, 0.7481307983398438, 0.779449462890625, 0.8107681274414062, 0.8420867919921875, 0.8734054565429688, 0.90472412109375, 0.9360427856445312, 0.9673614501953125, 0.9986801147460938, 1.029998779296875, 1.0613174438476562, 1.0926361083984375, 1.1239547729492188, 1.1552734375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 9.0, 10.0, 20.0, 23.0, 39.0, 72.0, 114.0, 170.0, 347.0, 575.0, 1172.0, 2416.0, 5317.0, 16983.0, 94254.0, 705152.0, 183890.0, 24841.0, 7186.0, 2966.0, 1450.0, 665.0, 365.0, 195.0, 113.0, 81.0, 40.0, 32.0, 11.0, 12.0, 11.0, 4.0, 5.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.75, -1.6946868896484375, -1.639373779296875, -1.5840606689453125, -1.52874755859375, -1.4734344482421875, -1.418121337890625, -1.3628082275390625, -1.3074951171875, -1.2521820068359375, -1.196868896484375, -1.1415557861328125, -1.08624267578125, -1.0309295654296875, -0.975616455078125, -0.9203033447265625, -0.864990234375, -0.8096771240234375, -0.754364013671875, -0.6990509033203125, -0.64373779296875, -0.5884246826171875, -0.533111572265625, -0.4777984619140625, -0.4224853515625, -0.3671722412109375, -0.311859130859375, -0.2565460205078125, -0.20123291015625, -0.1459197998046875, -0.090606689453125, -0.0352935791015625, 0.02001953125, 0.0753326416015625, 0.130645751953125, 0.1859588623046875, 0.24127197265625, 0.2965850830078125, 0.351898193359375, 0.4072113037109375, 0.4625244140625, 0.5178375244140625, 0.573150634765625, 0.6284637451171875, 0.68377685546875, 0.7390899658203125, 0.794403076171875, 0.8497161865234375, 0.905029296875, 0.9603424072265625, 1.015655517578125, 1.0709686279296875, 1.12628173828125, 1.1815948486328125, 1.236907958984375, 1.2922210693359375, 1.3475341796875, 1.4028472900390625, 1.458160400390625, 1.5134735107421875, 1.56878662109375, 1.6240997314453125, 1.679412841796875, 1.7347259521484375, 1.7900390625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 5.0, 10.0, 20.0, 29.0, 32.0, 53.0, 80.0, 155.0, 230.0, 157.0, 77.0, 44.0, 37.0, 22.0, 14.0, 8.0, 1.0, 2.0, 1.0, 4.0, 6.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002586841583251953, -0.0002511851489543915, -0.00024368613958358765, -0.0002361871302127838, -0.00022868812084197998, -0.00022118911147117615, -0.00021369010210037231, -0.00020619109272956848, -0.00019869208335876465, -0.00019119307398796082, -0.00018369406461715698, -0.00017619505524635315, -0.00016869604587554932, -0.00016119703650474548, -0.00015369802713394165, -0.00014619901776313782, -0.00013870000839233398, -0.00013120099902153015, -0.00012370198965072632, -0.00011620298027992249, -0.00010870397090911865, -0.00010120496153831482, -9.370595216751099e-05, -8.620694279670715e-05, -7.870793342590332e-05, -7.120892405509949e-05, -6.370991468429565e-05, -5.621090531349182e-05, -4.871189594268799e-05, -4.1212886571884155e-05, -3.371387720108032e-05, -2.621486783027649e-05, -1.8715858459472656e-05, -1.1216849088668823e-05, -3.7178397178649902e-06, 3.7811696529388428e-06, 1.1280179023742676e-05, 1.877918839454651e-05, 2.6278197765350342e-05, 3.3777207136154175e-05, 4.127621650695801e-05, 4.877522587776184e-05, 5.6274235248565674e-05, 6.377324461936951e-05, 7.127225399017334e-05, 7.877126336097717e-05, 8.6270272731781e-05, 9.376928210258484e-05, 0.00010126829147338867, 0.0001087673008441925, 0.00011626631021499634, 0.00012376531958580017, 0.000131264328956604, 0.00013876333832740784, 0.00014626234769821167, 0.0001537613570690155, 0.00016126036643981934, 0.00016875937581062317, 0.000176258385181427, 0.00018375739455223083, 0.00019125640392303467, 0.0001987554132938385, 0.00020625442266464233, 0.00021375343203544617, 0.00022125244140625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 8.0, 6.0, 4.0, 9.0, 20.0, 36.0, 44.0, 68.0, 102.0, 173.0, 217.0, 434.0, 894.0, 2239.0, 6827.0, 31691.0, 426068.0, 530239.0, 37419.0, 7634.0, 2316.0, 929.0, 444.0, 264.0, 158.0, 112.0, 78.0, 49.0, 19.0, 18.0, 12.0, 14.0, 1.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.8671875, -2.7937469482421875, -2.720306396484375, -2.6468658447265625, -2.57342529296875, -2.4999847412109375, -2.426544189453125, -2.3531036376953125, -2.2796630859375, -2.2062225341796875, -2.132781982421875, -2.0593414306640625, -1.98590087890625, -1.9124603271484375, -1.839019775390625, -1.7655792236328125, -1.692138671875, -1.6186981201171875, -1.545257568359375, -1.4718170166015625, -1.39837646484375, -1.3249359130859375, -1.251495361328125, -1.1780548095703125, -1.1046142578125, -1.0311737060546875, -0.957733154296875, -0.8842926025390625, -0.81085205078125, -0.7374114990234375, -0.663970947265625, -0.5905303955078125, -0.51708984375, -0.4436492919921875, -0.370208740234375, -0.2967681884765625, -0.22332763671875, -0.1498870849609375, -0.076446533203125, -0.0030059814453125, 0.0704345703125, 0.1438751220703125, 0.217315673828125, 0.2907562255859375, 0.36419677734375, 0.4376373291015625, 0.511077880859375, 0.5845184326171875, 0.657958984375, 0.7313995361328125, 0.804840087890625, 0.8782806396484375, 0.95172119140625, 1.0251617431640625, 1.098602294921875, 1.1720428466796875, 1.2454833984375, 1.3189239501953125, 1.392364501953125, 1.4658050537109375, 1.53924560546875, 1.6126861572265625, 1.686126708984375, 1.7595672607421875, 1.8330078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 2.0, 11.0, 19.0, 20.0, 35.0, 82.0, 133.0, 240.0, 221.0, 103.0, 68.0, 29.0, 13.0, 5.0, 4.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.306640625, -2.2403564453125, -2.174072265625, -2.1077880859375, -2.04150390625, -1.9752197265625, -1.908935546875, -1.8426513671875, -1.7763671875, -1.7100830078125, -1.643798828125, -1.5775146484375, -1.51123046875, -1.4449462890625, -1.378662109375, -1.3123779296875, -1.24609375, -1.1798095703125, -1.113525390625, -1.0472412109375, -0.98095703125, -0.9146728515625, -0.848388671875, -0.7821044921875, -0.7158203125, -0.6495361328125, -0.583251953125, -0.5169677734375, -0.45068359375, -0.3843994140625, -0.318115234375, -0.2518310546875, -0.185546875, -0.1192626953125, -0.052978515625, 0.0133056640625, 0.07958984375, 0.1458740234375, 0.212158203125, 0.2784423828125, 0.3447265625, 0.4110107421875, 0.477294921875, 0.5435791015625, 0.60986328125, 0.6761474609375, 0.742431640625, 0.8087158203125, 0.875, 0.9412841796875, 1.007568359375, 1.0738525390625, 1.14013671875, 1.2064208984375, 1.272705078125, 1.3389892578125, 1.4052734375, 1.4715576171875, 1.537841796875, 1.6041259765625, 1.67041015625, 1.7366943359375, 1.802978515625, 1.8692626953125, 1.935546875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 4.0, 14.0, 17.0, 31.0, 46.0, 67.0, 118.0, 110.0, 131.0, 134.0, 117.0, 70.0, 56.0, 36.0, 23.0, 10.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.224872589111328, -18.815414428710938, -18.405956268310547, -17.996498107910156, -17.587039947509766, -17.177581787109375, -16.768123626708984, -16.358665466308594, -15.949207305908203, -15.539749145507812, -15.130290985107422, -14.720832824707031, -14.31137466430664, -13.90191650390625, -13.49245834350586, -13.083000183105469, -12.673542022705078, -12.264083862304688, -11.854625701904297, -11.445167541503906, -11.035709381103516, -10.626251220703125, -10.216793060302734, -9.807334899902344, -9.397876739501953, -8.988418579101562, -8.578960418701172, -8.169502258300781, -7.760044097900391, -7.3505859375, -6.941127777099609, -6.531669616699219, -6.1222124099731445, -5.712754249572754, -5.303296089172363, -4.893837928771973, -4.484379768371582, -4.074921607971191, -3.665463447570801, -3.25600528717041, -2.8465471267700195, -2.437088966369629, -2.0276308059692383, -1.6181726455688477, -1.208714485168457, -0.7992563247680664, -0.3897981643676758, 0.019659996032714844, 0.42911815643310547, 0.8385763168334961, 1.2480344772338867, 1.6574926376342773, 2.066950798034668, 2.4764089584350586, 2.885867118835449, 3.29532527923584, 3.7047834396362305, 4.114241600036621, 4.523699760437012, 4.933157920837402, 5.342616081237793, 5.752074241638184, 6.161532402038574, 6.570990562438965, 6.9804487228393555]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 3.0, 4.0, 7.0, 14.0, 15.0, 11.0, 19.0, 16.0, 27.0, 25.0, 38.0, 33.0, 41.0, 42.0, 47.0, 49.0, 52.0, 58.0, 48.0, 58.0, 54.0, 50.0, 39.0, 44.0, 30.0, 28.0, 23.0, 25.0, 16.0, 15.0, 16.0, 11.0, 12.0, 9.0, 5.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8691511154174805, -5.654601097106934, -5.440051078796387, -5.22550106048584, -5.010951042175293, -4.796401023864746, -4.581851005554199, -4.367300987243652, -4.1527509689331055, -3.9382009506225586, -3.7236509323120117, -3.509100914001465, -3.294550895690918, -3.080000877380371, -2.865450859069824, -2.6509008407592773, -2.4363510608673096, -2.2218010425567627, -2.007251024246216, -1.792701005935669, -1.578150987625122, -1.3636010885238647, -1.1490510702133179, -0.934501051902771, -0.7199510335922241, -0.5054010152816772, -0.29085102677345276, -0.07630103826522827, 0.1382489800453186, 0.3527989387512207, 0.5673489570617676, 0.7818989753723145, 0.9964489936828613, 1.2109990119934082, 1.425549030303955, 1.640099048614502, 1.8546490669250488, 2.0691990852355957, 2.2837491035461426, 2.4982991218566895, 2.7128491401672363, 2.927399158477783, 3.14194917678833, 3.356499195098877, 3.571049213409424, 3.7855992317199707, 4.000149250030518, 4.2146992683410645, 4.429248809814453, 4.643798828125, 4.858348846435547, 5.072898864746094, 5.287448883056641, 5.5019989013671875, 5.716548919677734, 5.931098937988281, 6.145648956298828, 6.360198974609375, 6.574748992919922, 6.789299011230469, 7.003849029541016, 7.2183990478515625, 7.432949066162109, 7.647499084472656, 7.862049102783203]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 14.0, 24.0, 16.0, 25.0, 65.0, 107.0, 240.0, 406.0, 772.0, 1826.0, 4013.0, 10623.0, 35096.0, 163026.0, 3070956.0, 784718.0, 87604.0, 21707.0, 7313.0, 2845.0, 1313.0, 639.0, 337.0, 185.0, 110.0, 73.0, 52.0, 40.0, 27.0, 28.0, 17.0, 15.0, 10.0, 9.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.0833892822265625, -1.035919189453125, -0.9884490966796875, -0.94097900390625, -0.8935089111328125, -0.846038818359375, -0.7985687255859375, -0.7510986328125, -0.7036285400390625, -0.656158447265625, -0.6086883544921875, -0.56121826171875, -0.5137481689453125, -0.466278076171875, -0.4188079833984375, -0.371337890625, -0.3238677978515625, -0.276397705078125, -0.2289276123046875, -0.18145751953125, -0.1339874267578125, -0.086517333984375, -0.0390472412109375, 0.0084228515625, 0.0558929443359375, 0.103363037109375, 0.1508331298828125, 0.19830322265625, 0.2457733154296875, 0.293243408203125, 0.3407135009765625, 0.38818359375, 0.4356536865234375, 0.483123779296875, 0.5305938720703125, 0.57806396484375, 0.6255340576171875, 0.673004150390625, 0.7204742431640625, 0.7679443359375, 0.8154144287109375, 0.862884521484375, 0.9103546142578125, 0.95782470703125, 1.0052947998046875, 1.052764892578125, 1.1002349853515625, 1.147705078125, 1.1951751708984375, 1.242645263671875, 1.2901153564453125, 1.33758544921875, 1.3850555419921875, 1.432525634765625, 1.4799957275390625, 1.5274658203125, 1.5749359130859375, 1.622406005859375, 1.6698760986328125, 1.71734619140625, 1.7648162841796875, 1.812286376953125, 1.8597564697265625, 1.9072265625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 11.0, 8.0, 10.0, 22.0, 25.0, 59.0, 57.0, 52.0, 75.0, 78.0, 79.0, 77.0, 86.0, 71.0, 53.0, 60.0, 54.0, 46.0, 35.0, 19.0, 6.0, 9.0, 4.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2041015625, -0.1935272216796875, -0.182952880859375, -0.1723785400390625, -0.16180419921875, -0.1512298583984375, -0.140655517578125, -0.1300811767578125, -0.1195068359375, -0.1089324951171875, -0.098358154296875, -0.0877838134765625, -0.07720947265625, -0.0666351318359375, -0.056060791015625, -0.0454864501953125, -0.034912109375, -0.0243377685546875, -0.013763427734375, -0.0031890869140625, 0.00738525390625, 0.0179595947265625, 0.028533935546875, 0.0391082763671875, 0.0496826171875, 0.0602569580078125, 0.070831298828125, 0.0814056396484375, 0.09197998046875, 0.1025543212890625, 0.113128662109375, 0.1237030029296875, 0.13427734375, 0.1448516845703125, 0.155426025390625, 0.1660003662109375, 0.17657470703125, 0.1871490478515625, 0.197723388671875, 0.2082977294921875, 0.2188720703125, 0.2294464111328125, 0.240020751953125, 0.2505950927734375, 0.26116943359375, 0.2717437744140625, 0.282318115234375, 0.2928924560546875, 0.303466796875, 0.3140411376953125, 0.324615478515625, 0.3351898193359375, 0.34576416015625, 0.3563385009765625, 0.366912841796875, 0.3774871826171875, 0.3880615234375, 0.3986358642578125, 0.409210205078125, 0.4197845458984375, 0.43035888671875, 0.4409332275390625, 0.451507568359375, 0.4620819091796875, 0.47265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 6.0, 6.0, 10.0, 7.0, 13.0, 11.0, 13.0, 14.0, 20.0, 19.0, 20.0, 33.0, 48.0, 45.0, 75.0, 102.0, 219.0, 550.0, 1768.0, 6901.0, 35463.0, 328365.0, 3522094.0, 259044.0, 30655.0, 6139.0, 1577.0, 480.0, 190.0, 112.0, 70.0, 46.0, 37.0, 35.0, 18.0, 10.0, 11.0, 13.0, 13.0, 13.0, 4.0, 4.0, 4.0, 3.0, 0.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.623046875, -2.53399658203125, -2.4449462890625, -2.35589599609375, -2.266845703125, -2.17779541015625, -2.0887451171875, -1.99969482421875, -1.91064453125, -1.82159423828125, -1.7325439453125, -1.64349365234375, -1.554443359375, -1.46539306640625, -1.3763427734375, -1.28729248046875, -1.1982421875, -1.10919189453125, -1.0201416015625, -0.93109130859375, -0.842041015625, -0.75299072265625, -0.6639404296875, -0.57489013671875, -0.48583984375, -0.39678955078125, -0.3077392578125, -0.21868896484375, -0.129638671875, -0.04058837890625, 0.0484619140625, 0.13751220703125, 0.2265625, 0.31561279296875, 0.4046630859375, 0.49371337890625, 0.582763671875, 0.67181396484375, 0.7608642578125, 0.84991455078125, 0.93896484375, 1.02801513671875, 1.1170654296875, 1.20611572265625, 1.295166015625, 1.38421630859375, 1.4732666015625, 1.56231689453125, 1.6513671875, 1.74041748046875, 1.8294677734375, 1.91851806640625, 2.007568359375, 2.09661865234375, 2.1856689453125, 2.27471923828125, 2.36376953125, 2.45281982421875, 2.5418701171875, 2.63092041015625, 2.719970703125, 2.80902099609375, 2.8980712890625, 2.98712158203125, 3.076171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 9.0, 9.0, 14.0, 22.0, 51.0, 79.0, 149.0, 306.0, 800.0, 1590.0, 512.0, 243.0, 113.0, 65.0, 41.0, 31.0, 17.0, 10.0, 5.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.453125, -1.421051025390625, -1.38897705078125, -1.356903076171875, -1.3248291015625, -1.292755126953125, -1.26068115234375, -1.228607177734375, -1.196533203125, -1.164459228515625, -1.13238525390625, -1.100311279296875, -1.0682373046875, -1.036163330078125, -1.00408935546875, -0.972015380859375, -0.93994140625, -0.907867431640625, -0.87579345703125, -0.843719482421875, -0.8116455078125, -0.779571533203125, -0.74749755859375, -0.715423583984375, -0.683349609375, -0.651275634765625, -0.61920166015625, -0.587127685546875, -0.5550537109375, -0.522979736328125, -0.49090576171875, -0.458831787109375, -0.4267578125, -0.394683837890625, -0.36260986328125, -0.330535888671875, -0.2984619140625, -0.266387939453125, -0.23431396484375, -0.202239990234375, -0.170166015625, -0.138092041015625, -0.10601806640625, -0.073944091796875, -0.0418701171875, -0.009796142578125, 0.02227783203125, 0.054351806640625, 0.08642578125, 0.118499755859375, 0.15057373046875, 0.182647705078125, 0.2147216796875, 0.246795654296875, 0.27886962890625, 0.310943603515625, 0.343017578125, 0.375091552734375, 0.40716552734375, 0.439239501953125, 0.4713134765625, 0.503387451171875, 0.53546142578125, 0.567535400390625, 0.599609375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 16.0, 19.0, 39.0, 57.0, 103.0, 138.0, 169.0, 128.0, 113.0, 78.0, 62.0, 28.0, 27.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.663496494293213, -4.448001861572266, -4.23250675201416, -4.017012119293213, -3.8015174865722656, -3.5860226154327393, -3.370527744293213, -3.1550331115722656, -2.9395382404327393, -2.724043369293213, -2.5085487365722656, -2.2930538654327393, -2.077558994293213, -1.8620643615722656, -1.6465694904327393, -1.4310747385025024, -1.2155799865722656, -1.0000852346420288, -0.7845904231071472, -0.5690956115722656, -0.3536008596420288, -0.138106107711792, 0.07738876342773438, 0.2928835153579712, 0.508378267288208, 0.7238730192184448, 0.9393678307533264, 1.154862642288208, 1.3703573942184448, 1.5858521461486816, 1.801347017288208, 2.0168418884277344, 2.23233699798584, 2.447831869125366, 2.6633265018463135, 2.87882137298584, 3.094316005706787, 3.3098108768463135, 3.52530574798584, 3.740800380706787, 3.9562952518463135, 4.17179012298584, 4.387284755706787, 4.602779388427734, 4.81827449798584, 5.033769130706787, 5.249263763427734, 5.46475887298584, 5.680253505706787, 5.895748138427734, 6.11124324798584, 6.326737880706787, 6.542232513427734, 6.75772762298584, 6.973222255706787, 7.188716888427734, 7.40421199798584, 7.619706630706787, 7.835201740264893, 8.05069637298584, 8.266191482543945, 8.481685638427734, 8.69718074798584, 8.912675857543945, 9.128170013427734]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 7.0, 7.0, 8.0, 16.0, 20.0, 24.0, 31.0, 40.0, 43.0, 56.0, 63.0, 60.0, 60.0, 58.0, 63.0, 60.0, 62.0, 53.0, 56.0, 58.0, 28.0, 32.0, 27.0, 25.0, 17.0, 12.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.532818555831909, -3.417773723602295, -3.3027286529541016, -3.187683582305908, -3.072638750076294, -2.9575939178466797, -2.8425488471984863, -2.727503776550293, -2.6124589443206787, -2.4974141120910645, -2.382369041442871, -2.2673239707946777, -2.1522791385650635, -2.037234306335449, -1.9221892356872559, -1.807144284248352, -1.6920993328094482, -1.5770543813705444, -1.4620094299316406, -1.3469644784927368, -1.231919527053833, -1.1168745756149292, -1.0018296241760254, -0.8867846727371216, -0.7717397212982178, -0.656694769859314, -0.5416498184204102, -0.42660486698150635, -0.31155991554260254, -0.19651496410369873, -0.08147001266479492, 0.03357493877410889, 0.1486196517944336, 0.2636646032333374, 0.3787095546722412, 0.493754506111145, 0.6087994575500488, 0.7238444089889526, 0.8388893604278564, 0.9539343118667603, 1.068979263305664, 1.1840242147445679, 1.2990691661834717, 1.4141141176223755, 1.5291590690612793, 1.644204020500183, 1.759248971939087, 1.8742939233779907, 1.9893388748168945, 2.104383945465088, 2.219428777694702, 2.3344736099243164, 2.4495186805725098, 2.564563751220703, 2.6796085834503174, 2.7946534156799316, 2.909698486328125, 3.0247435569763184, 3.1397883892059326, 3.254833221435547, 3.3698782920837402, 3.4849233627319336, 3.599968194961548, 3.715013027191162, 3.8300580978393555]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 10.0, 13.0, 25.0, 36.0, 59.0, 85.0, 161.0, 299.0, 527.0, 994.0, 1949.0, 3876.0, 7969.0, 16832.0, 37506.0, 83274.0, 169758.0, 257766.0, 228224.0, 128303.0, 59930.0, 26776.0, 12349.0, 5769.0, 2897.0, 1428.0, 803.0, 349.0, 250.0, 132.0, 64.0, 41.0, 34.0, 18.0, 22.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.328125, -1.291015625, -1.25390625, -1.216796875, -1.1796875, -1.142578125, -1.10546875, -1.068359375, -1.03125, -0.994140625, -0.95703125, -0.919921875, -0.8828125, -0.845703125, -0.80859375, -0.771484375, -0.734375, -0.697265625, -0.66015625, -0.623046875, -0.5859375, -0.548828125, -0.51171875, -0.474609375, -0.4375, -0.400390625, -0.36328125, -0.326171875, -0.2890625, -0.251953125, -0.21484375, -0.177734375, -0.140625, -0.103515625, -0.06640625, -0.029296875, 0.0078125, 0.044921875, 0.08203125, 0.119140625, 0.15625, 0.193359375, 0.23046875, 0.267578125, 0.3046875, 0.341796875, 0.37890625, 0.416015625, 0.453125, 0.490234375, 0.52734375, 0.564453125, 0.6015625, 0.638671875, 0.67578125, 0.712890625, 0.75, 0.787109375, 0.82421875, 0.861328125, 0.8984375, 0.935546875, 0.97265625, 1.009765625, 1.046875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 8.0, 5.0, 9.0, 9.0, 7.0, 18.0, 20.0, 28.0, 26.0, 28.0, 31.0, 43.0, 43.0, 38.0, 45.0, 50.0, 45.0, 51.0, 51.0, 57.0, 32.0, 46.0, 36.0, 27.0, 42.0, 48.0, 22.0, 25.0, 22.0, 22.0, 15.0, 9.0, 11.0, 13.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.188232421875, -0.18152999877929688, -0.17482757568359375, -0.16812515258789062, -0.1614227294921875, -0.15472030639648438, -0.14801788330078125, -0.14131546020507812, -0.134613037109375, -0.12791061401367188, -0.12120819091796875, -0.11450576782226562, -0.1078033447265625, -0.10110092163085938, -0.09439849853515625, -0.08769607543945312, -0.08099365234375, -0.07429122924804688, -0.06758880615234375, -0.060886383056640625, -0.0541839599609375, -0.047481536865234375, -0.04077911376953125, -0.034076690673828125, -0.027374267578125, -0.020671844482421875, -0.01396942138671875, -0.007266998291015625, -0.0005645751953125, 0.006137847900390625, 0.01284027099609375, 0.019542694091796875, 0.0262451171875, 0.032947540283203125, 0.03964996337890625, 0.046352386474609375, 0.0530548095703125, 0.059757232666015625, 0.06645965576171875, 0.07316207885742188, 0.079864501953125, 0.08656692504882812, 0.09326934814453125, 0.09997177124023438, 0.1066741943359375, 0.11337661743164062, 0.12007904052734375, 0.12678146362304688, 0.13348388671875, 0.14018630981445312, 0.14688873291015625, 0.15359115600585938, 0.1602935791015625, 0.16699600219726562, 0.17369842529296875, 0.18040084838867188, 0.187103271484375, 0.19380569458007812, 0.20050811767578125, 0.20721054077148438, 0.2139129638671875, 0.22061538696289062, 0.22731781005859375, 0.23402023315429688, 0.24072265625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 5.0, 5.0, 12.0, 10.0, 17.0, 25.0, 39.0, 42.0, 52.0, 108.0, 158.0, 276.0, 444.0, 794.0, 1618.0, 3291.0, 7204.0, 17029.0, 39815.0, 91519.0, 187401.0, 274476.0, 219718.0, 114554.0, 50376.0, 21627.0, 9350.0, 4206.0, 2025.0, 1026.0, 511.0, 308.0, 157.0, 121.0, 70.0, 47.0, 24.0, 21.0, 21.0, 18.0, 11.0, 8.0, 9.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.2158203125, -1.18072509765625, -1.1456298828125, -1.11053466796875, -1.075439453125, -1.04034423828125, -1.0052490234375, -0.97015380859375, -0.93505859375, -0.89996337890625, -0.8648681640625, -0.82977294921875, -0.794677734375, -0.75958251953125, -0.7244873046875, -0.68939208984375, -0.654296875, -0.61920166015625, -0.5841064453125, -0.54901123046875, -0.513916015625, -0.47882080078125, -0.4437255859375, -0.40863037109375, -0.37353515625, -0.33843994140625, -0.3033447265625, -0.26824951171875, -0.233154296875, -0.19805908203125, -0.1629638671875, -0.12786865234375, -0.0927734375, -0.05767822265625, -0.0225830078125, 0.01251220703125, 0.047607421875, 0.08270263671875, 0.1177978515625, 0.15289306640625, 0.18798828125, 0.22308349609375, 0.2581787109375, 0.29327392578125, 0.328369140625, 0.36346435546875, 0.3985595703125, 0.43365478515625, 0.46875, 0.50384521484375, 0.5389404296875, 0.57403564453125, 0.609130859375, 0.64422607421875, 0.6793212890625, 0.71441650390625, 0.74951171875, 0.78460693359375, 0.8197021484375, 0.85479736328125, 0.889892578125, 0.92498779296875, 0.9600830078125, 0.99517822265625, 1.0302734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 8.0, 9.0, 8.0, 5.0, 12.0, 14.0, 24.0, 24.0, 19.0, 31.0, 28.0, 33.0, 39.0, 37.0, 37.0, 42.0, 50.0, 43.0, 52.0, 49.0, 46.0, 47.0, 42.0, 37.0, 41.0, 37.0, 34.0, 29.0, 21.0, 21.0, 20.0, 16.0, 15.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1796875, -1.143218994140625, -1.10675048828125, -1.070281982421875, -1.0338134765625, -0.997344970703125, -0.96087646484375, -0.924407958984375, -0.887939453125, -0.851470947265625, -0.81500244140625, -0.778533935546875, -0.7420654296875, -0.705596923828125, -0.66912841796875, -0.632659912109375, -0.59619140625, -0.559722900390625, -0.52325439453125, -0.486785888671875, -0.4503173828125, -0.413848876953125, -0.37738037109375, -0.340911865234375, -0.304443359375, -0.267974853515625, -0.23150634765625, -0.195037841796875, -0.1585693359375, -0.122100830078125, -0.08563232421875, -0.049163818359375, -0.0126953125, 0.023773193359375, 0.06024169921875, 0.096710205078125, 0.1331787109375, 0.169647216796875, 0.20611572265625, 0.242584228515625, 0.279052734375, 0.315521240234375, 0.35198974609375, 0.388458251953125, 0.4249267578125, 0.461395263671875, 0.49786376953125, 0.534332275390625, 0.57080078125, 0.607269287109375, 0.64373779296875, 0.680206298828125, 0.7166748046875, 0.753143310546875, 0.78961181640625, 0.826080322265625, 0.862548828125, 0.899017333984375, 0.93548583984375, 0.971954345703125, 1.0084228515625, 1.044891357421875, 1.08135986328125, 1.117828369140625, 1.154296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 5.0, 13.0, 12.0, 8.0, 17.0, 23.0, 42.0, 61.0, 72.0, 147.0, 280.0, 603.0, 1281.0, 2956.0, 8106.0, 25443.0, 129981.0, 693327.0, 144733.0, 27135.0, 8658.0, 3020.0, 1267.0, 645.0, 280.0, 166.0, 98.0, 56.0, 38.0, 14.0, 17.0, 10.0, 11.0, 6.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6630859375, -1.6047821044921875, -1.546478271484375, -1.4881744384765625, -1.42987060546875, -1.3715667724609375, -1.313262939453125, -1.2549591064453125, -1.1966552734375, -1.1383514404296875, -1.080047607421875, -1.0217437744140625, -0.96343994140625, -0.9051361083984375, -0.846832275390625, -0.7885284423828125, -0.730224609375, -0.6719207763671875, -0.613616943359375, -0.5553131103515625, -0.49700927734375, -0.4387054443359375, -0.380401611328125, -0.3220977783203125, -0.2637939453125, -0.2054901123046875, -0.147186279296875, -0.0888824462890625, -0.03057861328125, 0.0277252197265625, 0.086029052734375, 0.1443328857421875, 0.20263671875, 0.2609405517578125, 0.319244384765625, 0.3775482177734375, 0.43585205078125, 0.4941558837890625, 0.552459716796875, 0.6107635498046875, 0.6690673828125, 0.7273712158203125, 0.785675048828125, 0.8439788818359375, 0.90228271484375, 0.9605865478515625, 1.018890380859375, 1.0771942138671875, 1.135498046875, 1.1938018798828125, 1.252105712890625, 1.3104095458984375, 1.36871337890625, 1.4270172119140625, 1.485321044921875, 1.5436248779296875, 1.6019287109375, 1.6602325439453125, 1.718536376953125, 1.7768402099609375, 1.83514404296875, 1.8934478759765625, 1.951751708984375, 2.0100555419921875, 2.068359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 8.0, 2.0, 3.0, 12.0, 7.0, 13.0, 22.0, 24.0, 22.0, 39.0, 74.0, 95.0, 131.0, 164.0, 101.0, 70.0, 66.0, 42.0, 31.0, 17.0, 10.0, 14.0, 9.0, 8.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00021159648895263672, -0.00020560063421726227, -0.00019960477948188782, -0.00019360892474651337, -0.00018761307001113892, -0.00018161721527576447, -0.00017562136054039001, -0.00016962550580501556, -0.0001636296510696411, -0.00015763379633426666, -0.0001516379415988922, -0.00014564208686351776, -0.0001396462321281433, -0.00013365037739276886, -0.0001276545226573944, -0.00012165866792201996, -0.00011566281318664551, -0.00010966695845127106, -0.0001036711037158966, -9.767524898052216e-05, -9.16793942451477e-05, -8.568353950977325e-05, -7.96876847743988e-05, -7.369183003902435e-05, -6.76959753036499e-05, -6.170012056827545e-05, -5.5704265832901e-05, -4.970841109752655e-05, -4.37125563621521e-05, -3.771670162677765e-05, -3.17208468914032e-05, -2.5724992156028748e-05, -1.9729137420654297e-05, -1.3733282685279846e-05, -7.737427949905396e-06, -1.7415732145309448e-06, 4.254281520843506e-06, 1.0250136256217957e-05, 1.6245990991592407e-05, 2.2241845726966858e-05, 2.823770046234131e-05, 3.423355519771576e-05, 4.022940993309021e-05, 4.622526466846466e-05, 5.222111940383911e-05, 5.821697413921356e-05, 6.421282887458801e-05, 7.020868360996246e-05, 7.620453834533691e-05, 8.220039308071136e-05, 8.819624781608582e-05, 9.419210255146027e-05, 0.00010018795728683472, 0.00010618381202220917, 0.00011217966675758362, 0.00011817552149295807, 0.00012417137622833252, 0.00013016723096370697, 0.00013616308569908142, 0.00014215894043445587, 0.00014815479516983032, 0.00015415064990520477, 0.00016014650464057922, 0.00016614235937595367, 0.00017213821411132812]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 14.0, 16.0, 25.0, 40.0, 88.0, 131.0, 222.0, 442.0, 1067.0, 2778.0, 8369.0, 37165.0, 583482.0, 374039.0, 29180.0, 7190.0, 2372.0, 985.0, 450.0, 225.0, 119.0, 46.0, 29.0, 21.0, 12.0, 16.0, 3.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.970703125, -3.86871337890625, -3.7667236328125, -3.66473388671875, -3.562744140625, -3.46075439453125, -3.3587646484375, -3.25677490234375, -3.15478515625, -3.05279541015625, -2.9508056640625, -2.84881591796875, -2.746826171875, -2.64483642578125, -2.5428466796875, -2.44085693359375, -2.3388671875, -2.23687744140625, -2.1348876953125, -2.03289794921875, -1.930908203125, -1.82891845703125, -1.7269287109375, -1.62493896484375, -1.52294921875, -1.42095947265625, -1.3189697265625, -1.21697998046875, -1.114990234375, -1.01300048828125, -0.9110107421875, -0.80902099609375, -0.70703125, -0.60504150390625, -0.5030517578125, -0.40106201171875, -0.299072265625, -0.19708251953125, -0.0950927734375, 0.00689697265625, 0.10888671875, 0.21087646484375, 0.3128662109375, 0.41485595703125, 0.516845703125, 0.61883544921875, 0.7208251953125, 0.82281494140625, 0.9248046875, 1.02679443359375, 1.1287841796875, 1.23077392578125, 1.332763671875, 1.43475341796875, 1.5367431640625, 1.63873291015625, 1.74072265625, 1.84271240234375, 1.9447021484375, 2.04669189453125, 2.148681640625, 2.25067138671875, 2.3526611328125, 2.45465087890625, 2.556640625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 3.0, 9.0, 5.0, 10.0, 13.0, 15.0, 23.0, 23.0, 57.0, 82.0, 172.0, 193.0, 153.0, 90.0, 47.0, 27.0, 24.0, 16.0, 6.0, 4.0, 7.0, 7.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.720703125, -1.662322998046875, -1.60394287109375, -1.545562744140625, -1.4871826171875, -1.428802490234375, -1.37042236328125, -1.312042236328125, -1.253662109375, -1.195281982421875, -1.13690185546875, -1.078521728515625, -1.0201416015625, -0.961761474609375, -0.90338134765625, -0.845001220703125, -0.78662109375, -0.728240966796875, -0.66986083984375, -0.611480712890625, -0.5531005859375, -0.494720458984375, -0.43634033203125, -0.377960205078125, -0.319580078125, -0.261199951171875, -0.20281982421875, -0.144439697265625, -0.0860595703125, -0.027679443359375, 0.03070068359375, 0.089080810546875, 0.1474609375, 0.205841064453125, 0.26422119140625, 0.322601318359375, 0.3809814453125, 0.439361572265625, 0.49774169921875, 0.556121826171875, 0.614501953125, 0.672882080078125, 0.73126220703125, 0.789642333984375, 0.8480224609375, 0.906402587890625, 0.96478271484375, 1.023162841796875, 1.08154296875, 1.139923095703125, 1.19830322265625, 1.256683349609375, 1.3150634765625, 1.373443603515625, 1.43182373046875, 1.490203857421875, 1.548583984375, 1.606964111328125, 1.66534423828125, 1.723724365234375, 1.7821044921875, 1.840484619140625, 1.89886474609375, 1.957244873046875, 2.015625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 18.0, 18.0, 38.0, 48.0, 83.0, 117.0, 124.0, 136.0, 130.0, 93.0, 70.0, 45.0, 25.0, 11.0, 15.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.825067520141602, -7.345456123352051, -6.865845203399658, -6.386234283447266, -5.906622886657715, -5.427011489868164, -4.9474005699157715, -4.467789649963379, -3.988178253173828, -3.5085670948028564, -3.0289559364318848, -2.549344778060913, -2.0697336196899414, -1.5901224613189697, -1.110511302947998, -0.6309001445770264, -0.1512889862060547, 0.328322172164917, 0.8079333305358887, 1.2875444889068604, 1.767155647277832, 2.2467668056488037, 2.7263779640197754, 3.205989122390747, 3.6856002807617188, 4.1652116775512695, 4.644822597503662, 5.124433517456055, 5.6040449142456055, 6.083656311035156, 6.563267230987549, 7.042878150939941, 7.522489547729492, 8.002100944519043, 8.481712341308594, 8.961322784423828, 9.440934181213379, 9.92054557800293, 10.400156021118164, 10.879767417907715, 11.359378814697266, 11.838990211486816, 12.318601608276367, 12.798212051391602, 13.277823448181152, 13.757434844970703, 14.237045288085938, 14.716656684875488, 15.196268081665039, 15.67587947845459, 16.15549087524414, 16.635101318359375, 17.11471176147461, 17.594324111938477, 18.07393455505371, 18.553546905517578, 19.033157348632812, 19.512767791748047, 19.992380142211914, 20.47199058532715, 20.951602935791016, 21.43121337890625, 21.910823822021484, 22.39043617248535, 22.870046615600586]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 4.0, 5.0, 9.0, 7.0, 12.0, 16.0, 17.0, 26.0, 27.0, 30.0, 32.0, 37.0, 31.0, 37.0, 33.0, 44.0, 44.0, 53.0, 44.0, 51.0, 49.0, 46.0, 54.0, 29.0, 44.0, 40.0, 29.0, 32.0, 20.0, 15.0, 14.0, 16.0, 10.0, 10.0, 8.0, 3.0, 6.0, 3.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.124210357666016, -7.890478134155273, -7.6567463874816895, -7.423014163970947, -7.189282417297363, -6.955550193786621, -6.721817970275879, -6.488086223602295, -6.254354476928711, -6.020622253417969, -5.786890506744385, -5.553158283233643, -5.319426536560059, -5.085694313049316, -4.851962089538574, -4.61823034286499, -4.384498119354248, -4.150765895843506, -3.917034149169922, -3.6833019256591797, -3.4495701789855957, -3.2158379554748535, -2.9821059703826904, -2.7483739852905273, -2.5146420001983643, -2.280910015106201, -2.047178030014038, -1.8134459257125854, -1.5797139406204224, -1.3459819555282593, -1.1122498512268066, -0.8785178661346436, -0.6447858810424805, -0.411053866147995, -0.17732185125350952, 0.05641019344329834, 0.2901421785354614, 0.5238741636276245, 0.7576062679290771, 0.9913382530212402, 1.2250702381134033, 1.4588022232055664, 1.6925342082977295, 1.9262663125991821, 2.1599984169006348, 2.3937301635742188, 2.627462387084961, 2.861194372177124, 3.094926357269287, 3.32865834236145, 3.5623903274536133, 3.7961225509643555, 4.0298542976379395, 4.263586521148682, 4.497318267822266, 4.731050491333008, 4.96478271484375, 5.198514938354492, 5.432246685028076, 5.665978908538818, 5.899710655212402, 6.1334428787231445, 6.367175102233887, 6.600906848907471, 6.834638595581055]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 7.0, 15.0, 23.0, 36.0, 54.0, 77.0, 165.0, 305.0, 602.0, 1316.0, 3250.0, 8962.0, 31670.0, 169860.0, 3437754.0, 461259.0, 56512.0, 14073.0, 4653.0, 1840.0, 793.0, 424.0, 250.0, 124.0, 96.0, 52.0, 34.0, 25.0, 16.0, 8.0, 10.0, 2.0, 7.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.171875, -2.1110382080078125, -2.050201416015625, -1.9893646240234375, -1.92852783203125, -1.8676910400390625, -1.806854248046875, -1.7460174560546875, -1.6851806640625, -1.6243438720703125, -1.563507080078125, -1.5026702880859375, -1.44183349609375, -1.3809967041015625, -1.320159912109375, -1.2593231201171875, -1.198486328125, -1.1376495361328125, -1.076812744140625, -1.0159759521484375, -0.95513916015625, -0.8943023681640625, -0.833465576171875, -0.7726287841796875, -0.7117919921875, -0.6509552001953125, -0.590118408203125, -0.5292816162109375, -0.46844482421875, -0.4076080322265625, -0.346771240234375, -0.2859344482421875, -0.22509765625, -0.1642608642578125, -0.103424072265625, -0.0425872802734375, 0.01824951171875, 0.0790863037109375, 0.139923095703125, 0.2007598876953125, 0.2615966796875, 0.3224334716796875, 0.383270263671875, 0.4441070556640625, 0.50494384765625, 0.5657806396484375, 0.626617431640625, 0.6874542236328125, 0.748291015625, 0.8091278076171875, 0.869964599609375, 0.9308013916015625, 0.99163818359375, 1.0524749755859375, 1.113311767578125, 1.1741485595703125, 1.2349853515625, 1.2958221435546875, 1.356658935546875, 1.4174957275390625, 1.47833251953125, 1.5391693115234375, 1.600006103515625, 1.6608428955078125, 1.7216796875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 8.0, 4.0, 7.0, 9.0, 17.0, 20.0, 23.0, 36.0, 46.0, 40.0, 42.0, 73.0, 81.0, 60.0, 51.0, 78.0, 57.0, 74.0, 48.0, 59.0, 38.0, 39.0, 33.0, 20.0, 15.0, 11.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2467041015625, -0.2362537384033203, -0.22580337524414062, -0.21535301208496094, -0.20490264892578125, -0.19445228576660156, -0.18400192260742188, -0.1735515594482422, -0.1631011962890625, -0.1526508331298828, -0.14220046997070312, -0.13175010681152344, -0.12129974365234375, -0.11084938049316406, -0.10039901733398438, -0.08994865417480469, -0.079498291015625, -0.06904792785644531, -0.058597564697265625, -0.04814720153808594, -0.03769683837890625, -0.027246475219726562, -0.016796112060546875, -0.0063457489013671875, 0.0041046142578125, 0.014554977416992188, 0.025005340576171875, 0.03545570373535156, 0.04590606689453125, 0.05635643005371094, 0.06680679321289062, 0.07725715637207031, 0.08770751953125, 0.09815788269042969, 0.10860824584960938, 0.11905860900878906, 0.12950897216796875, 0.13995933532714844, 0.15040969848632812, 0.1608600616455078, 0.1713104248046875, 0.1817607879638672, 0.19221115112304688, 0.20266151428222656, 0.21311187744140625, 0.22356224060058594, 0.23401260375976562, 0.2444629669189453, 0.254913330078125, 0.2653636932373047, 0.2758140563964844, 0.28626441955566406, 0.29671478271484375, 0.30716514587402344, 0.3176155090332031, 0.3280658721923828, 0.3385162353515625, 0.3489665985107422, 0.3594169616699219, 0.36986732482910156, 0.38031768798828125, 0.39076805114746094, 0.4012184143066406, 0.4116687774658203, 0.422119140625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 14.0, 24.0, 31.0, 63.0, 80.0, 162.0, 294.0, 646.0, 1439.0, 3518.0, 9227.0, 28187.0, 108464.0, 745142.0, 2971666.0, 246890.0, 52381.0, 15956.0, 5720.0, 2353.0, 989.0, 438.0, 267.0, 144.0, 79.0, 52.0, 23.0, 13.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.302734375, -1.2384033203125, -1.174072265625, -1.1097412109375, -1.04541015625, -0.9810791015625, -0.916748046875, -0.8524169921875, -0.7880859375, -0.7237548828125, -0.659423828125, -0.5950927734375, -0.53076171875, -0.4664306640625, -0.402099609375, -0.3377685546875, -0.2734375, -0.2091064453125, -0.144775390625, -0.0804443359375, -0.01611328125, 0.0482177734375, 0.112548828125, 0.1768798828125, 0.2412109375, 0.3055419921875, 0.369873046875, 0.4342041015625, 0.49853515625, 0.5628662109375, 0.627197265625, 0.6915283203125, 0.755859375, 0.8201904296875, 0.884521484375, 0.9488525390625, 1.01318359375, 1.0775146484375, 1.141845703125, 1.2061767578125, 1.2705078125, 1.3348388671875, 1.399169921875, 1.4635009765625, 1.52783203125, 1.5921630859375, 1.656494140625, 1.7208251953125, 1.78515625, 1.8494873046875, 1.913818359375, 1.9781494140625, 2.04248046875, 2.1068115234375, 2.171142578125, 2.2354736328125, 2.2998046875, 2.3641357421875, 2.428466796875, 2.4927978515625, 2.55712890625, 2.6214599609375, 2.685791015625, 2.7501220703125, 2.814453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 7.0, 15.0, 15.0, 21.0, 18.0, 31.0, 35.0, 50.0, 97.0, 134.0, 176.0, 290.0, 617.0, 1210.0, 580.0, 274.0, 139.0, 107.0, 69.0, 49.0, 32.0, 25.0, 14.0, 13.0, 10.0, 7.0, 3.0, 7.0, 6.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.751953125, -0.7272415161132812, -0.7025299072265625, -0.6778182983398438, -0.653106689453125, -0.6283950805664062, -0.6036834716796875, -0.5789718627929688, -0.55426025390625, -0.5295486450195312, -0.5048370361328125, -0.48012542724609375, -0.455413818359375, -0.43070220947265625, -0.4059906005859375, -0.38127899169921875, -0.3565673828125, -0.33185577392578125, -0.3071441650390625, -0.28243255615234375, -0.257720947265625, -0.23300933837890625, -0.2082977294921875, -0.18358612060546875, -0.15887451171875, -0.13416290283203125, -0.1094512939453125, -0.08473968505859375, -0.060028076171875, -0.03531646728515625, -0.0106048583984375, 0.01410675048828125, 0.038818359375, 0.06352996826171875, 0.0882415771484375, 0.11295318603515625, 0.137664794921875, 0.16237640380859375, 0.1870880126953125, 0.21179962158203125, 0.23651123046875, 0.26122283935546875, 0.2859344482421875, 0.31064605712890625, 0.335357666015625, 0.36006927490234375, 0.3847808837890625, 0.40949249267578125, 0.4342041015625, 0.45891571044921875, 0.4836273193359375, 0.5083389282226562, 0.533050537109375, 0.5577621459960938, 0.5824737548828125, 0.6071853637695312, 0.63189697265625, 0.6566085815429688, 0.6813201904296875, 0.7060317993164062, 0.730743408203125, 0.7554550170898438, 0.7801666259765625, 0.8048782348632812, 0.82958984375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 5.0, 7.0, 11.0, 16.0, 19.0, 30.0, 45.0, 52.0, 83.0, 105.0, 100.0, 121.0, 109.0, 62.0, 73.0, 43.0, 24.0, 27.0, 31.0, 12.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.115675449371338, -4.941844940185547, -4.768013954162598, -4.594183444976807, -4.420352935791016, -4.246521949768066, -4.072691440582275, -3.8988606929779053, -3.725029945373535, -3.551199197769165, -3.377368688583374, -3.203537940979004, -3.029707193374634, -2.8558764457702637, -2.6820459365844727, -2.5082151889801025, -2.3343846797943115, -2.1605539321899414, -1.9867233037948608, -1.8128926753997803, -1.6390619277954102, -1.4652312994003296, -1.291400671005249, -1.117569923400879, -0.9437392950057983, -0.769908607006073, -0.5960779190063477, -0.4222472906112671, -0.24841660261154175, -0.0745859146118164, 0.09924471378326416, 0.2730754613876343, 0.44690608978271484, 0.6207367777824402, 0.7945674657821655, 0.9683980941772461, 1.1422288417816162, 1.3160594701766968, 1.4898900985717773, 1.6637208461761475, 1.837551474571228, 2.0113821029663086, 2.1852128505706787, 2.359043598175049, 2.53287410736084, 2.70670485496521, 2.88053560256958, 3.054366111755371, 3.228196859359741, 3.4020276069641113, 3.5758581161499023, 3.7496888637542725, 3.9235196113586426, 4.097350120544434, 4.271181106567383, 4.445011615753174, 4.618842124938965, 4.792672634124756, 4.966503620147705, 5.140334129333496, 5.314164638519287, 5.487995624542236, 5.661826133728027, 5.835657119750977, 6.009487628936768]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 9.0, 7.0, 10.0, 15.0, 11.0, 21.0, 25.0, 29.0, 39.0, 51.0, 47.0, 66.0, 60.0, 60.0, 73.0, 57.0, 65.0, 50.0, 59.0, 47.0, 47.0, 36.0, 24.0, 32.0, 23.0, 17.0, 8.0, 9.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.532545566558838, -4.389682769775391, -4.246819496154785, -4.10395622253418, -3.9610934257507324, -3.818230390548706, -3.6753673553466797, -3.5325043201446533, -3.389641284942627, -3.2467782497406006, -3.103915214538574, -2.961052179336548, -2.8181891441345215, -2.675326108932495, -2.5324630737304688, -2.3896000385284424, -2.246737003326416, -2.1038739681243896, -1.9610109329223633, -1.818147897720337, -1.6752848625183105, -1.5324218273162842, -1.3895587921142578, -1.2466957569122314, -1.103832721710205, -0.9609696865081787, -0.8181066513061523, -0.675243616104126, -0.5323805809020996, -0.38951754570007324, -0.24665451049804688, -0.10379147529602051, 0.039071083068847656, 0.18193411827087402, 0.3247971534729004, 0.46766018867492676, 0.6105232238769531, 0.7533862590789795, 0.8962492942810059, 1.0391123294830322, 1.1819753646850586, 1.324838399887085, 1.4677014350891113, 1.6105644702911377, 1.753427505493164, 1.8962905406951904, 2.039153575897217, 2.182016611099243, 2.3248796463012695, 2.467742681503296, 2.6106057167053223, 2.7534687519073486, 2.896331787109375, 3.0391948223114014, 3.1820578575134277, 3.324920892715454, 3.4677839279174805, 3.610646963119507, 3.753509998321533, 3.8963730335235596, 4.039236068725586, 4.182099342346191, 4.324962139129639, 4.467824935913086, 4.610688209533691]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 13.0, 15.0, 40.0, 80.0, 170.0, 444.0, 1145.0, 3688.0, 13168.0, 51892.0, 211809.0, 465086.0, 225604.0, 55515.0, 13888.0, 3900.0, 1295.0, 457.0, 184.0, 69.0, 38.0, 28.0, 11.0, 4.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.080078125, -2.011932373046875, -1.94378662109375, -1.875640869140625, -1.8074951171875, -1.739349365234375, -1.67120361328125, -1.603057861328125, -1.534912109375, -1.466766357421875, -1.39862060546875, -1.330474853515625, -1.2623291015625, -1.194183349609375, -1.12603759765625, -1.057891845703125, -0.98974609375, -0.921600341796875, -0.85345458984375, -0.785308837890625, -0.7171630859375, -0.649017333984375, -0.58087158203125, -0.512725830078125, -0.444580078125, -0.376434326171875, -0.30828857421875, -0.240142822265625, -0.1719970703125, -0.103851318359375, -0.03570556640625, 0.032440185546875, 0.1005859375, 0.168731689453125, 0.23687744140625, 0.305023193359375, 0.3731689453125, 0.441314697265625, 0.50946044921875, 0.577606201171875, 0.645751953125, 0.713897705078125, 0.78204345703125, 0.850189208984375, 0.9183349609375, 0.986480712890625, 1.05462646484375, 1.122772216796875, 1.19091796875, 1.259063720703125, 1.32720947265625, 1.395355224609375, 1.4635009765625, 1.531646728515625, 1.59979248046875, 1.667938232421875, 1.736083984375, 1.804229736328125, 1.87237548828125, 1.940521240234375, 2.0086669921875, 2.076812744140625, 2.14495849609375, 2.213104248046875, 2.28125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 4.0, 17.0, 13.0, 11.0, 18.0, 18.0, 16.0, 22.0, 24.0, 36.0, 33.0, 28.0, 37.0, 50.0, 43.0, 36.0, 39.0, 40.0, 52.0, 48.0, 47.0, 37.0, 35.0, 34.0, 42.0, 25.0, 30.0, 28.0, 13.0, 17.0, 20.0, 22.0, 14.0, 13.0, 5.0, 8.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2529296875, -0.2456340789794922, -0.23833847045898438, -0.23104286193847656, -0.22374725341796875, -0.21645164489746094, -0.20915603637695312, -0.2018604278564453, -0.1945648193359375, -0.1872692108154297, -0.17997360229492188, -0.17267799377441406, -0.16538238525390625, -0.15808677673339844, -0.15079116821289062, -0.1434955596923828, -0.136199951171875, -0.1289043426513672, -0.12160873413085938, -0.11431312561035156, -0.10701751708984375, -0.09972190856933594, -0.09242630004882812, -0.08513069152832031, -0.0778350830078125, -0.07053947448730469, -0.06324386596679688, -0.05594825744628906, -0.04865264892578125, -0.04135704040527344, -0.034061431884765625, -0.026765823364257812, -0.01947021484375, -0.012174606323242188, -0.004878997802734375, 0.0024166107177734375, 0.00971221923828125, 0.017007827758789062, 0.024303436279296875, 0.03159904479980469, 0.0388946533203125, 0.04619026184082031, 0.053485870361328125, 0.06078147888183594, 0.06807708740234375, 0.07537269592285156, 0.08266830444335938, 0.08996391296386719, 0.097259521484375, 0.10455513000488281, 0.11185073852539062, 0.11914634704589844, 0.12644195556640625, 0.13373756408691406, 0.14103317260742188, 0.1483287811279297, 0.1556243896484375, 0.1629199981689453, 0.17021560668945312, 0.17751121520996094, 0.18480682373046875, 0.19210243225097656, 0.19939804077148438, 0.2066936492919922, 0.2139892578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 11.0, 11.0, 25.0, 23.0, 45.0, 44.0, 58.0, 99.0, 138.0, 231.0, 381.0, 682.0, 1215.0, 2375.0, 4346.0, 8386.0, 17384.0, 38183.0, 87716.0, 194897.0, 300218.0, 213173.0, 97893.0, 42254.0, 19082.0, 9232.0, 4712.0, 2521.0, 1327.0, 746.0, 414.0, 232.0, 141.0, 114.0, 66.0, 50.0, 26.0, 34.0, 17.0, 12.0, 12.0, 9.0, 1.0, 7.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-1.380859375, -1.340911865234375, -1.30096435546875, -1.261016845703125, -1.2210693359375, -1.181121826171875, -1.14117431640625, -1.101226806640625, -1.061279296875, -1.021331787109375, -0.98138427734375, -0.941436767578125, -0.9014892578125, -0.861541748046875, -0.82159423828125, -0.781646728515625, -0.74169921875, -0.701751708984375, -0.66180419921875, -0.621856689453125, -0.5819091796875, -0.541961669921875, -0.50201416015625, -0.462066650390625, -0.422119140625, -0.382171630859375, -0.34222412109375, -0.302276611328125, -0.2623291015625, -0.222381591796875, -0.18243408203125, -0.142486572265625, -0.1025390625, -0.062591552734375, -0.02264404296875, 0.017303466796875, 0.0572509765625, 0.097198486328125, 0.13714599609375, 0.177093505859375, 0.217041015625, 0.256988525390625, 0.29693603515625, 0.336883544921875, 0.3768310546875, 0.416778564453125, 0.45672607421875, 0.496673583984375, 0.53662109375, 0.576568603515625, 0.61651611328125, 0.656463623046875, 0.6964111328125, 0.736358642578125, 0.77630615234375, 0.816253662109375, 0.856201171875, 0.896148681640625, 0.93609619140625, 0.976043701171875, 1.0159912109375, 1.055938720703125, 1.09588623046875, 1.135833740234375, 1.17578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 3.0, 8.0, 10.0, 12.0, 10.0, 12.0, 14.0, 16.0, 23.0, 22.0, 23.0, 39.0, 36.0, 39.0, 45.0, 41.0, 41.0, 45.0, 36.0, 36.0, 56.0, 57.0, 41.0, 42.0, 31.0, 29.0, 31.0, 31.0, 28.0, 21.0, 20.0, 17.0, 12.0, 13.0, 9.0, 6.0, 12.0, 6.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.25390625, -1.2167205810546875, -1.179534912109375, -1.1423492431640625, -1.10516357421875, -1.0679779052734375, -1.030792236328125, -0.9936065673828125, -0.9564208984375, -0.9192352294921875, -0.882049560546875, -0.8448638916015625, -0.80767822265625, -0.7704925537109375, -0.733306884765625, -0.6961212158203125, -0.658935546875, -0.6217498779296875, -0.584564208984375, -0.5473785400390625, -0.51019287109375, -0.4730072021484375, -0.435821533203125, -0.3986358642578125, -0.3614501953125, -0.3242645263671875, -0.287078857421875, -0.2498931884765625, -0.21270751953125, -0.1755218505859375, -0.138336181640625, -0.1011505126953125, -0.06396484375, -0.0267791748046875, 0.010406494140625, 0.0475921630859375, 0.08477783203125, 0.1219635009765625, 0.159149169921875, 0.1963348388671875, 0.2335205078125, 0.2707061767578125, 0.307891845703125, 0.3450775146484375, 0.38226318359375, 0.4194488525390625, 0.456634521484375, 0.4938201904296875, 0.531005859375, 0.5681915283203125, 0.605377197265625, 0.6425628662109375, 0.67974853515625, 0.7169342041015625, 0.754119873046875, 0.7913055419921875, 0.8284912109375, 0.8656768798828125, 0.902862548828125, 0.9400482177734375, 0.97723388671875, 1.0144195556640625, 1.051605224609375, 1.0887908935546875, 1.1259765625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 7.0, 18.0, 22.0, 42.0, 74.0, 97.0, 163.0, 372.0, 873.0, 2665.0, 10151.0, 65149.0, 859688.0, 91760.0, 12459.0, 3154.0, 958.0, 405.0, 196.0, 120.0, 69.0, 34.0, 27.0, 19.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.205078125, -2.1304931640625, -2.055908203125, -1.9813232421875, -1.90673828125, -1.8321533203125, -1.757568359375, -1.6829833984375, -1.6083984375, -1.5338134765625, -1.459228515625, -1.3846435546875, -1.31005859375, -1.2354736328125, -1.160888671875, -1.0863037109375, -1.01171875, -0.9371337890625, -0.862548828125, -0.7879638671875, -0.71337890625, -0.6387939453125, -0.564208984375, -0.4896240234375, -0.4150390625, -0.3404541015625, -0.265869140625, -0.1912841796875, -0.11669921875, -0.0421142578125, 0.032470703125, 0.1070556640625, 0.181640625, 0.2562255859375, 0.330810546875, 0.4053955078125, 0.47998046875, 0.5545654296875, 0.629150390625, 0.7037353515625, 0.7783203125, 0.8529052734375, 0.927490234375, 1.0020751953125, 1.07666015625, 1.1512451171875, 1.225830078125, 1.3004150390625, 1.375, 1.4495849609375, 1.524169921875, 1.5987548828125, 1.67333984375, 1.7479248046875, 1.822509765625, 1.8970947265625, 1.9716796875, 2.0462646484375, 2.120849609375, 2.1954345703125, 2.27001953125, 2.3446044921875, 2.419189453125, 2.4937744140625, 2.568359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 10.0, 6.0, 12.0, 18.0, 24.0, 45.0, 89.0, 284.0, 280.0, 89.0, 44.0, 23.0, 14.0, 13.0, 7.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002455711364746094, -0.00023612752556800842, -0.00022668391466140747, -0.00021724030375480652, -0.00020779669284820557, -0.00019835308194160461, -0.00018890947103500366, -0.0001794658601284027, -0.00017002224922180176, -0.0001605786383152008, -0.00015113502740859985, -0.0001416914165019989, -0.00013224780559539795, -0.000122804194688797, -0.00011336058378219604, -0.00010391697287559509, -9.447336196899414e-05, -8.502975106239319e-05, -7.558614015579224e-05, -6.614252924919128e-05, -5.669891834259033e-05, -4.725530743598938e-05, -3.781169652938843e-05, -2.8368085622787476e-05, -1.8924474716186523e-05, -9.480863809585571e-06, -3.725290298461914e-08, 9.406358003616333e-06, 1.8849968910217285e-05, 2.8293579816818237e-05, 3.773719072341919e-05, 4.718080163002014e-05, 5.6624412536621094e-05, 6.606802344322205e-05, 7.5511634349823e-05, 8.495524525642395e-05, 9.43988561630249e-05, 0.00010384246706962585, 0.0001132860779762268, 0.00012272968888282776, 0.0001321732997894287, 0.00014161691069602966, 0.00015106052160263062, 0.00016050413250923157, 0.00016994774341583252, 0.00017939135432243347, 0.00018883496522903442, 0.00019827857613563538, 0.00020772218704223633, 0.00021716579794883728, 0.00022660940885543823, 0.00023605301976203918, 0.00024549663066864014, 0.0002549402415752411, 0.00026438385248184204, 0.000273827463388443, 0.00028327107429504395, 0.0002927146852016449, 0.00030215829610824585, 0.0003116019070148468, 0.00032104551792144775, 0.0003304891288280487, 0.00033993273973464966, 0.0003493763506412506, 0.00035881996154785156]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 5.0, 5.0, 17.0, 13.0, 18.0, 30.0, 45.0, 62.0, 88.0, 162.0, 213.0, 376.0, 612.0, 971.0, 1818.0, 3107.0, 5627.0, 10352.0, 21140.0, 59200.0, 506405.0, 350907.0, 47227.0, 18961.0, 9369.0, 4971.0, 2774.0, 1598.0, 920.0, 549.0, 339.0, 225.0, 142.0, 99.0, 65.0, 42.0, 26.0, 23.0, 23.0, 12.0, 2.0, 2.0, 6.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3388671875, -1.2993927001953125, -1.259918212890625, -1.2204437255859375, -1.18096923828125, -1.1414947509765625, -1.102020263671875, -1.0625457763671875, -1.0230712890625, -0.9835968017578125, -0.944122314453125, -0.9046478271484375, -0.86517333984375, -0.8256988525390625, -0.786224365234375, -0.7467498779296875, -0.707275390625, -0.6678009033203125, -0.628326416015625, -0.5888519287109375, -0.54937744140625, -0.5099029541015625, -0.470428466796875, -0.4309539794921875, -0.3914794921875, -0.3520050048828125, -0.312530517578125, -0.2730560302734375, -0.23358154296875, -0.1941070556640625, -0.154632568359375, -0.1151580810546875, -0.07568359375, -0.0362091064453125, 0.003265380859375, 0.0427398681640625, 0.08221435546875, 0.1216888427734375, 0.161163330078125, 0.2006378173828125, 0.2401123046875, 0.2795867919921875, 0.319061279296875, 0.3585357666015625, 0.39801025390625, 0.4374847412109375, 0.476959228515625, 0.5164337158203125, 0.555908203125, 0.5953826904296875, 0.634857177734375, 0.6743316650390625, 0.71380615234375, 0.7532806396484375, 0.792755126953125, 0.8322296142578125, 0.8717041015625, 0.9111785888671875, 0.950653076171875, 0.9901275634765625, 1.02960205078125, 1.0690765380859375, 1.108551025390625, 1.1480255126953125, 1.1875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 2.0, 9.0, 10.0, 8.0, 15.0, 13.0, 16.0, 30.0, 40.0, 77.0, 131.0, 154.0, 148.0, 117.0, 59.0, 41.0, 19.0, 17.0, 17.0, 6.0, 8.0, 6.0, 6.0, 7.0, 3.0, 9.0, 5.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.021484375, -0.9912796020507812, -0.9610748291015625, -0.9308700561523438, -0.900665283203125, -0.8704605102539062, -0.8402557373046875, -0.8100509643554688, -0.77984619140625, -0.7496414184570312, -0.7194366455078125, -0.6892318725585938, -0.659027099609375, -0.6288223266601562, -0.5986175537109375, -0.5684127807617188, -0.5382080078125, -0.5080032348632812, -0.4777984619140625, -0.44759368896484375, -0.417388916015625, -0.38718414306640625, -0.3569793701171875, -0.32677459716796875, -0.29656982421875, -0.26636505126953125, -0.2361602783203125, -0.20595550537109375, -0.175750732421875, -0.14554595947265625, -0.1153411865234375, -0.08513641357421875, -0.054931640625, -0.02472686767578125, 0.0054779052734375, 0.03568267822265625, 0.065887451171875, 0.09609222412109375, 0.1262969970703125, 0.15650177001953125, 0.18670654296875, 0.21691131591796875, 0.2471160888671875, 0.27732086181640625, 0.307525634765625, 0.33773040771484375, 0.3679351806640625, 0.39813995361328125, 0.4283447265625, 0.45854949951171875, 0.4887542724609375, 0.5189590454101562, 0.549163818359375, 0.5793685913085938, 0.6095733642578125, 0.6397781372070312, 0.66998291015625, 0.7001876831054688, 0.7303924560546875, 0.7605972290039062, 0.790802001953125, 0.8210067749023438, 0.8512115478515625, 0.8814163208007812, 0.91162109375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 7.0, 4.0, 8.0, 12.0, 10.0, 14.0, 17.0, 21.0, 43.0, 35.0, 51.0, 46.0, 70.0, 54.0, 69.0, 64.0, 72.0, 61.0, 63.0, 47.0, 50.0, 47.0, 37.0, 19.0, 15.0, 18.0, 9.0, 6.0, 9.0, 10.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.198774337768555, -10.923103332519531, -10.647431373596191, -10.371760368347168, -10.096089363098145, -9.820417404174805, -9.544746398925781, -9.269075393676758, -8.993404388427734, -8.717733383178711, -8.442061424255371, -8.166390419006348, -7.890719413757324, -7.615047931671143, -7.339376449584961, -7.0637054443359375, -6.788033485412598, -6.512362003326416, -6.236690998077393, -5.961019515991211, -5.6853485107421875, -5.409677028656006, -5.134005546569824, -4.858334541320801, -4.582663059234619, -4.3069915771484375, -4.031320571899414, -3.7556490898132324, -3.47997784614563, -3.2043066024780273, -2.9286351203918457, -2.652963876724243, -2.3772926330566406, -2.101621389389038, -1.825950026512146, -1.550278663635254, -1.2746074199676514, -0.9989361763000488, -0.7232648134231567, -0.44759345054626465, -0.1719222068786621, 0.1037490963935852, 0.3794203996658325, 0.6550917029380798, 0.9307630062103271, 1.2064342498779297, 1.4821056127548218, 1.7577769756317139, 2.0334482192993164, 2.309119462966919, 2.5847907066345215, 2.860462188720703, 3.1361334323883057, 3.411804676055908, 3.68747615814209, 3.9631474018096924, 4.238818645477295, 4.514490127563477, 4.7901611328125, 5.065832614898682, 5.341504096984863, 5.617175102233887, 5.892846584320068, 6.16851806640625, 6.444189071655273]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 5.0, 6.0, 10.0, 12.0, 8.0, 13.0, 16.0, 24.0, 19.0, 18.0, 22.0, 28.0, 41.0, 38.0, 44.0, 44.0, 42.0, 45.0, 54.0, 33.0, 46.0, 43.0, 39.0, 35.0, 50.0, 43.0, 44.0, 22.0, 21.0, 19.0, 16.0, 12.0, 19.0, 15.0, 14.0, 11.0, 7.0, 2.0, 4.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.468884468078613, -5.259416580200195, -5.049948692321777, -4.840480804443359, -4.631012916564941, -4.421545028686523, -4.212076663970947, -4.002608776092529, -3.7931408882141113, -3.5836730003356934, -3.3742051124572754, -3.1647369861602783, -2.9552690982818604, -2.7458012104034424, -2.5363330841064453, -2.3268651962280273, -2.1173973083496094, -1.9079294204711914, -1.6984614133834839, -1.4889934062957764, -1.2795255184173584, -1.0700576305389404, -0.8605896234512329, -0.6511216163635254, -0.4416537284851074, -0.23218578100204468, -0.022717833518981934, 0.1867501139640808, 0.39621806144714355, 0.6056859493255615, 0.815153956413269, 1.0246219635009766, 1.2340898513793945, 1.4435577392578125, 1.65302574634552, 1.8624937534332275, 2.0719616413116455, 2.2814295291900635, 2.4908976554870605, 2.7003655433654785, 2.9098334312438965, 3.1193013191223145, 3.3287692070007324, 3.5382373332977295, 3.7477052211761475, 3.9571731090545654, 4.1666412353515625, 4.3761091232299805, 4.585577011108398, 4.795044898986816, 5.004512786865234, 5.213980674743652, 5.42344856262207, 5.632916450500488, 5.8423848152160645, 6.051852703094482, 6.2613205909729, 6.470788478851318, 6.680256366729736, 6.889724254608154, 7.0991926193237305, 7.308660507202148, 7.518128395080566, 7.727596282958984, 7.937064170837402]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 12.0, 11.0, 23.0, 31.0, 47.0, 53.0, 88.0, 139.0, 227.0, 324.0, 559.0, 936.0, 1487.0, 2585.0, 4486.0, 8207.0, 16308.0, 36226.0, 97723.0, 436158.0, 3189987.0, 266070.0, 73455.0, 28991.0, 13528.0, 7015.0, 3778.0, 2171.0, 1367.0, 837.0, 503.0, 301.0, 194.0, 133.0, 82.0, 75.0, 38.0, 37.0, 21.0, 11.0, 16.0, 10.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.2109375, -1.1710662841796875, -1.131195068359375, -1.0913238525390625, -1.05145263671875, -1.0115814208984375, -0.971710205078125, -0.9318389892578125, -0.8919677734375, -0.8520965576171875, -0.812225341796875, -0.7723541259765625, -0.73248291015625, -0.6926116943359375, -0.652740478515625, -0.6128692626953125, -0.572998046875, -0.5331268310546875, -0.493255615234375, -0.4533843994140625, -0.41351318359375, -0.3736419677734375, -0.333770751953125, -0.2938995361328125, -0.2540283203125, -0.2141571044921875, -0.174285888671875, -0.1344146728515625, -0.09454345703125, -0.0546722412109375, -0.014801025390625, 0.0250701904296875, 0.06494140625, 0.1048126220703125, 0.144683837890625, 0.1845550537109375, 0.22442626953125, 0.2642974853515625, 0.304168701171875, 0.3440399169921875, 0.3839111328125, 0.4237823486328125, 0.463653564453125, 0.5035247802734375, 0.54339599609375, 0.5832672119140625, 0.623138427734375, 0.6630096435546875, 0.702880859375, 0.7427520751953125, 0.782623291015625, 0.8224945068359375, 0.86236572265625, 0.9022369384765625, 0.942108154296875, 0.9819793701171875, 1.0218505859375, 1.0617218017578125, 1.101593017578125, 1.1414642333984375, 1.18133544921875, 1.2212066650390625, 1.261077880859375, 1.3009490966796875, 1.3408203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 11.0, 10.0, 8.0, 15.0, 10.0, 21.0, 14.0, 23.0, 22.0, 18.0, 29.0, 37.0, 31.0, 36.0, 50.0, 33.0, 39.0, 35.0, 49.0, 42.0, 44.0, 30.0, 44.0, 27.0, 35.0, 36.0, 34.0, 35.0, 34.0, 24.0, 18.0, 21.0, 9.0, 13.0, 17.0, 6.0, 8.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.25048828125, -0.2428722381591797, -0.23525619506835938, -0.22764015197753906, -0.22002410888671875, -0.21240806579589844, -0.20479202270507812, -0.1971759796142578, -0.1895599365234375, -0.1819438934326172, -0.17432785034179688, -0.16671180725097656, -0.15909576416015625, -0.15147972106933594, -0.14386367797851562, -0.1362476348876953, -0.128631591796875, -0.12101554870605469, -0.11339950561523438, -0.10578346252441406, -0.09816741943359375, -0.09055137634277344, -0.08293533325195312, -0.07531929016113281, -0.0677032470703125, -0.06008720397949219, -0.052471160888671875, -0.04485511779785156, -0.03723907470703125, -0.029623031616210938, -0.022006988525390625, -0.014390945434570312, -0.00677490234375, 0.0008411407470703125, 0.008457183837890625, 0.016073226928710938, 0.02368927001953125, 0.03130531311035156, 0.038921356201171875, 0.04653739929199219, 0.0541534423828125, 0.06176948547363281, 0.06938552856445312, 0.07700157165527344, 0.08461761474609375, 0.09223365783691406, 0.09984970092773438, 0.10746574401855469, 0.115081787109375, 0.12269783020019531, 0.13031387329101562, 0.13792991638183594, 0.14554595947265625, 0.15316200256347656, 0.16077804565429688, 0.1683940887451172, 0.1760101318359375, 0.1836261749267578, 0.19124221801757812, 0.19885826110839844, 0.20647430419921875, 0.21409034729003906, 0.22170639038085938, 0.2293224334716797, 0.2369384765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 9.0, 7.0, 27.0, 24.0, 55.0, 90.0, 147.0, 281.0, 523.0, 977.0, 1877.0, 4044.0, 8980.0, 23615.0, 79191.0, 496123.0, 3261151.0, 237214.0, 50402.0, 16497.0, 6771.0, 3086.0, 1491.0, 729.0, 410.0, 238.0, 131.0, 74.0, 44.0, 32.0, 22.0, 7.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.162109375, -2.093109130859375, -2.02410888671875, -1.955108642578125, -1.8861083984375, -1.817108154296875, -1.74810791015625, -1.679107666015625, -1.610107421875, -1.541107177734375, -1.47210693359375, -1.403106689453125, -1.3341064453125, -1.265106201171875, -1.19610595703125, -1.127105712890625, -1.05810546875, -0.989105224609375, -0.92010498046875, -0.851104736328125, -0.7821044921875, -0.713104248046875, -0.64410400390625, -0.575103759765625, -0.506103515625, -0.437103271484375, -0.36810302734375, -0.299102783203125, -0.2301025390625, -0.161102294921875, -0.09210205078125, -0.023101806640625, 0.0458984375, 0.114898681640625, 0.18389892578125, 0.252899169921875, 0.3218994140625, 0.390899658203125, 0.45989990234375, 0.528900146484375, 0.597900390625, 0.666900634765625, 0.73590087890625, 0.804901123046875, 0.8739013671875, 0.942901611328125, 1.01190185546875, 1.080902099609375, 1.14990234375, 1.218902587890625, 1.28790283203125, 1.356903076171875, 1.4259033203125, 1.494903564453125, 1.56390380859375, 1.632904052734375, 1.701904296875, 1.770904541015625, 1.83990478515625, 1.908905029296875, 1.9779052734375, 2.046905517578125, 2.11590576171875, 2.184906005859375, 2.25390625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 7.0, 12.0, 7.0, 7.0, 18.0, 19.0, 29.0, 32.0, 35.0, 84.0, 91.0, 166.0, 341.0, 968.0, 1317.0, 367.0, 222.0, 114.0, 73.0, 46.0, 26.0, 17.0, 23.0, 10.0, 10.0, 10.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68505859375, -0.659759521484375, -0.63446044921875, -0.609161376953125, -0.5838623046875, -0.558563232421875, -0.53326416015625, -0.507965087890625, -0.482666015625, -0.457366943359375, -0.43206787109375, -0.406768798828125, -0.3814697265625, -0.356170654296875, -0.33087158203125, -0.305572509765625, -0.2802734375, -0.254974365234375, -0.22967529296875, -0.204376220703125, -0.1790771484375, -0.153778076171875, -0.12847900390625, -0.103179931640625, -0.077880859375, -0.052581787109375, -0.02728271484375, -0.001983642578125, 0.0233154296875, 0.048614501953125, 0.07391357421875, 0.099212646484375, 0.12451171875, 0.149810791015625, 0.17510986328125, 0.200408935546875, 0.2257080078125, 0.251007080078125, 0.27630615234375, 0.301605224609375, 0.326904296875, 0.352203369140625, 0.37750244140625, 0.402801513671875, 0.4281005859375, 0.453399658203125, 0.47869873046875, 0.503997802734375, 0.529296875, 0.554595947265625, 0.57989501953125, 0.605194091796875, 0.6304931640625, 0.655792236328125, 0.68109130859375, 0.706390380859375, 0.731689453125, 0.756988525390625, 0.78228759765625, 0.807586669921875, 0.8328857421875, 0.858184814453125, 0.88348388671875, 0.908782958984375, 0.93408203125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 6.0, 4.0, 8.0, 13.0, 13.0, 17.0, 23.0, 25.0, 30.0, 43.0, 45.0, 64.0, 45.0, 75.0, 67.0, 70.0, 62.0, 57.0, 57.0, 57.0, 48.0, 35.0, 26.0, 26.0, 11.0, 19.0, 14.0, 9.0, 9.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.328150272369385, -4.226039886474609, -4.123929500579834, -4.021819591522217, -3.9197092056274414, -3.817598819732666, -3.7154884338378906, -3.6133782863616943, -3.511268138885498, -3.4091577529907227, -3.3070476055145264, -3.204937219619751, -3.1028270721435547, -3.0007166862487793, -2.898606300354004, -2.7964961528778076, -2.6943857669830322, -2.592275381088257, -2.4901652336120605, -2.388054847717285, -2.285944700241089, -2.1838343143463135, -2.081724166870117, -1.9796137809753418, -1.877503514289856, -1.7753932476043701, -1.6732829809188843, -1.5711727142333984, -1.469062328338623, -1.3669521808624268, -1.2648417949676514, -1.1627315282821655, -1.0606215000152588, -0.958511233329773, -0.8564009666442871, -0.7542906403541565, -0.6521803736686707, -0.5500701069831848, -0.4479597806930542, -0.34584951400756836, -0.24373924732208252, -0.14162896573543549, -0.03951868414878845, 0.06259161233901978, 0.16470187902450562, 0.26681214570999146, 0.36892247200012207, 0.4710327386856079, 0.5731430053710938, 0.6752532720565796, 0.7773635387420654, 0.879473865032196, 0.9815841317176819, 1.0836944580078125, 1.1858047246932983, 1.2879149913787842, 1.39002525806427, 1.4921355247497559, 1.5942457914352417, 1.6963560581207275, 1.798466444015503, 1.9005765914916992, 2.0026869773864746, 2.10479736328125, 2.2069075107574463]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 9.0, 8.0, 18.0, 18.0, 16.0, 29.0, 21.0, 26.0, 30.0, 25.0, 36.0, 33.0, 42.0, 55.0, 47.0, 39.0, 38.0, 42.0, 41.0, 44.0, 42.0, 39.0, 38.0, 34.0, 32.0, 25.0, 29.0, 24.0, 15.0, 20.0, 19.0, 11.0, 12.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0], "bins": [-3.1044154167175293, -3.0217201709747314, -2.9390249252319336, -2.8563296794891357, -2.773634433746338, -2.69093918800354, -2.608243942260742, -2.5255489349365234, -2.4428534507751465, -2.3601582050323486, -2.277462959289551, -2.194767713546753, -2.112072467803955, -2.0293772220611572, -1.946682095527649, -1.863986849784851, -1.7812917232513428, -1.698596477508545, -1.615901231765747, -1.5332059860229492, -1.4505107402801514, -1.3678154945373535, -1.2851203680038452, -1.2024251222610474, -1.1197298765182495, -1.0370346307754517, -0.9543393850326538, -0.8716441988945007, -0.7889489531517029, -0.706253707408905, -0.623558521270752, -0.5408632755279541, -0.45816779136657715, -0.3754725456237793, -0.29277732968330383, -0.21008209884166718, -0.12738686800003052, -0.044691622257232666, 0.0380035936832428, 0.12069880962371826, 0.2033940553665161, 0.28608930110931396, 0.36878451704978943, 0.4514797329902649, 0.5341749787330627, 0.6168702244758606, 0.6995654106140137, 0.7822606563568115, 0.8649559020996094, 0.9476511478424072, 1.030346393585205, 1.113041639328003, 1.1957368850708008, 1.2784321308135986, 1.361127257347107, 1.4438225030899048, 1.5265177488327026, 1.6092129945755005, 1.6919082403182983, 1.7746034860610962, 1.8572986125946045, 1.9399938583374023, 2.0226891040802, 2.105384349822998, 2.188079595565796]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 17.0, 17.0, 19.0, 30.0, 48.0, 59.0, 68.0, 120.0, 164.0, 238.0, 374.0, 662.0, 1044.0, 1852.0, 3337.0, 5748.0, 10523.0, 19458.0, 36863.0, 69646.0, 126796.0, 203247.0, 223386.0, 154976.0, 87871.0, 46924.0, 24781.0, 13333.0, 7087.0, 3928.0, 2333.0, 1401.0, 762.0, 498.0, 281.0, 190.0, 140.0, 81.0, 61.0, 48.0, 28.0, 29.0, 18.0, 10.0, 15.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-1.0888671875, -1.0550384521484375, -1.021209716796875, -0.9873809814453125, -0.95355224609375, -0.9197235107421875, -0.885894775390625, -0.8520660400390625, -0.8182373046875, -0.7844085693359375, -0.750579833984375, -0.7167510986328125, -0.68292236328125, -0.6490936279296875, -0.615264892578125, -0.5814361572265625, -0.547607421875, -0.5137786865234375, -0.479949951171875, -0.4461212158203125, -0.41229248046875, -0.3784637451171875, -0.344635009765625, -0.3108062744140625, -0.2769775390625, -0.2431488037109375, -0.209320068359375, -0.1754913330078125, -0.14166259765625, -0.1078338623046875, -0.074005126953125, -0.0401763916015625, -0.00634765625, 0.0274810791015625, 0.061309814453125, 0.0951385498046875, 0.12896728515625, 0.1627960205078125, 0.196624755859375, 0.2304534912109375, 0.2642822265625, 0.2981109619140625, 0.331939697265625, 0.3657684326171875, 0.39959716796875, 0.4334259033203125, 0.467254638671875, 0.5010833740234375, 0.534912109375, 0.5687408447265625, 0.602569580078125, 0.6363983154296875, 0.67022705078125, 0.7040557861328125, 0.737884521484375, 0.7717132568359375, 0.8055419921875, 0.8393707275390625, 0.873199462890625, 0.9070281982421875, 0.94085693359375, 0.9746856689453125, 1.008514404296875, 1.0423431396484375, 1.076171875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 1.0, 5.0, 2.0, 8.0, 11.0, 13.0, 12.0, 8.0, 16.0, 15.0, 17.0, 16.0, 32.0, 16.0, 29.0, 20.0, 34.0, 36.0, 29.0, 35.0, 30.0, 32.0, 33.0, 37.0, 46.0, 40.0, 30.0, 30.0, 31.0, 37.0, 33.0, 30.0, 31.0, 20.0, 31.0, 19.0, 21.0, 18.0, 17.0, 10.0, 8.0, 13.0, 13.0, 9.0, 11.0, 7.0, 8.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20166015625, -0.19451522827148438, -0.18737030029296875, -0.18022537231445312, -0.1730804443359375, -0.16593551635742188, -0.15879058837890625, -0.15164566040039062, -0.144500732421875, -0.13735580444335938, -0.13021087646484375, -0.12306594848632812, -0.1159210205078125, -0.10877609252929688, -0.10163116455078125, -0.09448623657226562, -0.08734130859375, -0.08019638061523438, -0.07305145263671875, -0.06590652465820312, -0.0587615966796875, -0.051616668701171875, -0.04447174072265625, -0.037326812744140625, -0.030181884765625, -0.023036956787109375, -0.01589202880859375, -0.008747100830078125, -0.0016021728515625, 0.005542755126953125, 0.01268768310546875, 0.019832611083984375, 0.0269775390625, 0.034122467041015625, 0.04126739501953125, 0.048412322998046875, 0.0555572509765625, 0.06270217895507812, 0.06984710693359375, 0.07699203491210938, 0.084136962890625, 0.09128189086914062, 0.09842681884765625, 0.10557174682617188, 0.1127166748046875, 0.11986160278320312, 0.12700653076171875, 0.13415145874023438, 0.14129638671875, 0.14844131469726562, 0.15558624267578125, 0.16273117065429688, 0.1698760986328125, 0.17702102661132812, 0.18416595458984375, 0.19131088256835938, 0.198455810546875, 0.20560073852539062, 0.21274566650390625, 0.21989059448242188, 0.2270355224609375, 0.23418045043945312, 0.24132537841796875, 0.24847030639648438, 0.255615234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 2.0, 7.0, 8.0, 11.0, 8.0, 23.0, 31.0, 43.0, 74.0, 127.0, 169.0, 294.0, 552.0, 926.0, 1554.0, 3033.0, 5540.0, 10183.0, 19854.0, 38814.0, 77846.0, 150821.0, 250533.0, 225658.0, 128323.0, 65510.0, 32642.0, 16848.0, 8744.0, 4544.0, 2485.0, 1346.0, 786.0, 469.0, 262.0, 166.0, 116.0, 61.0, 49.0, 23.0, 15.0, 13.0, 15.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.0341796875, -0.9995574951171875, -0.964935302734375, -0.9303131103515625, -0.89569091796875, -0.8610687255859375, -0.826446533203125, -0.7918243408203125, -0.7572021484375, -0.7225799560546875, -0.687957763671875, -0.6533355712890625, -0.61871337890625, -0.5840911865234375, -0.549468994140625, -0.5148468017578125, -0.480224609375, -0.4456024169921875, -0.410980224609375, -0.3763580322265625, -0.34173583984375, -0.3071136474609375, -0.272491455078125, -0.2378692626953125, -0.2032470703125, -0.1686248779296875, -0.134002685546875, -0.0993804931640625, -0.06475830078125, -0.0301361083984375, 0.004486083984375, 0.0391082763671875, 0.07373046875, 0.1083526611328125, 0.142974853515625, 0.1775970458984375, 0.21221923828125, 0.2468414306640625, 0.281463623046875, 0.3160858154296875, 0.3507080078125, 0.3853302001953125, 0.419952392578125, 0.4545745849609375, 0.48919677734375, 0.5238189697265625, 0.558441162109375, 0.5930633544921875, 0.627685546875, 0.6623077392578125, 0.696929931640625, 0.7315521240234375, 0.76617431640625, 0.8007965087890625, 0.835418701171875, 0.8700408935546875, 0.9046630859375, 0.9392852783203125, 0.973907470703125, 1.0085296630859375, 1.04315185546875, 1.0777740478515625, 1.112396240234375, 1.1470184326171875, 1.181640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 0.0, 8.0, 10.0, 8.0, 16.0, 8.0, 12.0, 5.0, 14.0, 18.0, 15.0, 17.0, 26.0, 25.0, 32.0, 37.0, 46.0, 33.0, 37.0, 51.0, 44.0, 42.0, 39.0, 41.0, 33.0, 33.0, 38.0, 41.0, 31.0, 31.0, 31.0, 16.0, 21.0, 18.0, 18.0, 18.0, 9.0, 17.0, 13.0, 6.0, 11.0, 8.0, 9.0, 5.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0791015625, -1.0430145263671875, -1.006927490234375, -0.9708404541015625, -0.93475341796875, -0.8986663818359375, -0.862579345703125, -0.8264923095703125, -0.7904052734375, -0.7543182373046875, -0.718231201171875, -0.6821441650390625, -0.64605712890625, -0.6099700927734375, -0.573883056640625, -0.5377960205078125, -0.501708984375, -0.4656219482421875, -0.429534912109375, -0.3934478759765625, -0.35736083984375, -0.3212738037109375, -0.285186767578125, -0.2490997314453125, -0.2130126953125, -0.1769256591796875, -0.140838623046875, -0.1047515869140625, -0.06866455078125, -0.0325775146484375, 0.003509521484375, 0.0395965576171875, 0.07568359375, 0.1117706298828125, 0.147857666015625, 0.1839447021484375, 0.22003173828125, 0.2561187744140625, 0.292205810546875, 0.3282928466796875, 0.3643798828125, 0.4004669189453125, 0.436553955078125, 0.4726409912109375, 0.50872802734375, 0.5448150634765625, 0.580902099609375, 0.6169891357421875, 0.653076171875, 0.6891632080078125, 0.725250244140625, 0.7613372802734375, 0.79742431640625, 0.8335113525390625, 0.869598388671875, 0.9056854248046875, 0.9417724609375, 0.9778594970703125, 1.013946533203125, 1.0500335693359375, 1.08612060546875, 1.1222076416015625, 1.158294677734375, 1.1943817138671875, 1.23046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 10.0, 23.0, 43.0, 86.0, 204.0, 578.0, 1800.0, 7378.0, 51751.0, 748020.0, 215024.0, 18565.0, 3520.0, 1006.0, 300.0, 134.0, 53.0, 29.0, 12.0, 7.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.365234375, -1.314208984375, -1.26318359375, -1.212158203125, -1.1611328125, -1.110107421875, -1.05908203125, -1.008056640625, -0.95703125, -0.906005859375, -0.85498046875, -0.803955078125, -0.7529296875, -0.701904296875, -0.65087890625, -0.599853515625, -0.548828125, -0.497802734375, -0.44677734375, -0.395751953125, -0.3447265625, -0.293701171875, -0.24267578125, -0.191650390625, -0.140625, -0.089599609375, -0.03857421875, 0.012451171875, 0.0634765625, 0.114501953125, 0.16552734375, 0.216552734375, 0.267578125, 0.318603515625, 0.36962890625, 0.420654296875, 0.4716796875, 0.522705078125, 0.57373046875, 0.624755859375, 0.67578125, 0.726806640625, 0.77783203125, 0.828857421875, 0.8798828125, 0.930908203125, 0.98193359375, 1.032958984375, 1.083984375, 1.135009765625, 1.18603515625, 1.237060546875, 1.2880859375, 1.339111328125, 1.39013671875, 1.441162109375, 1.4921875, 1.543212890625, 1.59423828125, 1.645263671875, 1.6962890625, 1.747314453125, 1.79833984375, 1.849365234375, 1.900390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 2.0, 7.0, 9.0, 11.0, 21.0, 32.0, 70.0, 142.0, 289.0, 215.0, 71.0, 41.0, 27.0, 23.0, 13.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002932548522949219, -0.00028453394770622253, -0.0002758130431175232, -0.00026709213852882385, -0.0002583712339401245, -0.00024965032935142517, -0.00024092942476272583, -0.0002322085201740265, -0.00022348761558532715, -0.0002147667109966278, -0.00020604580640792847, -0.00019732490181922913, -0.00018860399723052979, -0.00017988309264183044, -0.0001711621880531311, -0.00016244128346443176, -0.00015372037887573242, -0.00014499947428703308, -0.00013627856969833374, -0.0001275576651096344, -0.00011883676052093506, -0.00011011585593223572, -0.00010139495134353638, -9.267404675483704e-05, -8.39531421661377e-05, -7.523223757743835e-05, -6.651133298873901e-05, -5.779042840003967e-05, -4.906952381134033e-05, -4.034861922264099e-05, -3.162771463394165e-05, -2.290681004524231e-05, -1.4185905456542969e-05, -5.465000867843628e-06, 3.255903720855713e-06, 1.1976808309555054e-05, 2.0697712898254395e-05, 2.9418617486953735e-05, 3.8139522075653076e-05, 4.686042666435242e-05, 5.558133125305176e-05, 6.43022358417511e-05, 7.302314043045044e-05, 8.174404501914978e-05, 9.046494960784912e-05, 9.918585419654846e-05, 0.0001079067587852478, 0.00011662766337394714, 0.00012534856796264648, 0.00013406947255134583, 0.00014279037714004517, 0.0001515112817287445, 0.00016023218631744385, 0.0001689530909061432, 0.00017767399549484253, 0.00018639490008354187, 0.0001951158046722412, 0.00020383670926094055, 0.0002125576138496399, 0.00022127851843833923, 0.00022999942302703857, 0.00023872032761573792, 0.00024744123220443726, 0.0002561621367931366, 0.00026488304138183594]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 13.0, 7.0, 15.0, 19.0, 28.0, 55.0, 86.0, 151.0, 251.0, 476.0, 1052.0, 2481.0, 6818.0, 20610.0, 83100.0, 634492.0, 241774.0, 38537.0, 11499.0, 4021.0, 1523.0, 701.0, 355.0, 183.0, 113.0, 67.0, 43.0, 31.0, 19.0, 11.0, 9.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.248046875, -1.2158355712890625, -1.183624267578125, -1.1514129638671875, -1.11920166015625, -1.0869903564453125, -1.054779052734375, -1.0225677490234375, -0.9903564453125, -0.9581451416015625, -0.925933837890625, -0.8937225341796875, -0.86151123046875, -0.8292999267578125, -0.797088623046875, -0.7648773193359375, -0.732666015625, -0.7004547119140625, -0.668243408203125, -0.6360321044921875, -0.60382080078125, -0.5716094970703125, -0.539398193359375, -0.5071868896484375, -0.4749755859375, -0.4427642822265625, -0.410552978515625, -0.3783416748046875, -0.34613037109375, -0.3139190673828125, -0.281707763671875, -0.2494964599609375, -0.21728515625, -0.1850738525390625, -0.152862548828125, -0.1206512451171875, -0.08843994140625, -0.0562286376953125, -0.024017333984375, 0.0081939697265625, 0.0404052734375, 0.0726165771484375, 0.104827880859375, 0.1370391845703125, 0.16925048828125, 0.2014617919921875, 0.233673095703125, 0.2658843994140625, 0.298095703125, 0.3303070068359375, 0.362518310546875, 0.3947296142578125, 0.42694091796875, 0.4591522216796875, 0.491363525390625, 0.5235748291015625, 0.5557861328125, 0.5879974365234375, 0.620208740234375, 0.6524200439453125, 0.68463134765625, 0.7168426513671875, 0.749053955078125, 0.7812652587890625, 0.8134765625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 5.0, 10.0, 7.0, 18.0, 19.0, 39.0, 70.0, 106.0, 183.0, 172.0, 137.0, 80.0, 50.0, 19.0, 10.0, 20.0, 10.0, 9.0, 10.0, 8.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84765625, -0.81524658203125, -0.7828369140625, -0.75042724609375, -0.718017578125, -0.68560791015625, -0.6531982421875, -0.62078857421875, -0.58837890625, -0.55596923828125, -0.5235595703125, -0.49114990234375, -0.458740234375, -0.42633056640625, -0.3939208984375, -0.36151123046875, -0.3291015625, -0.29669189453125, -0.2642822265625, -0.23187255859375, -0.199462890625, -0.16705322265625, -0.1346435546875, -0.10223388671875, -0.06982421875, -0.03741455078125, -0.0050048828125, 0.02740478515625, 0.059814453125, 0.09222412109375, 0.1246337890625, 0.15704345703125, 0.189453125, 0.22186279296875, 0.2542724609375, 0.28668212890625, 0.319091796875, 0.35150146484375, 0.3839111328125, 0.41632080078125, 0.44873046875, 0.48114013671875, 0.5135498046875, 0.54595947265625, 0.578369140625, 0.61077880859375, 0.6431884765625, 0.67559814453125, 0.7080078125, 0.74041748046875, 0.7728271484375, 0.80523681640625, 0.837646484375, 0.87005615234375, 0.9024658203125, 0.93487548828125, 0.96728515625, 0.99969482421875, 1.0321044921875, 1.06451416015625, 1.096923828125, 1.12933349609375, 1.1617431640625, 1.19415283203125, 1.2265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 9.0, 16.0, 25.0, 54.0, 96.0, 115.0, 139.0, 169.0, 137.0, 112.0, 70.0, 31.0, 21.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-28.753450393676758, -28.191926956176758, -27.63040542602539, -27.06888198852539, -26.50735855102539, -25.945837020874023, -25.384313583374023, -24.822790145874023, -24.261268615722656, -23.699745178222656, -23.13822364807129, -22.57670021057129, -22.01517677307129, -21.453655242919922, -20.892131805419922, -20.330608367919922, -19.769084930419922, -19.207561492919922, -18.646039962768555, -18.084516525268555, -17.522993087768555, -16.961471557617188, -16.399948120117188, -15.838425636291504, -15.27690315246582, -14.715380668640137, -14.153857231140137, -13.592334747314453, -13.03081226348877, -12.469289779663086, -11.907766342163086, -11.346243858337402, -10.784721374511719, -10.223198890686035, -9.661675453186035, -9.100152969360352, -8.538630485534668, -7.977107524871826, -7.415584564208984, -6.854062080383301, -6.292539119720459, -5.731016159057617, -5.169493675231934, -4.607970714569092, -4.04644775390625, -3.4849252700805664, -2.9234023094177246, -2.361879587173462, -1.8003568649291992, -1.2388341426849365, -0.6773113012313843, -0.11578845977783203, 0.44573426246643066, 1.0072569847106934, 1.5687799453735352, 2.130302667617798, 2.6918253898620605, 3.2533481121063232, 3.814870834350586, 4.376393795013428, 4.9379167556762695, 5.499439239501953, 6.060962200164795, 6.622485160827637, 7.18400764465332]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 8.0, 8.0, 9.0, 5.0, 11.0, 9.0, 14.0, 13.0, 15.0, 27.0, 30.0, 17.0, 33.0, 36.0, 33.0, 35.0, 29.0, 32.0, 44.0, 46.0, 42.0, 46.0, 44.0, 41.0, 40.0, 29.0, 51.0, 31.0, 28.0, 34.0, 30.0, 26.0, 12.0, 14.0, 30.0, 6.0, 12.0, 5.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.959728240966797, -5.770707607269287, -5.581686973571777, -5.392666339874268, -5.203645706176758, -5.014625072479248, -4.825604438781738, -4.6365838050842285, -4.447563171386719, -4.258542537689209, -4.069521903991699, -3.8805012702941895, -3.6914806365966797, -3.50246000289917, -3.31343936920166, -3.1244187355041504, -2.9353981018066406, -2.746377468109131, -2.557356834411621, -2.3683362007141113, -2.1793155670166016, -1.9902949333190918, -1.801274299621582, -1.6122536659240723, -1.4232330322265625, -1.2342123985290527, -1.045191764831543, -0.8561711311340332, -0.6671504974365234, -0.47812986373901367, -0.2891092300415039, -0.10008859634399414, 0.08893203735351562, 0.2779526710510254, 0.46697330474853516, 0.6559939384460449, 0.8450145721435547, 1.0340352058410645, 1.2230558395385742, 1.412076473236084, 1.6010971069335938, 1.7901177406311035, 1.9791383743286133, 2.168159008026123, 2.357179641723633, 2.5462002754211426, 2.7352209091186523, 2.924241542816162, 3.113262176513672, 3.3022828102111816, 3.4913034439086914, 3.680324077606201, 3.869344711303711, 4.058365345001221, 4.2473859786987305, 4.43640661239624, 4.62542724609375, 4.81444787979126, 5.0034685134887695, 5.192489147186279, 5.381509780883789, 5.570530414581299, 5.759551048278809, 5.948571681976318, 6.137592315673828]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 11.0, 24.0, 36.0, 54.0, 83.0, 177.0, 340.0, 579.0, 1228.0, 2761.0, 6489.0, 20546.0, 101028.0, 3738070.0, 270123.0, 35697.0, 9990.0, 3677.0, 1620.0, 813.0, 391.0, 211.0, 124.0, 92.0, 47.0, 23.0, 19.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4921875, -3.38201904296875, -3.2718505859375, -3.16168212890625, -3.051513671875, -2.94134521484375, -2.8311767578125, -2.72100830078125, -2.61083984375, -2.50067138671875, -2.3905029296875, -2.28033447265625, -2.170166015625, -2.05999755859375, -1.9498291015625, -1.83966064453125, -1.7294921875, -1.61932373046875, -1.5091552734375, -1.39898681640625, -1.288818359375, -1.17864990234375, -1.0684814453125, -0.95831298828125, -0.84814453125, -0.73797607421875, -0.6278076171875, -0.51763916015625, -0.407470703125, -0.29730224609375, -0.1871337890625, -0.07696533203125, 0.033203125, 0.14337158203125, 0.2535400390625, 0.36370849609375, 0.473876953125, 0.58404541015625, 0.6942138671875, 0.80438232421875, 0.91455078125, 1.02471923828125, 1.1348876953125, 1.24505615234375, 1.355224609375, 1.46539306640625, 1.5755615234375, 1.68572998046875, 1.7958984375, 1.90606689453125, 2.0162353515625, 2.12640380859375, 2.236572265625, 2.34674072265625, 2.4569091796875, 2.56707763671875, 2.67724609375, 2.78741455078125, 2.8975830078125, 3.00775146484375, 3.117919921875, 3.22808837890625, 3.3382568359375, 3.44842529296875, 3.55859375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 7.0, 5.0, 7.0, 12.0, 12.0, 19.0, 26.0, 24.0, 19.0, 35.0, 31.0, 27.0, 32.0, 39.0, 35.0, 45.0, 58.0, 37.0, 45.0, 53.0, 57.0, 51.0, 46.0, 42.0, 39.0, 33.0, 29.0, 22.0, 25.0, 19.0, 14.0, 11.0, 9.0, 9.0, 10.0, 10.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.343994140625, -0.3344917297363281, -0.32498931884765625, -0.3154869079589844, -0.3059844970703125, -0.2964820861816406, -0.28697967529296875, -0.2774772644042969, -0.267974853515625, -0.2584724426269531, -0.24897003173828125, -0.23946762084960938, -0.2299652099609375, -0.22046279907226562, -0.21096038818359375, -0.20145797729492188, -0.19195556640625, -0.18245315551757812, -0.17295074462890625, -0.16344833374023438, -0.1539459228515625, -0.14444351196289062, -0.13494110107421875, -0.12543869018554688, -0.115936279296875, -0.10643386840820312, -0.09693145751953125, -0.08742904663085938, -0.0779266357421875, -0.06842422485351562, -0.05892181396484375, -0.049419403076171875, -0.0399169921875, -0.030414581298828125, -0.02091217041015625, -0.011409759521484375, -0.0019073486328125, 0.007595062255859375, 0.01709747314453125, 0.026599884033203125, 0.036102294921875, 0.045604705810546875, 0.05510711669921875, 0.06460952758789062, 0.0741119384765625, 0.08361434936523438, 0.09311676025390625, 0.10261917114257812, 0.11212158203125, 0.12162399291992188, 0.13112640380859375, 0.14062881469726562, 0.1501312255859375, 0.15963363647460938, 0.16913604736328125, 0.17863845825195312, 0.188140869140625, 0.19764328002929688, 0.20714569091796875, 0.21664810180664062, 0.2261505126953125, 0.23565292358398438, 0.24515533447265625, 0.2546577453613281, 0.26416015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 7.0, 12.0, 16.0, 19.0, 23.0, 37.0, 56.0, 69.0, 83.0, 151.0, 199.0, 331.0, 609.0, 1062.0, 1861.0, 3544.0, 6819.0, 14313.0, 32458.0, 82920.0, 316917.0, 3289035.0, 302814.0, 80638.0, 31262.0, 14007.0, 6847.0, 3449.0, 1917.0, 1083.0, 634.0, 373.0, 236.0, 158.0, 79.0, 81.0, 48.0, 28.0, 24.0, 17.0, 9.0, 9.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.869140625, -1.809783935546875, -1.75042724609375, -1.691070556640625, -1.6317138671875, -1.572357177734375, -1.51300048828125, -1.453643798828125, -1.394287109375, -1.334930419921875, -1.27557373046875, -1.216217041015625, -1.1568603515625, -1.097503662109375, -1.03814697265625, -0.978790283203125, -0.91943359375, -0.860076904296875, -0.80072021484375, -0.741363525390625, -0.6820068359375, -0.622650146484375, -0.56329345703125, -0.503936767578125, -0.444580078125, -0.385223388671875, -0.32586669921875, -0.266510009765625, -0.2071533203125, -0.147796630859375, -0.08843994140625, -0.029083251953125, 0.0302734375, 0.089630126953125, 0.14898681640625, 0.208343505859375, 0.2677001953125, 0.327056884765625, 0.38641357421875, 0.445770263671875, 0.505126953125, 0.564483642578125, 0.62384033203125, 0.683197021484375, 0.7425537109375, 0.801910400390625, 0.86126708984375, 0.920623779296875, 0.97998046875, 1.039337158203125, 1.09869384765625, 1.158050537109375, 1.2174072265625, 1.276763916015625, 1.33612060546875, 1.395477294921875, 1.454833984375, 1.514190673828125, 1.57354736328125, 1.632904052734375, 1.6922607421875, 1.751617431640625, 1.81097412109375, 1.870330810546875, 1.9296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 6.0, 19.0, 16.0, 16.0, 38.0, 36.0, 65.0, 89.0, 132.0, 224.0, 678.0, 1986.0, 322.0, 146.0, 91.0, 52.0, 28.0, 30.0, 24.0, 12.0, 8.0, 11.0, 5.0, 7.0, 7.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6923828125, -0.6649169921875, -0.637451171875, -0.6099853515625, -0.58251953125, -0.5550537109375, -0.527587890625, -0.5001220703125, -0.47265625, -0.4451904296875, -0.417724609375, -0.3902587890625, -0.36279296875, -0.3353271484375, -0.307861328125, -0.2803955078125, -0.2529296875, -0.2254638671875, -0.197998046875, -0.1705322265625, -0.14306640625, -0.1156005859375, -0.088134765625, -0.0606689453125, -0.033203125, -0.0057373046875, 0.021728515625, 0.0491943359375, 0.07666015625, 0.1041259765625, 0.131591796875, 0.1590576171875, 0.1865234375, 0.2139892578125, 0.241455078125, 0.2689208984375, 0.29638671875, 0.3238525390625, 0.351318359375, 0.3787841796875, 0.40625, 0.4337158203125, 0.461181640625, 0.4886474609375, 0.51611328125, 0.5435791015625, 0.571044921875, 0.5985107421875, 0.6259765625, 0.6534423828125, 0.680908203125, 0.7083740234375, 0.73583984375, 0.7633056640625, 0.790771484375, 0.8182373046875, 0.845703125, 0.8731689453125, 0.900634765625, 0.9281005859375, 0.95556640625, 0.9830322265625, 1.010498046875, 1.0379638671875, 1.0654296875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 11.0, 47.0, 138.0, 301.0, 298.0, 143.0, 54.0, 12.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.898653030395508, -10.404745101928711, -9.910837173461914, -9.416929244995117, -8.92302131652832, -8.429113388061523, -7.935205936431885, -7.441298484802246, -6.947390556335449, -6.453482627868652, -5.9595746994018555, -5.465666770935059, -4.97175931930542, -4.477851390838623, -3.983943462371826, -3.4900357723236084, -2.9961276054382324, -2.5022196769714355, -2.0083119869232178, -1.514404058456421, -1.0204962491989136, -0.5265884399414062, -0.032680511474609375, 0.4612271785736084, 0.9551351070404053, 1.4490429162979126, 1.94295072555542, 2.436858654022217, 2.9307665824890137, 3.4246742725372314, 3.9185822010040283, 4.412489891052246, 4.906397819519043, 5.40030574798584, 5.894213676452637, 6.388121604919434, 6.882029056549072, 7.375936985015869, 7.869844913482666, 8.363752365112305, 8.857660293579102, 9.351568222045898, 9.845476150512695, 10.339384078979492, 10.833292007446289, 11.327199935913086, 11.821107864379883, 12.315014839172363, 12.808923721313477, 13.302831649780273, 13.79673957824707, 14.290647506713867, 14.784555435180664, 15.278463363647461, 15.772371292114258, 16.266279220581055, 16.76018524169922, 17.254093170166016, 17.748001098632812, 18.24190902709961, 18.735816955566406, 19.229724884033203, 19.7236328125, 20.217540740966797, 20.711448669433594]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 10.0, 7.0, 8.0, 14.0, 11.0, 14.0, 21.0, 31.0, 21.0, 22.0, 37.0, 42.0, 43.0, 41.0, 56.0, 49.0, 44.0, 63.0, 39.0, 56.0, 50.0, 39.0, 44.0, 47.0, 29.0, 31.0, 22.0, 27.0, 22.0, 14.0, 12.0, 7.0, 7.0, 7.0, 8.0, 2.0, 2.0, 0.0, 7.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.75396466255188, -2.663573741912842, -2.5731828212738037, -2.4827919006347656, -2.3924009799957275, -2.3020100593566895, -2.2116193771362305, -2.1212282180786133, -2.0308375358581543, -1.9404466152191162, -1.8500556945800781, -1.75966477394104, -1.669273853302002, -1.5788829326629639, -1.4884921312332153, -1.3981012105941772, -1.3077101707458496, -1.2173192501068115, -1.1269283294677734, -1.0365374088287354, -0.946146547794342, -0.855755627155304, -0.7653647661209106, -0.6749738454818726, -0.5845829248428345, -0.4941920042037964, -0.4038011133670807, -0.313410222530365, -0.2230193018913269, -0.13262838125228882, -0.04223752021789551, 0.04815340042114258, 0.13854455947875977, 0.22893546521663666, 0.31932637095451355, 0.40971726179122925, 0.5001081824302673, 0.5904991030693054, 0.6808899641036987, 0.7712808847427368, 0.8616718053817749, 0.952062726020813, 1.042453646659851, 1.1328444480895996, 1.2232353687286377, 1.3136262893676758, 1.4040172100067139, 1.494408130645752, 1.58479905128479, 1.6751899719238281, 1.7655808925628662, 1.8559718132019043, 1.9463627338409424, 2.0367536544799805, 2.1271443367004395, 2.2175354957580566, 2.3079261779785156, 2.3983170986175537, 2.488708019256592, 2.57909893989563, 2.669489860534668, 2.759880781173706, 2.850271701812744, 2.940662384033203, 3.0310535430908203]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 15.0, 11.0, 7.0, 16.0, 19.0, 28.0, 36.0, 52.0, 86.0, 128.0, 206.0, 292.0, 456.0, 703.0, 1111.0, 1858.0, 3100.0, 5299.0, 9341.0, 17311.0, 31690.0, 59031.0, 108830.0, 186555.0, 232705.0, 172814.0, 98263.0, 53408.0, 28457.0, 15676.0, 8808.0, 4855.0, 2761.0, 1656.0, 1027.0, 660.0, 456.0, 253.0, 165.0, 127.0, 93.0, 54.0, 34.0, 30.0, 19.0, 16.0, 6.0, 10.0, 9.0, 8.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3701171875, -1.326507568359375, -1.28289794921875, -1.239288330078125, -1.1956787109375, -1.152069091796875, -1.10845947265625, -1.064849853515625, -1.021240234375, -0.977630615234375, -0.93402099609375, -0.890411376953125, -0.8468017578125, -0.803192138671875, -0.75958251953125, -0.715972900390625, -0.67236328125, -0.628753662109375, -0.58514404296875, -0.541534423828125, -0.4979248046875, -0.454315185546875, -0.41070556640625, -0.367095947265625, -0.323486328125, -0.279876708984375, -0.23626708984375, -0.192657470703125, -0.1490478515625, -0.105438232421875, -0.06182861328125, -0.018218994140625, 0.025390625, 0.069000244140625, 0.11260986328125, 0.156219482421875, 0.1998291015625, 0.243438720703125, 0.28704833984375, 0.330657958984375, 0.374267578125, 0.417877197265625, 0.46148681640625, 0.505096435546875, 0.5487060546875, 0.592315673828125, 0.63592529296875, 0.679534912109375, 0.72314453125, 0.766754150390625, 0.81036376953125, 0.853973388671875, 0.8975830078125, 0.941192626953125, 0.98480224609375, 1.028411865234375, 1.072021484375, 1.115631103515625, 1.15924072265625, 1.202850341796875, 1.2464599609375, 1.290069580078125, 1.33367919921875, 1.377288818359375, 1.4208984375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 9.0, 7.0, 8.0, 13.0, 15.0, 16.0, 20.0, 26.0, 27.0, 23.0, 27.0, 31.0, 31.0, 34.0, 30.0, 45.0, 36.0, 45.0, 46.0, 53.0, 50.0, 40.0, 38.0, 36.0, 33.0, 28.0, 29.0, 29.0, 25.0, 28.0, 27.0, 12.0, 15.0, 16.0, 7.0, 5.0, 3.0, 4.0, 6.0, 7.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.287841796875, -0.2790565490722656, -0.27027130126953125, -0.2614860534667969, -0.2527008056640625, -0.24391555786132812, -0.23513031005859375, -0.22634506225585938, -0.217559814453125, -0.20877456665039062, -0.19998931884765625, -0.19120407104492188, -0.1824188232421875, -0.17363357543945312, -0.16484832763671875, -0.15606307983398438, -0.14727783203125, -0.13849258422851562, -0.12970733642578125, -0.12092208862304688, -0.1121368408203125, -0.10335159301757812, -0.09456634521484375, -0.08578109741210938, -0.076995849609375, -0.06821060180664062, -0.05942535400390625, -0.050640106201171875, -0.0418548583984375, -0.033069610595703125, -0.02428436279296875, -0.015499114990234375, -0.0067138671875, 0.002071380615234375, 0.01085662841796875, 0.019641876220703125, 0.0284271240234375, 0.037212371826171875, 0.04599761962890625, 0.054782867431640625, 0.063568115234375, 0.07235336303710938, 0.08113861083984375, 0.08992385864257812, 0.0987091064453125, 0.10749435424804688, 0.11627960205078125, 0.12506484985351562, 0.13385009765625, 0.14263534545898438, 0.15142059326171875, 0.16020584106445312, 0.1689910888671875, 0.17777633666992188, 0.18656158447265625, 0.19534683227539062, 0.204132080078125, 0.21291732788085938, 0.22170257568359375, 0.23048782348632812, 0.2392730712890625, 0.24805831909179688, 0.25684356689453125, 0.2656288146972656, 0.2744140625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 9.0, 14.0, 14.0, 18.0, 42.0, 52.0, 62.0, 120.0, 190.0, 310.0, 481.0, 823.0, 1328.0, 2422.0, 4194.0, 7693.0, 14093.0, 27047.0, 50763.0, 96730.0, 173101.0, 244552.0, 191508.0, 108891.0, 58163.0, 30266.0, 15881.0, 8527.0, 4659.0, 2708.0, 1576.0, 872.0, 530.0, 349.0, 183.0, 149.0, 85.0, 54.0, 30.0, 32.0, 11.0, 11.0, 9.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.14453125, -1.1094207763671875, -1.074310302734375, -1.0391998291015625, -1.00408935546875, -0.9689788818359375, -0.933868408203125, -0.8987579345703125, -0.8636474609375, -0.8285369873046875, -0.793426513671875, -0.7583160400390625, -0.72320556640625, -0.6880950927734375, -0.652984619140625, -0.6178741455078125, -0.582763671875, -0.5476531982421875, -0.512542724609375, -0.4774322509765625, -0.44232177734375, -0.4072113037109375, -0.372100830078125, -0.3369903564453125, -0.3018798828125, -0.2667694091796875, -0.231658935546875, -0.1965484619140625, -0.16143798828125, -0.1263275146484375, -0.091217041015625, -0.0561065673828125, -0.02099609375, 0.0141143798828125, 0.049224853515625, 0.0843353271484375, 0.11944580078125, 0.1545562744140625, 0.189666748046875, 0.2247772216796875, 0.2598876953125, 0.2949981689453125, 0.330108642578125, 0.3652191162109375, 0.40032958984375, 0.4354400634765625, 0.470550537109375, 0.5056610107421875, 0.540771484375, 0.5758819580078125, 0.610992431640625, 0.6461029052734375, 0.68121337890625, 0.7163238525390625, 0.751434326171875, 0.7865447998046875, 0.8216552734375, 0.8567657470703125, 0.891876220703125, 0.9269866943359375, 0.96209716796875, 0.9972076416015625, 1.032318115234375, 1.0674285888671875, 1.1025390625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 5.0, 6.0, 15.0, 11.0, 13.0, 19.0, 18.0, 21.0, 17.0, 25.0, 31.0, 35.0, 37.0, 34.0, 39.0, 34.0, 35.0, 27.0, 42.0, 54.0, 55.0, 55.0, 40.0, 30.0, 28.0, 32.0, 37.0, 26.0, 20.0, 28.0, 18.0, 19.0, 19.0, 11.0, 6.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 4.0], "bins": [-1.6357421875, -1.5903778076171875, -1.545013427734375, -1.4996490478515625, -1.45428466796875, -1.4089202880859375, -1.363555908203125, -1.3181915283203125, -1.2728271484375, -1.2274627685546875, -1.182098388671875, -1.1367340087890625, -1.09136962890625, -1.0460052490234375, -1.000640869140625, -0.9552764892578125, -0.909912109375, -0.8645477294921875, -0.819183349609375, -0.7738189697265625, -0.72845458984375, -0.6830902099609375, -0.637725830078125, -0.5923614501953125, -0.5469970703125, -0.5016326904296875, -0.456268310546875, -0.4109039306640625, -0.36553955078125, -0.3201751708984375, -0.274810791015625, -0.2294464111328125, -0.18408203125, -0.1387176513671875, -0.093353271484375, -0.0479888916015625, -0.00262451171875, 0.0427398681640625, 0.088104248046875, 0.1334686279296875, 0.1788330078125, 0.2241973876953125, 0.269561767578125, 0.3149261474609375, 0.36029052734375, 0.4056549072265625, 0.451019287109375, 0.4963836669921875, 0.541748046875, 0.5871124267578125, 0.632476806640625, 0.6778411865234375, 0.72320556640625, 0.7685699462890625, 0.813934326171875, 0.8592987060546875, 0.9046630859375, 0.9500274658203125, 0.995391845703125, 1.0407562255859375, 1.08612060546875, 1.1314849853515625, 1.176849365234375, 1.2222137451171875, 1.267578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 6.0, 19.0, 16.0, 20.0, 29.0, 53.0, 86.0, 113.0, 201.0, 348.0, 562.0, 1018.0, 1961.0, 3956.0, 8663.0, 20669.0, 53097.0, 164585.0, 503917.0, 188867.0, 59384.0, 22287.0, 9476.0, 4326.0, 2187.0, 1108.0, 633.0, 400.0, 199.0, 130.0, 70.0, 49.0, 43.0, 23.0, 11.0, 11.0, 6.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2451171875, -1.2080078125, -1.1708984375, -1.1337890625, -1.0966796875, -1.0595703125, -1.0224609375, -0.9853515625, -0.9482421875, -0.9111328125, -0.8740234375, -0.8369140625, -0.7998046875, -0.7626953125, -0.7255859375, -0.6884765625, -0.6513671875, -0.6142578125, -0.5771484375, -0.5400390625, -0.5029296875, -0.4658203125, -0.4287109375, -0.3916015625, -0.3544921875, -0.3173828125, -0.2802734375, -0.2431640625, -0.2060546875, -0.1689453125, -0.1318359375, -0.0947265625, -0.0576171875, -0.0205078125, 0.0166015625, 0.0537109375, 0.0908203125, 0.1279296875, 0.1650390625, 0.2021484375, 0.2392578125, 0.2763671875, 0.3134765625, 0.3505859375, 0.3876953125, 0.4248046875, 0.4619140625, 0.4990234375, 0.5361328125, 0.5732421875, 0.6103515625, 0.6474609375, 0.6845703125, 0.7216796875, 0.7587890625, 0.7958984375, 0.8330078125, 0.8701171875, 0.9072265625, 0.9443359375, 0.9814453125, 1.0185546875, 1.0556640625, 1.0927734375, 1.1298828125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 8.0, 13.0, 15.0, 16.0, 23.0, 34.0, 39.0, 43.0, 47.0, 74.0, 103.0, 141.0, 107.0, 82.0, 55.0, 36.0, 30.0, 32.0, 14.0, 14.0, 15.0, 11.0, 3.0, 5.0, 5.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.00018930435180664062, -0.0001830998808145523, -0.000176895409822464, -0.00017069093883037567, -0.00016448646783828735, -0.00015828199684619904, -0.00015207752585411072, -0.0001458730548620224, -0.00013966858386993408, -0.00013346411287784576, -0.00012725964188575745, -0.00012105517089366913, -0.00011485069990158081, -0.00010864622890949249, -0.00010244175791740417, -9.623728692531586e-05, -9.003281593322754e-05, -8.382834494113922e-05, -7.76238739490509e-05, -7.141940295696259e-05, -6.521493196487427e-05, -5.901046097278595e-05, -5.280598998069763e-05, -4.6601518988609314e-05, -4.0397047996520996e-05, -3.419257700443268e-05, -2.798810601234436e-05, -2.1783635020256042e-05, -1.5579164028167725e-05, -9.374693036079407e-06, -3.170222043991089e-06, 3.034248948097229e-06, 9.238719940185547e-06, 1.5443190932273865e-05, 2.1647661924362183e-05, 2.78521329164505e-05, 3.405660390853882e-05, 4.0261074900627136e-05, 4.6465545892715454e-05, 5.267001688480377e-05, 5.887448787689209e-05, 6.507895886898041e-05, 7.128342986106873e-05, 7.748790085315704e-05, 8.369237184524536e-05, 8.989684283733368e-05, 9.6101313829422e-05, 0.00010230578482151031, 0.00010851025581359863, 0.00011471472680568695, 0.00012091919779777527, 0.00012712366878986359, 0.0001333281397819519, 0.00013953261077404022, 0.00014573708176612854, 0.00015194155275821686, 0.00015814602375030518, 0.0001643504947423935, 0.0001705549657344818, 0.00017675943672657013, 0.00018296390771865845, 0.00018916837871074677, 0.00019537284970283508, 0.0002015773206949234, 0.00020778179168701172]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 9.0, 12.0, 13.0, 28.0, 26.0, 39.0, 69.0, 98.0, 136.0, 197.0, 262.0, 386.0, 556.0, 933.0, 1381.0, 2269.0, 3496.0, 6575.0, 12545.0, 27861.0, 73809.0, 260394.0, 457160.0, 120635.0, 41594.0, 17327.0, 8543.0, 4584.0, 2639.0, 1622.0, 1096.0, 712.0, 476.0, 317.0, 228.0, 162.0, 115.0, 77.0, 44.0, 39.0, 32.0, 12.0, 19.0, 9.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.224609375, -1.1853790283203125, -1.146148681640625, -1.1069183349609375, -1.06768798828125, -1.0284576416015625, -0.989227294921875, -0.9499969482421875, -0.9107666015625, -0.8715362548828125, -0.832305908203125, -0.7930755615234375, -0.75384521484375, -0.7146148681640625, -0.675384521484375, -0.6361541748046875, -0.596923828125, -0.5576934814453125, -0.518463134765625, -0.4792327880859375, -0.44000244140625, -0.4007720947265625, -0.361541748046875, -0.3223114013671875, -0.2830810546875, -0.2438507080078125, -0.204620361328125, -0.1653900146484375, -0.12615966796875, -0.0869293212890625, -0.047698974609375, -0.0084686279296875, 0.03076171875, 0.0699920654296875, 0.109222412109375, 0.1484527587890625, 0.18768310546875, 0.2269134521484375, 0.266143798828125, 0.3053741455078125, 0.3446044921875, 0.3838348388671875, 0.423065185546875, 0.4622955322265625, 0.50152587890625, 0.5407562255859375, 0.579986572265625, 0.6192169189453125, 0.658447265625, 0.6976776123046875, 0.736907958984375, 0.7761383056640625, 0.81536865234375, 0.8545989990234375, 0.893829345703125, 0.9330596923828125, 0.9722900390625, 1.0115203857421875, 1.050750732421875, 1.0899810791015625, 1.12921142578125, 1.1684417724609375, 1.207672119140625, 1.2469024658203125, 1.2861328125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 8.0, 10.0, 9.0, 11.0, 18.0, 13.0, 16.0, 23.0, 38.0, 25.0, 41.0, 64.0, 91.0, 109.0, 115.0, 89.0, 77.0, 43.0, 33.0, 37.0, 25.0, 16.0, 14.0, 10.0, 7.0, 5.0, 7.0, 12.0, 8.0, 1.0, 6.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3525390625, -1.312652587890625, -1.27276611328125, -1.232879638671875, -1.1929931640625, -1.153106689453125, -1.11322021484375, -1.073333740234375, -1.033447265625, -0.993560791015625, -0.95367431640625, -0.913787841796875, -0.8739013671875, -0.834014892578125, -0.79412841796875, -0.754241943359375, -0.71435546875, -0.674468994140625, -0.63458251953125, -0.594696044921875, -0.5548095703125, -0.514923095703125, -0.47503662109375, -0.435150146484375, -0.395263671875, -0.355377197265625, -0.31549072265625, -0.275604248046875, -0.2357177734375, -0.195831298828125, -0.15594482421875, -0.116058349609375, -0.076171875, -0.036285400390625, 0.00360107421875, 0.043487548828125, 0.0833740234375, 0.123260498046875, 0.16314697265625, 0.203033447265625, 0.242919921875, 0.282806396484375, 0.32269287109375, 0.362579345703125, 0.4024658203125, 0.442352294921875, 0.48223876953125, 0.522125244140625, 0.56201171875, 0.601898193359375, 0.64178466796875, 0.681671142578125, 0.7215576171875, 0.761444091796875, 0.80133056640625, 0.841217041015625, 0.881103515625, 0.920989990234375, 0.96087646484375, 1.000762939453125, 1.0406494140625, 1.080535888671875, 1.12042236328125, 1.160308837890625, 1.2001953125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 17.0, 38.0, 75.0, 128.0, 196.0, 190.0, 155.0, 93.0, 65.0, 23.0, 15.0, 9.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.437450408935547, -9.413684844970703, -8.389920234680176, -7.36615514755249, -6.342390060424805, -5.318624973297119, -4.294859886169434, -3.271094799041748, -2.2473297119140625, -1.223564624786377, -0.1997995376586914, 0.8239655494689941, 1.8477306365966797, 2.8714957237243652, 3.895260810852051, 4.919025897979736, 5.942790985107422, 6.966556072235107, 7.990321159362793, 9.01408576965332, 10.037851333618164, 11.061616897583008, 12.085381507873535, 13.109146118164062, 14.132911682128906, 15.15667724609375, 16.180442810058594, 17.204206466674805, 18.22797203063965, 19.251737594604492, 20.275501251220703, 21.299266815185547, 22.32303237915039, 23.346797943115234, 24.370563507080078, 25.39432716369629, 26.418092727661133, 27.441858291625977, 28.465621948242188, 29.48938751220703, 30.513153076171875, 31.53691864013672, 32.56068420410156, 33.584449768066406, 34.60821533203125, 35.63197708129883, 36.65574264526367, 37.679508209228516, 38.70327377319336, 39.7270393371582, 40.75080490112305, 41.77457046508789, 42.79833221435547, 43.82209777832031, 44.845863342285156, 45.86962890625, 46.893394470214844, 47.91716003417969, 48.94092559814453, 49.964691162109375, 50.98845672607422, 52.0122184753418, 53.03598403930664, 54.059749603271484, 55.08351516723633]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 8.0, 7.0, 9.0, 10.0, 12.0, 16.0, 20.0, 20.0, 25.0, 14.0, 24.0, 41.0, 23.0, 13.0, 46.0, 40.0, 41.0, 38.0, 47.0, 39.0, 48.0, 27.0, 37.0, 44.0, 34.0, 42.0, 35.0, 34.0, 27.0, 24.0, 21.0, 21.0, 15.0, 20.0, 7.0, 13.0, 8.0, 4.0, 9.0, 10.0, 3.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.209246635437012, -7.943666934967041, -7.67808723449707, -7.4125075340271, -7.146927833557129, -6.881348133087158, -6.6157684326171875, -6.350189208984375, -6.084609031677246, -5.819029331207275, -5.553449630737305, -5.287869930267334, -5.022290229797363, -4.756710529327393, -4.491130828857422, -4.225551605224609, -3.9599719047546387, -3.694392204284668, -3.4288125038146973, -3.1632328033447266, -2.897653102874756, -2.632073402404785, -2.3664939403533936, -2.100914239883423, -1.8353345394134521, -1.5697548389434814, -1.3041751384735107, -1.0385955572128296, -0.7730158567428589, -0.5074361562728882, -0.24185657501220703, 0.023723125457763672, 0.2893028259277344, 0.5548825263977051, 0.820462167263031, 1.086041808128357, 1.3516215085983276, 1.6172012090682983, 1.8827807903289795, 2.14836049079895, 2.413940191268921, 2.6795198917388916, 2.9450995922088623, 3.210679054260254, 3.4762587547302246, 3.7418384552001953, 4.007418155670166, 4.272997856140137, 4.538577556610107, 4.804157257080078, 5.069736957550049, 5.3353166580200195, 5.60089635848999, 5.866476058959961, 6.132055282592773, 6.397635459899902, 6.663214683532715, 6.9287943840026855, 7.194374084472656, 7.459953784942627, 7.725533485412598, 7.991113185882568, 8.256692886352539, 8.522272109985352, 8.78785228729248]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 6.0, 11.0, 7.0, 18.0, 21.0, 37.0, 34.0, 32.0, 64.0, 95.0, 103.0, 179.0, 252.0, 359.0, 576.0, 1043.0, 1886.0, 3800.0, 9242.0, 27234.0, 120351.0, 3044613.0, 869560.0, 80453.0, 20009.0, 7136.0, 3126.0, 1502.0, 918.0, 501.0, 332.0, 226.0, 154.0, 102.0, 75.0, 65.0, 44.0, 29.0, 16.0, 15.0, 17.0, 10.0, 7.0, 6.0, 6.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.505859375, -3.392333984375, -3.27880859375, -3.165283203125, -3.0517578125, -2.938232421875, -2.82470703125, -2.711181640625, -2.59765625, -2.484130859375, -2.37060546875, -2.257080078125, -2.1435546875, -2.030029296875, -1.91650390625, -1.802978515625, -1.689453125, -1.575927734375, -1.46240234375, -1.348876953125, -1.2353515625, -1.121826171875, -1.00830078125, -0.894775390625, -0.78125, -0.667724609375, -0.55419921875, -0.440673828125, -0.3271484375, -0.213623046875, -0.10009765625, 0.013427734375, 0.126953125, 0.240478515625, 0.35400390625, 0.467529296875, 0.5810546875, 0.694580078125, 0.80810546875, 0.921630859375, 1.03515625, 1.148681640625, 1.26220703125, 1.375732421875, 1.4892578125, 1.602783203125, 1.71630859375, 1.829833984375, 1.943359375, 2.056884765625, 2.17041015625, 2.283935546875, 2.3974609375, 2.510986328125, 2.62451171875, 2.738037109375, 2.8515625, 2.965087890625, 3.07861328125, 3.192138671875, 3.3056640625, 3.419189453125, 3.53271484375, 3.646240234375, 3.759765625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 11.0, 8.0, 13.0, 18.0, 21.0, 23.0, 33.0, 26.0, 40.0, 34.0, 60.0, 55.0, 43.0, 61.0, 49.0, 47.0, 53.0, 37.0, 50.0, 52.0, 30.0, 35.0, 33.0, 24.0, 24.0, 17.0, 17.0, 16.0, 14.0, 9.0, 10.0, 7.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341064453125, -0.32967376708984375, -0.3182830810546875, -0.30689239501953125, -0.295501708984375, -0.28411102294921875, -0.2727203369140625, -0.26132965087890625, -0.24993896484375, -0.23854827880859375, -0.2271575927734375, -0.21576690673828125, -0.204376220703125, -0.19298553466796875, -0.1815948486328125, -0.17020416259765625, -0.1588134765625, -0.14742279052734375, -0.1360321044921875, -0.12464141845703125, -0.113250732421875, -0.10186004638671875, -0.0904693603515625, -0.07907867431640625, -0.06768798828125, -0.05629730224609375, -0.0449066162109375, -0.03351593017578125, -0.022125244140625, -0.01073455810546875, 0.0006561279296875, 0.01204681396484375, 0.0234375, 0.03482818603515625, 0.0462188720703125, 0.05760955810546875, 0.069000244140625, 0.08039093017578125, 0.0917816162109375, 0.10317230224609375, 0.11456298828125, 0.12595367431640625, 0.1373443603515625, 0.14873504638671875, 0.160125732421875, 0.17151641845703125, 0.1829071044921875, 0.19429779052734375, 0.2056884765625, 0.21707916259765625, 0.2284698486328125, 0.23986053466796875, 0.251251220703125, 0.26264190673828125, 0.2740325927734375, 0.28542327880859375, 0.29681396484375, 0.30820465087890625, 0.3195953369140625, 0.33098602294921875, 0.342376708984375, 0.35376739501953125, 0.3651580810546875, 0.37654876708984375, 0.387939453125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 7.0, 14.0, 14.0, 29.0, 47.0, 92.0, 134.0, 228.0, 419.0, 715.0, 1407.0, 2789.0, 6476.0, 16590.0, 53358.0, 263125.0, 3166903.0, 556136.0, 85732.0, 23736.0, 8692.0, 3761.0, 1839.0, 914.0, 452.0, 298.0, 141.0, 101.0, 62.0, 26.0, 23.0, 13.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.73046875, -2.628082275390625, -2.52569580078125, -2.423309326171875, -2.3209228515625, -2.218536376953125, -2.11614990234375, -2.013763427734375, -1.911376953125, -1.808990478515625, -1.70660400390625, -1.604217529296875, -1.5018310546875, -1.399444580078125, -1.29705810546875, -1.194671630859375, -1.09228515625, -0.989898681640625, -0.88751220703125, -0.785125732421875, -0.6827392578125, -0.580352783203125, -0.47796630859375, -0.375579833984375, -0.273193359375, -0.170806884765625, -0.06842041015625, 0.033966064453125, 0.1363525390625, 0.238739013671875, 0.34112548828125, 0.443511962890625, 0.5458984375, 0.648284912109375, 0.75067138671875, 0.853057861328125, 0.9554443359375, 1.057830810546875, 1.16021728515625, 1.262603759765625, 1.364990234375, 1.467376708984375, 1.56976318359375, 1.672149658203125, 1.7745361328125, 1.876922607421875, 1.97930908203125, 2.081695556640625, 2.18408203125, 2.286468505859375, 2.38885498046875, 2.491241455078125, 2.5936279296875, 2.696014404296875, 2.79840087890625, 2.900787353515625, 3.003173828125, 3.105560302734375, 3.20794677734375, 3.310333251953125, 3.4127197265625, 3.515106201171875, 3.61749267578125, 3.719879150390625, 3.822265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 10.0, 6.0, 12.0, 19.0, 23.0, 35.0, 56.0, 80.0, 153.0, 196.0, 406.0, 1400.0, 811.0, 358.0, 174.0, 92.0, 80.0, 38.0, 27.0, 23.0, 18.0, 17.0, 10.0, 5.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3984375, -1.348175048828125, -1.29791259765625, -1.247650146484375, -1.1973876953125, -1.147125244140625, -1.09686279296875, -1.046600341796875, -0.996337890625, -0.946075439453125, -0.89581298828125, -0.845550537109375, -0.7952880859375, -0.745025634765625, -0.69476318359375, -0.644500732421875, -0.59423828125, -0.543975830078125, -0.49371337890625, -0.443450927734375, -0.3931884765625, -0.342926025390625, -0.29266357421875, -0.242401123046875, -0.192138671875, -0.141876220703125, -0.09161376953125, -0.041351318359375, 0.0089111328125, 0.059173583984375, 0.10943603515625, 0.159698486328125, 0.2099609375, 0.260223388671875, 0.31048583984375, 0.360748291015625, 0.4110107421875, 0.461273193359375, 0.51153564453125, 0.561798095703125, 0.612060546875, 0.662322998046875, 0.71258544921875, 0.762847900390625, 0.8131103515625, 0.863372802734375, 0.91363525390625, 0.963897705078125, 1.01416015625, 1.064422607421875, 1.11468505859375, 1.164947509765625, 1.2152099609375, 1.265472412109375, 1.31573486328125, 1.365997314453125, 1.416259765625, 1.466522216796875, 1.51678466796875, 1.567047119140625, 1.6173095703125, 1.667572021484375, 1.71783447265625, 1.768096923828125, 1.818359375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 16.0, 26.0, 56.0, 114.0, 151.0, 221.0, 207.0, 129.0, 48.0, 24.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.397632598876953, -30.68122673034668, -29.964818954467773, -29.2484130859375, -28.532007217407227, -27.815601348876953, -27.099193572998047, -26.382787704467773, -25.6663818359375, -24.949975967407227, -24.23356819152832, -23.517162322998047, -22.800756454467773, -22.0843505859375, -21.367942810058594, -20.65153694152832, -19.935129165649414, -19.21872329711914, -18.502315521240234, -17.78590965270996, -17.069503784179688, -16.35309600830078, -15.636690139770508, -14.920284271240234, -14.203877449035645, -13.487470626831055, -12.771064758300781, -12.054657936096191, -11.338251113891602, -10.621845245361328, -9.905438423156738, -9.189031600952148, -8.472627639770508, -7.756221294403076, -7.0398149490356445, -6.323408126831055, -5.607001781463623, -4.890595436096191, -4.174188613891602, -3.45778226852417, -2.7413759231567383, -2.0249695777893066, -1.308562994003296, -0.5921564102172852, 0.12424993515014648, 0.8406562805175781, 1.557063102722168, 2.2734694480895996, 2.9898757934570312, 3.706282138824463, 4.4226884841918945, 5.139095306396484, 5.855501651763916, 6.571907997131348, 7.2883148193359375, 8.004720687866211, 8.7211275100708, 9.43753433227539, 10.153940200805664, 10.870347023010254, 11.586753845214844, 12.303159713745117, 13.019566535949707, 13.735973358154297, 14.45237922668457]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 7.0, 6.0, 7.0, 7.0, 5.0, 15.0, 21.0, 22.0, 31.0, 26.0, 28.0, 26.0, 38.0, 47.0, 47.0, 47.0, 48.0, 54.0, 62.0, 46.0, 38.0, 47.0, 45.0, 34.0, 45.0, 40.0, 27.0, 26.0, 22.0, 20.0, 12.0, 18.0, 7.0, 12.0, 6.0, 3.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.977465629577637, -6.752467155456543, -6.527468681335449, -6.3024702072143555, -6.077471733093262, -5.852473258972168, -5.627474784851074, -5.4024763107299805, -5.177477836608887, -4.952479362487793, -4.727480888366699, -4.5024824142456055, -4.277483940124512, -4.052485466003418, -3.8274872303009033, -3.6024887561798096, -3.377490520477295, -3.152492046356201, -2.9274935722351074, -2.7024950981140137, -2.47749662399292, -2.252498149871826, -2.0274999141693115, -1.8025014400482178, -1.577502965927124, -1.3525044918060303, -1.1275060176849365, -0.9025076627731323, -0.6775091886520386, -0.4525107145309448, -0.22751235961914062, -0.002513885498046875, 0.22248411178588867, 0.44748255610466003, 0.6724810004234314, 0.8974794149398804, 1.1224778890609741, 1.3474763631820679, 1.572474718093872, 1.7974731922149658, 2.0224716663360596, 2.2474701404571533, 2.472468614578247, 2.6974668502807617, 2.9224653244018555, 3.147463798522949, 3.372462272644043, 3.5974607467651367, 3.8224592208862305, 4.047457695007324, 4.272456169128418, 4.497454643249512, 4.7224531173706055, 4.947451591491699, 5.172450065612793, 5.397448539733887, 5.6224470138549805, 5.847445487976074, 6.072443962097168, 6.297442436218262, 6.5224409103393555, 6.747439384460449, 6.972437858581543, 7.197436332702637, 7.422434329986572]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 16.0, 17.0, 20.0, 38.0, 37.0, 91.0, 124.0, 218.0, 367.0, 625.0, 1107.0, 1923.0, 3486.0, 6353.0, 12029.0, 23025.0, 44556.0, 85773.0, 151268.0, 214547.0, 206973.0, 137234.0, 75509.0, 39108.0, 20207.0, 10667.0, 5928.0, 3078.0, 1769.0, 1035.0, 541.0, 360.0, 216.0, 120.0, 65.0, 38.0, 28.0, 17.0, 21.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.505859375, -1.44989013671875, -1.3939208984375, -1.33795166015625, -1.281982421875, -1.22601318359375, -1.1700439453125, -1.11407470703125, -1.05810546875, -1.00213623046875, -0.9461669921875, -0.89019775390625, -0.834228515625, -0.77825927734375, -0.7222900390625, -0.66632080078125, -0.6103515625, -0.55438232421875, -0.4984130859375, -0.44244384765625, -0.386474609375, -0.33050537109375, -0.2745361328125, -0.21856689453125, -0.16259765625, -0.10662841796875, -0.0506591796875, 0.00531005859375, 0.061279296875, 0.11724853515625, 0.1732177734375, 0.22918701171875, 0.28515625, 0.34112548828125, 0.3970947265625, 0.45306396484375, 0.509033203125, 0.56500244140625, 0.6209716796875, 0.67694091796875, 0.73291015625, 0.78887939453125, 0.8448486328125, 0.90081787109375, 0.956787109375, 1.01275634765625, 1.0687255859375, 1.12469482421875, 1.1806640625, 1.23663330078125, 1.2926025390625, 1.34857177734375, 1.404541015625, 1.46051025390625, 1.5164794921875, 1.57244873046875, 1.62841796875, 1.68438720703125, 1.7403564453125, 1.79632568359375, 1.852294921875, 1.90826416015625, 1.9642333984375, 2.02020263671875, 2.076171875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 10.0, 9.0, 7.0, 14.0, 15.0, 29.0, 27.0, 31.0, 31.0, 29.0, 36.0, 31.0, 36.0, 44.0, 42.0, 46.0, 58.0, 35.0, 45.0, 43.0, 33.0, 29.0, 37.0, 44.0, 27.0, 25.0, 24.0, 25.0, 21.0, 18.0, 22.0, 13.0, 14.0, 11.0, 12.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.463134765625, -0.44911956787109375, -0.4351043701171875, -0.42108917236328125, -0.407073974609375, -0.39305877685546875, -0.3790435791015625, -0.36502838134765625, -0.35101318359375, -0.33699798583984375, -0.3229827880859375, -0.30896759033203125, -0.294952392578125, -0.28093719482421875, -0.2669219970703125, -0.25290679931640625, -0.2388916015625, -0.22487640380859375, -0.2108612060546875, -0.19684600830078125, -0.182830810546875, -0.16881561279296875, -0.1548004150390625, -0.14078521728515625, -0.12677001953125, -0.11275482177734375, -0.0987396240234375, -0.08472442626953125, -0.070709228515625, -0.05669403076171875, -0.0426788330078125, -0.02866363525390625, -0.0146484375, -0.00063323974609375, 0.0133819580078125, 0.02739715576171875, 0.041412353515625, 0.05542755126953125, 0.0694427490234375, 0.08345794677734375, 0.09747314453125, 0.11148834228515625, 0.1255035400390625, 0.13951873779296875, 0.153533935546875, 0.16754913330078125, 0.1815643310546875, 0.19557952880859375, 0.2095947265625, 0.22360992431640625, 0.2376251220703125, 0.25164031982421875, 0.265655517578125, 0.27967071533203125, 0.2936859130859375, 0.30770111083984375, 0.32171630859375, 0.33573150634765625, 0.3497467041015625, 0.36376190185546875, 0.377777099609375, 0.39179229736328125, 0.4058074951171875, 0.41982269287109375, 0.433837890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 5.0, 2.0, 6.0, 20.0, 24.0, 26.0, 64.0, 99.0, 173.0, 309.0, 640.0, 1373.0, 2894.0, 6925.0, 17121.0, 45622.0, 127851.0, 307619.0, 319468.0, 137732.0, 48717.0, 18356.0, 7335.0, 3255.0, 1437.0, 673.0, 336.0, 208.0, 89.0, 63.0, 28.0, 22.0, 20.0, 12.0, 6.0, 7.0, 8.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-3.24609375, -3.158447265625, -3.07080078125, -2.983154296875, -2.8955078125, -2.807861328125, -2.72021484375, -2.632568359375, -2.544921875, -2.457275390625, -2.36962890625, -2.281982421875, -2.1943359375, -2.106689453125, -2.01904296875, -1.931396484375, -1.84375, -1.756103515625, -1.66845703125, -1.580810546875, -1.4931640625, -1.405517578125, -1.31787109375, -1.230224609375, -1.142578125, -1.054931640625, -0.96728515625, -0.879638671875, -0.7919921875, -0.704345703125, -0.61669921875, -0.529052734375, -0.44140625, -0.353759765625, -0.26611328125, -0.178466796875, -0.0908203125, -0.003173828125, 0.08447265625, 0.172119140625, 0.259765625, 0.347412109375, 0.43505859375, 0.522705078125, 0.6103515625, 0.697998046875, 0.78564453125, 0.873291015625, 0.9609375, 1.048583984375, 1.13623046875, 1.223876953125, 1.3115234375, 1.399169921875, 1.48681640625, 1.574462890625, 1.662109375, 1.749755859375, 1.83740234375, 1.925048828125, 2.0126953125, 2.100341796875, 2.18798828125, 2.275634765625, 2.36328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 9.0, 6.0, 5.0, 7.0, 7.0, 8.0, 12.0, 25.0, 11.0, 26.0, 18.0, 32.0, 42.0, 46.0, 37.0, 43.0, 50.0, 48.0, 37.0, 49.0, 49.0, 55.0, 54.0, 46.0, 36.0, 42.0, 30.0, 29.0, 28.0, 23.0, 27.0, 18.0, 10.0, 15.0, 8.0, 4.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.087890625, -2.987548828125, -2.88720703125, -2.786865234375, -2.6865234375, -2.586181640625, -2.48583984375, -2.385498046875, -2.28515625, -2.184814453125, -2.08447265625, -1.984130859375, -1.8837890625, -1.783447265625, -1.68310546875, -1.582763671875, -1.482421875, -1.382080078125, -1.28173828125, -1.181396484375, -1.0810546875, -0.980712890625, -0.88037109375, -0.780029296875, -0.6796875, -0.579345703125, -0.47900390625, -0.378662109375, -0.2783203125, -0.177978515625, -0.07763671875, 0.022705078125, 0.123046875, 0.223388671875, 0.32373046875, 0.424072265625, 0.5244140625, 0.624755859375, 0.72509765625, 0.825439453125, 0.92578125, 1.026123046875, 1.12646484375, 1.226806640625, 1.3271484375, 1.427490234375, 1.52783203125, 1.628173828125, 1.728515625, 1.828857421875, 1.92919921875, 2.029541015625, 2.1298828125, 2.230224609375, 2.33056640625, 2.430908203125, 2.53125, 2.631591796875, 2.73193359375, 2.832275390625, 2.9326171875, 3.032958984375, 3.13330078125, 3.233642578125, 3.333984375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 10.0, 8.0, 12.0, 24.0, 31.0, 47.0, 69.0, 114.0, 193.0, 266.0, 506.0, 959.0, 1839.0, 4068.0, 9321.0, 25825.0, 79521.0, 278755.0, 436963.0, 140783.0, 42559.0, 15129.0, 5977.0, 2598.0, 1315.0, 661.0, 375.0, 228.0, 143.0, 79.0, 59.0, 30.0, 23.0, 16.0, 15.0, 14.0, 10.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.068359375, -2.0061187744140625, -1.943878173828125, -1.8816375732421875, -1.81939697265625, -1.7571563720703125, -1.694915771484375, -1.6326751708984375, -1.5704345703125, -1.5081939697265625, -1.445953369140625, -1.3837127685546875, -1.32147216796875, -1.2592315673828125, -1.196990966796875, -1.1347503662109375, -1.072509765625, -1.0102691650390625, -0.948028564453125, -0.8857879638671875, -0.82354736328125, -0.7613067626953125, -0.699066162109375, -0.6368255615234375, -0.5745849609375, -0.5123443603515625, -0.450103759765625, -0.3878631591796875, -0.32562255859375, -0.2633819580078125, -0.201141357421875, -0.1389007568359375, -0.07666015625, -0.0144195556640625, 0.047821044921875, 0.1100616455078125, 0.17230224609375, 0.2345428466796875, 0.296783447265625, 0.3590240478515625, 0.4212646484375, 0.4835052490234375, 0.545745849609375, 0.6079864501953125, 0.67022705078125, 0.7324676513671875, 0.794708251953125, 0.8569488525390625, 0.919189453125, 0.9814300537109375, 1.043670654296875, 1.1059112548828125, 1.16815185546875, 1.2303924560546875, 1.292633056640625, 1.3548736572265625, 1.4171142578125, 1.4793548583984375, 1.541595458984375, 1.6038360595703125, 1.66607666015625, 1.7283172607421875, 1.790557861328125, 1.8527984619140625, 1.9150390625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 6.0, 9.0, 14.0, 11.0, 27.0, 42.0, 67.0, 80.0, 138.0, 115.0, 131.0, 118.0, 70.0, 60.0, 36.0, 28.0, 12.0, 12.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004096031188964844, -0.0003966912627220154, -0.0003837794065475464, -0.0003708675503730774, -0.0003579556941986084, -0.0003450438380241394, -0.0003321319818496704, -0.0003192201256752014, -0.0003063082695007324, -0.00029339641332626343, -0.00028048455715179443, -0.00026757270097732544, -0.00025466084480285645, -0.00024174898862838745, -0.00022883713245391846, -0.00021592527627944946, -0.00020301342010498047, -0.00019010156393051147, -0.00017718970775604248, -0.00016427785158157349, -0.0001513659954071045, -0.0001384541392326355, -0.0001255422830581665, -0.00011263042688369751, -9.971857070922852e-05, -8.680671453475952e-05, -7.389485836029053e-05, -6.098300218582153e-05, -4.807114601135254e-05, -3.5159289836883545e-05, -2.224743366241455e-05, -9.335577487945557e-06, 3.5762786865234375e-06, 1.648813486099243e-05, 2.9399991035461426e-05, 4.231184720993042e-05, 5.5223703384399414e-05, 6.813555955886841e-05, 8.10474157333374e-05, 9.39592719078064e-05, 0.00010687112808227539, 0.00011978298425674438, 0.00013269484043121338, 0.00014560669660568237, 0.00015851855278015137, 0.00017143040895462036, 0.00018434226512908936, 0.00019725412130355835, 0.00021016597747802734, 0.00022307783365249634, 0.00023598968982696533, 0.0002489015460014343, 0.0002618134021759033, 0.0002747252583503723, 0.0002876371145248413, 0.0003005489706993103, 0.0003134608268737793, 0.0003263726830482483, 0.0003392845392227173, 0.0003521963953971863, 0.0003651082515716553, 0.00037802010774612427, 0.00039093196392059326, 0.00040384382009506226, 0.00041675567626953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 8.0, 15.0, 21.0, 24.0, 44.0, 47.0, 75.0, 130.0, 206.0, 383.0, 680.0, 1192.0, 2518.0, 6024.0, 17227.0, 62198.0, 278503.0, 500194.0, 129521.0, 31985.0, 9849.0, 3870.0, 1725.0, 882.0, 464.0, 286.0, 149.0, 100.0, 59.0, 44.0, 50.0, 20.0, 15.0, 11.0, 5.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.517578125, -2.43951416015625, -2.3614501953125, -2.28338623046875, -2.205322265625, -2.12725830078125, -2.0491943359375, -1.97113037109375, -1.89306640625, -1.81500244140625, -1.7369384765625, -1.65887451171875, -1.580810546875, -1.50274658203125, -1.4246826171875, -1.34661865234375, -1.2685546875, -1.19049072265625, -1.1124267578125, -1.03436279296875, -0.956298828125, -0.87823486328125, -0.8001708984375, -0.72210693359375, -0.64404296875, -0.56597900390625, -0.4879150390625, -0.40985107421875, -0.331787109375, -0.25372314453125, -0.1756591796875, -0.09759521484375, -0.01953125, 0.05853271484375, 0.1365966796875, 0.21466064453125, 0.292724609375, 0.37078857421875, 0.4488525390625, 0.52691650390625, 0.60498046875, 0.68304443359375, 0.7611083984375, 0.83917236328125, 0.917236328125, 0.99530029296875, 1.0733642578125, 1.15142822265625, 1.2294921875, 1.30755615234375, 1.3856201171875, 1.46368408203125, 1.541748046875, 1.61981201171875, 1.6978759765625, 1.77593994140625, 1.85400390625, 1.93206787109375, 2.0101318359375, 2.08819580078125, 2.166259765625, 2.24432373046875, 2.3223876953125, 2.40045166015625, 2.478515625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 4.0, 5.0, 4.0, 10.0, 13.0, 20.0, 15.0, 34.0, 41.0, 40.0, 35.0, 62.0, 69.0, 66.0, 79.0, 80.0, 76.0, 68.0, 59.0, 37.0, 27.0, 29.0, 17.0, 16.0, 18.0, 16.0, 12.0, 9.0, 6.0, 4.0, 2.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.31640625, -2.2507781982421875, -2.185150146484375, -2.1195220947265625, -2.05389404296875, -1.9882659912109375, -1.922637939453125, -1.8570098876953125, -1.7913818359375, -1.7257537841796875, -1.660125732421875, -1.5944976806640625, -1.52886962890625, -1.4632415771484375, -1.397613525390625, -1.3319854736328125, -1.266357421875, -1.2007293701171875, -1.135101318359375, -1.0694732666015625, -1.00384521484375, -0.9382171630859375, -0.872589111328125, -0.8069610595703125, -0.7413330078125, -0.6757049560546875, -0.610076904296875, -0.5444488525390625, -0.47882080078125, -0.4131927490234375, -0.347564697265625, -0.2819366455078125, -0.21630859375, -0.1506805419921875, -0.085052490234375, -0.0194244384765625, 0.04620361328125, 0.1118316650390625, 0.177459716796875, 0.2430877685546875, 0.3087158203125, 0.3743438720703125, 0.439971923828125, 0.5055999755859375, 0.57122802734375, 0.6368560791015625, 0.702484130859375, 0.7681121826171875, 0.833740234375, 0.8993682861328125, 0.964996337890625, 1.0306243896484375, 1.09625244140625, 1.1618804931640625, 1.227508544921875, 1.2931365966796875, 1.3587646484375, 1.4243927001953125, 1.490020751953125, 1.5556488037109375, 1.62127685546875, 1.6869049072265625, 1.752532958984375, 1.8181610107421875, 1.8837890625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 10.0, 12.0, 28.0, 60.0, 106.0, 154.0, 176.0, 183.0, 130.0, 66.0, 42.0, 26.0, 8.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.78036880493164, -51.22138595581055, -49.66239929199219, -48.103416442871094, -46.54443359375, -44.985450744628906, -43.42646408081055, -41.86748123168945, -40.308494567871094, -38.74951171875, -37.19052505493164, -35.63154220581055, -34.07255935668945, -32.513572692871094, -30.95458984375, -29.395606994628906, -27.836624145507812, -26.277639389038086, -24.718656539916992, -23.159671783447266, -21.600688934326172, -20.041704177856445, -18.48271942138672, -16.923736572265625, -15.364751815795898, -13.805768013000488, -12.246784210205078, -10.687799453735352, -9.128815650939941, -7.569831848144531, -6.010847091674805, -4.4518632888793945, -2.8928794860839844, -1.3338954448699951, 0.22508859634399414, 1.7840728759765625, 3.3430566787719727, 4.902040481567383, 6.461025238037109, 8.02000904083252, 9.57899284362793, 11.13797664642334, 12.69696044921875, 14.255945205688477, 15.814929008483887, 17.373912811279297, 18.932897567749023, 20.49188232421875, 22.050865173339844, 23.60984992980957, 25.168832778930664, 26.72781753540039, 28.286800384521484, 29.84578514099121, 31.404769897460938, 32.96375274658203, 34.522735595703125, 36.08171844482422, 37.64070510864258, 39.19968795776367, 40.758670806884766, 42.317657470703125, 43.87664031982422, 45.43562316894531, 46.99460983276367]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 7.0, 5.0, 8.0, 10.0, 8.0, 18.0, 15.0, 15.0, 19.0, 30.0, 33.0, 34.0, 50.0, 34.0, 50.0, 40.0, 49.0, 39.0, 47.0, 56.0, 45.0, 43.0, 46.0, 37.0, 38.0, 32.0, 36.0, 26.0, 16.0, 16.0, 22.0, 12.0, 12.0, 12.0, 5.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.704089164733887, -15.125262260437012, -14.54643440246582, -13.967607498168945, -13.388779640197754, -12.809952735900879, -12.231124877929688, -11.652297973632812, -11.073471069335938, -10.494644165039062, -9.915816307067871, -9.336989402770996, -8.758161544799805, -8.17933464050293, -7.6005072593688965, -7.021679878234863, -6.442852020263672, -5.864024639129639, -5.2851972579956055, -4.7063703536987305, -4.127542495727539, -3.548715353012085, -2.969888210296631, -2.3910608291625977, -1.8122334480285645, -1.2334060668945312, -0.6545788049697876, -0.07575154304504395, 0.5030758380889893, 1.0819032192230225, 1.6607303619384766, 2.2395577430725098, 2.8183841705322266, 3.3972115516662598, 3.976038932800293, 4.554865837097168, 5.133693695068359, 5.712520599365234, 6.291347980499268, 6.870175361633301, 7.449002742767334, 8.027830123901367, 8.606657028198242, 9.185484886169434, 9.764311790466309, 10.3431396484375, 10.921966552734375, 11.50079345703125, 12.079621315002441, 12.658448219299316, 13.237276077270508, 13.816102981567383, 14.394930839538574, 14.97375774383545, 15.55258560180664, 16.131412506103516, 16.71023941040039, 17.289066314697266, 17.86789321899414, 18.44672203063965, 19.025548934936523, 19.6043758392334, 20.183202743530273, 20.76203155517578, 21.340858459472656]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 10.0, 20.0, 15.0, 35.0, 36.0, 78.0, 124.0, 194.0, 306.0, 561.0, 1298.0, 3555.0, 11944.0, 108054.0, 4029156.0, 28693.0, 6079.0, 2039.0, 915.0, 442.0, 234.0, 153.0, 100.0, 73.0, 34.0, 24.0, 24.0, 18.0, 11.0, 12.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.65625, -5.44866943359375, -5.2410888671875, -5.03350830078125, -4.825927734375, -4.61834716796875, -4.4107666015625, -4.20318603515625, -3.99560546875, -3.78802490234375, -3.5804443359375, -3.37286376953125, -3.165283203125, -2.95770263671875, -2.7501220703125, -2.54254150390625, -2.3349609375, -2.12738037109375, -1.9197998046875, -1.71221923828125, -1.504638671875, -1.29705810546875, -1.0894775390625, -0.88189697265625, -0.67431640625, -0.46673583984375, -0.2591552734375, -0.05157470703125, 0.156005859375, 0.36358642578125, 0.5711669921875, 0.77874755859375, 0.986328125, 1.19390869140625, 1.4014892578125, 1.60906982421875, 1.816650390625, 2.02423095703125, 2.2318115234375, 2.43939208984375, 2.64697265625, 2.85455322265625, 3.0621337890625, 3.26971435546875, 3.477294921875, 3.68487548828125, 3.8924560546875, 4.10003662109375, 4.3076171875, 4.51519775390625, 4.7227783203125, 4.93035888671875, 5.137939453125, 5.34552001953125, 5.5531005859375, 5.76068115234375, 5.96826171875, 6.17584228515625, 6.3834228515625, 6.59100341796875, 6.798583984375, 7.00616455078125, 7.2137451171875, 7.42132568359375, 7.62890625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 3.0, 10.0, 6.0, 13.0, 16.0, 11.0, 13.0, 14.0, 33.0, 34.0, 56.0, 56.0, 59.0, 59.0, 64.0, 61.0, 72.0, 65.0, 58.0, 42.0, 46.0, 33.0, 33.0, 29.0, 27.0, 21.0, 14.0, 7.0, 13.0, 7.0, 4.0, 10.0, 5.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81640625, -0.790069580078125, -0.76373291015625, -0.737396240234375, -0.7110595703125, -0.684722900390625, -0.65838623046875, -0.632049560546875, -0.605712890625, -0.579376220703125, -0.55303955078125, -0.526702880859375, -0.5003662109375, -0.474029541015625, -0.44769287109375, -0.421356201171875, -0.39501953125, -0.368682861328125, -0.34234619140625, -0.316009521484375, -0.2896728515625, -0.263336181640625, -0.23699951171875, -0.210662841796875, -0.184326171875, -0.157989501953125, -0.13165283203125, -0.105316162109375, -0.0789794921875, -0.052642822265625, -0.02630615234375, 3.0517578125e-05, 0.0263671875, 0.052703857421875, 0.07904052734375, 0.105377197265625, 0.1317138671875, 0.158050537109375, 0.18438720703125, 0.210723876953125, 0.237060546875, 0.263397216796875, 0.28973388671875, 0.316070556640625, 0.3424072265625, 0.368743896484375, 0.39508056640625, 0.421417236328125, 0.44775390625, 0.474090576171875, 0.50042724609375, 0.526763916015625, 0.5531005859375, 0.579437255859375, 0.60577392578125, 0.632110595703125, 0.658447265625, 0.684783935546875, 0.71112060546875, 0.737457275390625, 0.7637939453125, 0.790130615234375, 0.81646728515625, 0.842803955078125, 0.869140625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 9.0, 5.0, 12.0, 16.0, 26.0, 37.0, 51.0, 54.0, 84.0, 116.0, 152.0, 222.0, 315.0, 479.0, 746.0, 1205.0, 1989.0, 3558.0, 7333.0, 18410.0, 68337.0, 3814283.0, 218033.0, 34663.0, 11810.0, 5176.0, 2741.0, 1516.0, 942.0, 618.0, 409.0, 291.0, 182.0, 145.0, 79.0, 68.0, 49.0, 39.0, 32.0, 13.0, 15.0, 10.0, 7.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.31640625, -3.1925048828125, -3.068603515625, -2.9447021484375, -2.82080078125, -2.6968994140625, -2.572998046875, -2.4490966796875, -2.3251953125, -2.2012939453125, -2.077392578125, -1.9534912109375, -1.82958984375, -1.7056884765625, -1.581787109375, -1.4578857421875, -1.333984375, -1.2100830078125, -1.086181640625, -0.9622802734375, -0.83837890625, -0.7144775390625, -0.590576171875, -0.4666748046875, -0.3427734375, -0.2188720703125, -0.094970703125, 0.0289306640625, 0.15283203125, 0.2767333984375, 0.400634765625, 0.5245361328125, 0.6484375, 0.7723388671875, 0.896240234375, 1.0201416015625, 1.14404296875, 1.2679443359375, 1.391845703125, 1.5157470703125, 1.6396484375, 1.7635498046875, 1.887451171875, 2.0113525390625, 2.13525390625, 2.2591552734375, 2.383056640625, 2.5069580078125, 2.630859375, 2.7547607421875, 2.878662109375, 3.0025634765625, 3.12646484375, 3.2503662109375, 3.374267578125, 3.4981689453125, 3.6220703125, 3.7459716796875, 3.869873046875, 3.9937744140625, 4.11767578125, 4.2415771484375, 4.365478515625, 4.4893798828125, 4.61328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 9.0, 5.0, 13.0, 25.0, 27.0, 45.0, 111.0, 434.0, 3103.0, 123.0, 48.0, 47.0, 25.0, 15.0, 13.0, 4.0, 4.0, 2.0, 4.0, 2.0, 7.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0654296875, -1.0341720581054688, -1.0029144287109375, -0.9716567993164062, -0.940399169921875, -0.9091415405273438, -0.8778839111328125, -0.8466262817382812, -0.81536865234375, -0.7841110229492188, -0.7528533935546875, -0.7215957641601562, -0.690338134765625, -0.6590805053710938, -0.6278228759765625, -0.5965652465820312, -0.5653076171875, -0.5340499877929688, -0.5027923583984375, -0.47153472900390625, -0.440277099609375, -0.40901947021484375, -0.3777618408203125, -0.34650421142578125, -0.31524658203125, -0.28398895263671875, -0.2527313232421875, -0.22147369384765625, -0.190216064453125, -0.15895843505859375, -0.1277008056640625, -0.09644317626953125, -0.065185546875, -0.03392791748046875, -0.0026702880859375, 0.02858734130859375, 0.059844970703125, 0.09110260009765625, 0.1223602294921875, 0.15361785888671875, 0.18487548828125, 0.21613311767578125, 0.2473907470703125, 0.27864837646484375, 0.309906005859375, 0.34116363525390625, 0.3724212646484375, 0.40367889404296875, 0.4349365234375, 0.46619415283203125, 0.4974517822265625, 0.5287094116210938, 0.559967041015625, 0.5912246704101562, 0.6224822998046875, 0.6537399291992188, 0.68499755859375, 0.7162551879882812, 0.7475128173828125, 0.7787704467773438, 0.810028076171875, 0.8412857055664062, 0.8725433349609375, 0.9038009643554688, 0.93505859375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 12.0, 16.0, 23.0, 45.0, 61.0, 72.0, 107.0, 119.0, 100.0, 106.0, 102.0, 70.0, 51.0, 39.0, 28.0, 16.0, 13.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.894130229949951, -3.7724692821502686, -3.650808095932007, -3.529147148132324, -3.4074859619140625, -3.28582501411438, -3.1641640663146973, -3.0425028800964355, -2.920841693878174, -2.799180746078491, -2.6775195598602295, -2.555858612060547, -2.434197425842285, -2.3125364780426025, -2.19087553024292, -2.069214344024658, -1.9475533962249756, -1.8258923292160034, -1.7042312622070312, -1.5825703144073486, -1.460909128189087, -1.3392481803894043, -1.2175871133804321, -1.09592604637146, -0.9742649793624878, -0.8526039123535156, -0.7309428453445435, -0.6092818379402161, -0.4876207709312439, -0.36595970392227173, -0.24429869651794434, -0.12263762950897217, -0.0009763240814208984, 0.12068472802639008, 0.24234578013420105, 0.36400681734085083, 0.485667884349823, 0.6073289513587952, 0.7289899587631226, 0.8506510257720947, 0.9723120927810669, 1.093973159790039, 1.2156342267990112, 1.3372952938079834, 1.458956241607666, 1.5806174278259277, 1.7022783756256104, 1.8239394426345825, 1.9456005096435547, 2.0672614574432373, 2.188922643661499, 2.3105835914611816, 2.4322447776794434, 2.553905725479126, 2.6755666732788086, 2.7972278594970703, 2.918889045715332, 3.0405499935150146, 3.1622111797332764, 3.283872127532959, 3.4055333137512207, 3.5271942615509033, 3.648855209350586, 3.7705163955688477, 3.8921773433685303]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 6.0, 7.0, 10.0, 8.0, 10.0, 30.0, 14.0, 19.0, 27.0, 22.0, 39.0, 33.0, 28.0, 36.0, 39.0, 30.0, 46.0, 34.0, 44.0, 39.0, 33.0, 43.0, 41.0, 39.0, 30.0, 39.0, 28.0, 31.0, 34.0, 19.0, 26.0, 15.0, 10.0, 17.0, 15.0, 8.0, 5.0, 10.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.7558159828186035, -1.7032572031021118, -1.6506985425949097, -1.598139762878418, -1.5455811023712158, -1.4930223226547241, -1.4404635429382324, -1.3879048824310303, -1.3353462219238281, -1.2827874422073364, -1.2302287817001343, -1.1776700019836426, -1.1251113414764404, -1.0725525617599487, -1.019993782043457, -0.9674351215362549, -0.9148763418197632, -0.8623176217079163, -0.8097589015960693, -0.7572001218795776, -0.7046414613723755, -0.6520826816558838, -0.5995239615440369, -0.5469652414321899, -0.494406521320343, -0.4418478012084961, -0.38928908109664917, -0.33673033118247986, -0.28417161107063293, -0.231612890958786, -0.1790541410446167, -0.12649542093276978, -0.0739368200302124, -0.02137809246778488, 0.03118063509464264, 0.08373937010765076, 0.13629809021949768, 0.1888568103313446, 0.24141556024551392, 0.29397428035736084, 0.34653300046920776, 0.3990917205810547, 0.4516504406929016, 0.5042091608047485, 0.5567679405212402, 0.6093266010284424, 0.6618853807449341, 0.714444100856781, 0.7670028209686279, 0.8195615410804749, 0.8721202611923218, 0.9246790409088135, 0.9772377014160156, 1.0297964811325073, 1.082355260848999, 1.1349139213562012, 1.1874725818634033, 1.240031361579895, 1.2925900220870972, 1.3451488018035889, 1.397707462310791, 1.4502662420272827, 1.5028250217437744, 1.5553836822509766, 1.6079424619674683]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 8.0, 6.0, 11.0, 21.0, 30.0, 44.0, 59.0, 79.0, 170.0, 231.0, 434.0, 727.0, 1244.0, 2477.0, 4764.0, 9683.0, 20640.0, 44440.0, 94012.0, 176927.0, 249534.0, 211599.0, 120380.0, 58584.0, 26827.0, 12682.0, 6034.0, 3022.0, 1717.0, 884.0, 487.0, 277.0, 172.0, 113.0, 77.0, 46.0, 27.0, 31.0, 18.0, 7.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-2.376953125, -2.310333251953125, -2.24371337890625, -2.177093505859375, -2.1104736328125, -2.043853759765625, -1.97723388671875, -1.910614013671875, -1.843994140625, -1.777374267578125, -1.71075439453125, -1.644134521484375, -1.5775146484375, -1.510894775390625, -1.44427490234375, -1.377655029296875, -1.31103515625, -1.244415283203125, -1.17779541015625, -1.111175537109375, -1.0445556640625, -0.977935791015625, -0.91131591796875, -0.844696044921875, -0.778076171875, -0.711456298828125, -0.64483642578125, -0.578216552734375, -0.5115966796875, -0.444976806640625, -0.37835693359375, -0.311737060546875, -0.2451171875, -0.178497314453125, -0.11187744140625, -0.045257568359375, 0.0213623046875, 0.087982177734375, 0.15460205078125, 0.221221923828125, 0.287841796875, 0.354461669921875, 0.42108154296875, 0.487701416015625, 0.5543212890625, 0.620941162109375, 0.68756103515625, 0.754180908203125, 0.82080078125, 0.887420654296875, 0.95404052734375, 1.020660400390625, 1.0872802734375, 1.153900146484375, 1.22052001953125, 1.287139892578125, 1.353759765625, 1.420379638671875, 1.48699951171875, 1.553619384765625, 1.6202392578125, 1.686859130859375, 1.75347900390625, 1.820098876953125, 1.88671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 6.0, 11.0, 18.0, 15.0, 14.0, 17.0, 16.0, 28.0, 51.0, 40.0, 55.0, 63.0, 61.0, 62.0, 87.0, 64.0, 41.0, 69.0, 35.0, 43.0, 39.0, 33.0, 28.0, 24.0, 19.0, 13.0, 10.0, 12.0, 6.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71484375, -0.6880035400390625, -0.661163330078125, -0.6343231201171875, -0.60748291015625, -0.5806427001953125, -0.553802490234375, -0.5269622802734375, -0.5001220703125, -0.4732818603515625, -0.446441650390625, -0.4196014404296875, -0.39276123046875, -0.3659210205078125, -0.339080810546875, -0.3122406005859375, -0.285400390625, -0.2585601806640625, -0.231719970703125, -0.2048797607421875, -0.17803955078125, -0.1511993408203125, -0.124359130859375, -0.0975189208984375, -0.0706787109375, -0.0438385009765625, -0.016998291015625, 0.0098419189453125, 0.03668212890625, 0.0635223388671875, 0.090362548828125, 0.1172027587890625, 0.14404296875, 0.1708831787109375, 0.197723388671875, 0.2245635986328125, 0.25140380859375, 0.2782440185546875, 0.305084228515625, 0.3319244384765625, 0.3587646484375, 0.3856048583984375, 0.412445068359375, 0.4392852783203125, 0.46612548828125, 0.4929656982421875, 0.519805908203125, 0.5466461181640625, 0.573486328125, 0.6003265380859375, 0.627166748046875, 0.6540069580078125, 0.68084716796875, 0.7076873779296875, 0.734527587890625, 0.7613677978515625, 0.7882080078125, 0.8150482177734375, 0.841888427734375, 0.8687286376953125, 0.89556884765625, 0.9224090576171875, 0.949249267578125, 0.9760894775390625, 1.0029296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 5.0, 5.0, 6.0, 13.0, 7.0, 28.0, 51.0, 85.0, 141.0, 314.0, 658.0, 1579.0, 4688.0, 16133.0, 61923.0, 246363.0, 484694.0, 172202.0, 42542.0, 11330.0, 3465.0, 1234.0, 545.0, 262.0, 126.0, 67.0, 44.0, 21.0, 11.0, 10.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.57421875, -3.46026611328125, -3.3463134765625, -3.23236083984375, -3.118408203125, -3.00445556640625, -2.8905029296875, -2.77655029296875, -2.66259765625, -2.54864501953125, -2.4346923828125, -2.32073974609375, -2.206787109375, -2.09283447265625, -1.9788818359375, -1.86492919921875, -1.7509765625, -1.63702392578125, -1.5230712890625, -1.40911865234375, -1.295166015625, -1.18121337890625, -1.0672607421875, -0.95330810546875, -0.83935546875, -0.72540283203125, -0.6114501953125, -0.49749755859375, -0.383544921875, -0.26959228515625, -0.1556396484375, -0.04168701171875, 0.072265625, 0.18621826171875, 0.3001708984375, 0.41412353515625, 0.528076171875, 0.64202880859375, 0.7559814453125, 0.86993408203125, 0.98388671875, 1.09783935546875, 1.2117919921875, 1.32574462890625, 1.439697265625, 1.55364990234375, 1.6676025390625, 1.78155517578125, 1.8955078125, 2.00946044921875, 2.1234130859375, 2.23736572265625, 2.351318359375, 2.46527099609375, 2.5792236328125, 2.69317626953125, 2.80712890625, 2.92108154296875, 3.0350341796875, 3.14898681640625, 3.262939453125, 3.37689208984375, 3.4908447265625, 3.60479736328125, 3.71875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 13.0, 15.0, 15.0, 27.0, 34.0, 34.0, 36.0, 43.0, 49.0, 48.0, 59.0, 65.0, 71.0, 62.0, 66.0, 59.0, 60.0, 38.0, 45.0, 25.0, 27.0, 27.0, 18.0, 9.0, 15.0, 8.0, 10.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.65582275390625, -4.4874267578125, -4.31903076171875, -4.150634765625, -3.98223876953125, -3.8138427734375, -3.64544677734375, -3.47705078125, -3.30865478515625, -3.1402587890625, -2.97186279296875, -2.803466796875, -2.63507080078125, -2.4666748046875, -2.29827880859375, -2.1298828125, -1.96148681640625, -1.7930908203125, -1.62469482421875, -1.456298828125, -1.28790283203125, -1.1195068359375, -0.95111083984375, -0.78271484375, -0.61431884765625, -0.4459228515625, -0.27752685546875, -0.109130859375, 0.05926513671875, 0.2276611328125, 0.39605712890625, 0.564453125, 0.73284912109375, 0.9012451171875, 1.06964111328125, 1.238037109375, 1.40643310546875, 1.5748291015625, 1.74322509765625, 1.91162109375, 2.08001708984375, 2.2484130859375, 2.41680908203125, 2.585205078125, 2.75360107421875, 2.9219970703125, 3.09039306640625, 3.2587890625, 3.42718505859375, 3.5955810546875, 3.76397705078125, 3.932373046875, 4.10076904296875, 4.2691650390625, 4.43756103515625, 4.60595703125, 4.77435302734375, 4.9427490234375, 5.11114501953125, 5.279541015625, 5.44793701171875, 5.6163330078125, 5.78472900390625, 5.953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 11.0, 8.0, 18.0, 21.0, 39.0, 61.0, 72.0, 137.0, 207.0, 363.0, 669.0, 1226.0, 2342.0, 4859.0, 11715.0, 30694.0, 95218.0, 345323.0, 390755.0, 107428.0, 33928.0, 12590.0, 5361.0, 2493.0, 1316.0, 667.0, 355.0, 237.0, 146.0, 77.0, 67.0, 35.0, 28.0, 21.0, 8.0, 13.0, 10.0, 3.0, 3.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.6865234375, -1.6284637451171875, -1.570404052734375, -1.5123443603515625, -1.45428466796875, -1.3962249755859375, -1.338165283203125, -1.2801055908203125, -1.2220458984375, -1.1639862060546875, -1.105926513671875, -1.0478668212890625, -0.98980712890625, -0.9317474365234375, -0.873687744140625, -0.8156280517578125, -0.757568359375, -0.6995086669921875, -0.641448974609375, -0.5833892822265625, -0.52532958984375, -0.4672698974609375, -0.409210205078125, -0.3511505126953125, -0.2930908203125, -0.2350311279296875, -0.176971435546875, -0.1189117431640625, -0.06085205078125, -0.0027923583984375, 0.055267333984375, 0.1133270263671875, 0.17138671875, 0.2294464111328125, 0.287506103515625, 0.3455657958984375, 0.40362548828125, 0.4616851806640625, 0.519744873046875, 0.5778045654296875, 0.6358642578125, 0.6939239501953125, 0.751983642578125, 0.8100433349609375, 0.86810302734375, 0.9261627197265625, 0.984222412109375, 1.0422821044921875, 1.100341796875, 1.1584014892578125, 1.216461181640625, 1.2745208740234375, 1.33258056640625, 1.3906402587890625, 1.448699951171875, 1.5067596435546875, 1.5648193359375, 1.6228790283203125, 1.680938720703125, 1.7389984130859375, 1.79705810546875, 1.8551177978515625, 1.913177490234375, 1.9712371826171875, 2.029296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 5.0, 3.0, 10.0, 9.0, 8.0, 26.0, 18.0, 36.0, 29.0, 37.0, 48.0, 45.0, 60.0, 62.0, 72.0, 61.0, 62.0, 67.0, 70.0, 59.0, 40.0, 32.0, 32.0, 21.0, 14.0, 17.0, 11.0, 9.0, 5.0, 5.0, 9.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018978118896484375, -0.00018225610256195068, -0.00017473101615905762, -0.00016720592975616455, -0.00015968084335327148, -0.00015215575695037842, -0.00014463067054748535, -0.00013710558414459229, -0.00012958049774169922, -0.00012205541133880615, -0.00011453032493591309, -0.00010700523853302002, -9.948015213012695e-05, -9.195506572723389e-05, -8.442997932434082e-05, -7.690489292144775e-05, -6.937980651855469e-05, -6.185472011566162e-05, -5.4329633712768555e-05, -4.680454730987549e-05, -3.927946090698242e-05, -3.1754374504089355e-05, -2.422928810119629e-05, -1.6704201698303223e-05, -9.179115295410156e-06, -1.6540288925170898e-06, 5.8710575103759766e-06, 1.3396143913269043e-05, 2.092123031616211e-05, 2.8446316719055176e-05, 3.597140312194824e-05, 4.349648952484131e-05, 5.1021575927734375e-05, 5.854666233062744e-05, 6.607174873352051e-05, 7.359683513641357e-05, 8.112192153930664e-05, 8.864700794219971e-05, 9.617209434509277e-05, 0.00010369718074798584, 0.0001112222671508789, 0.00011874735355377197, 0.00012627243995666504, 0.0001337975263595581, 0.00014132261276245117, 0.00014884769916534424, 0.0001563727855682373, 0.00016389787197113037, 0.00017142295837402344, 0.0001789480447769165, 0.00018647313117980957, 0.00019399821758270264, 0.0002015233039855957, 0.00020904839038848877, 0.00021657347679138184, 0.0002240985631942749, 0.00023162364959716797, 0.00023914873600006104, 0.0002466738224029541, 0.00025419890880584717, 0.00026172399520874023, 0.0002692490816116333, 0.00027677416801452637, 0.00028429925441741943, 0.0002918243408203125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 11.0, 12.0, 16.0, 25.0, 44.0, 67.0, 145.0, 197.0, 311.0, 658.0, 1385.0, 3517.0, 10794.0, 45466.0, 273667.0, 573470.0, 107098.0, 21377.0, 5921.0, 2231.0, 966.0, 481.0, 265.0, 177.0, 89.0, 52.0, 34.0, 27.0, 16.0, 13.0, 7.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.123046875, -3.034454345703125, -2.94586181640625, -2.857269287109375, -2.7686767578125, -2.680084228515625, -2.59149169921875, -2.502899169921875, -2.414306640625, -2.325714111328125, -2.23712158203125, -2.148529052734375, -2.0599365234375, -1.971343994140625, -1.88275146484375, -1.794158935546875, -1.70556640625, -1.616973876953125, -1.52838134765625, -1.439788818359375, -1.3511962890625, -1.262603759765625, -1.17401123046875, -1.085418701171875, -0.996826171875, -0.908233642578125, -0.81964111328125, -0.731048583984375, -0.6424560546875, -0.553863525390625, -0.46527099609375, -0.376678466796875, -0.2880859375, -0.199493408203125, -0.11090087890625, -0.022308349609375, 0.0662841796875, 0.154876708984375, 0.24346923828125, 0.332061767578125, 0.420654296875, 0.509246826171875, 0.59783935546875, 0.686431884765625, 0.7750244140625, 0.863616943359375, 0.95220947265625, 1.040802001953125, 1.12939453125, 1.217987060546875, 1.30657958984375, 1.395172119140625, 1.4837646484375, 1.572357177734375, 1.66094970703125, 1.749542236328125, 1.838134765625, 1.926727294921875, 2.01531982421875, 2.103912353515625, 2.1925048828125, 2.281097412109375, 2.36968994140625, 2.458282470703125, 2.546875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 10.0, 10.0, 13.0, 19.0, 24.0, 44.0, 55.0, 60.0, 83.0, 99.0, 93.0, 93.0, 84.0, 59.0, 52.0, 50.0, 26.0, 38.0, 25.0, 12.0, 11.0, 10.0, 7.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.306640625, -3.199737548828125, -3.09283447265625, -2.985931396484375, -2.8790283203125, -2.772125244140625, -2.66522216796875, -2.558319091796875, -2.451416015625, -2.344512939453125, -2.23760986328125, -2.130706787109375, -2.0238037109375, -1.916900634765625, -1.80999755859375, -1.703094482421875, -1.59619140625, -1.489288330078125, -1.38238525390625, -1.275482177734375, -1.1685791015625, -1.061676025390625, -0.95477294921875, -0.847869873046875, -0.740966796875, -0.634063720703125, -0.52716064453125, -0.420257568359375, -0.3133544921875, -0.206451416015625, -0.09954833984375, 0.007354736328125, 0.1142578125, 0.221160888671875, 0.32806396484375, 0.434967041015625, 0.5418701171875, 0.648773193359375, 0.75567626953125, 0.862579345703125, 0.969482421875, 1.076385498046875, 1.18328857421875, 1.290191650390625, 1.3970947265625, 1.503997802734375, 1.61090087890625, 1.717803955078125, 1.82470703125, 1.931610107421875, 2.03851318359375, 2.145416259765625, 2.2523193359375, 2.359222412109375, 2.46612548828125, 2.573028564453125, 2.679931640625, 2.786834716796875, 2.89373779296875, 3.000640869140625, 3.1075439453125, 3.214447021484375, 3.32135009765625, 3.428253173828125, 3.53515625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 18.0, 10.0, 16.0, 32.0, 38.0, 47.0, 62.0, 75.0, 96.0, 98.0, 109.0, 92.0, 82.0, 74.0, 45.0, 36.0, 19.0, 16.0, 8.0, 8.0, 7.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.350460052490234, -26.484621047973633, -25.61878204345703, -24.75294303894043, -23.887104034423828, -23.021265029907227, -22.155426025390625, -21.28958511352539, -20.423748016357422, -19.55790901184082, -18.69207000732422, -17.826231002807617, -16.960391998291016, -16.094552993774414, -15.228713035583496, -14.362874031066895, -13.497034072875977, -12.631195068359375, -11.765356063842773, -10.899517059326172, -10.03367805480957, -9.167839050292969, -8.30199909210205, -7.436160087585449, -6.570321083068848, -5.704482078552246, -4.8386430740356445, -3.9728035926818848, -3.106964588165283, -2.2411255836486816, -1.3752861022949219, -0.5094470977783203, 0.35639381408691406, 1.2222329378128052, 2.0880720615386963, 2.953911304473877, 3.8197503089904785, 4.68558931350708, 5.55142879486084, 6.417267799377441, 7.283106803894043, 8.148945808410645, 9.014784812927246, 9.880624771118164, 10.746463775634766, 11.612302780151367, 12.478141784667969, 13.34398078918457, 14.209819793701172, 15.075658798217773, 15.941497802734375, 16.807336807250977, 17.673175811767578, 18.53901481628418, 19.40485382080078, 20.270694732666016, 21.136531829833984, 22.002370834350586, 22.868209838867188, 23.73404884338379, 24.59988784790039, 25.465726852416992, 26.331565856933594, 27.197406768798828, 28.06324577331543]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 9.0, 5.0, 4.0, 9.0, 8.0, 17.0, 19.0, 20.0, 19.0, 33.0, 25.0, 21.0, 34.0, 34.0, 37.0, 35.0, 41.0, 44.0, 52.0, 58.0, 51.0, 42.0, 37.0, 48.0, 44.0, 33.0, 33.0, 33.0, 27.0, 22.0, 15.0, 17.0, 11.0, 10.0, 10.0, 10.0, 14.0, 7.0, 3.0, 7.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.75204849243164, -18.084064483642578, -17.416080474853516, -16.748098373413086, -16.080114364624023, -15.412130355834961, -14.744147300720215, -14.076164245605469, -13.408180236816406, -12.740196228027344, -12.072213172912598, -11.404230117797852, -10.736246109008789, -10.068262100219727, -9.40027904510498, -8.732295989990234, -8.064311981201172, -7.396328449249268, -6.728344917297363, -6.060361385345459, -5.392377853393555, -4.72439432144165, -4.056410789489746, -3.388427257537842, -2.7204437255859375, -2.052460193634033, -1.384476661682129, -0.7164931297302246, -0.04850959777832031, 0.619473934173584, 1.2874574661254883, 1.9554409980773926, 2.6234264373779297, 3.291409969329834, 3.9593935012817383, 4.627377033233643, 5.295360565185547, 5.963344097137451, 6.6313276290893555, 7.29931116104126, 7.967294692993164, 8.635278701782227, 9.303261756896973, 9.971244812011719, 10.639228820800781, 11.307212829589844, 11.97519588470459, 12.643178939819336, 13.311162948608398, 13.979146957397461, 14.647130012512207, 15.315113067626953, 15.983097076416016, 16.651081085205078, 17.31906509399414, 17.98704719543457, 18.655031204223633, 19.323015213012695, 19.990997314453125, 20.658981323242188, 21.32696533203125, 21.994949340820312, 22.662933349609375, 23.330915451049805, 23.998899459838867]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 4.0, 5.0, 15.0, 3.0, 16.0, 20.0, 38.0, 60.0, 81.0, 120.0, 162.0, 253.0, 374.0, 652.0, 1177.0, 2087.0, 4901.0, 14463.0, 78891.0, 3987715.0, 79109.0, 14289.0, 4801.0, 2061.0, 1108.0, 681.0, 377.0, 235.0, 159.0, 117.0, 94.0, 72.0, 43.0, 40.0, 14.0, 21.0, 8.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.73828125, -3.60711669921875, -3.4759521484375, -3.34478759765625, -3.213623046875, -3.08245849609375, -2.9512939453125, -2.82012939453125, -2.68896484375, -2.55780029296875, -2.4266357421875, -2.29547119140625, -2.164306640625, -2.03314208984375, -1.9019775390625, -1.77081298828125, -1.6396484375, -1.50848388671875, -1.3773193359375, -1.24615478515625, -1.114990234375, -0.98382568359375, -0.8526611328125, -0.72149658203125, -0.59033203125, -0.45916748046875, -0.3280029296875, -0.19683837890625, -0.065673828125, 0.06549072265625, 0.1966552734375, 0.32781982421875, 0.458984375, 0.59014892578125, 0.7213134765625, 0.85247802734375, 0.983642578125, 1.11480712890625, 1.2459716796875, 1.37713623046875, 1.50830078125, 1.63946533203125, 1.7706298828125, 1.90179443359375, 2.032958984375, 2.16412353515625, 2.2952880859375, 2.42645263671875, 2.5576171875, 2.68878173828125, 2.8199462890625, 2.95111083984375, 3.082275390625, 3.21343994140625, 3.3446044921875, 3.47576904296875, 3.60693359375, 3.73809814453125, 3.8692626953125, 4.00042724609375, 4.131591796875, 4.26275634765625, 4.3939208984375, 4.52508544921875, 4.65625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 11.0, 15.0, 13.0, 28.0, 31.0, 38.0, 42.0, 62.0, 66.0, 61.0, 82.0, 87.0, 89.0, 78.0, 56.0, 48.0, 54.0, 39.0, 32.0, 12.0, 13.0, 11.0, 10.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1474609375, -1.1071014404296875, -1.066741943359375, -1.0263824462890625, -0.98602294921875, -0.9456634521484375, -0.905303955078125, -0.8649444580078125, -0.8245849609375, -0.7842254638671875, -0.743865966796875, -0.7035064697265625, -0.66314697265625, -0.6227874755859375, -0.582427978515625, -0.5420684814453125, -0.501708984375, -0.4613494873046875, -0.420989990234375, -0.3806304931640625, -0.34027099609375, -0.2999114990234375, -0.259552001953125, -0.2191925048828125, -0.1788330078125, -0.1384735107421875, -0.098114013671875, -0.0577545166015625, -0.01739501953125, 0.0229644775390625, 0.063323974609375, 0.1036834716796875, 0.14404296875, 0.1844024658203125, 0.224761962890625, 0.2651214599609375, 0.30548095703125, 0.3458404541015625, 0.386199951171875, 0.4265594482421875, 0.4669189453125, 0.5072784423828125, 0.547637939453125, 0.5879974365234375, 0.62835693359375, 0.6687164306640625, 0.709075927734375, 0.7494354248046875, 0.789794921875, 0.8301544189453125, 0.870513916015625, 0.9108734130859375, 0.95123291015625, 0.9915924072265625, 1.031951904296875, 1.0723114013671875, 1.1126708984375, 1.1530303955078125, 1.193389892578125, 1.2337493896484375, 1.27410888671875, 1.3144683837890625, 1.354827880859375, 1.3951873779296875, 1.435546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 4.0, 6.0, 17.0, 14.0, 40.0, 39.0, 53.0, 90.0, 118.0, 175.0, 236.0, 434.0, 662.0, 1219.0, 2170.0, 4347.0, 10307.0, 27833.0, 108394.0, 3700827.0, 262828.0, 46277.0, 15102.0, 6203.0, 2928.0, 1544.0, 872.0, 540.0, 343.0, 217.0, 158.0, 103.0, 54.0, 52.0, 26.0, 21.0, 11.0, 4.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.82421875, -2.725860595703125, -2.62750244140625, -2.529144287109375, -2.4307861328125, -2.332427978515625, -2.23406982421875, -2.135711669921875, -2.037353515625, -1.938995361328125, -1.84063720703125, -1.742279052734375, -1.6439208984375, -1.545562744140625, -1.44720458984375, -1.348846435546875, -1.25048828125, -1.152130126953125, -1.05377197265625, -0.955413818359375, -0.8570556640625, -0.758697509765625, -0.66033935546875, -0.561981201171875, -0.463623046875, -0.365264892578125, -0.26690673828125, -0.168548583984375, -0.0701904296875, 0.028167724609375, 0.12652587890625, 0.224884033203125, 0.3232421875, 0.421600341796875, 0.51995849609375, 0.618316650390625, 0.7166748046875, 0.815032958984375, 0.91339111328125, 1.011749267578125, 1.110107421875, 1.208465576171875, 1.30682373046875, 1.405181884765625, 1.5035400390625, 1.601898193359375, 1.70025634765625, 1.798614501953125, 1.89697265625, 1.995330810546875, 2.09368896484375, 2.192047119140625, 2.2904052734375, 2.388763427734375, 2.48712158203125, 2.585479736328125, 2.683837890625, 2.782196044921875, 2.88055419921875, 2.978912353515625, 3.0772705078125, 3.175628662109375, 3.27398681640625, 3.372344970703125, 3.470703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 5.0, 6.0, 10.0, 7.0, 19.0, 27.0, 52.0, 72.0, 136.0, 333.0, 2832.0, 239.0, 98.0, 63.0, 60.0, 24.0, 19.0, 23.0, 11.0, 5.0, 2.0, 4.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.853515625, -0.827117919921875, -0.80072021484375, -0.774322509765625, -0.7479248046875, -0.721527099609375, -0.69512939453125, -0.668731689453125, -0.642333984375, -0.615936279296875, -0.58953857421875, -0.563140869140625, -0.5367431640625, -0.510345458984375, -0.48394775390625, -0.457550048828125, -0.43115234375, -0.404754638671875, -0.37835693359375, -0.351959228515625, -0.3255615234375, -0.299163818359375, -0.27276611328125, -0.246368408203125, -0.219970703125, -0.193572998046875, -0.16717529296875, -0.140777587890625, -0.1143798828125, -0.087982177734375, -0.06158447265625, -0.035186767578125, -0.0087890625, 0.017608642578125, 0.04400634765625, 0.070404052734375, 0.0968017578125, 0.123199462890625, 0.14959716796875, 0.175994873046875, 0.202392578125, 0.228790283203125, 0.25518798828125, 0.281585693359375, 0.3079833984375, 0.334381103515625, 0.36077880859375, 0.387176513671875, 0.41357421875, 0.439971923828125, 0.46636962890625, 0.492767333984375, 0.5191650390625, 0.545562744140625, 0.57196044921875, 0.598358154296875, 0.624755859375, 0.651153564453125, 0.67755126953125, 0.703948974609375, 0.7303466796875, 0.756744384765625, 0.78314208984375, 0.809539794921875, 0.8359375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 17.0, 38.0, 76.0, 130.0, 181.0, 185.0, 150.0, 105.0, 62.0, 31.0, 12.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.706099271774292, -3.4369072914123535, -3.167715549468994, -2.8985235691070557, -2.629331588745117, -2.360139846801758, -2.0909478664398193, -1.8217560052871704, -1.5525641441345215, -1.2833722829818726, -1.0141804218292236, -0.7449884414672852, -0.47579658031463623, -0.2066047191619873, 0.06258726119995117, 0.3317791223526001, 0.600970983505249, 0.870162844657898, 1.1393547058105469, 1.4085466861724854, 1.6777385473251343, 1.9469304084777832, 2.2161223888397217, 2.48531436920166, 2.7545061111450195, 3.023698091506958, 3.2928898334503174, 3.562081813812256, 3.8312735557556152, 4.100465774536133, 4.369657516479492, 4.638849258422852, 4.908041954040527, 5.177233695983887, 5.446425914764404, 5.715617656707764, 5.984809398651123, 6.254001617431641, 6.523193359375, 6.792385101318359, 7.061576843261719, 7.330768585205078, 7.599960803985596, 7.869152545928955, 8.138344764709473, 8.407536506652832, 8.676728248596191, 8.94591999053955, 9.215112686157227, 9.484304428100586, 9.753496170043945, 10.022687911987305, 10.29188060760498, 10.56107234954834, 10.8302640914917, 11.099455833435059, 11.368647575378418, 11.637839317321777, 11.907031059265137, 12.176223754882812, 12.445415496826172, 12.714607238769531, 12.98379898071289, 13.25299072265625, 13.52218246459961]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 9.0, 10.0, 3.0, 14.0, 17.0, 16.0, 13.0, 15.0, 23.0, 24.0, 22.0, 28.0, 31.0, 23.0, 27.0, 33.0, 36.0, 43.0, 38.0, 30.0, 45.0, 31.0, 43.0, 37.0, 32.0, 41.0, 44.0, 32.0, 31.0, 25.0, 34.0, 25.0, 24.0, 15.0, 18.0, 11.0, 14.0, 9.0, 5.0, 8.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.5221776962280273, -2.4437906742095947, -2.365403652191162, -2.2870168685913086, -2.208629846572876, -2.1302428245544434, -2.05185604095459, -1.9734690189361572, -1.8950819969177246, -1.816694974899292, -1.738308072090149, -1.6599211692810059, -1.5815341472625732, -1.5031471252441406, -1.4247602224349976, -1.3463733196258545, -1.2679862976074219, -1.1895992755889893, -1.1112123727798462, -1.0328254699707031, -0.9544384479522705, -0.8760514855384827, -0.7976645231246948, -0.719277560710907, -0.6408905982971191, -0.5625036358833313, -0.48411667346954346, -0.4057297110557556, -0.3273427486419678, -0.24895578622817993, -0.1705688238143921, -0.09218186140060425, -0.013794898986816406, 0.06459206342697144, 0.14297902584075928, 0.22136598825454712, 0.29975295066833496, 0.3781399130821228, 0.45652687549591064, 0.5349138379096985, 0.6133008003234863, 0.6916877627372742, 0.770074725151062, 0.8484616875648499, 0.9268486499786377, 1.0052356719970703, 1.0836225748062134, 1.1620094776153564, 1.240396499633789, 1.3187835216522217, 1.3971704244613647, 1.4755573272705078, 1.5539443492889404, 1.632331371307373, 1.7107182741165161, 1.7891051769256592, 1.8674921989440918, 1.9458792209625244, 2.024266242980957, 2.1026530265808105, 2.181040048599243, 2.259427070617676, 2.3378138542175293, 2.416200876235962, 2.4945878982543945]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 15.0, 17.0, 28.0, 25.0, 52.0, 99.0, 192.0, 374.0, 874.0, 2187.0, 6563.0, 22606.0, 99199.0, 401178.0, 389381.0, 93799.0, 21858.0, 6382.0, 2088.0, 834.0, 388.0, 197.0, 100.0, 49.0, 32.0, 13.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.339691162109375, -4.22235107421875, -4.105010986328125, -3.9876708984375, -3.870330810546875, -3.75299072265625, -3.635650634765625, -3.518310546875, -3.400970458984375, -3.28363037109375, -3.166290283203125, -3.0489501953125, -2.931610107421875, -2.81427001953125, -2.696929931640625, -2.57958984375, -2.462249755859375, -2.34490966796875, -2.227569580078125, -2.1102294921875, -1.992889404296875, -1.87554931640625, -1.758209228515625, -1.640869140625, -1.523529052734375, -1.40618896484375, -1.288848876953125, -1.1715087890625, -1.054168701171875, -0.93682861328125, -0.819488525390625, -0.7021484375, -0.584808349609375, -0.46746826171875, -0.350128173828125, -0.2327880859375, -0.115447998046875, 0.00189208984375, 0.119232177734375, 0.236572265625, 0.353912353515625, 0.47125244140625, 0.588592529296875, 0.7059326171875, 0.823272705078125, 0.94061279296875, 1.057952880859375, 1.17529296875, 1.292633056640625, 1.40997314453125, 1.527313232421875, 1.6446533203125, 1.761993408203125, 1.87933349609375, 1.996673583984375, 2.114013671875, 2.231353759765625, 2.34869384765625, 2.466033935546875, 2.5833740234375, 2.700714111328125, 2.81805419921875, 2.935394287109375, 3.052734375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 8.0, 10.0, 31.0, 25.0, 32.0, 39.0, 36.0, 70.0, 84.0, 88.0, 74.0, 89.0, 86.0, 76.0, 54.0, 66.0, 35.0, 33.0, 28.0, 10.0, 8.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.330078125, -1.2823333740234375, -1.234588623046875, -1.1868438720703125, -1.13909912109375, -1.0913543701171875, -1.043609619140625, -0.9958648681640625, -0.9481201171875, -0.9003753662109375, -0.852630615234375, -0.8048858642578125, -0.75714111328125, -0.7093963623046875, -0.661651611328125, -0.6139068603515625, -0.566162109375, -0.5184173583984375, -0.470672607421875, -0.4229278564453125, -0.37518310546875, -0.3274383544921875, -0.279693603515625, -0.2319488525390625, -0.1842041015625, -0.1364593505859375, -0.088714599609375, -0.0409698486328125, 0.00677490234375, 0.0545196533203125, 0.102264404296875, 0.1500091552734375, 0.19775390625, 0.2454986572265625, 0.293243408203125, 0.3409881591796875, 0.38873291015625, 0.4364776611328125, 0.484222412109375, 0.5319671630859375, 0.5797119140625, 0.6274566650390625, 0.675201416015625, 0.7229461669921875, 0.77069091796875, 0.8184356689453125, 0.866180419921875, 0.9139251708984375, 0.961669921875, 1.0094146728515625, 1.057159423828125, 1.1049041748046875, 1.15264892578125, 1.2003936767578125, 1.248138427734375, 1.2958831787109375, 1.3436279296875, 1.3913726806640625, 1.439117431640625, 1.4868621826171875, 1.53460693359375, 1.5823516845703125, 1.630096435546875, 1.6778411865234375, 1.7255859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 8.0, 5.0, 5.0, 19.0, 23.0, 38.0, 48.0, 82.0, 136.0, 233.0, 445.0, 708.0, 1715.0, 4378.0, 14038.0, 57485.0, 299363.0, 512178.0, 120151.0, 25243.0, 7233.0, 2641.0, 1092.0, 520.0, 308.0, 156.0, 89.0, 67.0, 43.0, 37.0, 28.0, 10.0, 8.0, 9.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.95855712890625, -3.8428955078125, -3.72723388671875, -3.611572265625, -3.49591064453125, -3.3802490234375, -3.26458740234375, -3.14892578125, -3.03326416015625, -2.9176025390625, -2.80194091796875, -2.686279296875, -2.57061767578125, -2.4549560546875, -2.33929443359375, -2.2236328125, -2.10797119140625, -1.9923095703125, -1.87664794921875, -1.760986328125, -1.64532470703125, -1.5296630859375, -1.41400146484375, -1.29833984375, -1.18267822265625, -1.0670166015625, -0.95135498046875, -0.835693359375, -0.72003173828125, -0.6043701171875, -0.48870849609375, -0.373046875, -0.25738525390625, -0.1417236328125, -0.02606201171875, 0.089599609375, 0.20526123046875, 0.3209228515625, 0.43658447265625, 0.55224609375, 0.66790771484375, 0.7835693359375, 0.89923095703125, 1.014892578125, 1.13055419921875, 1.2462158203125, 1.36187744140625, 1.4775390625, 1.59320068359375, 1.7088623046875, 1.82452392578125, 1.940185546875, 2.05584716796875, 2.1715087890625, 2.28717041015625, 2.40283203125, 2.51849365234375, 2.6341552734375, 2.74981689453125, 2.865478515625, 2.98114013671875, 3.0968017578125, 3.21246337890625, 3.328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 12.0, 7.0, 11.0, 16.0, 13.0, 30.0, 40.0, 35.0, 43.0, 42.0, 50.0, 37.0, 59.0, 63.0, 47.0, 60.0, 52.0, 66.0, 45.0, 47.0, 43.0, 36.0, 31.0, 14.0, 26.0, 15.0, 14.0, 9.0, 7.0, 7.0, 6.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.8702392578125, -5.701416015625, -5.5325927734375, -5.36376953125, -5.1949462890625, -5.026123046875, -4.8572998046875, -4.6884765625, -4.5196533203125, -4.350830078125, -4.1820068359375, -4.01318359375, -3.8443603515625, -3.675537109375, -3.5067138671875, -3.337890625, -3.1690673828125, -3.000244140625, -2.8314208984375, -2.66259765625, -2.4937744140625, -2.324951171875, -2.1561279296875, -1.9873046875, -1.8184814453125, -1.649658203125, -1.4808349609375, -1.31201171875, -1.1431884765625, -0.974365234375, -0.8055419921875, -0.63671875, -0.4678955078125, -0.299072265625, -0.1302490234375, 0.03857421875, 0.2073974609375, 0.376220703125, 0.5450439453125, 0.7138671875, 0.8826904296875, 1.051513671875, 1.2203369140625, 1.38916015625, 1.5579833984375, 1.726806640625, 1.8956298828125, 2.064453125, 2.2332763671875, 2.402099609375, 2.5709228515625, 2.73974609375, 2.9085693359375, 3.077392578125, 3.2462158203125, 3.4150390625, 3.5838623046875, 3.752685546875, 3.9215087890625, 4.09033203125, 4.2591552734375, 4.427978515625, 4.5968017578125, 4.765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 18.0, 21.0, 22.0, 28.0, 47.0, 66.0, 137.0, 197.0, 401.0, 731.0, 1742.0, 5381.0, 24045.0, 239050.0, 699549.0, 61656.0, 10164.0, 3000.0, 1079.0, 500.0, 288.0, 154.0, 95.0, 58.0, 41.0, 27.0, 16.0, 12.0, 9.0, 6.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.88671875, -2.7723388671875, -2.657958984375, -2.5435791015625, -2.42919921875, -2.3148193359375, -2.200439453125, -2.0860595703125, -1.9716796875, -1.8572998046875, -1.742919921875, -1.6285400390625, -1.51416015625, -1.3997802734375, -1.285400390625, -1.1710205078125, -1.056640625, -0.9422607421875, -0.827880859375, -0.7135009765625, -0.59912109375, -0.4847412109375, -0.370361328125, -0.2559814453125, -0.1416015625, -0.0272216796875, 0.087158203125, 0.2015380859375, 0.31591796875, 0.4302978515625, 0.544677734375, 0.6590576171875, 0.7734375, 0.8878173828125, 1.002197265625, 1.1165771484375, 1.23095703125, 1.3453369140625, 1.459716796875, 1.5740966796875, 1.6884765625, 1.8028564453125, 1.917236328125, 2.0316162109375, 2.14599609375, 2.2603759765625, 2.374755859375, 2.4891357421875, 2.603515625, 2.7178955078125, 2.832275390625, 2.9466552734375, 3.06103515625, 3.1754150390625, 3.289794921875, 3.4041748046875, 3.5185546875, 3.6329345703125, 3.747314453125, 3.8616943359375, 3.97607421875, 4.0904541015625, 4.204833984375, 4.3192138671875, 4.43359375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 0.0, 5.0, 16.0, 11.0, 19.0, 24.0, 36.0, 59.0, 100.0, 126.0, 166.0, 133.0, 100.0, 65.0, 44.0, 34.0, 20.0, 7.0, 7.0, 5.0, 7.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004191398620605469, -0.00040445476770401, -0.00038976967334747314, -0.0003750845789909363, -0.0003603994846343994, -0.00034571439027786255, -0.0003310292959213257, -0.0003163442015647888, -0.00030165910720825195, -0.0002869740128517151, -0.0002722889184951782, -0.00025760382413864136, -0.0002429187297821045, -0.00022823363542556763, -0.00021354854106903076, -0.0001988634467124939, -0.00018417835235595703, -0.00016949325799942017, -0.0001548081636428833, -0.00014012306928634644, -0.00012543797492980957, -0.0001107528805732727, -9.606778621673584e-05, -8.138269186019897e-05, -6.669759750366211e-05, -5.2012503147125244e-05, -3.732740879058838e-05, -2.2642314434051514e-05, -7.957220077514648e-06, 6.727874279022217e-06, 2.1412968635559082e-05, 3.609806299209595e-05, 5.078315734863281e-05, 6.546825170516968e-05, 8.015334606170654e-05, 9.483844041824341e-05, 0.00010952353477478027, 0.00012420862913131714, 0.000138893723487854, 0.00015357881784439087, 0.00016826391220092773, 0.0001829490065574646, 0.00019763410091400146, 0.00021231919527053833, 0.0002270042896270752, 0.00024168938398361206, 0.0002563744783401489, 0.0002710595726966858, 0.00028574466705322266, 0.0003004297614097595, 0.0003151148557662964, 0.00032979995012283325, 0.0003444850444793701, 0.000359170138835907, 0.00037385523319244385, 0.0003885403275489807, 0.0004032254219055176, 0.00041791051626205444, 0.0004325956106185913, 0.0004472807049751282, 0.00046196579933166504, 0.0004766508936882019, 0.0004913359880447388, 0.0005060210824012756, 0.0005207061767578125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 16.0, 26.0, 59.0, 112.0, 263.0, 868.0, 11121.0, 950433.0, 82744.0, 2197.0, 410.0, 152.0, 71.0, 25.0, 26.0, 17.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8515625, -10.5560302734375, -10.260498046875, -9.9649658203125, -9.66943359375, -9.3739013671875, -9.078369140625, -8.7828369140625, -8.4873046875, -8.1917724609375, -7.896240234375, -7.6007080078125, -7.30517578125, -7.0096435546875, -6.714111328125, -6.4185791015625, -6.123046875, -5.8275146484375, -5.531982421875, -5.2364501953125, -4.94091796875, -4.6453857421875, -4.349853515625, -4.0543212890625, -3.7587890625, -3.4632568359375, -3.167724609375, -2.8721923828125, -2.57666015625, -2.2811279296875, -1.985595703125, -1.6900634765625, -1.39453125, -1.0989990234375, -0.803466796875, -0.5079345703125, -0.21240234375, 0.0831298828125, 0.378662109375, 0.6741943359375, 0.9697265625, 1.2652587890625, 1.560791015625, 1.8563232421875, 2.15185546875, 2.4473876953125, 2.742919921875, 3.0384521484375, 3.333984375, 3.6295166015625, 3.925048828125, 4.2205810546875, 4.51611328125, 4.8116455078125, 5.107177734375, 5.4027099609375, 5.6982421875, 5.9937744140625, 6.289306640625, 6.5848388671875, 6.88037109375, 7.1759033203125, 7.471435546875, 7.7669677734375, 8.0625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 4.0, 8.0, 7.0, 16.0, 20.0, 45.0, 116.0, 213.0, 256.0, 162.0, 74.0, 42.0, 22.0, 10.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.546875, -7.31298828125, -7.0791015625, -6.84521484375, -6.611328125, -6.37744140625, -6.1435546875, -5.90966796875, -5.67578125, -5.44189453125, -5.2080078125, -4.97412109375, -4.740234375, -4.50634765625, -4.2724609375, -4.03857421875, -3.8046875, -3.57080078125, -3.3369140625, -3.10302734375, -2.869140625, -2.63525390625, -2.4013671875, -2.16748046875, -1.93359375, -1.69970703125, -1.4658203125, -1.23193359375, -0.998046875, -0.76416015625, -0.5302734375, -0.29638671875, -0.0625, 0.17138671875, 0.4052734375, 0.63916015625, 0.873046875, 1.10693359375, 1.3408203125, 1.57470703125, 1.80859375, 2.04248046875, 2.2763671875, 2.51025390625, 2.744140625, 2.97802734375, 3.2119140625, 3.44580078125, 3.6796875, 3.91357421875, 4.1474609375, 4.38134765625, 4.615234375, 4.84912109375, 5.0830078125, 5.31689453125, 5.55078125, 5.78466796875, 6.0185546875, 6.25244140625, 6.486328125, 6.72021484375, 6.9541015625, 7.18798828125, 7.421875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 11.0, 73.0, 274.0, 380.0, 191.0, 55.0, 15.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.591182708740234, -20.597827911376953, -16.604473114013672, -12.611117362976074, -8.617762565612793, -4.624406814575195, -0.6310520172119141, 3.362302780151367, 7.355657577514648, 11.34901237487793, 15.342367172241211, 19.335723876953125, 23.329078674316406, 27.322433471679688, 31.31578826904297, 35.30914306640625, 39.30249786376953, 43.29585266113281, 47.289207458496094, 51.282562255859375, 55.275917053222656, 59.26927185058594, 63.26262664794922, 67.2559814453125, 71.24933624267578, 75.24269104003906, 79.23604583740234, 83.22940063476562, 87.2227554321289, 91.21611022949219, 95.20946502685547, 99.20281982421875, 103.19617462158203, 107.18952941894531, 111.1828842163086, 115.17623901367188, 119.16959381103516, 123.16294860839844, 127.15630340576172, 131.149658203125, 135.1430206298828, 139.13638305664062, 143.12973022460938, 147.1230926513672, 151.11643981933594, 155.10980224609375, 159.1031494140625, 163.0965118408203, 167.08985900878906, 171.08322143554688, 175.07656860351562, 179.06993103027344, 183.0632781982422, 187.056640625, 191.04998779296875, 195.04335021972656, 199.0366973876953, 203.03005981445312, 207.02340698242188, 211.0167694091797, 215.01011657714844, 219.00347900390625, 222.996826171875, 226.9901885986328, 230.98353576660156]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 11.0, 7.0, 6.0, 13.0, 15.0, 18.0, 11.0, 21.0, 24.0, 35.0, 36.0, 43.0, 36.0, 55.0, 47.0, 51.0, 51.0, 66.0, 53.0, 46.0, 49.0, 37.0, 45.0, 48.0, 32.0, 28.0, 28.0, 16.0, 17.0, 12.0, 7.0, 10.0, 4.0, 4.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0], "bins": [-30.142671585083008, -29.332134246826172, -28.521596908569336, -27.7110595703125, -26.90052032470703, -26.089984893798828, -25.27944564819336, -24.468908309936523, -23.658370971679688, -22.84783363342285, -22.037296295166016, -21.22675895690918, -20.416221618652344, -19.605682373046875, -18.79514503479004, -17.984607696533203, -17.174070358276367, -16.36353302001953, -15.552995681762695, -14.742457389831543, -13.931920051574707, -13.121382713317871, -12.310844421386719, -11.500307083129883, -10.689769744873047, -9.879232406616211, -9.068695068359375, -8.258156776428223, -7.447619438171387, -6.637082099914551, -5.826544284820557, -5.0160064697265625, -4.205471038818359, -3.3949334621429443, -2.5843958854675293, -1.7738583087921143, -0.9633207321166992, -0.15278339385986328, 0.6577544212341309, 1.468292236328125, 2.278829574584961, 3.089367151260376, 3.899904727935791, 4.710442543029785, 5.520979881286621, 6.331517219543457, 7.142055034637451, 7.952592849731445, 8.763130187988281, 9.573667526245117, 10.384204864501953, 11.194743156433105, 12.005280494689941, 12.815817832946777, 13.62635612487793, 14.436893463134766, 15.247430801391602, 16.057968139648438, 16.868505477905273, 17.67904281616211, 18.489582061767578, 19.30011749267578, 20.11065673828125, 20.921194076538086, 21.731731414794922]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 12.0, 11.0, 10.0, 16.0, 27.0, 33.0, 55.0, 75.0, 113.0, 198.0, 310.0, 514.0, 938.0, 1941.0, 4071.0, 11991.0, 70901.0, 4061044.0, 28448.0, 7426.0, 2889.0, 1412.0, 688.0, 426.0, 243.0, 148.0, 109.0, 57.0, 44.0, 34.0, 31.0, 19.0, 13.0, 9.0, 8.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.0, -4.82330322265625, -4.6466064453125, -4.46990966796875, -4.293212890625, -4.11651611328125, -3.9398193359375, -3.76312255859375, -3.58642578125, -3.40972900390625, -3.2330322265625, -3.05633544921875, -2.879638671875, -2.70294189453125, -2.5262451171875, -2.34954833984375, -2.1728515625, -1.99615478515625, -1.8194580078125, -1.64276123046875, -1.466064453125, -1.28936767578125, -1.1126708984375, -0.93597412109375, -0.75927734375, -0.58258056640625, -0.4058837890625, -0.22918701171875, -0.052490234375, 0.12420654296875, 0.3009033203125, 0.47760009765625, 0.654296875, 0.83099365234375, 1.0076904296875, 1.18438720703125, 1.361083984375, 1.53778076171875, 1.7144775390625, 1.89117431640625, 2.06787109375, 2.24456787109375, 2.4212646484375, 2.59796142578125, 2.774658203125, 2.95135498046875, 3.1280517578125, 3.30474853515625, 3.4814453125, 3.65814208984375, 3.8348388671875, 4.01153564453125, 4.188232421875, 4.36492919921875, 4.5416259765625, 4.71832275390625, 4.89501953125, 5.07171630859375, 5.2484130859375, 5.42510986328125, 5.601806640625, 5.77850341796875, 5.9552001953125, 6.13189697265625, 6.30859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 10.0, 12.0, 12.0, 25.0, 23.0, 28.0, 32.0, 36.0, 47.0, 55.0, 47.0, 67.0, 67.0, 54.0, 67.0, 72.0, 48.0, 52.0, 44.0, 37.0, 24.0, 25.0, 22.0, 17.0, 18.0, 12.0, 6.0, 8.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.396484375, -1.359893798828125, -1.32330322265625, -1.286712646484375, -1.2501220703125, -1.213531494140625, -1.17694091796875, -1.140350341796875, -1.103759765625, -1.067169189453125, -1.03057861328125, -0.993988037109375, -0.9573974609375, -0.920806884765625, -0.88421630859375, -0.847625732421875, -0.81103515625, -0.774444580078125, -0.73785400390625, -0.701263427734375, -0.6646728515625, -0.628082275390625, -0.59149169921875, -0.554901123046875, -0.518310546875, -0.481719970703125, -0.44512939453125, -0.408538818359375, -0.3719482421875, -0.335357666015625, -0.29876708984375, -0.262176513671875, -0.2255859375, -0.188995361328125, -0.15240478515625, -0.115814208984375, -0.0792236328125, -0.042633056640625, -0.00604248046875, 0.030548095703125, 0.067138671875, 0.103729248046875, 0.14031982421875, 0.176910400390625, 0.2135009765625, 0.250091552734375, 0.28668212890625, 0.323272705078125, 0.35986328125, 0.396453857421875, 0.43304443359375, 0.469635009765625, 0.5062255859375, 0.542816162109375, 0.57940673828125, 0.615997314453125, 0.652587890625, 0.689178466796875, 0.72576904296875, 0.762359619140625, 0.7989501953125, 0.835540771484375, 0.87213134765625, 0.908721923828125, 0.9453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 9.0, 7.0, 17.0, 21.0, 31.0, 37.0, 50.0, 60.0, 114.0, 180.0, 230.0, 342.0, 455.0, 702.0, 1071.0, 1853.0, 3540.0, 8265.0, 24492.0, 149907.0, 3915527.0, 60099.0, 14581.0, 5609.0, 2689.0, 1525.0, 934.0, 556.0, 388.0, 291.0, 192.0, 140.0, 114.0, 81.0, 53.0, 33.0, 26.0, 15.0, 10.0, 14.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.42578125, -4.300384521484375, -4.17498779296875, -4.049591064453125, -3.9241943359375, -3.798797607421875, -3.67340087890625, -3.548004150390625, -3.422607421875, -3.297210693359375, -3.17181396484375, -3.046417236328125, -2.9210205078125, -2.795623779296875, -2.67022705078125, -2.544830322265625, -2.41943359375, -2.294036865234375, -2.16864013671875, -2.043243408203125, -1.9178466796875, -1.792449951171875, -1.66705322265625, -1.541656494140625, -1.416259765625, -1.290863037109375, -1.16546630859375, -1.040069580078125, -0.9146728515625, -0.789276123046875, -0.66387939453125, -0.538482666015625, -0.4130859375, -0.287689208984375, -0.16229248046875, -0.036895751953125, 0.0885009765625, 0.213897705078125, 0.33929443359375, 0.464691162109375, 0.590087890625, 0.715484619140625, 0.84088134765625, 0.966278076171875, 1.0916748046875, 1.217071533203125, 1.34246826171875, 1.467864990234375, 1.59326171875, 1.718658447265625, 1.84405517578125, 1.969451904296875, 2.0948486328125, 2.220245361328125, 2.34564208984375, 2.471038818359375, 2.596435546875, 2.721832275390625, 2.84722900390625, 2.972625732421875, 3.0980224609375, 3.223419189453125, 3.34881591796875, 3.474212646484375, 3.599609375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 17.0, 17.0, 27.0, 46.0, 110.0, 736.0, 2903.0, 94.0, 41.0, 24.0, 16.0, 15.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1181640625, -1.0782470703125, -1.038330078125, -0.9984130859375, -0.95849609375, -0.9185791015625, -0.878662109375, -0.8387451171875, -0.798828125, -0.7589111328125, -0.718994140625, -0.6790771484375, -0.63916015625, -0.5992431640625, -0.559326171875, -0.5194091796875, -0.4794921875, -0.4395751953125, -0.399658203125, -0.3597412109375, -0.31982421875, -0.2799072265625, -0.239990234375, -0.2000732421875, -0.16015625, -0.1202392578125, -0.080322265625, -0.0404052734375, -0.00048828125, 0.0394287109375, 0.079345703125, 0.1192626953125, 0.1591796875, 0.1990966796875, 0.239013671875, 0.2789306640625, 0.31884765625, 0.3587646484375, 0.398681640625, 0.4385986328125, 0.478515625, 0.5184326171875, 0.558349609375, 0.5982666015625, 0.63818359375, 0.6781005859375, 0.718017578125, 0.7579345703125, 0.7978515625, 0.8377685546875, 0.877685546875, 0.9176025390625, 0.95751953125, 0.9974365234375, 1.037353515625, 1.0772705078125, 1.1171875, 1.1571044921875, 1.197021484375, 1.2369384765625, 1.27685546875, 1.3167724609375, 1.356689453125, 1.3966064453125, 1.4365234375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 7.0, 9.0, 14.0, 27.0, 54.0, 118.0, 159.0, 169.0, 176.0, 100.0, 77.0, 43.0, 22.0, 13.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.39766788482666, -10.179049491882324, -9.960430145263672, -9.741811752319336, -9.523192405700684, -9.304574012756348, -9.085954666137695, -8.86733627319336, -8.648716926574707, -8.430098533630371, -8.211479187011719, -7.992860317230225, -7.7742414474487305, -7.555622577667236, -7.337003707885742, -7.118385314941406, -6.899766445159912, -6.681147575378418, -6.462528705596924, -6.24390983581543, -6.0252909660339355, -5.806672096252441, -5.5880537033081055, -5.369434356689453, -5.150815963745117, -4.932197093963623, -4.713578224182129, -4.494959354400635, -4.276340484619141, -4.0577216148376465, -3.8391029834747314, -3.6204841136932373, -3.401864528656006, -3.1832456588745117, -2.9646267890930176, -2.7460079193115234, -2.5273890495300293, -2.308770179748535, -2.09015154838562, -1.871532678604126, -1.6529138088226318, -1.4342949390411377, -1.2156760692596436, -0.997057318687439, -0.7784384489059448, -0.5598195791244507, -0.3412008285522461, -0.12258195877075195, 0.09603691101074219, 0.31465575098991394, 0.5332745909690857, 0.7518934011459351, 0.9705122709274292, 1.1891311407089233, 1.407749891281128, 1.626368761062622, 1.8449876308441162, 2.0636065006256104, 2.2822253704071045, 2.5008440017700195, 2.7194628715515137, 2.938081741333008, 3.156700611114502, 3.375319480895996, 3.5939383506774902]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 2.0, 6.0, 5.0, 6.0, 9.0, 10.0, 17.0, 17.0, 14.0, 21.0, 38.0, 20.0, 28.0, 35.0, 38.0, 47.0, 41.0, 47.0, 45.0, 49.0, 46.0, 49.0, 37.0, 45.0, 50.0, 41.0, 27.0, 27.0, 30.0, 31.0, 17.0, 13.0, 18.0, 19.0, 14.0, 11.0, 8.0, 6.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.252042770385742, -2.1730380058288574, -2.0940334796905518, -2.015028715133667, -1.9360241889953613, -1.8570195436477661, -1.778014898300171, -1.6990101337432861, -1.6200056076049805, -1.5410009622573853, -1.46199631690979, -1.3829916715621948, -1.3039870262145996, -1.2249823808670044, -1.1459777355194092, -1.0669729709625244, -0.9879683256149292, -0.908963680267334, -0.8299590349197388, -0.7509543895721436, -0.6719497442245483, -0.5929450988769531, -0.5139403939247131, -0.4349357485771179, -0.3559311032295227, -0.2769264578819275, -0.19792179763317108, -0.11891713738441467, -0.03991249203681946, 0.03909215331077576, 0.11809682846069336, 0.19710147380828857, 0.2761061191558838, 0.355110764503479, 0.4341154098510742, 0.5131200551986694, 0.5921247005462646, 0.6711293458938599, 0.7501340508460999, 0.8291386961936951, 0.9081433415412903, 0.9871479868888855, 1.0661526918411255, 1.1451573371887207, 1.224161982536316, 1.3031666278839111, 1.3821712732315063, 1.4611759185791016, 1.5401805639266968, 1.619185209274292, 1.6981898546218872, 1.7771944999694824, 1.8561991453170776, 1.9352037906646729, 2.0142085552215576, 2.0932130813598633, 2.172217845916748, 2.251222610473633, 2.3302271366119385, 2.4092319011688232, 2.488236427307129, 2.5672411918640137, 2.6462457180023193, 2.725250482559204, 2.8042550086975098]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 11.0, 18.0, 35.0, 48.0, 80.0, 96.0, 175.0, 290.0, 486.0, 790.0, 1340.0, 2488.0, 4799.0, 9962.0, 21857.0, 49253.0, 115855.0, 240142.0, 294071.0, 170614.0, 74990.0, 32004.0, 14508.0, 6821.0, 3448.0, 1790.0, 999.0, 632.0, 326.0, 229.0, 141.0, 81.0, 49.0, 44.0, 21.0, 19.0, 15.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.982421875, -1.924530029296875, -1.86663818359375, -1.808746337890625, -1.7508544921875, -1.692962646484375, -1.63507080078125, -1.577178955078125, -1.519287109375, -1.461395263671875, -1.40350341796875, -1.345611572265625, -1.2877197265625, -1.229827880859375, -1.17193603515625, -1.114044189453125, -1.05615234375, -0.998260498046875, -0.94036865234375, -0.882476806640625, -0.8245849609375, -0.766693115234375, -0.70880126953125, -0.650909423828125, -0.593017578125, -0.535125732421875, -0.47723388671875, -0.419342041015625, -0.3614501953125, -0.303558349609375, -0.24566650390625, -0.187774658203125, -0.1298828125, -0.071990966796875, -0.01409912109375, 0.043792724609375, 0.1016845703125, 0.159576416015625, 0.21746826171875, 0.275360107421875, 0.333251953125, 0.391143798828125, 0.44903564453125, 0.506927490234375, 0.5648193359375, 0.622711181640625, 0.68060302734375, 0.738494873046875, 0.79638671875, 0.854278564453125, 0.91217041015625, 0.970062255859375, 1.0279541015625, 1.085845947265625, 1.14373779296875, 1.201629638671875, 1.259521484375, 1.317413330078125, 1.37530517578125, 1.433197021484375, 1.4910888671875, 1.548980712890625, 1.60687255859375, 1.664764404296875, 1.72265625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 1.0, 6.0, 2.0, 7.0, 8.0, 12.0, 11.0, 18.0, 20.0, 19.0, 25.0, 38.0, 42.0, 68.0, 58.0, 57.0, 65.0, 79.0, 56.0, 49.0, 57.0, 55.0, 48.0, 41.0, 34.0, 26.0, 17.0, 12.0, 12.0, 19.0, 15.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-1.58203125, -1.5407867431640625, -1.499542236328125, -1.4582977294921875, -1.41705322265625, -1.3758087158203125, -1.334564208984375, -1.2933197021484375, -1.2520751953125, -1.2108306884765625, -1.169586181640625, -1.1283416748046875, -1.08709716796875, -1.0458526611328125, -1.004608154296875, -0.9633636474609375, -0.922119140625, -0.8808746337890625, -0.839630126953125, -0.7983856201171875, -0.75714111328125, -0.7158966064453125, -0.674652099609375, -0.6334075927734375, -0.5921630859375, -0.5509185791015625, -0.509674072265625, -0.4684295654296875, -0.42718505859375, -0.3859405517578125, -0.344696044921875, -0.3034515380859375, -0.26220703125, -0.2209625244140625, -0.179718017578125, -0.1384735107421875, -0.09722900390625, -0.0559844970703125, -0.014739990234375, 0.0265045166015625, 0.0677490234375, 0.1089935302734375, 0.150238037109375, 0.1914825439453125, 0.23272705078125, 0.2739715576171875, 0.315216064453125, 0.3564605712890625, 0.397705078125, 0.4389495849609375, 0.480194091796875, 0.5214385986328125, 0.56268310546875, 0.6039276123046875, 0.645172119140625, 0.6864166259765625, 0.7276611328125, 0.7689056396484375, 0.810150146484375, 0.8513946533203125, 0.89263916015625, 0.9338836669921875, 0.975128173828125, 1.0163726806640625, 1.0576171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 13.0, 5.0, 20.0, 31.0, 53.0, 72.0, 117.0, 221.0, 323.0, 631.0, 1359.0, 3591.0, 14425.0, 93120.0, 610554.0, 277825.0, 35049.0, 6998.0, 2126.0, 887.0, 482.0, 234.0, 136.0, 80.0, 72.0, 45.0, 22.0, 16.0, 12.0, 10.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.578125, -4.4383544921875, -4.298583984375, -4.1588134765625, -4.01904296875, -3.8792724609375, -3.739501953125, -3.5997314453125, -3.4599609375, -3.3201904296875, -3.180419921875, -3.0406494140625, -2.90087890625, -2.7611083984375, -2.621337890625, -2.4815673828125, -2.341796875, -2.2020263671875, -2.062255859375, -1.9224853515625, -1.78271484375, -1.6429443359375, -1.503173828125, -1.3634033203125, -1.2236328125, -1.0838623046875, -0.944091796875, -0.8043212890625, -0.66455078125, -0.5247802734375, -0.385009765625, -0.2452392578125, -0.10546875, 0.0343017578125, 0.174072265625, 0.3138427734375, 0.45361328125, 0.5933837890625, 0.733154296875, 0.8729248046875, 1.0126953125, 1.1524658203125, 1.292236328125, 1.4320068359375, 1.57177734375, 1.7115478515625, 1.851318359375, 1.9910888671875, 2.130859375, 2.2706298828125, 2.410400390625, 2.5501708984375, 2.68994140625, 2.8297119140625, 2.969482421875, 3.1092529296875, 3.2490234375, 3.3887939453125, 3.528564453125, 3.6683349609375, 3.80810546875, 3.9478759765625, 4.087646484375, 4.2274169921875, 4.3671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 15.0, 16.0, 14.0, 21.0, 32.0, 28.0, 45.0, 51.0, 57.0, 57.0, 75.0, 75.0, 64.0, 73.0, 71.0, 49.0, 51.0, 36.0, 43.0, 31.0, 29.0, 18.0, 11.0, 10.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3828125, -8.11962890625, -7.8564453125, -7.59326171875, -7.330078125, -7.06689453125, -6.8037109375, -6.54052734375, -6.27734375, -6.01416015625, -5.7509765625, -5.48779296875, -5.224609375, -4.96142578125, -4.6982421875, -4.43505859375, -4.171875, -3.90869140625, -3.6455078125, -3.38232421875, -3.119140625, -2.85595703125, -2.5927734375, -2.32958984375, -2.06640625, -1.80322265625, -1.5400390625, -1.27685546875, -1.013671875, -0.75048828125, -0.4873046875, -0.22412109375, 0.0390625, 0.30224609375, 0.5654296875, 0.82861328125, 1.091796875, 1.35498046875, 1.6181640625, 1.88134765625, 2.14453125, 2.40771484375, 2.6708984375, 2.93408203125, 3.197265625, 3.46044921875, 3.7236328125, 3.98681640625, 4.25, 4.51318359375, 4.7763671875, 5.03955078125, 5.302734375, 5.56591796875, 5.8291015625, 6.09228515625, 6.35546875, 6.61865234375, 6.8818359375, 7.14501953125, 7.408203125, 7.67138671875, 7.9345703125, 8.19775390625, 8.4609375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 19.0, 24.0, 55.0, 159.0, 408.0, 1635.0, 11921.0, 658796.0, 365124.0, 8466.0, 1323.0, 366.0, 120.0, 53.0, 20.0, 12.0, 12.0, 7.0, 6.0, 2.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.75, -4.60125732421875, -4.4525146484375, -4.30377197265625, -4.155029296875, -4.00628662109375, -3.8575439453125, -3.70880126953125, -3.56005859375, -3.41131591796875, -3.2625732421875, -3.11383056640625, -2.965087890625, -2.81634521484375, -2.6676025390625, -2.51885986328125, -2.3701171875, -2.22137451171875, -2.0726318359375, -1.92388916015625, -1.775146484375, -1.62640380859375, -1.4776611328125, -1.32891845703125, -1.18017578125, -1.03143310546875, -0.8826904296875, -0.73394775390625, -0.585205078125, -0.43646240234375, -0.2877197265625, -0.13897705078125, 0.009765625, 0.15850830078125, 0.3072509765625, 0.45599365234375, 0.604736328125, 0.75347900390625, 0.9022216796875, 1.05096435546875, 1.19970703125, 1.34844970703125, 1.4971923828125, 1.64593505859375, 1.794677734375, 1.94342041015625, 2.0921630859375, 2.24090576171875, 2.3896484375, 2.53839111328125, 2.6871337890625, 2.83587646484375, 2.984619140625, 3.13336181640625, 3.2821044921875, 3.43084716796875, 3.57958984375, 3.72833251953125, 3.8770751953125, 4.02581787109375, 4.174560546875, 4.32330322265625, 4.4720458984375, 4.62078857421875, 4.76953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 8.0, 10.0, 20.0, 35.0, 39.0, 57.0, 78.0, 105.0, 123.0, 127.0, 111.0, 100.0, 65.0, 41.0, 39.0, 14.0, 10.0, 11.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002765655517578125, -0.00026598572731018066, -0.00025540590286254883, -0.000244826078414917, -0.00023424625396728516, -0.00022366642951965332, -0.00021308660507202148, -0.00020250678062438965, -0.0001919269561767578, -0.00018134713172912598, -0.00017076730728149414, -0.0001601874828338623, -0.00014960765838623047, -0.00013902783393859863, -0.0001284480094909668, -0.00011786818504333496, -0.00010728836059570312, -9.670853614807129e-05, -8.612871170043945e-05, -7.554888725280762e-05, -6.496906280517578e-05, -5.4389238357543945e-05, -4.380941390991211e-05, -3.3229589462280273e-05, -2.2649765014648438e-05, -1.2069940567016602e-05, -1.4901161193847656e-06, 9.08970832824707e-06, 1.9669532775878906e-05, 3.0249357223510742e-05, 4.082918167114258e-05, 5.1409006118774414e-05, 6.198883056640625e-05, 7.256865501403809e-05, 8.314847946166992e-05, 9.372830390930176e-05, 0.0001043081283569336, 0.00011488795280456543, 0.00012546777725219727, 0.0001360476016998291, 0.00014662742614746094, 0.00015720725059509277, 0.0001677870750427246, 0.00017836689949035645, 0.00018894672393798828, 0.00019952654838562012, 0.00021010637283325195, 0.0002206861972808838, 0.00023126602172851562, 0.00024184584617614746, 0.0002524256706237793, 0.00026300549507141113, 0.00027358531951904297, 0.0002841651439666748, 0.00029474496841430664, 0.0003053247928619385, 0.0003159046173095703, 0.00032648444175720215, 0.000337064266204834, 0.0003476440906524658, 0.00035822391510009766, 0.0003688037395477295, 0.00037938356399536133, 0.00038996338844299316, 0.000400543212890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 8.0, 6.0, 19.0, 28.0, 46.0, 66.0, 116.0, 235.0, 468.0, 1047.0, 2796.0, 11659.0, 149144.0, 817641.0, 54592.0, 7059.0, 2016.0, 777.0, 335.0, 184.0, 117.0, 64.0, 42.0, 24.0, 17.0, 13.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.46484375, -3.36395263671875, -3.2630615234375, -3.16217041015625, -3.061279296875, -2.96038818359375, -2.8594970703125, -2.75860595703125, -2.65771484375, -2.55682373046875, -2.4559326171875, -2.35504150390625, -2.254150390625, -2.15325927734375, -2.0523681640625, -1.95147705078125, -1.8505859375, -1.74969482421875, -1.6488037109375, -1.54791259765625, -1.447021484375, -1.34613037109375, -1.2452392578125, -1.14434814453125, -1.04345703125, -0.94256591796875, -0.8416748046875, -0.74078369140625, -0.639892578125, -0.53900146484375, -0.4381103515625, -0.33721923828125, -0.236328125, -0.13543701171875, -0.0345458984375, 0.06634521484375, 0.167236328125, 0.26812744140625, 0.3690185546875, 0.46990966796875, 0.57080078125, 0.67169189453125, 0.7725830078125, 0.87347412109375, 0.974365234375, 1.07525634765625, 1.1761474609375, 1.27703857421875, 1.3779296875, 1.47882080078125, 1.5797119140625, 1.68060302734375, 1.781494140625, 1.88238525390625, 1.9832763671875, 2.08416748046875, 2.18505859375, 2.28594970703125, 2.3868408203125, 2.48773193359375, 2.588623046875, 2.68951416015625, 2.7904052734375, 2.89129638671875, 2.9921875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 2.0, 14.0, 26.0, 59.0, 134.0, 209.0, 206.0, 160.0, 77.0, 37.0, 25.0, 15.0, 11.0, 8.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23046875, -6.06329345703125, -5.8961181640625, -5.72894287109375, -5.561767578125, -5.39459228515625, -5.2274169921875, -5.06024169921875, -4.89306640625, -4.72589111328125, -4.5587158203125, -4.39154052734375, -4.224365234375, -4.05718994140625, -3.8900146484375, -3.72283935546875, -3.5556640625, -3.38848876953125, -3.2213134765625, -3.05413818359375, -2.886962890625, -2.71978759765625, -2.5526123046875, -2.38543701171875, -2.21826171875, -2.05108642578125, -1.8839111328125, -1.71673583984375, -1.549560546875, -1.38238525390625, -1.2152099609375, -1.04803466796875, -0.880859375, -0.71368408203125, -0.5465087890625, -0.37933349609375, -0.212158203125, -0.04498291015625, 0.1221923828125, 0.28936767578125, 0.45654296875, 0.62371826171875, 0.7908935546875, 0.95806884765625, 1.125244140625, 1.29241943359375, 1.4595947265625, 1.62677001953125, 1.7939453125, 1.96112060546875, 2.1282958984375, 2.29547119140625, 2.462646484375, 2.62982177734375, 2.7969970703125, 2.96417236328125, 3.13134765625, 3.29852294921875, 3.4656982421875, 3.63287353515625, 3.800048828125, 3.96722412109375, 4.1343994140625, 4.30157470703125, 4.46875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 25.0, 51.0, 90.0, 165.0, 236.0, 190.0, 131.0, 59.0, 24.0, 11.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.26506805419922, -50.616703033447266, -48.96833419799805, -47.319969177246094, -45.671600341796875, -44.02323532104492, -42.37487030029297, -40.72650146484375, -39.07813262939453, -37.42976760864258, -35.78139877319336, -34.133033752441406, -32.48466491699219, -30.836299896240234, -29.18793296813965, -27.539566040039062, -25.89120101928711, -24.242834091186523, -22.594467163085938, -20.946102142333984, -19.297733306884766, -17.649368286132812, -16.001001358032227, -14.35263442993164, -12.704267501831055, -11.055900573730469, -9.407533645629883, -7.759167671203613, -6.110800743103027, -4.462433815002441, -2.814067840576172, -1.165700912475586, 0.482666015625, 2.131032705307007, 3.7793993949890137, 5.427765846252441, 7.076132774353027, 8.724499702453613, 10.372865676879883, 12.021232604980469, 13.669599533081055, 15.31796646118164, 16.966333389282227, 18.614700317382812, 20.263065338134766, 21.911434173583984, 23.559799194335938, 25.208166122436523, 26.85653305053711, 28.504899978637695, 30.15326690673828, 31.801631927490234, 33.45000076293945, 35.098365783691406, 36.746734619140625, 38.39509963989258, 40.04346466064453, 41.691829681396484, 43.3401985168457, 44.988563537597656, 46.636932373046875, 48.28529739379883, 49.93366241455078, 51.58203125, 53.23040008544922]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 3.0, 6.0, 8.0, 10.0, 15.0, 18.0, 14.0, 23.0, 26.0, 28.0, 27.0, 38.0, 34.0, 56.0, 46.0, 49.0, 62.0, 57.0, 54.0, 40.0, 63.0, 46.0, 40.0, 35.0, 29.0, 30.0, 23.0, 15.0, 24.0, 18.0, 15.0, 8.0, 7.0, 6.0, 7.0, 2.0, 5.0, 5.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.928848266601562, -25.970550537109375, -25.012252807617188, -24.053955078125, -23.09565544128418, -22.137357711791992, -21.179059982299805, -20.220762252807617, -19.262462615966797, -18.30416488647461, -17.345867156982422, -16.387569427490234, -15.429269790649414, -14.470972061157227, -13.512674331665039, -12.554376602172852, -11.596078872680664, -10.637781143188477, -9.679482460021973, -8.721184730529785, -7.7628865242004395, -6.804588317871094, -5.846290588378906, -4.8879923820495605, -3.929694175720215, -2.971395969390869, -2.0130980014801025, -1.054800033569336, -0.09650182723999023, 0.8617963790893555, 1.820094108581543, 2.7783923149108887, 3.7366905212402344, 4.69498872756958, 5.653286933898926, 6.611584663391113, 7.569882869720459, 8.528181076049805, 9.486478805541992, 10.44477653503418, 11.403075218200684, 12.361372947692871, 13.319671630859375, 14.277969360351562, 15.23626708984375, 16.194564819335938, 17.152862548828125, 18.111162185668945, 19.069459915161133, 20.02775764465332, 20.986055374145508, 21.944355010986328, 22.902652740478516, 23.860950469970703, 24.81924819946289, 25.777545928955078, 26.735843658447266, 27.694141387939453, 28.65243911743164, 29.610736846923828, 30.56903648376465, 31.527334213256836, 32.485633850097656, 33.443931579589844, 34.40222930908203]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 21.0, 15.0, 35.0, 52.0, 102.0, 178.0, 346.0, 754.0, 1700.0, 4899.0, 19374.0, 414369.0, 3721246.0, 22344.0, 5350.0, 1835.0, 777.0, 382.0, 190.0, 101.0, 76.0, 48.0, 18.0, 21.0, 10.0, 7.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.880859375, -3.731842041015625, -3.58282470703125, -3.433807373046875, -3.2847900390625, -3.135772705078125, -2.98675537109375, -2.837738037109375, -2.688720703125, -2.539703369140625, -2.39068603515625, -2.241668701171875, -2.0926513671875, -1.943634033203125, -1.79461669921875, -1.645599365234375, -1.49658203125, -1.347564697265625, -1.19854736328125, -1.049530029296875, -0.9005126953125, -0.751495361328125, -0.60247802734375, -0.453460693359375, -0.304443359375, -0.155426025390625, -0.00640869140625, 0.142608642578125, 0.2916259765625, 0.440643310546875, 0.58966064453125, 0.738677978515625, 0.8876953125, 1.036712646484375, 1.18572998046875, 1.334747314453125, 1.4837646484375, 1.632781982421875, 1.78179931640625, 1.930816650390625, 2.079833984375, 2.228851318359375, 2.37786865234375, 2.526885986328125, 2.6759033203125, 2.824920654296875, 2.97393798828125, 3.122955322265625, 3.27197265625, 3.420989990234375, 3.57000732421875, 3.719024658203125, 3.8680419921875, 4.017059326171875, 4.16607666015625, 4.315093994140625, 4.464111328125, 4.613128662109375, 4.76214599609375, 4.911163330078125, 5.0601806640625, 5.209197998046875, 5.35821533203125, 5.507232666015625, 5.65625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 5.0, 9.0, 6.0, 13.0, 23.0, 21.0, 45.0, 55.0, 61.0, 79.0, 76.0, 107.0, 109.0, 92.0, 81.0, 48.0, 51.0, 37.0, 26.0, 18.0, 9.0, 7.0, 5.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1953125, -2.1303863525390625, -2.065460205078125, -2.0005340576171875, -1.93560791015625, -1.8706817626953125, -1.805755615234375, -1.7408294677734375, -1.6759033203125, -1.6109771728515625, -1.546051025390625, -1.4811248779296875, -1.41619873046875, -1.3512725830078125, -1.286346435546875, -1.2214202880859375, -1.156494140625, -1.0915679931640625, -1.026641845703125, -0.9617156982421875, -0.89678955078125, -0.8318634033203125, -0.766937255859375, -0.7020111083984375, -0.6370849609375, -0.5721588134765625, -0.507232666015625, -0.4423065185546875, -0.37738037109375, -0.3124542236328125, -0.247528076171875, -0.1826019287109375, -0.11767578125, -0.0527496337890625, 0.012176513671875, 0.0771026611328125, 0.14202880859375, 0.2069549560546875, 0.271881103515625, 0.3368072509765625, 0.4017333984375, 0.4666595458984375, 0.531585693359375, 0.5965118408203125, 0.66143798828125, 0.7263641357421875, 0.791290283203125, 0.8562164306640625, 0.921142578125, 0.9860687255859375, 1.050994873046875, 1.1159210205078125, 1.18084716796875, 1.2457733154296875, 1.310699462890625, 1.3756256103515625, 1.4405517578125, 1.5054779052734375, 1.570404052734375, 1.6353302001953125, 1.70025634765625, 1.7651824951171875, 1.830108642578125, 1.8950347900390625, 1.9599609375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 9.0, 6.0, 10.0, 15.0, 20.0, 14.0, 22.0, 34.0, 36.0, 42.0, 67.0, 85.0, 94.0, 165.0, 262.0, 464.0, 951.0, 2092.0, 5890.0, 23144.0, 210250.0, 3870710.0, 61558.0, 11701.0, 3515.0, 1362.0, 649.0, 355.0, 218.0, 126.0, 82.0, 62.0, 48.0, 45.0, 36.0, 27.0, 24.0, 19.0, 14.0, 14.0, 9.0, 9.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0], "bins": [-4.703125, -4.56976318359375, -4.4364013671875, -4.30303955078125, -4.169677734375, -4.03631591796875, -3.9029541015625, -3.76959228515625, -3.63623046875, -3.50286865234375, -3.3695068359375, -3.23614501953125, -3.102783203125, -2.96942138671875, -2.8360595703125, -2.70269775390625, -2.5693359375, -2.43597412109375, -2.3026123046875, -2.16925048828125, -2.035888671875, -1.90252685546875, -1.7691650390625, -1.63580322265625, -1.50244140625, -1.36907958984375, -1.2357177734375, -1.10235595703125, -0.968994140625, -0.83563232421875, -0.7022705078125, -0.56890869140625, -0.435546875, -0.30218505859375, -0.1688232421875, -0.03546142578125, 0.097900390625, 0.23126220703125, 0.3646240234375, 0.49798583984375, 0.63134765625, 0.76470947265625, 0.8980712890625, 1.03143310546875, 1.164794921875, 1.29815673828125, 1.4315185546875, 1.56488037109375, 1.6982421875, 1.83160400390625, 1.9649658203125, 2.09832763671875, 2.231689453125, 2.36505126953125, 2.4984130859375, 2.63177490234375, 2.76513671875, 2.89849853515625, 3.0318603515625, 3.16522216796875, 3.298583984375, 3.43194580078125, 3.5653076171875, 3.69866943359375, 3.83203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 7.0, 3.0, 7.0, 14.0, 28.0, 46.0, 73.0, 217.0, 3089.0, 353.0, 111.0, 43.0, 36.0, 23.0, 7.0, 8.0, 7.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7265625, -2.657684326171875, -2.58880615234375, -2.519927978515625, -2.4510498046875, -2.382171630859375, -2.31329345703125, -2.244415283203125, -2.175537109375, -2.106658935546875, -2.03778076171875, -1.968902587890625, -1.9000244140625, -1.831146240234375, -1.76226806640625, -1.693389892578125, -1.62451171875, -1.555633544921875, -1.48675537109375, -1.417877197265625, -1.3489990234375, -1.280120849609375, -1.21124267578125, -1.142364501953125, -1.073486328125, -1.004608154296875, -0.93572998046875, -0.866851806640625, -0.7979736328125, -0.729095458984375, -0.66021728515625, -0.591339111328125, -0.5224609375, -0.453582763671875, -0.38470458984375, -0.315826416015625, -0.2469482421875, -0.178070068359375, -0.10919189453125, -0.040313720703125, 0.028564453125, 0.097442626953125, 0.16632080078125, 0.235198974609375, 0.3040771484375, 0.372955322265625, 0.44183349609375, 0.510711669921875, 0.57958984375, 0.648468017578125, 0.71734619140625, 0.786224365234375, 0.8551025390625, 0.923980712890625, 0.99285888671875, 1.061737060546875, 1.130615234375, 1.199493408203125, 1.26837158203125, 1.337249755859375, 1.4061279296875, 1.475006103515625, 1.54388427734375, 1.612762451171875, 1.681640625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 18.0, 20.0, 41.0, 58.0, 81.0, 107.0, 125.0, 142.0, 124.0, 93.0, 58.0, 47.0, 31.0, 8.0, 14.0, 8.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9645280838012695, -5.739344596862793, -5.514161109924316, -5.28897762298584, -5.063794136047363, -4.838610649108887, -4.61342716217041, -4.388244152069092, -4.163060665130615, -3.9378771781921387, -3.712693691253662, -3.4875102043151855, -3.262326955795288, -3.0371434688568115, -2.811959981918335, -2.5867767333984375, -2.361593008041382, -2.1364095211029053, -1.9112261533737183, -1.6860426664352417, -1.4608592987060547, -1.2356758117675781, -1.0104923248291016, -0.7853089570999146, -0.560125470161438, -0.3349420428276062, -0.10975858569145203, 0.11542487144470215, 0.34060829877853394, 0.5657917261123657, 0.7909752130508423, 1.0161585807800293, 1.2413420677185059, 1.4665255546569824, 1.6917089223861694, 1.916892409324646, 2.142075777053833, 2.3672592639923096, 2.592442750930786, 2.8176259994506836, 3.04280948638916, 3.2679929733276367, 3.4931764602661133, 3.71835994720459, 3.9435431957244873, 4.168726921081543, 4.3939104080200195, 4.619093418121338, 4.844277381896973, 5.069460868835449, 5.294644355773926, 5.519827842712402, 5.745011329650879, 5.9701948165893555, 6.195378303527832, 6.42056131362915, 6.645744800567627, 6.8709282875061035, 7.09611177444458, 7.321295261383057, 7.546478748321533, 7.771661758422852, 7.996845245361328, 8.222028732299805, 8.447212219238281]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 6.0, 7.0, 4.0, 8.0, 12.0, 6.0, 7.0, 13.0, 21.0, 15.0, 15.0, 26.0, 24.0, 27.0, 24.0, 33.0, 50.0, 41.0, 38.0, 63.0, 29.0, 43.0, 61.0, 48.0, 34.0, 44.0, 26.0, 45.0, 40.0, 20.0, 27.0, 19.0, 21.0, 28.0, 20.0, 14.0, 7.0, 13.0, 8.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.343759536743164, -4.226547718048096, -4.109335422515869, -3.9921233654022217, -3.874911308288574, -3.7576992511749268, -3.6404871940612793, -3.523275136947632, -3.4060630798339844, -3.288851022720337, -3.1716389656066895, -3.054426908493042, -2.9372148513793945, -2.820002794265747, -2.7027907371520996, -2.585578680038452, -2.4683666229248047, -2.3511545658111572, -2.2339425086975098, -2.1167304515838623, -1.9995183944702148, -1.8823063373565674, -1.76509428024292, -1.6478822231292725, -1.530670404434204, -1.4134583473205566, -1.2962462902069092, -1.1790342330932617, -1.0618221759796143, -0.9446101784706116, -0.8273981213569641, -0.7101860642433167, -0.5929739475250244, -0.47576189041137695, -0.3585498332977295, -0.24133780598640442, -0.12412574887275696, -0.006913721561431885, 0.11029833555221558, 0.22751039266586304, 0.3447224497795105, 0.46193450689315796, 0.5791465640068054, 0.6963585615158081, 0.8135706186294556, 0.930782675743103, 1.0479947328567505, 1.165206789970398, 1.2824188470840454, 1.3996309041976929, 1.5168429613113403, 1.6340550184249878, 1.7512670755386353, 1.8684790134429932, 1.9856910705566406, 2.102903127670288, 2.2201151847839355, 2.337327241897583, 2.4545392990112305, 2.571751356124878, 2.6889634132385254, 2.806175470352173, 2.9233875274658203, 3.0405995845794678, 3.1578116416931152]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 2.0, 18.0, 12.0, 23.0, 24.0, 50.0, 80.0, 112.0, 184.0, 351.0, 654.0, 1330.0, 3104.0, 8675.0, 29264.0, 124923.0, 461674.0, 318004.0, 71685.0, 18110.0, 5675.0, 2267.0, 1013.0, 553.0, 299.0, 161.0, 111.0, 56.0, 38.0, 28.0, 18.0, 16.0, 9.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.572265625, -3.463409423828125, -3.35455322265625, -3.245697021484375, -3.1368408203125, -3.027984619140625, -2.91912841796875, -2.810272216796875, -2.701416015625, -2.592559814453125, -2.48370361328125, -2.374847412109375, -2.2659912109375, -2.157135009765625, -2.04827880859375, -1.939422607421875, -1.83056640625, -1.721710205078125, -1.61285400390625, -1.503997802734375, -1.3951416015625, -1.286285400390625, -1.17742919921875, -1.068572998046875, -0.959716796875, -0.850860595703125, -0.74200439453125, -0.633148193359375, -0.5242919921875, -0.415435791015625, -0.30657958984375, -0.197723388671875, -0.0888671875, 0.019989013671875, 0.12884521484375, 0.237701416015625, 0.3465576171875, 0.455413818359375, 0.56427001953125, 0.673126220703125, 0.781982421875, 0.890838623046875, 0.99969482421875, 1.108551025390625, 1.2174072265625, 1.326263427734375, 1.43511962890625, 1.543975830078125, 1.65283203125, 1.761688232421875, 1.87054443359375, 1.979400634765625, 2.0882568359375, 2.197113037109375, 2.30596923828125, 2.414825439453125, 2.523681640625, 2.632537841796875, 2.74139404296875, 2.850250244140625, 2.9591064453125, 3.067962646484375, 3.17681884765625, 3.285675048828125, 3.39453125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 6.0, 11.0, 13.0, 20.0, 24.0, 26.0, 40.0, 42.0, 62.0, 57.0, 69.0, 100.0, 89.0, 90.0, 84.0, 64.0, 45.0, 37.0, 27.0, 25.0, 11.0, 13.0, 14.0, 7.0, 5.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.98046875, -1.9203338623046875, -1.860198974609375, -1.8000640869140625, -1.73992919921875, -1.6797943115234375, -1.619659423828125, -1.5595245361328125, -1.4993896484375, -1.4392547607421875, -1.379119873046875, -1.3189849853515625, -1.25885009765625, -1.1987152099609375, -1.138580322265625, -1.0784454345703125, -1.018310546875, -0.9581756591796875, -0.898040771484375, -0.8379058837890625, -0.77777099609375, -0.7176361083984375, -0.657501220703125, -0.5973663330078125, -0.5372314453125, -0.4770965576171875, -0.416961669921875, -0.3568267822265625, -0.29669189453125, -0.2365570068359375, -0.176422119140625, -0.1162872314453125, -0.05615234375, 0.0039825439453125, 0.064117431640625, 0.1242523193359375, 0.18438720703125, 0.2445220947265625, 0.304656982421875, 0.3647918701171875, 0.4249267578125, 0.4850616455078125, 0.545196533203125, 0.6053314208984375, 0.66546630859375, 0.7256011962890625, 0.785736083984375, 0.8458709716796875, 0.906005859375, 0.9661407470703125, 1.026275634765625, 1.0864105224609375, 1.14654541015625, 1.2066802978515625, 1.266815185546875, 1.3269500732421875, 1.3870849609375, 1.4472198486328125, 1.507354736328125, 1.5674896240234375, 1.62762451171875, 1.6877593994140625, 1.747894287109375, 1.8080291748046875, 1.8681640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 8.0, 18.0, 23.0, 37.0, 82.0, 139.0, 277.0, 675.0, 1777.0, 7925.0, 88881.0, 833987.0, 103070.0, 8467.0, 1885.0, 656.0, 306.0, 128.0, 90.0, 43.0, 22.0, 16.0, 8.0, 7.0, 2.0, 10.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.38616943359375, -7.1590576171875, -6.93194580078125, -6.704833984375, -6.47772216796875, -6.2506103515625, -6.02349853515625, -5.79638671875, -5.56927490234375, -5.3421630859375, -5.11505126953125, -4.887939453125, -4.66082763671875, -4.4337158203125, -4.20660400390625, -3.9794921875, -3.75238037109375, -3.5252685546875, -3.29815673828125, -3.071044921875, -2.84393310546875, -2.6168212890625, -2.38970947265625, -2.16259765625, -1.93548583984375, -1.7083740234375, -1.48126220703125, -1.254150390625, -1.02703857421875, -0.7999267578125, -0.57281494140625, -0.345703125, -0.11859130859375, 0.1085205078125, 0.33563232421875, 0.562744140625, 0.78985595703125, 1.0169677734375, 1.24407958984375, 1.47119140625, 1.69830322265625, 1.9254150390625, 2.15252685546875, 2.379638671875, 2.60675048828125, 2.8338623046875, 3.06097412109375, 3.2880859375, 3.51519775390625, 3.7423095703125, 3.96942138671875, 4.196533203125, 4.42364501953125, 4.6507568359375, 4.87786865234375, 5.10498046875, 5.33209228515625, 5.5592041015625, 5.78631591796875, 6.013427734375, 6.24053955078125, 6.4676513671875, 6.69476318359375, 6.921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 8.0, 11.0, 10.0, 16.0, 20.0, 23.0, 23.0, 38.0, 43.0, 35.0, 45.0, 46.0, 58.0, 54.0, 53.0, 51.0, 63.0, 50.0, 58.0, 45.0, 48.0, 36.0, 30.0, 19.0, 25.0, 15.0, 14.0, 23.0, 5.0, 3.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.84375, -6.646240234375, -6.44873046875, -6.251220703125, -6.0537109375, -5.856201171875, -5.65869140625, -5.461181640625, -5.263671875, -5.066162109375, -4.86865234375, -4.671142578125, -4.4736328125, -4.276123046875, -4.07861328125, -3.881103515625, -3.68359375, -3.486083984375, -3.28857421875, -3.091064453125, -2.8935546875, -2.696044921875, -2.49853515625, -2.301025390625, -2.103515625, -1.906005859375, -1.70849609375, -1.510986328125, -1.3134765625, -1.115966796875, -0.91845703125, -0.720947265625, -0.5234375, -0.325927734375, -0.12841796875, 0.069091796875, 0.2666015625, 0.464111328125, 0.66162109375, 0.859130859375, 1.056640625, 1.254150390625, 1.45166015625, 1.649169921875, 1.8466796875, 2.044189453125, 2.24169921875, 2.439208984375, 2.63671875, 2.834228515625, 3.03173828125, 3.229248046875, 3.4267578125, 3.624267578125, 3.82177734375, 4.019287109375, 4.216796875, 4.414306640625, 4.61181640625, 4.809326171875, 5.0068359375, 5.204345703125, 5.40185546875, 5.599365234375, 5.796875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 9.0, 8.0, 17.0, 31.0, 38.0, 76.0, 191.0, 492.0, 1451.0, 7165.0, 103338.0, 877077.0, 51728.0, 4975.0, 1194.0, 393.0, 180.0, 74.0, 39.0, 30.0, 12.0, 8.0, 7.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.50390625, -3.41497802734375, -3.3260498046875, -3.23712158203125, -3.148193359375, -3.05926513671875, -2.9703369140625, -2.88140869140625, -2.79248046875, -2.70355224609375, -2.6146240234375, -2.52569580078125, -2.436767578125, -2.34783935546875, -2.2589111328125, -2.16998291015625, -2.0810546875, -1.99212646484375, -1.9031982421875, -1.81427001953125, -1.725341796875, -1.63641357421875, -1.5474853515625, -1.45855712890625, -1.36962890625, -1.28070068359375, -1.1917724609375, -1.10284423828125, -1.013916015625, -0.92498779296875, -0.8360595703125, -0.74713134765625, -0.658203125, -0.56927490234375, -0.4803466796875, -0.39141845703125, -0.302490234375, -0.21356201171875, -0.1246337890625, -0.03570556640625, 0.05322265625, 0.14215087890625, 0.2310791015625, 0.32000732421875, 0.408935546875, 0.49786376953125, 0.5867919921875, 0.67572021484375, 0.7646484375, 0.85357666015625, 0.9425048828125, 1.03143310546875, 1.120361328125, 1.20928955078125, 1.2982177734375, 1.38714599609375, 1.47607421875, 1.56500244140625, 1.6539306640625, 1.74285888671875, 1.831787109375, 1.92071533203125, 2.0096435546875, 2.09857177734375, 2.1875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 4.0, 6.0, 9.0, 10.0, 12.0, 28.0, 40.0, 57.0, 97.0, 147.0, 164.0, 151.0, 86.0, 71.0, 35.0, 29.0, 18.0, 12.0, 10.0, 2.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004734992980957031, -0.00046154484152793884, -0.00044959038496017456, -0.0004376359283924103, -0.000425681471824646, -0.0004137270152568817, -0.00040177255868911743, -0.00038981810212135315, -0.00037786364555358887, -0.0003659091889858246, -0.0003539547324180603, -0.000342000275850296, -0.00033004581928253174, -0.00031809136271476746, -0.0003061369061470032, -0.0002941824495792389, -0.0002822279930114746, -0.00027027353644371033, -0.00025831907987594604, -0.00024636462330818176, -0.00023441016674041748, -0.0002224557101726532, -0.00021050125360488892, -0.00019854679703712463, -0.00018659234046936035, -0.00017463788390159607, -0.0001626834273338318, -0.0001507289707660675, -0.00013877451419830322, -0.00012682005763053894, -0.00011486560106277466, -0.00010291114449501038, -9.09566879272461e-05, -7.900223135948181e-05, -6.704777479171753e-05, -5.509331822395325e-05, -4.3138861656188965e-05, -3.118440508842468e-05, -1.92299485206604e-05, -7.275491952896118e-06, 4.678964614868164e-06, 1.6633421182632446e-05, 2.858787775039673e-05, 4.054233431816101e-05, 5.249679088592529e-05, 6.445124745368958e-05, 7.640570402145386e-05, 8.836016058921814e-05, 0.00010031461715698242, 0.0001122690737247467, 0.00012422353029251099, 0.00013617798686027527, 0.00014813244342803955, 0.00016008689999580383, 0.00017204135656356812, 0.0001839958131313324, 0.00019595026969909668, 0.00020790472626686096, 0.00021985918283462524, 0.00023181363940238953, 0.0002437680959701538, 0.0002557225525379181, 0.0002676770091056824, 0.00027963146567344666, 0.00029158592224121094]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 11.0, 19.0, 23.0, 29.0, 45.0, 77.0, 108.0, 237.0, 479.0, 1252.0, 4024.0, 22143.0, 438541.0, 548688.0, 26084.0, 4441.0, 1297.0, 487.0, 232.0, 110.0, 88.0, 50.0, 22.0, 26.0, 12.0, 8.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.638671875, -2.55364990234375, -2.4686279296875, -2.38360595703125, -2.298583984375, -2.21356201171875, -2.1285400390625, -2.04351806640625, -1.95849609375, -1.87347412109375, -1.7884521484375, -1.70343017578125, -1.618408203125, -1.53338623046875, -1.4483642578125, -1.36334228515625, -1.2783203125, -1.19329833984375, -1.1082763671875, -1.02325439453125, -0.938232421875, -0.85321044921875, -0.7681884765625, -0.68316650390625, -0.59814453125, -0.51312255859375, -0.4281005859375, -0.34307861328125, -0.258056640625, -0.17303466796875, -0.0880126953125, -0.00299072265625, 0.08203125, 0.16705322265625, 0.2520751953125, 0.33709716796875, 0.422119140625, 0.50714111328125, 0.5921630859375, 0.67718505859375, 0.76220703125, 0.84722900390625, 0.9322509765625, 1.01727294921875, 1.102294921875, 1.18731689453125, 1.2723388671875, 1.35736083984375, 1.4423828125, 1.52740478515625, 1.6124267578125, 1.69744873046875, 1.782470703125, 1.86749267578125, 1.9525146484375, 2.03753662109375, 2.12255859375, 2.20758056640625, 2.2926025390625, 2.37762451171875, 2.462646484375, 2.54766845703125, 2.6326904296875, 2.71771240234375, 2.802734375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 1.0, 8.0, 7.0, 12.0, 17.0, 24.0, 36.0, 52.0, 80.0, 80.0, 98.0, 98.0, 114.0, 88.0, 86.0, 58.0, 43.0, 25.0, 19.0, 12.0, 10.0, 10.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9140625, -1.8450927734375, -1.776123046875, -1.7071533203125, -1.63818359375, -1.5692138671875, -1.500244140625, -1.4312744140625, -1.3623046875, -1.2933349609375, -1.224365234375, -1.1553955078125, -1.08642578125, -1.0174560546875, -0.948486328125, -0.8795166015625, -0.810546875, -0.7415771484375, -0.672607421875, -0.6036376953125, -0.53466796875, -0.4656982421875, -0.396728515625, -0.3277587890625, -0.2587890625, -0.1898193359375, -0.120849609375, -0.0518798828125, 0.01708984375, 0.0860595703125, 0.155029296875, 0.2239990234375, 0.29296875, 0.3619384765625, 0.430908203125, 0.4998779296875, 0.56884765625, 0.6378173828125, 0.706787109375, 0.7757568359375, 0.8447265625, 0.9136962890625, 0.982666015625, 1.0516357421875, 1.12060546875, 1.1895751953125, 1.258544921875, 1.3275146484375, 1.396484375, 1.4654541015625, 1.534423828125, 1.6033935546875, 1.67236328125, 1.7413330078125, 1.810302734375, 1.8792724609375, 1.9482421875, 2.0172119140625, 2.086181640625, 2.1551513671875, 2.22412109375, 2.2930908203125, 2.362060546875, 2.4310302734375, 2.5]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 17.0, 82.0, 165.0, 301.0, 272.0, 110.0, 32.0, 11.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.89868927001953, -37.39041519165039, -34.882137298583984, -32.373863220214844, -29.865589141845703, -27.35731315612793, -24.849037170410156, -22.340763092041016, -19.832487106323242, -17.32421112060547, -14.815937042236328, -12.307661056518555, -9.799386024475098, -7.291110992431641, -4.782835006713867, -2.2745609283447266, 0.23371505737304688, 2.741990327835083, 5.250265598297119, 7.758541107177734, 10.266816139221191, 12.775091171264648, 15.283367156982422, 17.791641235351562, 20.299917221069336, 22.80819320678711, 25.31646728515625, 27.824743270874023, 30.333019256591797, 32.84129333496094, 35.349571228027344, 37.85784149169922, 40.366119384765625, 42.874393463134766, 45.38267135620117, 47.89094543457031, 50.39921951293945, 52.907493591308594, 55.415771484375, 57.92404556274414, 60.43231964111328, 62.94059371948242, 65.44886779785156, 67.95714569091797, 70.46542358398438, 72.97369384765625, 75.48197174072266, 77.99024963378906, 80.49851989746094, 83.00679779052734, 85.51506805419922, 88.02334594726562, 90.53162384033203, 93.0398941040039, 95.54817199707031, 98.05644226074219, 100.56472778320312, 103.07300567626953, 105.5812759399414, 108.08955383300781, 110.59783172607422, 113.1061019897461, 115.6143798828125, 118.12265014648438, 120.63092803955078]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 4.0, 7.0, 7.0, 11.0, 9.0, 19.0, 15.0, 27.0, 23.0, 37.0, 40.0, 34.0, 47.0, 53.0, 51.0, 72.0, 58.0, 66.0, 54.0, 58.0, 45.0, 55.0, 27.0, 32.0, 26.0, 24.0, 20.0, 18.0, 23.0, 8.0, 7.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.68877601623535, -25.729816436767578, -24.770858764648438, -23.811899185180664, -22.852941513061523, -21.89398193359375, -20.93502426147461, -19.976064682006836, -19.017105102539062, -18.05814552307129, -17.09918785095215, -16.140228271484375, -15.181270599365234, -14.222311019897461, -13.263352394104004, -12.304393768310547, -11.345436096191406, -10.38647747039795, -9.427518844604492, -8.468559265136719, -7.50960111618042, -6.550642490386963, -5.591683387756348, -4.632724761962891, -3.6737661361694336, -2.7148075103759766, -1.7558486461639404, -0.7968897819519043, 0.16206884384155273, 1.1210274696350098, 2.079986572265625, 3.038945198059082, 3.997905731201172, 4.956864356994629, 5.915822982788086, 6.874782085418701, 7.833740711212158, 8.792699813842773, 9.75165843963623, 10.710617065429688, 11.669575691223145, 12.628534317016602, 13.587492942810059, 14.546451568603516, 15.505411148071289, 16.46436882019043, 17.423328399658203, 18.382286071777344, 19.341245651245117, 20.30020523071289, 21.25916290283203, 22.218122482299805, 23.177080154418945, 24.13603973388672, 25.09499740600586, 26.053956985473633, 27.012916564941406, 27.97187614440918, 28.93083381652832, 29.889793395996094, 30.848751068115234, 31.807710647583008, 32.76667022705078, 33.72562789916992, 34.68458557128906]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 4.0, 16.0, 14.0, 15.0, 18.0, 33.0, 67.0, 116.0, 222.0, 504.0, 1426.0, 5244.0, 28500.0, 556943.0, 3520643.0, 67446.0, 9475.0, 2124.0, 756.0, 300.0, 153.0, 85.0, 51.0, 36.0, 16.0, 15.0, 14.0, 10.0, 7.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.814453125, -3.668853759765625, -3.52325439453125, -3.377655029296875, -3.2320556640625, -3.086456298828125, -2.94085693359375, -2.795257568359375, -2.649658203125, -2.504058837890625, -2.35845947265625, -2.212860107421875, -2.0672607421875, -1.921661376953125, -1.77606201171875, -1.630462646484375, -1.48486328125, -1.339263916015625, -1.19366455078125, -1.048065185546875, -0.9024658203125, -0.756866455078125, -0.61126708984375, -0.465667724609375, -0.320068359375, -0.174468994140625, -0.02886962890625, 0.116729736328125, 0.2623291015625, 0.407928466796875, 0.55352783203125, 0.699127197265625, 0.8447265625, 0.990325927734375, 1.13592529296875, 1.281524658203125, 1.4271240234375, 1.572723388671875, 1.71832275390625, 1.863922119140625, 2.009521484375, 2.155120849609375, 2.30072021484375, 2.446319580078125, 2.5919189453125, 2.737518310546875, 2.88311767578125, 3.028717041015625, 3.17431640625, 3.319915771484375, 3.46551513671875, 3.611114501953125, 3.7567138671875, 3.902313232421875, 4.04791259765625, 4.193511962890625, 4.339111328125, 4.484710693359375, 4.63031005859375, 4.775909423828125, 4.9215087890625, 5.067108154296875, 5.21270751953125, 5.358306884765625, 5.50390625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 6.0, 7.0, 8.0, 8.0, 13.0, 13.0, 15.0, 22.0, 30.0, 32.0, 45.0, 42.0, 51.0, 56.0, 69.0, 68.0, 80.0, 76.0, 65.0, 47.0, 53.0, 43.0, 29.0, 31.0, 25.0, 17.0, 13.0, 8.0, 10.0, 5.0, 5.0, 3.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1005859375, -1.0566558837890625, -1.012725830078125, -0.9687957763671875, -0.92486572265625, -0.8809356689453125, -0.837005615234375, -0.7930755615234375, -0.7491455078125, -0.7052154541015625, -0.661285400390625, -0.6173553466796875, -0.57342529296875, -0.5294952392578125, -0.485565185546875, -0.4416351318359375, -0.397705078125, -0.3537750244140625, -0.309844970703125, -0.2659149169921875, -0.22198486328125, -0.1780548095703125, -0.134124755859375, -0.0901947021484375, -0.0462646484375, -0.0023345947265625, 0.041595458984375, 0.0855255126953125, 0.12945556640625, 0.1733856201171875, 0.217315673828125, 0.2612457275390625, 0.30517578125, 0.3491058349609375, 0.393035888671875, 0.4369659423828125, 0.48089599609375, 0.5248260498046875, 0.568756103515625, 0.6126861572265625, 0.6566162109375, 0.7005462646484375, 0.744476318359375, 0.7884063720703125, 0.83233642578125, 0.8762664794921875, 0.920196533203125, 0.9641265869140625, 1.008056640625, 1.0519866943359375, 1.095916748046875, 1.1398468017578125, 1.18377685546875, 1.2277069091796875, 1.271636962890625, 1.3155670166015625, 1.3594970703125, 1.4034271240234375, 1.447357177734375, 1.4912872314453125, 1.53521728515625, 1.5791473388671875, 1.623077392578125, 1.6670074462890625, 1.7109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 9.0, 9.0, 10.0, 16.0, 31.0, 47.0, 114.0, 291.0, 976.0, 4258.0, 26682.0, 964094.0, 3153813.0, 37168.0, 5066.0, 1124.0, 302.0, 112.0, 54.0, 18.0, 13.0, 16.0, 6.0, 13.0, 6.0, 4.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.23828125, -6.03759765625, -5.8369140625, -5.63623046875, -5.435546875, -5.23486328125, -5.0341796875, -4.83349609375, -4.6328125, -4.43212890625, -4.2314453125, -4.03076171875, -3.830078125, -3.62939453125, -3.4287109375, -3.22802734375, -3.02734375, -2.82666015625, -2.6259765625, -2.42529296875, -2.224609375, -2.02392578125, -1.8232421875, -1.62255859375, -1.421875, -1.22119140625, -1.0205078125, -0.81982421875, -0.619140625, -0.41845703125, -0.2177734375, -0.01708984375, 0.18359375, 0.38427734375, 0.5849609375, 0.78564453125, 0.986328125, 1.18701171875, 1.3876953125, 1.58837890625, 1.7890625, 1.98974609375, 2.1904296875, 2.39111328125, 2.591796875, 2.79248046875, 2.9931640625, 3.19384765625, 3.39453125, 3.59521484375, 3.7958984375, 3.99658203125, 4.197265625, 4.39794921875, 4.5986328125, 4.79931640625, 5.0, 5.20068359375, 5.4013671875, 5.60205078125, 5.802734375, 6.00341796875, 6.2041015625, 6.40478515625, 6.60546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 8.0, 5.0, 4.0, 6.0, 6.0, 9.0, 12.0, 21.0, 14.0, 23.0, 43.0, 67.0, 101.0, 185.0, 396.0, 872.0, 1148.0, 566.0, 247.0, 129.0, 78.0, 37.0, 19.0, 23.0, 15.0, 8.0, 4.0, 1.0, 4.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.76171875, -3.644805908203125, -3.52789306640625, -3.410980224609375, -3.2940673828125, -3.177154541015625, -3.06024169921875, -2.943328857421875, -2.826416015625, -2.709503173828125, -2.59259033203125, -2.475677490234375, -2.3587646484375, -2.241851806640625, -2.12493896484375, -2.008026123046875, -1.89111328125, -1.774200439453125, -1.65728759765625, -1.540374755859375, -1.4234619140625, -1.306549072265625, -1.18963623046875, -1.072723388671875, -0.955810546875, -0.838897705078125, -0.72198486328125, -0.605072021484375, -0.4881591796875, -0.371246337890625, -0.25433349609375, -0.137420654296875, -0.0205078125, 0.096405029296875, 0.21331787109375, 0.330230712890625, 0.4471435546875, 0.564056396484375, 0.68096923828125, 0.797882080078125, 0.914794921875, 1.031707763671875, 1.14862060546875, 1.265533447265625, 1.3824462890625, 1.499359130859375, 1.61627197265625, 1.733184814453125, 1.85009765625, 1.967010498046875, 2.08392333984375, 2.200836181640625, 2.3177490234375, 2.434661865234375, 2.55157470703125, 2.668487548828125, 2.785400390625, 2.902313232421875, 3.01922607421875, 3.136138916015625, 3.2530517578125, 3.369964599609375, 3.48687744140625, 3.603790283203125, 3.720703125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 20.0, 77.0, 228.0, 360.0, 232.0, 58.0, 16.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0], "bins": [-125.49991607666016, -123.19523620605469, -120.89055633544922, -118.58587646484375, -116.28119659423828, -113.97651672363281, -111.67183685302734, -109.36715698242188, -107.0624771118164, -104.75779724121094, -102.45311737060547, -100.1484375, -97.84375762939453, -95.53907775878906, -93.2343978881836, -90.92971801757812, -88.62503051757812, -86.32035064697266, -84.01567077636719, -81.71099090576172, -79.40631103515625, -77.10163116455078, -74.79695129394531, -72.49227142333984, -70.18759155273438, -67.8829116821289, -65.57823181152344, -63.27355194091797, -60.9688720703125, -58.66419219970703, -56.35951232910156, -54.054832458496094, -51.750152587890625, -49.445472717285156, -47.14079284667969, -44.83611297607422, -42.53143310546875, -40.22675323486328, -37.92207336425781, -35.617393493652344, -33.31270980834961, -31.00802993774414, -28.703350067138672, -26.398670196533203, -24.093990325927734, -21.789310455322266, -19.484628677368164, -17.179948806762695, -14.875268936157227, -12.570589065551758, -10.265909194946289, -7.961228370666504, -5.656548500061035, -3.3518686294555664, -1.0471878051757812, 1.2574920654296875, 3.5621719360351562, 5.866851806640625, 8.171531677246094, 10.476212501525879, 12.780892372131348, 15.085572242736816, 17.3902530670166, 19.69493293762207, 21.99961280822754]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 7.0, 5.0, 9.0, 12.0, 22.0, 25.0, 34.0, 38.0, 34.0, 35.0, 52.0, 59.0, 55.0, 58.0, 61.0, 58.0, 46.0, 59.0, 61.0, 56.0, 38.0, 33.0, 25.0, 29.0, 11.0, 21.0, 20.0, 8.0, 12.0, 5.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.92122459411621, -19.30014991760254, -18.6790771484375, -18.058002471923828, -17.43692970275879, -16.815855026245117, -16.194782257080078, -15.573707580566406, -14.95263385772705, -14.331560134887695, -13.71048641204834, -13.089412689208984, -12.468338012695312, -11.847265243530273, -11.226190567016602, -10.605116844177246, -9.98404312133789, -9.362969398498535, -8.74189567565918, -8.120821952819824, -7.4997477531433105, -6.878674030303955, -6.257599830627441, -5.636526107788086, -5.0154523849487305, -4.394378662109375, -3.7733047008514404, -3.152230739593506, -2.5311570167541504, -1.910083293914795, -1.2890093326568604, -0.6679353713989258, -0.04686164855957031, 0.5742121934890747, 1.1952860355377197, 1.8163598775863647, 2.4374337196350098, 3.0585074424743652, 3.6795814037323, 4.300655364990234, 4.92172908782959, 5.542802810668945, 6.163876533508301, 6.7849507331848145, 7.40602445602417, 8.027097702026367, 8.648172378540039, 9.269246101379395, 9.89031982421875, 10.511393547058105, 11.132467269897461, 11.753540992736816, 12.374614715576172, 12.995689392089844, 13.6167631149292, 14.237836837768555, 14.85891056060791, 15.479984283447266, 16.101058959960938, 16.722131729125977, 17.34320640563965, 17.964279174804688, 18.58535385131836, 19.20642852783203, 19.82750129699707]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 6.0, 6.0, 12.0, 10.0, 25.0, 35.0, 52.0, 88.0, 97.0, 162.0, 247.0, 434.0, 681.0, 1156.0, 1945.0, 3230.0, 6117.0, 11308.0, 20981.0, 39857.0, 77925.0, 148075.0, 241422.0, 223828.0, 129024.0, 66547.0, 34520.0, 18096.0, 10016.0, 5200.0, 2935.0, 1767.0, 1026.0, 613.0, 388.0, 224.0, 160.0, 110.0, 62.0, 47.0, 32.0, 17.0, 23.0, 14.0, 15.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.6337890625, -1.5869598388671875, -1.540130615234375, -1.4933013916015625, -1.44647216796875, -1.3996429443359375, -1.352813720703125, -1.3059844970703125, -1.2591552734375, -1.2123260498046875, -1.165496826171875, -1.1186676025390625, -1.07183837890625, -1.0250091552734375, -0.978179931640625, -0.9313507080078125, -0.884521484375, -0.8376922607421875, -0.790863037109375, -0.7440338134765625, -0.69720458984375, -0.6503753662109375, -0.603546142578125, -0.5567169189453125, -0.5098876953125, -0.4630584716796875, -0.416229248046875, -0.3694000244140625, -0.32257080078125, -0.2757415771484375, -0.228912353515625, -0.1820831298828125, -0.13525390625, -0.0884246826171875, -0.041595458984375, 0.0052337646484375, 0.05206298828125, 0.0988922119140625, 0.145721435546875, 0.1925506591796875, 0.2393798828125, 0.2862091064453125, 0.333038330078125, 0.3798675537109375, 0.42669677734375, 0.4735260009765625, 0.520355224609375, 0.5671844482421875, 0.614013671875, 0.6608428955078125, 0.707672119140625, 0.7545013427734375, 0.80133056640625, 0.8481597900390625, 0.894989013671875, 0.9418182373046875, 0.9886474609375, 1.0354766845703125, 1.082305908203125, 1.1291351318359375, 1.17596435546875, 1.2227935791015625, 1.269622802734375, 1.3164520263671875, 1.36328125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 5.0, 4.0, 8.0, 6.0, 13.0, 16.0, 12.0, 8.0, 11.0, 20.0, 30.0, 25.0, 30.0, 24.0, 32.0, 38.0, 37.0, 42.0, 54.0, 52.0, 54.0, 53.0, 58.0, 44.0, 51.0, 31.0, 31.0, 33.0, 22.0, 20.0, 22.0, 24.0, 14.0, 17.0, 8.0, 10.0, 7.0, 8.0, 9.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.962890625, -0.931243896484375, -0.89959716796875, -0.867950439453125, -0.8363037109375, -0.804656982421875, -0.77301025390625, -0.741363525390625, -0.709716796875, -0.678070068359375, -0.64642333984375, -0.614776611328125, -0.5831298828125, -0.551483154296875, -0.51983642578125, -0.488189697265625, -0.45654296875, -0.424896240234375, -0.39324951171875, -0.361602783203125, -0.3299560546875, -0.298309326171875, -0.26666259765625, -0.235015869140625, -0.203369140625, -0.171722412109375, -0.14007568359375, -0.108428955078125, -0.0767822265625, -0.045135498046875, -0.01348876953125, 0.018157958984375, 0.0498046875, 0.081451416015625, 0.11309814453125, 0.144744873046875, 0.1763916015625, 0.208038330078125, 0.23968505859375, 0.271331787109375, 0.302978515625, 0.334625244140625, 0.36627197265625, 0.397918701171875, 0.4295654296875, 0.461212158203125, 0.49285888671875, 0.524505615234375, 0.55615234375, 0.587799072265625, 0.61944580078125, 0.651092529296875, 0.6827392578125, 0.714385986328125, 0.74603271484375, 0.777679443359375, 0.809326171875, 0.840972900390625, 0.87261962890625, 0.904266357421875, 0.9359130859375, 0.967559814453125, 0.99920654296875, 1.030853271484375, 1.0625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 12.0, 14.0, 23.0, 20.0, 37.0, 71.0, 135.0, 247.0, 474.0, 960.0, 2461.0, 11111.0, 130822.0, 808439.0, 81736.0, 8131.0, 2115.0, 818.0, 372.0, 230.0, 123.0, 88.0, 41.0, 25.0, 15.0, 11.0, 9.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.99609375, -7.80303955078125, -7.6099853515625, -7.41693115234375, -7.223876953125, -7.03082275390625, -6.8377685546875, -6.64471435546875, -6.45166015625, -6.25860595703125, -6.0655517578125, -5.87249755859375, -5.679443359375, -5.48638916015625, -5.2933349609375, -5.10028076171875, -4.9072265625, -4.71417236328125, -4.5211181640625, -4.32806396484375, -4.135009765625, -3.94195556640625, -3.7489013671875, -3.55584716796875, -3.36279296875, -3.16973876953125, -2.9766845703125, -2.78363037109375, -2.590576171875, -2.39752197265625, -2.2044677734375, -2.01141357421875, -1.818359375, -1.62530517578125, -1.4322509765625, -1.23919677734375, -1.046142578125, -0.85308837890625, -0.6600341796875, -0.46697998046875, -0.27392578125, -0.08087158203125, 0.1121826171875, 0.30523681640625, 0.498291015625, 0.69134521484375, 0.8843994140625, 1.07745361328125, 1.2705078125, 1.46356201171875, 1.6566162109375, 1.84967041015625, 2.042724609375, 2.23577880859375, 2.4288330078125, 2.62188720703125, 2.81494140625, 3.00799560546875, 3.2010498046875, 3.39410400390625, 3.587158203125, 3.78021240234375, 3.9732666015625, 4.16632080078125, 4.359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 3.0, 8.0, 8.0, 12.0, 14.0, 26.0, 16.0, 22.0, 28.0, 25.0, 38.0, 38.0, 34.0, 48.0, 40.0, 46.0, 45.0, 53.0, 41.0, 48.0, 42.0, 49.0, 44.0, 37.0, 31.0, 34.0, 28.0, 17.0, 18.0, 18.0, 23.0, 12.0, 14.0, 6.0, 7.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.64453125, -5.49493408203125, -5.3453369140625, -5.19573974609375, -5.046142578125, -4.89654541015625, -4.7469482421875, -4.59735107421875, -4.44775390625, -4.29815673828125, -4.1485595703125, -3.99896240234375, -3.849365234375, -3.69976806640625, -3.5501708984375, -3.40057373046875, -3.2509765625, -3.10137939453125, -2.9517822265625, -2.80218505859375, -2.652587890625, -2.50299072265625, -2.3533935546875, -2.20379638671875, -2.05419921875, -1.90460205078125, -1.7550048828125, -1.60540771484375, -1.455810546875, -1.30621337890625, -1.1566162109375, -1.00701904296875, -0.857421875, -0.70782470703125, -0.5582275390625, -0.40863037109375, -0.259033203125, -0.10943603515625, 0.0401611328125, 0.18975830078125, 0.33935546875, 0.48895263671875, 0.6385498046875, 0.78814697265625, 0.937744140625, 1.08734130859375, 1.2369384765625, 1.38653564453125, 1.5361328125, 1.68572998046875, 1.8353271484375, 1.98492431640625, 2.134521484375, 2.28411865234375, 2.4337158203125, 2.58331298828125, 2.73291015625, 2.88250732421875, 3.0321044921875, 3.18170166015625, 3.331298828125, 3.48089599609375, 3.6304931640625, 3.78009033203125, 3.9296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 7.0, 7.0, 22.0, 29.0, 79.0, 160.0, 326.0, 953.0, 4037.0, 43929.0, 894425.0, 96262.0, 6313.0, 1239.0, 409.0, 161.0, 81.0, 35.0, 27.0, 11.0, 7.0, 9.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.609375, -2.50335693359375, -2.3973388671875, -2.29132080078125, -2.185302734375, -2.07928466796875, -1.9732666015625, -1.86724853515625, -1.76123046875, -1.65521240234375, -1.5491943359375, -1.44317626953125, -1.337158203125, -1.23114013671875, -1.1251220703125, -1.01910400390625, -0.9130859375, -0.80706787109375, -0.7010498046875, -0.59503173828125, -0.489013671875, -0.38299560546875, -0.2769775390625, -0.17095947265625, -0.06494140625, 0.04107666015625, 0.1470947265625, 0.25311279296875, 0.359130859375, 0.46514892578125, 0.5711669921875, 0.67718505859375, 0.783203125, 0.88922119140625, 0.9952392578125, 1.10125732421875, 1.207275390625, 1.31329345703125, 1.4193115234375, 1.52532958984375, 1.63134765625, 1.73736572265625, 1.8433837890625, 1.94940185546875, 2.055419921875, 2.16143798828125, 2.2674560546875, 2.37347412109375, 2.4794921875, 2.58551025390625, 2.6915283203125, 2.79754638671875, 2.903564453125, 3.00958251953125, 3.1156005859375, 3.22161865234375, 3.32763671875, 3.43365478515625, 3.5396728515625, 3.64569091796875, 3.751708984375, 3.85772705078125, 3.9637451171875, 4.06976318359375, 4.17578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 2.0, 9.0, 11.0, 11.0, 13.0, 21.0, 22.0, 36.0, 45.0, 54.0, 87.0, 90.0, 104.0, 90.0, 76.0, 68.0, 59.0, 45.0, 34.0, 34.0, 19.0, 20.0, 7.0, 11.0, 9.0, 5.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002923011779785156, -0.000282827764749527, -0.00027335435152053833, -0.0002638809382915497, -0.00025440752506256104, -0.0002449341118335724, -0.00023546069860458374, -0.0002259872853755951, -0.00021651387214660645, -0.0002070404589176178, -0.00019756704568862915, -0.0001880936324596405, -0.00017862021923065186, -0.0001691468060016632, -0.00015967339277267456, -0.0001501999795436859, -0.00014072656631469727, -0.00013125315308570862, -0.00012177973985671997, -0.00011230632662773132, -0.00010283291339874268, -9.335950016975403e-05, -8.388608694076538e-05, -7.441267371177673e-05, -6.493926048278809e-05, -5.546584725379944e-05, -4.599243402481079e-05, -3.6519020795822144e-05, -2.7045607566833496e-05, -1.757219433784485e-05, -8.098781108856201e-06, 1.3746321201324463e-06, 1.0848045349121094e-05, 2.032145857810974e-05, 2.979487180709839e-05, 3.9268285036087036e-05, 4.8741698265075684e-05, 5.821511149406433e-05, 6.768852472305298e-05, 7.716193795204163e-05, 8.663535118103027e-05, 9.610876441001892e-05, 0.00010558217763900757, 0.00011505559086799622, 0.00012452900409698486, 0.0001340024173259735, 0.00014347583055496216, 0.0001529492437839508, 0.00016242265701293945, 0.0001718960702419281, 0.00018136948347091675, 0.0001908428966999054, 0.00020031630992889404, 0.0002097897231578827, 0.00021926313638687134, 0.00022873654961585999, 0.00023820996284484863, 0.0002476833760738373, 0.00025715678930282593, 0.0002666302025318146, 0.0002761036157608032, 0.00028557702898979187, 0.0002950504422187805, 0.00030452385544776917, 0.0003139972686767578]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 6.0, 10.0, 5.0, 28.0, 35.0, 76.0, 94.0, 143.0, 280.0, 570.0, 1267.0, 3433.0, 13188.0, 91784.0, 766048.0, 146409.0, 17943.0, 4353.0, 1457.0, 679.0, 299.0, 175.0, 90.0, 57.0, 42.0, 27.0, 19.0, 7.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.185546875, -2.1116943359375, -2.037841796875, -1.9639892578125, -1.89013671875, -1.8162841796875, -1.742431640625, -1.6685791015625, -1.5947265625, -1.5208740234375, -1.447021484375, -1.3731689453125, -1.29931640625, -1.2254638671875, -1.151611328125, -1.0777587890625, -1.00390625, -0.9300537109375, -0.856201171875, -0.7823486328125, -0.70849609375, -0.6346435546875, -0.560791015625, -0.4869384765625, -0.4130859375, -0.3392333984375, -0.265380859375, -0.1915283203125, -0.11767578125, -0.0438232421875, 0.030029296875, 0.1038818359375, 0.177734375, 0.2515869140625, 0.325439453125, 0.3992919921875, 0.47314453125, 0.5469970703125, 0.620849609375, 0.6947021484375, 0.7685546875, 0.8424072265625, 0.916259765625, 0.9901123046875, 1.06396484375, 1.1378173828125, 1.211669921875, 1.2855224609375, 1.359375, 1.4332275390625, 1.507080078125, 1.5809326171875, 1.65478515625, 1.7286376953125, 1.802490234375, 1.8763427734375, 1.9501953125, 2.0240478515625, 2.097900390625, 2.1717529296875, 2.24560546875, 2.3194580078125, 2.393310546875, 2.4671630859375, 2.541015625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 6.0, 2.0, 11.0, 11.0, 11.0, 31.0, 24.0, 24.0, 42.0, 57.0, 85.0, 82.0, 108.0, 110.0, 108.0, 73.0, 52.0, 50.0, 24.0, 22.0, 16.0, 15.0, 9.0, 13.0, 3.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.119140625, -2.052490234375, -1.98583984375, -1.919189453125, -1.8525390625, -1.785888671875, -1.71923828125, -1.652587890625, -1.5859375, -1.519287109375, -1.45263671875, -1.385986328125, -1.3193359375, -1.252685546875, -1.18603515625, -1.119384765625, -1.052734375, -0.986083984375, -0.91943359375, -0.852783203125, -0.7861328125, -0.719482421875, -0.65283203125, -0.586181640625, -0.51953125, -0.452880859375, -0.38623046875, -0.319580078125, -0.2529296875, -0.186279296875, -0.11962890625, -0.052978515625, 0.013671875, 0.080322265625, 0.14697265625, 0.213623046875, 0.2802734375, 0.346923828125, 0.41357421875, 0.480224609375, 0.546875, 0.613525390625, 0.68017578125, 0.746826171875, 0.8134765625, 0.880126953125, 0.94677734375, 1.013427734375, 1.080078125, 1.146728515625, 1.21337890625, 1.280029296875, 1.3466796875, 1.413330078125, 1.47998046875, 1.546630859375, 1.61328125, 1.679931640625, 1.74658203125, 1.813232421875, 1.8798828125, 1.946533203125, 2.01318359375, 2.079833984375, 2.146484375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 21.0, 41.0, 59.0, 109.0, 163.0, 200.0, 160.0, 96.0, 58.0, 34.0, 13.0, 10.0, 9.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.785573959350586, -21.672935485839844, -20.56029510498047, -19.447656631469727, -18.33501625061035, -17.22237777709961, -16.109737396240234, -14.997098922729492, -13.884459495544434, -12.771820068359375, -11.659180641174316, -10.546541213989258, -9.433902740478516, -8.32126235961914, -7.208623886108398, -6.09598445892334, -4.983345031738281, -3.8707056045532227, -2.758066415786743, -1.6454272270202637, -0.5327877998352051, 0.5798516273498535, 1.692490577697754, 2.8051300048828125, 3.917769432067871, 5.03040885925293, 6.143048286437988, 7.255687236785889, 8.368326187133789, 9.480966567993164, 10.593605041503906, 11.706244468688965, 12.81888198852539, 13.93152141571045, 15.044160842895508, 16.15679931640625, 17.269439697265625, 18.382078170776367, 19.49471664428711, 20.607357025146484, 21.71999740600586, 22.8326358795166, 23.945276260375977, 25.05791473388672, 26.170555114746094, 27.283193588256836, 28.395832061767578, 29.508472442626953, 30.621110916137695, 31.733749389648438, 32.84638977050781, 33.95903015136719, 35.0716667175293, 36.18430709838867, 37.29694747924805, 38.409584045410156, 39.52222442626953, 40.634864807128906, 41.747501373291016, 42.86014175415039, 43.972782135009766, 45.08542251586914, 46.19805908203125, 47.310699462890625, 48.42333984375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 8.0, 6.0, 8.0, 8.0, 8.0, 16.0, 11.0, 15.0, 27.0, 14.0, 14.0, 21.0, 30.0, 21.0, 30.0, 32.0, 43.0, 39.0, 43.0, 40.0, 46.0, 37.0, 41.0, 58.0, 48.0, 42.0, 37.0, 30.0, 28.0, 25.0, 27.0, 14.0, 19.0, 14.0, 16.0, 11.0, 16.0, 7.0, 14.0, 4.0, 8.0, 5.0, 5.0, 4.0, 7.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-16.410511016845703, -15.905683517456055, -15.40085506439209, -14.896026611328125, -14.391199111938477, -13.886371612548828, -13.381543159484863, -12.876714706420898, -12.37188720703125, -11.867059707641602, -11.362231254577637, -10.857402801513672, -10.352575302124023, -9.847747802734375, -9.34291934967041, -8.838090896606445, -8.333263397216797, -7.82843542098999, -7.323607444763184, -6.818779468536377, -6.31395149230957, -5.809123516082764, -5.304295539855957, -4.79946756362915, -4.294639587402344, -3.789811611175537, -3.2849836349487305, -2.780155658721924, -2.275327682495117, -1.7704997062683105, -1.265671730041504, -0.7608437538146973, -0.2560157775878906, 0.24881219863891602, 0.7536401748657227, 1.2584681510925293, 1.763296127319336, 2.2681241035461426, 2.772952079772949, 3.277780055999756, 3.7826080322265625, 4.287436008453369, 4.792263984680176, 5.297091960906982, 5.801919937133789, 6.306747913360596, 6.811575889587402, 7.316403865814209, 7.821231842041016, 8.326059341430664, 8.830887794494629, 9.335716247558594, 9.840543746948242, 10.34537124633789, 10.850199699401855, 11.35502815246582, 11.859855651855469, 12.364683151245117, 12.869511604309082, 13.374340057373047, 13.879167556762695, 14.383995056152344, 14.888823509216309, 15.393651962280273, 15.898479461669922]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 7.0, 4.0, 6.0, 12.0, 18.0, 35.0, 55.0, 92.0, 180.0, 325.0, 639.0, 1513.0, 4189.0, 13048.0, 55115.0, 652599.0, 3254903.0, 171710.0, 27703.0, 7624.0, 2625.0, 1026.0, 449.0, 197.0, 104.0, 48.0, 31.0, 14.0, 9.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5390625, -3.455352783203125, -3.37164306640625, -3.287933349609375, -3.2042236328125, -3.120513916015625, -3.03680419921875, -2.953094482421875, -2.869384765625, -2.785675048828125, -2.70196533203125, -2.618255615234375, -2.5345458984375, -2.450836181640625, -2.36712646484375, -2.283416748046875, -2.19970703125, -2.115997314453125, -2.03228759765625, -1.948577880859375, -1.8648681640625, -1.781158447265625, -1.69744873046875, -1.613739013671875, -1.530029296875, -1.446319580078125, -1.36260986328125, -1.278900146484375, -1.1951904296875, -1.111480712890625, -1.02777099609375, -0.944061279296875, -0.8603515625, -0.776641845703125, -0.69293212890625, -0.609222412109375, -0.5255126953125, -0.441802978515625, -0.35809326171875, -0.274383544921875, -0.190673828125, -0.106964111328125, -0.02325439453125, 0.060455322265625, 0.1441650390625, 0.227874755859375, 0.31158447265625, 0.395294189453125, 0.47900390625, 0.562713623046875, 0.64642333984375, 0.730133056640625, 0.8138427734375, 0.897552490234375, 0.98126220703125, 1.064971923828125, 1.148681640625, 1.232391357421875, 1.31610107421875, 1.399810791015625, 1.4835205078125, 1.567230224609375, 1.65093994140625, 1.734649658203125, 1.818359375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 12.0, 9.0, 15.0, 25.0, 27.0, 22.0, 48.0, 37.0, 40.0, 68.0, 63.0, 80.0, 86.0, 86.0, 62.0, 63.0, 51.0, 55.0, 31.0, 30.0, 23.0, 16.0, 18.0, 10.0, 9.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.341796875, -1.29461669921875, -1.2474365234375, -1.20025634765625, -1.153076171875, -1.10589599609375, -1.0587158203125, -1.01153564453125, -0.96435546875, -0.91717529296875, -0.8699951171875, -0.82281494140625, -0.775634765625, -0.72845458984375, -0.6812744140625, -0.63409423828125, -0.5869140625, -0.53973388671875, -0.4925537109375, -0.44537353515625, -0.398193359375, -0.35101318359375, -0.3038330078125, -0.25665283203125, -0.20947265625, -0.16229248046875, -0.1151123046875, -0.06793212890625, -0.020751953125, 0.02642822265625, 0.0736083984375, 0.12078857421875, 0.16796875, 0.21514892578125, 0.2623291015625, 0.30950927734375, 0.356689453125, 0.40386962890625, 0.4510498046875, 0.49822998046875, 0.54541015625, 0.59259033203125, 0.6397705078125, 0.68695068359375, 0.734130859375, 0.78131103515625, 0.8284912109375, 0.87567138671875, 0.9228515625, 0.97003173828125, 1.0172119140625, 1.06439208984375, 1.111572265625, 1.15875244140625, 1.2059326171875, 1.25311279296875, 1.30029296875, 1.34747314453125, 1.3946533203125, 1.44183349609375, 1.489013671875, 1.53619384765625, 1.5833740234375, 1.63055419921875, 1.677734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 7.0, 9.0, 10.0, 34.0, 62.0, 97.0, 242.0, 621.0, 1977.0, 7901.0, 47819.0, 1074103.0, 2964904.0, 80672.0, 12017.0, 2534.0, 703.0, 314.0, 118.0, 62.0, 35.0, 21.0, 14.0, 6.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.890625, -5.76007080078125, -5.6295166015625, -5.49896240234375, -5.368408203125, -5.23785400390625, -5.1072998046875, -4.97674560546875, -4.84619140625, -4.71563720703125, -4.5850830078125, -4.45452880859375, -4.323974609375, -4.19342041015625, -4.0628662109375, -3.93231201171875, -3.8017578125, -3.67120361328125, -3.5406494140625, -3.41009521484375, -3.279541015625, -3.14898681640625, -3.0184326171875, -2.88787841796875, -2.75732421875, -2.62677001953125, -2.4962158203125, -2.36566162109375, -2.235107421875, -2.10455322265625, -1.9739990234375, -1.84344482421875, -1.712890625, -1.58233642578125, -1.4517822265625, -1.32122802734375, -1.190673828125, -1.06011962890625, -0.9295654296875, -0.79901123046875, -0.66845703125, -0.53790283203125, -0.4073486328125, -0.27679443359375, -0.146240234375, -0.01568603515625, 0.1148681640625, 0.24542236328125, 0.3759765625, 0.50653076171875, 0.6370849609375, 0.76763916015625, 0.898193359375, 1.02874755859375, 1.1593017578125, 1.28985595703125, 1.42041015625, 1.55096435546875, 1.6815185546875, 1.81207275390625, 1.942626953125, 2.07318115234375, 2.2037353515625, 2.33428955078125, 2.46484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 5.0, 11.0, 9.0, 19.0, 21.0, 29.0, 45.0, 72.0, 116.0, 216.0, 390.0, 801.0, 962.0, 619.0, 312.0, 186.0, 87.0, 59.0, 33.0, 23.0, 20.0, 11.0, 7.0, 4.0, 4.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91796875, -2.821380615234375, -2.72479248046875, -2.628204345703125, -2.5316162109375, -2.435028076171875, -2.33843994140625, -2.241851806640625, -2.145263671875, -2.048675537109375, -1.95208740234375, -1.855499267578125, -1.7589111328125, -1.662322998046875, -1.56573486328125, -1.469146728515625, -1.37255859375, -1.275970458984375, -1.17938232421875, -1.082794189453125, -0.9862060546875, -0.889617919921875, -0.79302978515625, -0.696441650390625, -0.599853515625, -0.503265380859375, -0.40667724609375, -0.310089111328125, -0.2135009765625, -0.116912841796875, -0.02032470703125, 0.076263427734375, 0.1728515625, 0.269439697265625, 0.36602783203125, 0.462615966796875, 0.5592041015625, 0.655792236328125, 0.75238037109375, 0.848968505859375, 0.945556640625, 1.042144775390625, 1.13873291015625, 1.235321044921875, 1.3319091796875, 1.428497314453125, 1.52508544921875, 1.621673583984375, 1.71826171875, 1.814849853515625, 1.91143798828125, 2.008026123046875, 2.1046142578125, 2.201202392578125, 2.29779052734375, 2.394378662109375, 2.490966796875, 2.587554931640625, 2.68414306640625, 2.780731201171875, 2.8773193359375, 2.973907470703125, 3.07049560546875, 3.167083740234375, 3.263671875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 3.0, 15.0, 26.0, 51.0, 87.0, 118.0, 157.0, 172.0, 146.0, 95.0, 41.0, 23.0, 13.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.623659133911133, -21.852252960205078, -21.08084487915039, -20.309438705444336, -19.53803253173828, -18.766626358032227, -17.995220184326172, -17.223812103271484, -16.45240592956543, -15.680999755859375, -14.909592628479004, -14.138185501098633, -13.366779327392578, -12.595373153686523, -11.823966026306152, -11.052558898925781, -10.281152725219727, -9.509746551513672, -8.7383394241333, -7.966932773590088, -7.195526123046875, -6.424119472503662, -5.652712821960449, -4.881306171417236, -4.109899520874023, -3.3384928703308105, -2.5670862197875977, -1.7956795692443848, -1.0242729187011719, -0.252866268157959, 0.5185403823852539, 1.2899470329284668, 2.0613555908203125, 2.8327622413635254, 3.6041688919067383, 4.375575542449951, 5.146982192993164, 5.918388843536377, 6.68979549407959, 7.461202144622803, 8.232608795166016, 9.00401496887207, 9.775422096252441, 10.546829223632812, 11.318235397338867, 12.089641571044922, 12.861048698425293, 13.632455825805664, 14.403861999511719, 15.175268173217773, 15.946675300598145, 16.718082427978516, 17.48948860168457, 18.260894775390625, 19.032302856445312, 19.803709030151367, 20.575115203857422, 21.346521377563477, 22.11792755126953, 22.88933563232422, 23.660741806030273, 24.432147979736328, 25.203556060791016, 25.97496223449707, 26.746368408203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 9.0, 8.0, 8.0, 14.0, 17.0, 16.0, 23.0, 29.0, 23.0, 40.0, 40.0, 50.0, 43.0, 61.0, 53.0, 52.0, 67.0, 47.0, 47.0, 48.0, 49.0, 41.0, 37.0, 40.0, 25.0, 20.0, 25.0, 13.0, 18.0, 6.0, 8.0, 3.0, 8.0, 9.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.033833503723145, -9.670145034790039, -9.306455612182617, -8.942767143249512, -8.579078674316406, -8.2153902053833, -7.851701259613037, -7.488012313842773, -7.124323844909668, -6.7606353759765625, -6.396946430206299, -6.033257484436035, -5.66956901550293, -5.305880546569824, -4.9421916007995605, -4.578502655029297, -4.214814186096191, -3.851125478744507, -3.4874367713928223, -3.1237480640411377, -2.760059356689453, -2.3963706493377686, -2.032681941986084, -1.6689932346343994, -1.3053045272827148, -0.9416158199310303, -0.5779271125793457, -0.21423840522766113, 0.14945030212402344, 0.513139009475708, 0.8768277168273926, 1.2405164241790771, 1.6042041778564453, 1.9678928852081299, 2.3315815925598145, 2.695270299911499, 3.0589590072631836, 3.422647714614868, 3.7863364219665527, 4.150025367736816, 4.513713836669922, 4.877402305603027, 5.241091251373291, 5.604780197143555, 5.96846866607666, 6.332157135009766, 6.695846080780029, 7.059535026550293, 7.423223495483398, 7.786911964416504, 8.15060043334961, 8.514289855957031, 8.877978324890137, 9.241666793823242, 9.605356216430664, 9.96904468536377, 10.332733154296875, 10.69642162322998, 11.060110092163086, 11.423799514770508, 11.787487983703613, 12.151176452636719, 12.51486587524414, 12.878554344177246, 13.242242813110352]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 5.0, 11.0, 13.0, 24.0, 26.0, 48.0, 64.0, 97.0, 189.0, 266.0, 439.0, 806.0, 1295.0, 2263.0, 3994.0, 7203.0, 13369.0, 25938.0, 51050.0, 102881.0, 208309.0, 281819.0, 174231.0, 84796.0, 42475.0, 21599.0, 11311.0, 6045.0, 3311.0, 1850.0, 1088.0, 614.0, 405.0, 246.0, 155.0, 109.0, 66.0, 33.0, 29.0, 22.0, 17.0, 13.0, 8.0, 4.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.505859375, -1.4545745849609375, -1.403289794921875, -1.3520050048828125, -1.30072021484375, -1.2494354248046875, -1.198150634765625, -1.1468658447265625, -1.0955810546875, -1.0442962646484375, -0.993011474609375, -0.9417266845703125, -0.89044189453125, -0.8391571044921875, -0.787872314453125, -0.7365875244140625, -0.685302734375, -0.6340179443359375, -0.582733154296875, -0.5314483642578125, -0.48016357421875, -0.4288787841796875, -0.377593994140625, -0.3263092041015625, -0.2750244140625, -0.2237396240234375, -0.172454833984375, -0.1211700439453125, -0.06988525390625, -0.0186004638671875, 0.032684326171875, 0.0839691162109375, 0.13525390625, 0.1865386962890625, 0.237823486328125, 0.2891082763671875, 0.34039306640625, 0.3916778564453125, 0.442962646484375, 0.4942474365234375, 0.5455322265625, 0.5968170166015625, 0.648101806640625, 0.6993865966796875, 0.75067138671875, 0.8019561767578125, 0.853240966796875, 0.9045257568359375, 0.955810546875, 1.0070953369140625, 1.058380126953125, 1.1096649169921875, 1.16094970703125, 1.2122344970703125, 1.263519287109375, 1.3148040771484375, 1.3660888671875, 1.4173736572265625, 1.468658447265625, 1.5199432373046875, 1.57122802734375, 1.6225128173828125, 1.673797607421875, 1.7250823974609375, 1.7763671875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 8.0, 5.0, 8.0, 13.0, 22.0, 18.0, 20.0, 31.0, 28.0, 36.0, 31.0, 27.0, 33.0, 35.0, 61.0, 44.0, 57.0, 42.0, 72.0, 67.0, 37.0, 35.0, 39.0, 25.0, 30.0, 33.0, 24.0, 12.0, 14.0, 12.0, 15.0, 14.0, 7.0, 12.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.001953125, -0.969390869140625, -0.93682861328125, -0.904266357421875, -0.8717041015625, -0.839141845703125, -0.80657958984375, -0.774017333984375, -0.741455078125, -0.708892822265625, -0.67633056640625, -0.643768310546875, -0.6112060546875, -0.578643798828125, -0.54608154296875, -0.513519287109375, -0.48095703125, -0.448394775390625, -0.41583251953125, -0.383270263671875, -0.3507080078125, -0.318145751953125, -0.28558349609375, -0.253021240234375, -0.220458984375, -0.187896728515625, -0.15533447265625, -0.122772216796875, -0.0902099609375, -0.057647705078125, -0.02508544921875, 0.007476806640625, 0.0400390625, 0.072601318359375, 0.10516357421875, 0.137725830078125, 0.1702880859375, 0.202850341796875, 0.23541259765625, 0.267974853515625, 0.300537109375, 0.333099365234375, 0.36566162109375, 0.398223876953125, 0.4307861328125, 0.463348388671875, 0.49591064453125, 0.528472900390625, 0.56103515625, 0.593597412109375, 0.62615966796875, 0.658721923828125, 0.6912841796875, 0.723846435546875, 0.75640869140625, 0.788970947265625, 0.821533203125, 0.854095458984375, 0.88665771484375, 0.919219970703125, 0.9517822265625, 0.984344482421875, 1.01690673828125, 1.049468994140625, 1.08203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 3.0, 15.0, 11.0, 25.0, 30.0, 44.0, 63.0, 109.0, 137.0, 249.0, 434.0, 887.0, 2124.0, 6308.0, 26329.0, 164524.0, 676360.0, 138709.0, 22657.0, 5625.0, 2016.0, 835.0, 428.0, 234.0, 132.0, 77.0, 63.0, 37.0, 15.0, 15.0, 16.0, 9.0, 11.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1640625, -4.02734375, -3.890625, -3.75390625, -3.6171875, -3.48046875, -3.34375, -3.20703125, -3.0703125, -2.93359375, -2.796875, -2.66015625, -2.5234375, -2.38671875, -2.25, -2.11328125, -1.9765625, -1.83984375, -1.703125, -1.56640625, -1.4296875, -1.29296875, -1.15625, -1.01953125, -0.8828125, -0.74609375, -0.609375, -0.47265625, -0.3359375, -0.19921875, -0.0625, 0.07421875, 0.2109375, 0.34765625, 0.484375, 0.62109375, 0.7578125, 0.89453125, 1.03125, 1.16796875, 1.3046875, 1.44140625, 1.578125, 1.71484375, 1.8515625, 1.98828125, 2.125, 2.26171875, 2.3984375, 2.53515625, 2.671875, 2.80859375, 2.9453125, 3.08203125, 3.21875, 3.35546875, 3.4921875, 3.62890625, 3.765625, 3.90234375, 4.0390625, 4.17578125, 4.3125, 4.44921875, 4.5859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 11.0, 9.0, 4.0, 15.0, 10.0, 12.0, 19.0, 27.0, 18.0, 30.0, 22.0, 31.0, 38.0, 41.0, 40.0, 41.0, 43.0, 43.0, 51.0, 42.0, 44.0, 31.0, 52.0, 39.0, 36.0, 26.0, 22.0, 25.0, 31.0, 14.0, 23.0, 14.0, 13.0, 8.0, 15.0, 9.0, 9.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.916015625, -3.798736572265625, -3.68145751953125, -3.564178466796875, -3.4468994140625, -3.329620361328125, -3.21234130859375, -3.095062255859375, -2.977783203125, -2.860504150390625, -2.74322509765625, -2.625946044921875, -2.5086669921875, -2.391387939453125, -2.27410888671875, -2.156829833984375, -2.03955078125, -1.922271728515625, -1.80499267578125, -1.687713623046875, -1.5704345703125, -1.453155517578125, -1.33587646484375, -1.218597412109375, -1.101318359375, -0.984039306640625, -0.86676025390625, -0.749481201171875, -0.6322021484375, -0.514923095703125, -0.39764404296875, -0.280364990234375, -0.1630859375, -0.045806884765625, 0.07147216796875, 0.188751220703125, 0.3060302734375, 0.423309326171875, 0.54058837890625, 0.657867431640625, 0.775146484375, 0.892425537109375, 1.00970458984375, 1.126983642578125, 1.2442626953125, 1.361541748046875, 1.47882080078125, 1.596099853515625, 1.71337890625, 1.830657958984375, 1.94793701171875, 2.065216064453125, 2.1824951171875, 2.299774169921875, 2.41705322265625, 2.534332275390625, 2.651611328125, 2.768890380859375, 2.88616943359375, 3.003448486328125, 3.1207275390625, 3.238006591796875, 3.35528564453125, 3.472564697265625, 3.58984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 7.0, 6.0, 11.0, 19.0, 30.0, 47.0, 96.0, 209.0, 521.0, 1496.0, 6542.0, 75089.0, 868987.0, 85743.0, 7200.0, 1569.0, 493.0, 207.0, 104.0, 73.0, 34.0, 19.0, 15.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.29296875, -3.19171142578125, -3.0904541015625, -2.98919677734375, -2.887939453125, -2.78668212890625, -2.6854248046875, -2.58416748046875, -2.48291015625, -2.38165283203125, -2.2803955078125, -2.17913818359375, -2.077880859375, -1.97662353515625, -1.8753662109375, -1.77410888671875, -1.6728515625, -1.57159423828125, -1.4703369140625, -1.36907958984375, -1.267822265625, -1.16656494140625, -1.0653076171875, -0.96405029296875, -0.86279296875, -0.76153564453125, -0.6602783203125, -0.55902099609375, -0.457763671875, -0.35650634765625, -0.2552490234375, -0.15399169921875, -0.052734375, 0.04852294921875, 0.1497802734375, 0.25103759765625, 0.352294921875, 0.45355224609375, 0.5548095703125, 0.65606689453125, 0.75732421875, 0.85858154296875, 0.9598388671875, 1.06109619140625, 1.162353515625, 1.26361083984375, 1.3648681640625, 1.46612548828125, 1.5673828125, 1.66864013671875, 1.7698974609375, 1.87115478515625, 1.972412109375, 2.07366943359375, 2.1749267578125, 2.27618408203125, 2.37744140625, 2.47869873046875, 2.5799560546875, 2.68121337890625, 2.782470703125, 2.88372802734375, 2.9849853515625, 3.08624267578125, 3.1875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 11.0, 27.0, 44.0, 116.0, 206.0, 259.0, 166.0, 95.0, 34.0, 14.0, 14.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0013294219970703125, -0.0012987032532691956, -0.0012679845094680786, -0.0012372657656669617, -0.0012065470218658447, -0.0011758282780647278, -0.0011451095342636108, -0.001114390790462494, -0.001083672046661377, -0.00105295330286026, -0.001022234559059143, -0.0009915158152580261, -0.0009607970714569092, -0.0009300783276557922, -0.0008993595838546753, -0.0008686408400535583, -0.0008379220962524414, -0.0008072033524513245, -0.0007764846086502075, -0.0007457658648490906, -0.0007150471210479736, -0.0006843283772468567, -0.0006536096334457397, -0.0006228908896446228, -0.0005921721458435059, -0.0005614534020423889, -0.000530734658241272, -0.000500015914440155, -0.0004692971706390381, -0.00043857842683792114, -0.0004078596830368042, -0.00037714093923568726, -0.0003464221954345703, -0.00031570345163345337, -0.0002849847078323364, -0.0002542659640312195, -0.00022354722023010254, -0.0001928284764289856, -0.00016210973262786865, -0.0001313909888267517, -0.00010067224502563477, -6.995350122451782e-05, -3.923475742340088e-05, -8.516013622283936e-06, 2.2202730178833008e-05, 5.292147397994995e-05, 8.36402177810669e-05, 0.00011435896158218384, 0.00014507770538330078, 0.00017579644918441772, 0.00020651519298553467, 0.0002372339367866516, 0.00026795268058776855, 0.0002986714243888855, 0.00032939016819000244, 0.0003601089119911194, 0.00039082765579223633, 0.00042154639959335327, 0.0004522651433944702, 0.00048298388719558716, 0.0005137026309967041, 0.000544421374797821, 0.000575140118598938, 0.0006058588624000549, 0.0006365776062011719]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 10.0, 21.0, 25.0, 47.0, 102.0, 186.0, 367.0, 779.0, 1787.0, 5654.0, 30477.0, 383557.0, 575436.0, 39517.0, 6735.0, 2141.0, 858.0, 381.0, 173.0, 128.0, 67.0, 34.0, 18.0, 12.0, 8.0, 5.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.640625, -2.5653076171875, -2.489990234375, -2.4146728515625, -2.33935546875, -2.2640380859375, -2.188720703125, -2.1134033203125, -2.0380859375, -1.9627685546875, -1.887451171875, -1.8121337890625, -1.73681640625, -1.6614990234375, -1.586181640625, -1.5108642578125, -1.435546875, -1.3602294921875, -1.284912109375, -1.2095947265625, -1.13427734375, -1.0589599609375, -0.983642578125, -0.9083251953125, -0.8330078125, -0.7576904296875, -0.682373046875, -0.6070556640625, -0.53173828125, -0.4564208984375, -0.381103515625, -0.3057861328125, -0.23046875, -0.1551513671875, -0.079833984375, -0.0045166015625, 0.07080078125, 0.1461181640625, 0.221435546875, 0.2967529296875, 0.3720703125, 0.4473876953125, 0.522705078125, 0.5980224609375, 0.67333984375, 0.7486572265625, 0.823974609375, 0.8992919921875, 0.974609375, 1.0499267578125, 1.125244140625, 1.2005615234375, 1.27587890625, 1.3511962890625, 1.426513671875, 1.5018310546875, 1.5771484375, 1.6524658203125, 1.727783203125, 1.8031005859375, 1.87841796875, 1.9537353515625, 2.029052734375, 2.1043701171875, 2.1796875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 6.0, 2.0, 10.0, 8.0, 6.0, 14.0, 7.0, 23.0, 29.0, 31.0, 48.0, 56.0, 57.0, 62.0, 73.0, 78.0, 81.0, 90.0, 62.0, 46.0, 41.0, 31.0, 34.0, 22.0, 15.0, 17.0, 9.0, 12.0, 7.0, 4.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4638671875, -1.4189910888671875, -1.374114990234375, -1.3292388916015625, -1.28436279296875, -1.2394866943359375, -1.194610595703125, -1.1497344970703125, -1.1048583984375, -1.0599822998046875, -1.015106201171875, -0.9702301025390625, -0.92535400390625, -0.8804779052734375, -0.835601806640625, -0.7907257080078125, -0.745849609375, -0.7009735107421875, -0.656097412109375, -0.6112213134765625, -0.56634521484375, -0.5214691162109375, -0.476593017578125, -0.4317169189453125, -0.3868408203125, -0.3419647216796875, -0.297088623046875, -0.2522125244140625, -0.20733642578125, -0.1624603271484375, -0.117584228515625, -0.0727081298828125, -0.02783203125, 0.0170440673828125, 0.061920166015625, 0.1067962646484375, 0.15167236328125, 0.1965484619140625, 0.241424560546875, 0.2863006591796875, 0.3311767578125, 0.3760528564453125, 0.420928955078125, 0.4658050537109375, 0.51068115234375, 0.5555572509765625, 0.600433349609375, 0.6453094482421875, 0.690185546875, 0.7350616455078125, 0.779937744140625, 0.8248138427734375, 0.86968994140625, 0.9145660400390625, 0.959442138671875, 1.0043182373046875, 1.0491943359375, 1.0940704345703125, 1.138946533203125, 1.1838226318359375, 1.22869873046875, 1.2735748291015625, 1.318450927734375, 1.3633270263671875, 1.408203125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 16.0, 37.0, 71.0, 157.0, 273.0, 202.0, 128.0, 51.0, 30.0, 17.0, 8.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.772090911865234, -50.32299041748047, -48.87388610839844, -47.424781799316406, -45.97568130493164, -44.526580810546875, -43.077476501464844, -41.62837219238281, -40.17927169799805, -38.73017120361328, -37.28106689453125, -35.83196258544922, -34.38286209106445, -32.93376159667969, -31.484657287597656, -30.035554885864258, -28.58645248413086, -27.13735008239746, -25.688247680664062, -24.239145278930664, -22.790042877197266, -21.340940475463867, -19.89183807373047, -18.44273567199707, -16.993633270263672, -15.544530868530273, -14.095428466796875, -12.646326065063477, -11.197223663330078, -9.74812126159668, -8.299018859863281, -6.849916458129883, -5.40081787109375, -3.9517154693603516, -2.502613067626953, -1.0535106658935547, 0.39559173583984375, 1.8446941375732422, 3.2937965393066406, 4.742898941040039, 6.1920013427734375, 7.641103744506836, 9.090206146240234, 10.539308547973633, 11.988410949707031, 13.43751335144043, 14.886615753173828, 16.335718154907227, 17.784820556640625, 19.233922958374023, 20.683025360107422, 22.13212776184082, 23.58123016357422, 25.030332565307617, 26.479434967041016, 27.928537368774414, 29.377639770507812, 30.82674217224121, 32.27584457397461, 33.724945068359375, 35.174049377441406, 36.62315368652344, 38.0722541809082, 39.52135467529297, 40.970458984375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 12.0, 9.0, 16.0, 16.0, 18.0, 12.0, 19.0, 39.0, 18.0, 17.0, 36.0, 45.0, 39.0, 60.0, 63.0, 62.0, 61.0, 53.0, 59.0, 54.0, 52.0, 36.0, 37.0, 36.0, 18.0, 21.0, 29.0, 12.0, 16.0, 4.0, 3.0, 8.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.26943588256836, -22.633747100830078, -21.99806022644043, -21.36237144470215, -20.7266845703125, -20.09099578857422, -19.45530891418457, -18.81962013244629, -18.18393325805664, -17.54824447631836, -16.91255760192871, -16.27686882019043, -15.641181945800781, -15.0054931640625, -14.369805335998535, -13.73411750793457, -13.098428726196289, -12.462740898132324, -11.82705307006836, -11.191365242004395, -10.55567741394043, -9.919988632202148, -9.284300804138184, -8.648612976074219, -8.012925148010254, -7.377237319946289, -6.741549491882324, -6.105861186981201, -5.470173358917236, -4.8344855308532715, -4.198797225952148, -3.5631093978881836, -2.9274215698242188, -2.291733741760254, -1.65604567527771, -1.0203577280044556, -0.38466978073120117, 0.25101804733276367, 0.8867061138153076, 1.5223941802978516, 2.1580820083618164, 2.7937698364257812, 3.429457902908325, 4.065145969390869, 4.700833797454834, 5.336521625518799, 5.972209930419922, 6.607897758483887, 7.243585586547852, 7.879273414611816, 8.514961242675781, 9.150649070739746, 9.786336898803711, 10.422025680541992, 11.057713508605957, 11.693401336669922, 12.329089164733887, 12.964776992797852, 13.600464820861816, 14.236152648925781, 14.871841430664062, 15.507528305053711, 16.143217086791992, 16.77890396118164, 17.414592742919922]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 9.0, 8.0, 10.0, 16.0, 22.0, 25.0, 42.0, 83.0, 124.0, 200.0, 337.0, 831.0, 2226.0, 6762.0, 27638.0, 171074.0, 2657480.0, 1207781.0, 93223.0, 18255.0, 5069.0, 1783.0, 656.0, 322.0, 130.0, 73.0, 38.0, 21.0, 17.0, 11.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.291015625, -3.212371826171875, -3.13372802734375, -3.055084228515625, -2.9764404296875, -2.897796630859375, -2.81915283203125, -2.740509033203125, -2.661865234375, -2.583221435546875, -2.50457763671875, -2.425933837890625, -2.3472900390625, -2.268646240234375, -2.19000244140625, -2.111358642578125, -2.03271484375, -1.954071044921875, -1.87542724609375, -1.796783447265625, -1.7181396484375, -1.639495849609375, -1.56085205078125, -1.482208251953125, -1.403564453125, -1.324920654296875, -1.24627685546875, -1.167633056640625, -1.0889892578125, -1.010345458984375, -0.93170166015625, -0.853057861328125, -0.7744140625, -0.695770263671875, -0.61712646484375, -0.538482666015625, -0.4598388671875, -0.381195068359375, -0.30255126953125, -0.223907470703125, -0.145263671875, -0.066619873046875, 0.01202392578125, 0.090667724609375, 0.1693115234375, 0.247955322265625, 0.32659912109375, 0.405242919921875, 0.48388671875, 0.562530517578125, 0.64117431640625, 0.719818115234375, 0.7984619140625, 0.877105712890625, 0.95574951171875, 1.034393310546875, 1.113037109375, 1.191680908203125, 1.27032470703125, 1.348968505859375, 1.4276123046875, 1.506256103515625, 1.58489990234375, 1.663543701171875, 1.7421875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 6.0, 16.0, 33.0, 37.0, 61.0, 79.0, 66.0, 99.0, 111.0, 131.0, 101.0, 80.0, 74.0, 40.0, 30.0, 11.0, 16.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.21875, -3.148223876953125, -3.07769775390625, -3.007171630859375, -2.9366455078125, -2.866119384765625, -2.79559326171875, -2.725067138671875, -2.654541015625, -2.584014892578125, -2.51348876953125, -2.442962646484375, -2.3724365234375, -2.301910400390625, -2.23138427734375, -2.160858154296875, -2.09033203125, -2.019805908203125, -1.94927978515625, -1.878753662109375, -1.8082275390625, -1.737701416015625, -1.66717529296875, -1.596649169921875, -1.526123046875, -1.455596923828125, -1.38507080078125, -1.314544677734375, -1.2440185546875, -1.173492431640625, -1.10296630859375, -1.032440185546875, -0.9619140625, -0.891387939453125, -0.82086181640625, -0.750335693359375, -0.6798095703125, -0.609283447265625, -0.53875732421875, -0.468231201171875, -0.397705078125, -0.327178955078125, -0.25665283203125, -0.186126708984375, -0.1156005859375, -0.045074462890625, 0.02545166015625, 0.095977783203125, 0.16650390625, 0.237030029296875, 0.30755615234375, 0.378082275390625, 0.4486083984375, 0.519134521484375, 0.58966064453125, 0.660186767578125, 0.730712890625, 0.801239013671875, 0.87176513671875, 0.942291259765625, 1.0128173828125, 1.083343505859375, 1.15386962890625, 1.224395751953125, 1.294921875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 15.0, 22.0, 26.0, 47.0, 90.0, 166.0, 364.0, 928.0, 3278.0, 13476.0, 81714.0, 1793617.0, 2193075.0, 89238.0, 13573.0, 3049.0, 923.0, 339.0, 147.0, 63.0, 40.0, 31.0, 20.0, 9.0, 9.0, 6.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0, -3.8824462890625, -3.764892578125, -3.6473388671875, -3.52978515625, -3.4122314453125, -3.294677734375, -3.1771240234375, -3.0595703125, -2.9420166015625, -2.824462890625, -2.7069091796875, -2.58935546875, -2.4718017578125, -2.354248046875, -2.2366943359375, -2.119140625, -2.0015869140625, -1.884033203125, -1.7664794921875, -1.64892578125, -1.5313720703125, -1.413818359375, -1.2962646484375, -1.1787109375, -1.0611572265625, -0.943603515625, -0.8260498046875, -0.70849609375, -0.5909423828125, -0.473388671875, -0.3558349609375, -0.23828125, -0.1207275390625, -0.003173828125, 0.1143798828125, 0.23193359375, 0.3494873046875, 0.467041015625, 0.5845947265625, 0.7021484375, 0.8197021484375, 0.937255859375, 1.0548095703125, 1.17236328125, 1.2899169921875, 1.407470703125, 1.5250244140625, 1.642578125, 1.7601318359375, 1.877685546875, 1.9952392578125, 2.11279296875, 2.2303466796875, 2.347900390625, 2.4654541015625, 2.5830078125, 2.7005615234375, 2.818115234375, 2.9356689453125, 3.05322265625, 3.1707763671875, 3.288330078125, 3.4058837890625, 3.5234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 4.0, 8.0, 7.0, 6.0, 13.0, 12.0, 16.0, 13.0, 26.0, 41.0, 58.0, 82.0, 130.0, 192.0, 280.0, 401.0, 621.0, 660.0, 525.0, 311.0, 208.0, 132.0, 75.0, 61.0, 39.0, 33.0, 27.0, 30.0, 8.0, 14.0, 8.0, 7.0, 3.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.548828125, -2.46722412109375, -2.3856201171875, -2.30401611328125, -2.222412109375, -2.14080810546875, -2.0592041015625, -1.97760009765625, -1.89599609375, -1.81439208984375, -1.7327880859375, -1.65118408203125, -1.569580078125, -1.48797607421875, -1.4063720703125, -1.32476806640625, -1.2431640625, -1.16156005859375, -1.0799560546875, -0.99835205078125, -0.916748046875, -0.83514404296875, -0.7535400390625, -0.67193603515625, -0.59033203125, -0.50872802734375, -0.4271240234375, -0.34552001953125, -0.263916015625, -0.18231201171875, -0.1007080078125, -0.01910400390625, 0.0625, 0.14410400390625, 0.2257080078125, 0.30731201171875, 0.388916015625, 0.47052001953125, 0.5521240234375, 0.63372802734375, 0.71533203125, 0.79693603515625, 0.8785400390625, 0.96014404296875, 1.041748046875, 1.12335205078125, 1.2049560546875, 1.28656005859375, 1.3681640625, 1.44976806640625, 1.5313720703125, 1.61297607421875, 1.694580078125, 1.77618408203125, 1.8577880859375, 1.93939208984375, 2.02099609375, 2.10260009765625, 2.1842041015625, 2.26580810546875, 2.347412109375, 2.42901611328125, 2.5106201171875, 2.59222412109375, 2.673828125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 2.0, 8.0, 26.0, 80.0, 137.0, 223.0, 234.0, 149.0, 77.0, 27.0, 11.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.64106750488281, -47.30323791503906, -45.96540451049805, -44.6275749206543, -43.28974533081055, -41.95191192626953, -40.61408233642578, -39.27625274658203, -37.93842315673828, -36.60059356689453, -35.262760162353516, -33.924930572509766, -32.587100982666016, -31.249269485473633, -29.91143798828125, -28.5736083984375, -27.235774993896484, -25.8979434967041, -24.56011390686035, -23.22228240966797, -21.88445281982422, -20.546621322631836, -19.208789825439453, -17.870960235595703, -16.53312873840332, -15.195298194885254, -13.857467651367188, -12.519636154174805, -11.181805610656738, -9.843975067138672, -8.506143569946289, -7.168313026428223, -5.830478668212891, -4.492648124694824, -3.1548171043395996, -1.816986083984375, -0.4791555404663086, 0.8586750030517578, 2.1965065002441406, 3.534337043762207, 4.872167587280273, 6.20999813079834, 7.5478291511535645, 8.885660171508789, 10.223490715026855, 11.561321258544922, 12.899152755737305, 14.236983299255371, 15.574813842773438, 16.91264533996582, 18.25047492980957, 19.588306427001953, 20.926136016845703, 22.263967514038086, 23.60179901123047, 24.93962860107422, 26.2774600982666, 27.615291595458984, 28.953121185302734, 30.290952682495117, 31.6287841796875, 32.96661376953125, 34.304443359375, 35.642276763916016, 36.980106353759766]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 9.0, 15.0, 12.0, 21.0, 5.0, 19.0, 27.0, 26.0, 43.0, 41.0, 48.0, 28.0, 53.0, 45.0, 56.0, 33.0, 50.0, 62.0, 48.0, 39.0, 37.0, 46.0, 43.0, 42.0, 22.0, 17.0, 14.0, 24.0, 16.0, 11.0, 16.0, 8.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.384416580200195, -8.967121124267578, -8.549825668334961, -8.132530212402344, -7.715234279632568, -7.297938823699951, -6.880642890930176, -6.463347434997559, -6.046051979064941, -5.628756523132324, -5.211461067199707, -4.794165134429932, -4.3768696784973145, -3.9595742225646973, -3.542278528213501, -3.1249828338623047, -2.7076873779296875, -2.2903919219970703, -1.873096227645874, -1.4558006525039673, -1.0385050773620605, -0.6212096214294434, -0.20391392707824707, 0.21338176727294922, 0.6306772232055664, 1.0479727983474731, 1.4652683734893799, 1.8825639486312866, 2.2998595237731934, 2.7171549797058105, 3.134450674057007, 3.551746368408203, 3.9690418243408203, 4.3863372802734375, 4.803632736206055, 5.22092866897583, 5.638224124908447, 6.0555195808410645, 6.47281551361084, 6.890110969543457, 7.307406425476074, 7.724701881408691, 8.141997337341309, 8.559292793273926, 8.97658920288086, 9.393884658813477, 9.811180114746094, 10.228475570678711, 10.645771026611328, 11.063066482543945, 11.480361938476562, 11.89765739440918, 12.314952850341797, 12.732248306274414, 13.149544715881348, 13.566840171813965, 13.984135627746582, 14.4014310836792, 14.818726539611816, 15.236021995544434, 15.653318405151367, 16.070613861083984, 16.4879093170166, 16.90520477294922, 17.322500228881836]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 3.0, 5.0, 15.0, 15.0, 16.0, 41.0, 47.0, 81.0, 137.0, 244.0, 425.0, 838.0, 1641.0, 3549.0, 8224.0, 20348.0, 50228.0, 121162.0, 270241.0, 310556.0, 152027.0, 63562.0, 26072.0, 10594.0, 4445.0, 1970.0, 936.0, 500.0, 259.0, 139.0, 90.0, 50.0, 33.0, 15.0, 16.0, 15.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.51171875, -2.4440765380859375, -2.376434326171875, -2.3087921142578125, -2.24114990234375, -2.1735076904296875, -2.105865478515625, -2.0382232666015625, -1.9705810546875, -1.9029388427734375, -1.835296630859375, -1.7676544189453125, -1.70001220703125, -1.6323699951171875, -1.564727783203125, -1.4970855712890625, -1.429443359375, -1.3618011474609375, -1.294158935546875, -1.2265167236328125, -1.15887451171875, -1.0912322998046875, -1.023590087890625, -0.9559478759765625, -0.8883056640625, -0.8206634521484375, -0.753021240234375, -0.6853790283203125, -0.61773681640625, -0.5500946044921875, -0.482452392578125, -0.4148101806640625, -0.34716796875, -0.2795257568359375, -0.211883544921875, -0.1442413330078125, -0.07659912109375, -0.0089569091796875, 0.058685302734375, 0.1263275146484375, 0.1939697265625, 0.2616119384765625, 0.329254150390625, 0.3968963623046875, 0.46453857421875, 0.5321807861328125, 0.599822998046875, 0.6674652099609375, 0.735107421875, 0.8027496337890625, 0.870391845703125, 0.9380340576171875, 1.00567626953125, 1.0733184814453125, 1.140960693359375, 1.2086029052734375, 1.2762451171875, 1.3438873291015625, 1.411529541015625, 1.4791717529296875, 1.54681396484375, 1.6144561767578125, 1.682098388671875, 1.7497406005859375, 1.8173828125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 8.0, 7.0, 14.0, 10.0, 13.0, 23.0, 21.0, 33.0, 33.0, 33.0, 43.0, 52.0, 52.0, 60.0, 62.0, 65.0, 54.0, 54.0, 56.0, 47.0, 42.0, 38.0, 30.0, 28.0, 26.0, 27.0, 13.0, 13.0, 15.0, 11.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3486328125, -1.3126678466796875, -1.276702880859375, -1.2407379150390625, -1.20477294921875, -1.1688079833984375, -1.132843017578125, -1.0968780517578125, -1.0609130859375, -1.0249481201171875, -0.988983154296875, -0.9530181884765625, -0.91705322265625, -0.8810882568359375, -0.845123291015625, -0.8091583251953125, -0.773193359375, -0.7372283935546875, -0.701263427734375, -0.6652984619140625, -0.62933349609375, -0.5933685302734375, -0.557403564453125, -0.5214385986328125, -0.4854736328125, -0.4495086669921875, -0.413543701171875, -0.3775787353515625, -0.34161376953125, -0.3056488037109375, -0.269683837890625, -0.2337188720703125, -0.19775390625, -0.1617889404296875, -0.125823974609375, -0.0898590087890625, -0.05389404296875, -0.0179290771484375, 0.018035888671875, 0.0540008544921875, 0.0899658203125, 0.1259307861328125, 0.161895751953125, 0.1978607177734375, 0.23382568359375, 0.2697906494140625, 0.305755615234375, 0.3417205810546875, 0.377685546875, 0.4136505126953125, 0.449615478515625, 0.4855804443359375, 0.52154541015625, 0.5575103759765625, 0.593475341796875, 0.6294403076171875, 0.6654052734375, 0.7013702392578125, 0.737335205078125, 0.7733001708984375, 0.80926513671875, 0.8452301025390625, 0.881195068359375, 0.9171600341796875, 0.953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 6.0, 3.0, 13.0, 13.0, 18.0, 35.0, 37.0, 69.0, 121.0, 167.0, 272.0, 468.0, 718.0, 1431.0, 3420.0, 12699.0, 103337.0, 758362.0, 143890.0, 15988.0, 3844.0, 1571.0, 770.0, 463.0, 282.0, 196.0, 128.0, 80.0, 51.0, 33.0, 24.0, 18.0, 5.0, 8.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.26953125, -5.10772705078125, -4.9459228515625, -4.78411865234375, -4.622314453125, -4.46051025390625, -4.2987060546875, -4.13690185546875, -3.97509765625, -3.81329345703125, -3.6514892578125, -3.48968505859375, -3.327880859375, -3.16607666015625, -3.0042724609375, -2.84246826171875, -2.6806640625, -2.51885986328125, -2.3570556640625, -2.19525146484375, -2.033447265625, -1.87164306640625, -1.7098388671875, -1.54803466796875, -1.38623046875, -1.22442626953125, -1.0626220703125, -0.90081787109375, -0.739013671875, -0.57720947265625, -0.4154052734375, -0.25360107421875, -0.091796875, 0.07000732421875, 0.2318115234375, 0.39361572265625, 0.555419921875, 0.71722412109375, 0.8790283203125, 1.04083251953125, 1.20263671875, 1.36444091796875, 1.5262451171875, 1.68804931640625, 1.849853515625, 2.01165771484375, 2.1734619140625, 2.33526611328125, 2.4970703125, 2.65887451171875, 2.8206787109375, 2.98248291015625, 3.144287109375, 3.30609130859375, 3.4678955078125, 3.62969970703125, 3.79150390625, 3.95330810546875, 4.1151123046875, 4.27691650390625, 4.438720703125, 4.60052490234375, 4.7623291015625, 4.92413330078125, 5.0859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 7.0, 6.0, 6.0, 10.0, 14.0, 4.0, 13.0, 14.0, 20.0, 25.0, 24.0, 45.0, 28.0, 32.0, 43.0, 49.0, 49.0, 35.0, 42.0, 43.0, 43.0, 38.0, 52.0, 56.0, 40.0, 50.0, 31.0, 28.0, 28.0, 19.0, 18.0, 22.0, 11.0, 10.0, 7.0, 12.0, 7.0, 5.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.49609375, -4.36663818359375, -4.2371826171875, -4.10772705078125, -3.978271484375, -3.84881591796875, -3.7193603515625, -3.58990478515625, -3.46044921875, -3.33099365234375, -3.2015380859375, -3.07208251953125, -2.942626953125, -2.81317138671875, -2.6837158203125, -2.55426025390625, -2.4248046875, -2.29534912109375, -2.1658935546875, -2.03643798828125, -1.906982421875, -1.77752685546875, -1.6480712890625, -1.51861572265625, -1.38916015625, -1.25970458984375, -1.1302490234375, -1.00079345703125, -0.871337890625, -0.74188232421875, -0.6124267578125, -0.48297119140625, -0.353515625, -0.22406005859375, -0.0946044921875, 0.03485107421875, 0.164306640625, 0.29376220703125, 0.4232177734375, 0.55267333984375, 0.68212890625, 0.81158447265625, 0.9410400390625, 1.07049560546875, 1.199951171875, 1.32940673828125, 1.4588623046875, 1.58831787109375, 1.7177734375, 1.84722900390625, 1.9766845703125, 2.10614013671875, 2.235595703125, 2.36505126953125, 2.4945068359375, 2.62396240234375, 2.75341796875, 2.88287353515625, 3.0123291015625, 3.14178466796875, 3.271240234375, 3.40069580078125, 3.5301513671875, 3.65960693359375, 3.7890625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 8.0, 2.0, 13.0, 26.0, 28.0, 43.0, 40.0, 64.0, 122.0, 208.0, 432.0, 944.0, 2922.0, 14002.0, 117470.0, 789149.0, 105709.0, 12769.0, 2710.0, 934.0, 385.0, 217.0, 112.0, 68.0, 46.0, 30.0, 17.0, 28.0, 12.0, 9.0, 4.0, 8.0, 5.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.732421875, -1.66937255859375, -1.6063232421875, -1.54327392578125, -1.480224609375, -1.41717529296875, -1.3541259765625, -1.29107666015625, -1.22802734375, -1.16497802734375, -1.1019287109375, -1.03887939453125, -0.975830078125, -0.91278076171875, -0.8497314453125, -0.78668212890625, -0.7236328125, -0.66058349609375, -0.5975341796875, -0.53448486328125, -0.471435546875, -0.40838623046875, -0.3453369140625, -0.28228759765625, -0.21923828125, -0.15618896484375, -0.0931396484375, -0.03009033203125, 0.032958984375, 0.09600830078125, 0.1590576171875, 0.22210693359375, 0.28515625, 0.34820556640625, 0.4112548828125, 0.47430419921875, 0.537353515625, 0.60040283203125, 0.6634521484375, 0.72650146484375, 0.78955078125, 0.85260009765625, 0.9156494140625, 0.97869873046875, 1.041748046875, 1.10479736328125, 1.1678466796875, 1.23089599609375, 1.2939453125, 1.35699462890625, 1.4200439453125, 1.48309326171875, 1.546142578125, 1.60919189453125, 1.6722412109375, 1.73529052734375, 1.79833984375, 1.86138916015625, 1.9244384765625, 1.98748779296875, 2.050537109375, 2.11358642578125, 2.1766357421875, 2.23968505859375, 2.302734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 3.0, 10.0, 9.0, 9.0, 10.0, 18.0, 23.0, 30.0, 38.0, 41.0, 47.0, 67.0, 93.0, 93.0, 90.0, 78.0, 78.0, 50.0, 40.0, 37.0, 25.0, 25.0, 14.0, 12.0, 17.0, 9.0, 10.0, 5.0, 1.0, 2.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003058910369873047, -0.00029503926634788513, -0.0002841874957084656, -0.000273335725069046, -0.00026248395442962646, -0.0002516321837902069, -0.00024078041315078735, -0.0002299286425113678, -0.00021907687187194824, -0.0002082251012325287, -0.00019737333059310913, -0.00018652155995368958, -0.00017566978931427002, -0.00016481801867485046, -0.0001539662480354309, -0.00014311447739601135, -0.0001322627067565918, -0.00012141093611717224, -0.00011055916547775269, -9.970739483833313e-05, -8.885562419891357e-05, -7.800385355949402e-05, -6.715208292007446e-05, -5.630031228065491e-05, -4.544854164123535e-05, -3.4596771001815796e-05, -2.374500036239624e-05, -1.2893229722976685e-05, -2.041459083557129e-06, 8.810311555862427e-06, 1.9662082195281982e-05, 3.0513852834701538e-05, 4.1365623474121094e-05, 5.221739411354065e-05, 6.30691647529602e-05, 7.392093539237976e-05, 8.477270603179932e-05, 9.562447667121887e-05, 0.00010647624731063843, 0.00011732801795005798, 0.00012817978858947754, 0.0001390315592288971, 0.00014988332986831665, 0.0001607351005077362, 0.00017158687114715576, 0.00018243864178657532, 0.00019329041242599487, 0.00020414218306541443, 0.00021499395370483398, 0.00022584572434425354, 0.0002366974949836731, 0.00024754926562309265, 0.0002584010362625122, 0.00026925280690193176, 0.0002801045775413513, 0.0002909563481807709, 0.00030180811882019043, 0.00031265988945961, 0.00032351166009902954, 0.0003343634307384491, 0.00034521520137786865, 0.0003560669720172882, 0.00036691874265670776, 0.0003777705132961273, 0.0003886222839355469]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 8.0, 13.0, 12.0, 25.0, 56.0, 62.0, 134.0, 247.0, 527.0, 1210.0, 3729.0, 19000.0, 300042.0, 684624.0, 30878.0, 5191.0, 1520.0, 625.0, 274.0, 137.0, 72.0, 55.0, 36.0, 24.0, 10.0, 18.0, 7.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.96484375, -1.88958740234375, -1.8143310546875, -1.73907470703125, -1.663818359375, -1.58856201171875, -1.5133056640625, -1.43804931640625, -1.36279296875, -1.28753662109375, -1.2122802734375, -1.13702392578125, -1.061767578125, -0.98651123046875, -0.9112548828125, -0.83599853515625, -0.7607421875, -0.68548583984375, -0.6102294921875, -0.53497314453125, -0.459716796875, -0.38446044921875, -0.3092041015625, -0.23394775390625, -0.15869140625, -0.08343505859375, -0.0081787109375, 0.06707763671875, 0.142333984375, 0.21759033203125, 0.2928466796875, 0.36810302734375, 0.443359375, 0.51861572265625, 0.5938720703125, 0.66912841796875, 0.744384765625, 0.81964111328125, 0.8948974609375, 0.97015380859375, 1.04541015625, 1.12066650390625, 1.1959228515625, 1.27117919921875, 1.346435546875, 1.42169189453125, 1.4969482421875, 1.57220458984375, 1.6474609375, 1.72271728515625, 1.7979736328125, 1.87322998046875, 1.948486328125, 2.02374267578125, 2.0989990234375, 2.17425537109375, 2.24951171875, 2.32476806640625, 2.4000244140625, 2.47528076171875, 2.550537109375, 2.62579345703125, 2.7010498046875, 2.77630615234375, 2.8515625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 15.0, 10.0, 16.0, 22.0, 21.0, 31.0, 50.0, 76.0, 88.0, 93.0, 115.0, 110.0, 87.0, 78.0, 53.0, 36.0, 29.0, 12.0, 16.0, 8.0, 9.0, 6.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5517578125, -1.498992919921875, -1.44622802734375, -1.393463134765625, -1.3406982421875, -1.287933349609375, -1.23516845703125, -1.182403564453125, -1.129638671875, -1.076873779296875, -1.02410888671875, -0.971343994140625, -0.9185791015625, -0.865814208984375, -0.81304931640625, -0.760284423828125, -0.70751953125, -0.654754638671875, -0.60198974609375, -0.549224853515625, -0.4964599609375, -0.443695068359375, -0.39093017578125, -0.338165283203125, -0.285400390625, -0.232635498046875, -0.17987060546875, -0.127105712890625, -0.0743408203125, -0.021575927734375, 0.03118896484375, 0.083953857421875, 0.13671875, 0.189483642578125, 0.24224853515625, 0.295013427734375, 0.3477783203125, 0.400543212890625, 0.45330810546875, 0.506072998046875, 0.558837890625, 0.611602783203125, 0.66436767578125, 0.717132568359375, 0.7698974609375, 0.822662353515625, 0.87542724609375, 0.928192138671875, 0.98095703125, 1.033721923828125, 1.08648681640625, 1.139251708984375, 1.1920166015625, 1.244781494140625, 1.29754638671875, 1.350311279296875, 1.403076171875, 1.455841064453125, 1.50860595703125, 1.561370849609375, 1.6141357421875, 1.666900634765625, 1.71966552734375, 1.772430419921875, 1.8251953125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 7.0, 10.0, 32.0, 51.0, 90.0, 137.0, 249.0, 206.0, 103.0, 51.0, 32.0, 22.0, 6.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.611814498901367, -26.50395965576172, -25.39610481262207, -24.288249969482422, -23.180395126342773, -22.072540283203125, -20.964683532714844, -19.856830596923828, -18.748973846435547, -17.6411190032959, -16.53326416015625, -15.425409317016602, -14.317554473876953, -13.209699630737305, -12.10184383392334, -10.993988990783691, -9.88613510131836, -8.778280258178711, -7.6704254150390625, -6.562570095062256, -5.454715251922607, -4.346860408782959, -3.2390050888061523, -2.131150245666504, -1.0232954025268555, 0.08455955982208252, 1.1924145221710205, 2.300269603729248, 3.4081244468688965, 4.515979290008545, 5.623834609985352, 6.731689453125, 7.839546203613281, 8.94740104675293, 10.055255889892578, 11.163110733032227, 12.270965576171875, 13.378820419311523, 14.486676216125488, 15.594531059265137, 16.70238494873047, 17.810239791870117, 18.918094635009766, 20.025949478149414, 21.133804321289062, 22.24165916442871, 23.34951400756836, 24.45737075805664, 25.56522560119629, 26.673080444335938, 27.780935287475586, 28.888790130615234, 29.996644973754883, 31.10449981689453, 32.21235656738281, 33.32020950317383, 34.42806625366211, 35.53592300415039, 36.643775939941406, 37.75163269042969, 38.8594856262207, 39.967342376708984, 41.0751953125, 42.18305206298828, 43.2909049987793]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 12.0, 6.0, 8.0, 7.0, 8.0, 7.0, 4.0, 11.0, 20.0, 12.0, 22.0, 25.0, 19.0, 29.0, 26.0, 32.0, 37.0, 42.0, 47.0, 62.0, 57.0, 74.0, 60.0, 54.0, 41.0, 33.0, 25.0, 22.0, 30.0, 28.0, 16.0, 22.0, 18.0, 17.0, 10.0, 6.0, 7.0, 9.0, 8.0, 7.0, 6.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.339868545532227, -13.874029159545898, -13.40818977355957, -12.942349433898926, -12.476510047912598, -12.01067066192627, -11.544831275939941, -11.078990936279297, -10.613151550292969, -10.14731216430664, -9.681472778320312, -9.215632438659668, -8.74979305267334, -8.283953666687012, -7.818114280700684, -7.352274417877197, -6.886435031890869, -6.420595645904541, -5.954755783081055, -5.488916397094727, -5.02307653427124, -4.557237148284912, -4.091397285461426, -3.6255578994750977, -3.1597182750701904, -2.693878650665283, -2.228039026260376, -1.7621995210647583, -1.296359896659851, -0.8305203914642334, -0.36468076705932617, 0.10115885734558105, 0.5669984817504883, 1.0328381061553955, 1.4986777305603027, 1.9645172357559204, 2.430356979370117, 2.8961963653564453, 3.3620359897613525, 3.8278756141662598, 4.293715476989746, 4.759554862976074, 5.2253947257995605, 5.691234111785889, 6.157073974609375, 6.622913360595703, 7.088752746582031, 7.554592609405518, 8.020431518554688, 8.486270904541016, 8.952110290527344, 9.417950630187988, 9.883790016174316, 10.349629402160645, 10.815468788146973, 11.281309127807617, 11.747148513793945, 12.212987899780273, 12.678827285766602, 13.144667625427246, 13.610507011413574, 14.076346397399902, 14.54218578338623, 15.008026123046875, 15.473865509033203]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 8.0, 12.0, 23.0, 40.0, 88.0, 120.0, 295.0, 581.0, 1558.0, 4401.0, 15656.0, 73885.0, 785609.0, 2967008.0, 289769.0, 40564.0, 9692.0, 3034.0, 1075.0, 452.0, 214.0, 97.0, 46.0, 29.0, 11.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.508941650390625, -2.44171142578125, -2.374481201171875, -2.3072509765625, -2.240020751953125, -2.17279052734375, -2.105560302734375, -2.038330078125, -1.971099853515625, -1.90386962890625, -1.836639404296875, -1.7694091796875, -1.702178955078125, -1.63494873046875, -1.567718505859375, -1.50048828125, -1.433258056640625, -1.36602783203125, -1.298797607421875, -1.2315673828125, -1.164337158203125, -1.09710693359375, -1.029876708984375, -0.962646484375, -0.895416259765625, -0.82818603515625, -0.760955810546875, -0.6937255859375, -0.626495361328125, -0.55926513671875, -0.492034912109375, -0.4248046875, -0.357574462890625, -0.29034423828125, -0.223114013671875, -0.1558837890625, -0.088653564453125, -0.02142333984375, 0.045806884765625, 0.113037109375, 0.180267333984375, 0.24749755859375, 0.314727783203125, 0.3819580078125, 0.449188232421875, 0.51641845703125, 0.583648681640625, 0.65087890625, 0.718109130859375, 0.78533935546875, 0.852569580078125, 0.9197998046875, 0.987030029296875, 1.05426025390625, 1.121490478515625, 1.188720703125, 1.255950927734375, 1.32318115234375, 1.390411376953125, 1.4576416015625, 1.524871826171875, 1.59210205078125, 1.659332275390625, 1.7265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 9.0, 5.0, 3.0, 14.0, 14.0, 17.0, 17.0, 23.0, 19.0, 20.0, 22.0, 22.0, 38.0, 30.0, 39.0, 45.0, 42.0, 46.0, 51.0, 57.0, 42.0, 39.0, 43.0, 36.0, 32.0, 40.0, 32.0, 32.0, 28.0, 15.0, 28.0, 18.0, 12.0, 7.0, 8.0, 8.0, 9.0, 8.0, 9.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96875, -0.941802978515625, -0.91485595703125, -0.887908935546875, -0.8609619140625, -0.834014892578125, -0.80706787109375, -0.780120849609375, -0.753173828125, -0.726226806640625, -0.69927978515625, -0.672332763671875, -0.6453857421875, -0.618438720703125, -0.59149169921875, -0.564544677734375, -0.53759765625, -0.510650634765625, -0.48370361328125, -0.456756591796875, -0.4298095703125, -0.402862548828125, -0.37591552734375, -0.348968505859375, -0.322021484375, -0.295074462890625, -0.26812744140625, -0.241180419921875, -0.2142333984375, -0.187286376953125, -0.16033935546875, -0.133392333984375, -0.1064453125, -0.079498291015625, -0.05255126953125, -0.025604248046875, 0.0013427734375, 0.028289794921875, 0.05523681640625, 0.082183837890625, 0.109130859375, 0.136077880859375, 0.16302490234375, 0.189971923828125, 0.2169189453125, 0.243865966796875, 0.27081298828125, 0.297760009765625, 0.32470703125, 0.351654052734375, 0.37860107421875, 0.405548095703125, 0.4324951171875, 0.459442138671875, 0.48638916015625, 0.513336181640625, 0.540283203125, 0.567230224609375, 0.59417724609375, 0.621124267578125, 0.6480712890625, 0.675018310546875, 0.70196533203125, 0.728912353515625, 0.755859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 14.0, 14.0, 27.0, 25.0, 38.0, 63.0, 104.0, 140.0, 301.0, 567.0, 1263.0, 3070.0, 9266.0, 30475.0, 139373.0, 1590594.0, 2186464.0, 178415.0, 36563.0, 10638.0, 3728.0, 1506.0, 682.0, 394.0, 195.0, 108.0, 71.0, 45.0, 37.0, 33.0, 12.0, 12.0, 6.0, 3.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.205078125, -2.13409423828125, -2.0631103515625, -1.99212646484375, -1.921142578125, -1.85015869140625, -1.7791748046875, -1.70819091796875, -1.63720703125, -1.56622314453125, -1.4952392578125, -1.42425537109375, -1.353271484375, -1.28228759765625, -1.2113037109375, -1.14031982421875, -1.0693359375, -0.99835205078125, -0.9273681640625, -0.85638427734375, -0.785400390625, -0.71441650390625, -0.6434326171875, -0.57244873046875, -0.50146484375, -0.43048095703125, -0.3594970703125, -0.28851318359375, -0.217529296875, -0.14654541015625, -0.0755615234375, -0.00457763671875, 0.06640625, 0.13739013671875, 0.2083740234375, 0.27935791015625, 0.350341796875, 0.42132568359375, 0.4923095703125, 0.56329345703125, 0.63427734375, 0.70526123046875, 0.7762451171875, 0.84722900390625, 0.918212890625, 0.98919677734375, 1.0601806640625, 1.13116455078125, 1.2021484375, 1.27313232421875, 1.3441162109375, 1.41510009765625, 1.486083984375, 1.55706787109375, 1.6280517578125, 1.69903564453125, 1.77001953125, 1.84100341796875, 1.9119873046875, 1.98297119140625, 2.053955078125, 2.12493896484375, 2.1959228515625, 2.26690673828125, 2.337890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 9.0, 11.0, 8.0, 15.0, 30.0, 34.0, 35.0, 53.0, 83.0, 108.0, 180.0, 282.0, 457.0, 665.0, 674.0, 483.0, 274.0, 199.0, 137.0, 93.0, 63.0, 38.0, 29.0, 27.0, 17.0, 16.0, 7.0, 9.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.221221923828125, -2.14752197265625, -2.073822021484375, -2.0001220703125, -1.926422119140625, -1.85272216796875, -1.779022216796875, -1.705322265625, -1.631622314453125, -1.55792236328125, -1.484222412109375, -1.4105224609375, -1.336822509765625, -1.26312255859375, -1.189422607421875, -1.11572265625, -1.042022705078125, -0.96832275390625, -0.894622802734375, -0.8209228515625, -0.747222900390625, -0.67352294921875, -0.599822998046875, -0.526123046875, -0.452423095703125, -0.37872314453125, -0.305023193359375, -0.2313232421875, -0.157623291015625, -0.08392333984375, -0.010223388671875, 0.0634765625, 0.137176513671875, 0.21087646484375, 0.284576416015625, 0.3582763671875, 0.431976318359375, 0.50567626953125, 0.579376220703125, 0.653076171875, 0.726776123046875, 0.80047607421875, 0.874176025390625, 0.9478759765625, 1.021575927734375, 1.09527587890625, 1.168975830078125, 1.24267578125, 1.316375732421875, 1.39007568359375, 1.463775634765625, 1.5374755859375, 1.611175537109375, 1.68487548828125, 1.758575439453125, 1.832275390625, 1.905975341796875, 1.97967529296875, 2.053375244140625, 2.1270751953125, 2.200775146484375, 2.27447509765625, 2.348175048828125, 2.421875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 34.0, 68.0, 186.0, 272.0, 238.0, 94.0, 55.0, 21.0, 8.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.06241226196289, -38.79749298095703, -37.53257369995117, -36.26765441894531, -35.00273513793945, -33.737815856933594, -32.472896575927734, -31.207977294921875, -29.943058013916016, -28.678138732910156, -27.413219451904297, -26.148300170898438, -24.883380889892578, -23.61846160888672, -22.35354232788086, -21.088623046875, -19.82370376586914, -18.55878448486328, -17.293865203857422, -16.028945922851562, -14.764026641845703, -13.499107360839844, -12.234188079833984, -10.969268798828125, -9.704349517822266, -8.439430236816406, -7.174510955810547, -5.9095916748046875, -4.644672393798828, -3.3797531127929688, -2.1148338317871094, -0.84991455078125, 0.41500091552734375, 1.6799201965332031, 2.9448394775390625, 4.209758758544922, 5.474678039550781, 6.739597320556641, 8.0045166015625, 9.26943588256836, 10.534355163574219, 11.799274444580078, 13.064193725585938, 14.329113006591797, 15.594032287597656, 16.858951568603516, 18.123870849609375, 19.388790130615234, 20.653709411621094, 21.918628692626953, 23.183547973632812, 24.448467254638672, 25.71338653564453, 26.97830581665039, 28.24322509765625, 29.50814437866211, 30.77306365966797, 32.03798294067383, 33.30290222167969, 34.56782150268555, 35.832740783691406, 37.097660064697266, 38.362579345703125, 39.627498626708984, 40.892417907714844]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 6.0, 2.0, 4.0, 5.0, 11.0, 9.0, 22.0, 13.0, 17.0, 16.0, 28.0, 21.0, 13.0, 26.0, 25.0, 37.0, 39.0, 47.0, 26.0, 38.0, 32.0, 44.0, 41.0, 47.0, 33.0, 38.0, 47.0, 32.0, 37.0, 31.0, 29.0, 24.0, 22.0, 24.0, 15.0, 21.0, 11.0, 6.0, 7.0, 15.0, 7.0, 9.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.51646614074707, -8.231355667114258, -7.946244239807129, -7.661133289337158, -7.3760223388671875, -7.090911388397217, -6.805800437927246, -6.520689964294434, -6.235578536987305, -5.950467586517334, -5.665356636047363, -5.380245685577393, -5.095134735107422, -4.810023784637451, -4.5249128341674805, -4.239802360534668, -3.9546914100646973, -3.6695804595947266, -3.384469509124756, -3.099358558654785, -2.8142476081848145, -2.5291366577148438, -2.244025945663452, -1.9589149951934814, -1.6738040447235107, -1.38869309425354, -1.1035821437835693, -0.8184713125228882, -0.5333603620529175, -0.24824941158294678, 0.036861419677734375, 0.3219723701477051, 0.6070833206176758, 0.8921942710876465, 1.1773052215576172, 1.4624160528182983, 1.747527003288269, 2.0326380729675293, 2.317748785018921, 2.6028597354888916, 2.8879706859588623, 3.173081636428833, 3.4581925868988037, 3.7433032989501953, 4.028414249420166, 4.313525199890137, 4.598636150360107, 4.883747100830078, 5.168858051300049, 5.4539690017700195, 5.73907995223999, 6.024190902709961, 6.309301853179932, 6.594412803649902, 6.879523277282715, 7.164634704589844, 7.449745178222656, 7.734856128692627, 8.019967079162598, 8.30507755279541, 8.590188980102539, 8.875299453735352, 9.16041088104248, 9.445521354675293, 9.730632781982422]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 8.0, 10.0, 10.0, 18.0, 32.0, 43.0, 76.0, 107.0, 159.0, 277.0, 459.0, 862.0, 1422.0, 2574.0, 5009.0, 9941.0, 20617.0, 44044.0, 95954.0, 214126.0, 307044.0, 187100.0, 83578.0, 38019.0, 18167.0, 8822.0, 4503.0, 2334.0, 1311.0, 729.0, 457.0, 293.0, 178.0, 81.0, 56.0, 45.0, 25.0, 18.0, 11.0, 8.0, 9.0, 11.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806640625, -1.7509002685546875, -1.695159912109375, -1.6394195556640625, -1.58367919921875, -1.5279388427734375, -1.472198486328125, -1.4164581298828125, -1.3607177734375, -1.3049774169921875, -1.249237060546875, -1.1934967041015625, -1.13775634765625, -1.0820159912109375, -1.026275634765625, -0.9705352783203125, -0.914794921875, -0.8590545654296875, -0.803314208984375, -0.7475738525390625, -0.69183349609375, -0.6360931396484375, -0.580352783203125, -0.5246124267578125, -0.4688720703125, -0.4131317138671875, -0.357391357421875, -0.3016510009765625, -0.24591064453125, -0.1901702880859375, -0.134429931640625, -0.0786895751953125, -0.02294921875, 0.0327911376953125, 0.088531494140625, 0.1442718505859375, 0.20001220703125, 0.2557525634765625, 0.311492919921875, 0.3672332763671875, 0.4229736328125, 0.4787139892578125, 0.534454345703125, 0.5901947021484375, 0.64593505859375, 0.7016754150390625, 0.757415771484375, 0.8131561279296875, 0.868896484375, 0.9246368408203125, 0.980377197265625, 1.0361175537109375, 1.09185791015625, 1.1475982666015625, 1.203338623046875, 1.2590789794921875, 1.3148193359375, 1.3705596923828125, 1.426300048828125, 1.4820404052734375, 1.53778076171875, 1.5935211181640625, 1.649261474609375, 1.7050018310546875, 1.7607421875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 3.0, 6.0, 1.0, 8.0, 10.0, 12.0, 10.0, 11.0, 18.0, 18.0, 16.0, 24.0, 27.0, 26.0, 29.0, 38.0, 38.0, 32.0, 42.0, 40.0, 43.0, 39.0, 52.0, 40.0, 43.0, 39.0, 39.0, 31.0, 33.0, 33.0, 20.0, 18.0, 30.0, 23.0, 25.0, 13.0, 10.0, 9.0, 8.0, 20.0, 4.0, 4.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.91845703125, -0.89208984375, -0.86572265625, -0.83935546875, -0.81298828125, -0.78662109375, -0.76025390625, -0.73388671875, -0.70751953125, -0.68115234375, -0.65478515625, -0.62841796875, -0.60205078125, -0.57568359375, -0.54931640625, -0.52294921875, -0.49658203125, -0.47021484375, -0.44384765625, -0.41748046875, -0.39111328125, -0.36474609375, -0.33837890625, -0.31201171875, -0.28564453125, -0.25927734375, -0.23291015625, -0.20654296875, -0.18017578125, -0.15380859375, -0.12744140625, -0.10107421875, -0.07470703125, -0.04833984375, -0.02197265625, 0.00439453125, 0.03076171875, 0.05712890625, 0.08349609375, 0.10986328125, 0.13623046875, 0.16259765625, 0.18896484375, 0.21533203125, 0.24169921875, 0.26806640625, 0.29443359375, 0.32080078125, 0.34716796875, 0.37353515625, 0.39990234375, 0.42626953125, 0.45263671875, 0.47900390625, 0.50537109375, 0.53173828125, 0.55810546875, 0.58447265625, 0.61083984375, 0.63720703125, 0.66357421875, 0.68994140625, 0.71630859375, 0.74267578125, 0.76904296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 5.0, 12.0, 6.0, 13.0, 26.0, 16.0, 44.0, 51.0, 68.0, 101.0, 148.0, 208.0, 339.0, 480.0, 932.0, 1718.0, 4163.0, 14007.0, 74530.0, 653780.0, 249202.0, 34558.0, 7990.0, 2770.0, 1381.0, 714.0, 399.0, 282.0, 174.0, 137.0, 80.0, 61.0, 38.0, 29.0, 21.0, 20.0, 8.0, 12.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.85546875, -3.7215576171875, -3.587646484375, -3.4537353515625, -3.31982421875, -3.1859130859375, -3.052001953125, -2.9180908203125, -2.7841796875, -2.6502685546875, -2.516357421875, -2.3824462890625, -2.24853515625, -2.1146240234375, -1.980712890625, -1.8468017578125, -1.712890625, -1.5789794921875, -1.445068359375, -1.3111572265625, -1.17724609375, -1.0433349609375, -0.909423828125, -0.7755126953125, -0.6416015625, -0.5076904296875, -0.373779296875, -0.2398681640625, -0.10595703125, 0.0279541015625, 0.161865234375, 0.2957763671875, 0.4296875, 0.5635986328125, 0.697509765625, 0.8314208984375, 0.96533203125, 1.0992431640625, 1.233154296875, 1.3670654296875, 1.5009765625, 1.6348876953125, 1.768798828125, 1.9027099609375, 2.03662109375, 2.1705322265625, 2.304443359375, 2.4383544921875, 2.572265625, 2.7061767578125, 2.840087890625, 2.9739990234375, 3.10791015625, 3.2418212890625, 3.375732421875, 3.5096435546875, 3.6435546875, 3.7774658203125, 3.911376953125, 4.0452880859375, 4.17919921875, 4.3131103515625, 4.447021484375, 4.5809326171875, 4.71484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 7.0, 8.0, 9.0, 5.0, 10.0, 16.0, 9.0, 16.0, 19.0, 19.0, 26.0, 32.0, 41.0, 31.0, 56.0, 40.0, 47.0, 52.0, 49.0, 48.0, 57.0, 57.0, 46.0, 59.0, 32.0, 29.0, 27.0, 26.0, 22.0, 22.0, 19.0, 15.0, 18.0, 9.0, 9.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.578125, -3.45574951171875, -3.3333740234375, -3.21099853515625, -3.088623046875, -2.96624755859375, -2.8438720703125, -2.72149658203125, -2.59912109375, -2.47674560546875, -2.3543701171875, -2.23199462890625, -2.109619140625, -1.98724365234375, -1.8648681640625, -1.74249267578125, -1.6201171875, -1.49774169921875, -1.3753662109375, -1.25299072265625, -1.130615234375, -1.00823974609375, -0.8858642578125, -0.76348876953125, -0.64111328125, -0.51873779296875, -0.3963623046875, -0.27398681640625, -0.151611328125, -0.02923583984375, 0.0931396484375, 0.21551513671875, 0.337890625, 0.46026611328125, 0.5826416015625, 0.70501708984375, 0.827392578125, 0.94976806640625, 1.0721435546875, 1.19451904296875, 1.31689453125, 1.43927001953125, 1.5616455078125, 1.68402099609375, 1.806396484375, 1.92877197265625, 2.0511474609375, 2.17352294921875, 2.2958984375, 2.41827392578125, 2.5406494140625, 2.66302490234375, 2.785400390625, 2.90777587890625, 3.0301513671875, 3.15252685546875, 3.27490234375, 3.39727783203125, 3.5196533203125, 3.64202880859375, 3.764404296875, 3.88677978515625, 4.0091552734375, 4.13153076171875, 4.25390625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 9.0, 3.0, 10.0, 8.0, 19.0, 12.0, 19.0, 29.0, 40.0, 76.0, 101.0, 122.0, 242.0, 426.0, 807.0, 1721.0, 4591.0, 15039.0, 66807.0, 509172.0, 364535.0, 62486.0, 14296.0, 4351.0, 1705.0, 777.0, 423.0, 254.0, 142.0, 100.0, 59.0, 47.0, 24.0, 22.0, 16.0, 12.0, 12.0, 8.0, 6.0, 8.0, 4.0, 2.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3505859375, -1.31304931640625, -1.2755126953125, -1.23797607421875, -1.200439453125, -1.16290283203125, -1.1253662109375, -1.08782958984375, -1.05029296875, -1.01275634765625, -0.9752197265625, -0.93768310546875, -0.900146484375, -0.86260986328125, -0.8250732421875, -0.78753662109375, -0.75, -0.71246337890625, -0.6749267578125, -0.63739013671875, -0.599853515625, -0.56231689453125, -0.5247802734375, -0.48724365234375, -0.44970703125, -0.41217041015625, -0.3746337890625, -0.33709716796875, -0.299560546875, -0.26202392578125, -0.2244873046875, -0.18695068359375, -0.1494140625, -0.11187744140625, -0.0743408203125, -0.03680419921875, 0.000732421875, 0.03826904296875, 0.0758056640625, 0.11334228515625, 0.15087890625, 0.18841552734375, 0.2259521484375, 0.26348876953125, 0.301025390625, 0.33856201171875, 0.3760986328125, 0.41363525390625, 0.451171875, 0.48870849609375, 0.5262451171875, 0.56378173828125, 0.601318359375, 0.63885498046875, 0.6763916015625, 0.71392822265625, 0.75146484375, 0.78900146484375, 0.8265380859375, 0.86407470703125, 0.901611328125, 0.93914794921875, 0.9766845703125, 1.01422119140625, 1.0517578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 5.0, 1.0, 6.0, 3.0, 6.0, 9.0, 6.0, 11.0, 11.0, 10.0, 24.0, 16.0, 28.0, 35.0, 57.0, 69.0, 84.0, 75.0, 90.0, 81.0, 63.0, 67.0, 49.0, 39.0, 28.0, 28.0, 14.0, 22.0, 17.0, 16.0, 4.0, 5.0, 5.0, 6.0, 0.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0], "bins": [-0.0003638267517089844, -0.00035485997796058655, -0.0003458932042121887, -0.0003369264304637909, -0.00032795965671539307, -0.00031899288296699524, -0.0003100261092185974, -0.0003010593354701996, -0.00029209256172180176, -0.00028312578797340393, -0.0002741590142250061, -0.0002651922404766083, -0.00025622546672821045, -0.0002472586929798126, -0.0002382919192314148, -0.00022932514548301697, -0.00022035837173461914, -0.0002113915979862213, -0.00020242482423782349, -0.00019345805048942566, -0.00018449127674102783, -0.00017552450299263, -0.00016655772924423218, -0.00015759095549583435, -0.00014862418174743652, -0.0001396574079990387, -0.00013069063425064087, -0.00012172386050224304, -0.00011275708675384521, -0.00010379031300544739, -9.482353925704956e-05, -8.585676550865173e-05, -7.68899917602539e-05, -6.792321801185608e-05, -5.895644426345825e-05, -4.9989670515060425e-05, -4.10228967666626e-05, -3.205612301826477e-05, -2.3089349269866943e-05, -1.4122575521469116e-05, -5.155801773071289e-06, 3.810971975326538e-06, 1.2777745723724365e-05, 2.1744519472122192e-05, 3.071129322052002e-05, 3.967806696891785e-05, 4.8644840717315674e-05, 5.76116144657135e-05, 6.657838821411133e-05, 7.554516196250916e-05, 8.451193571090698e-05, 9.347870945930481e-05, 0.00010244548320770264, 0.00011141225695610046, 0.00012037903070449829, 0.00012934580445289612, 0.00013831257820129395, 0.00014727935194969177, 0.0001562461256980896, 0.00016521289944648743, 0.00017417967319488525, 0.00018314644694328308, 0.0001921132206916809, 0.00020107999444007874, 0.00021004676818847656]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 8.0, 12.0, 9.0, 7.0, 26.0, 23.0, 20.0, 33.0, 55.0, 84.0, 152.0, 229.0, 376.0, 711.0, 1285.0, 2802.0, 7152.0, 25327.0, 148800.0, 681394.0, 142707.0, 24523.0, 6942.0, 2833.0, 1357.0, 663.0, 349.0, 223.0, 143.0, 92.0, 65.0, 40.0, 24.0, 15.0, 16.0, 16.0, 4.0, 5.0, 6.0, 4.0, 1.0, 8.0, 2.0, 1.0, 2.0, 3.0, 3.0], "bins": [-1.4130859375, -1.374359130859375, -1.33563232421875, -1.296905517578125, -1.2581787109375, -1.219451904296875, -1.18072509765625, -1.141998291015625, -1.103271484375, -1.064544677734375, -1.02581787109375, -0.987091064453125, -0.9483642578125, -0.909637451171875, -0.87091064453125, -0.832183837890625, -0.79345703125, -0.754730224609375, -0.71600341796875, -0.677276611328125, -0.6385498046875, -0.599822998046875, -0.56109619140625, -0.522369384765625, -0.483642578125, -0.444915771484375, -0.40618896484375, -0.367462158203125, -0.3287353515625, -0.290008544921875, -0.25128173828125, -0.212554931640625, -0.173828125, -0.135101318359375, -0.09637451171875, -0.057647705078125, -0.0189208984375, 0.019805908203125, 0.05853271484375, 0.097259521484375, 0.135986328125, 0.174713134765625, 0.21343994140625, 0.252166748046875, 0.2908935546875, 0.329620361328125, 0.36834716796875, 0.407073974609375, 0.44580078125, 0.484527587890625, 0.52325439453125, 0.561981201171875, 0.6007080078125, 0.639434814453125, 0.67816162109375, 0.716888427734375, 0.755615234375, 0.794342041015625, 0.83306884765625, 0.871795654296875, 0.9105224609375, 0.949249267578125, 0.98797607421875, 1.026702880859375, 1.0654296875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 5.0, 6.0, 9.0, 12.0, 5.0, 18.0, 35.0, 43.0, 43.0, 72.0, 95.0, 90.0, 101.0, 114.0, 90.0, 65.0, 46.0, 30.0, 28.0, 20.0, 18.0, 13.0, 8.0, 5.0, 8.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.248046875, -1.20562744140625, -1.1632080078125, -1.12078857421875, -1.078369140625, -1.03594970703125, -0.9935302734375, -0.95111083984375, -0.90869140625, -0.86627197265625, -0.8238525390625, -0.78143310546875, -0.739013671875, -0.69659423828125, -0.6541748046875, -0.61175537109375, -0.5693359375, -0.52691650390625, -0.4844970703125, -0.44207763671875, -0.399658203125, -0.35723876953125, -0.3148193359375, -0.27239990234375, -0.22998046875, -0.18756103515625, -0.1451416015625, -0.10272216796875, -0.060302734375, -0.01788330078125, 0.0245361328125, 0.06695556640625, 0.109375, 0.15179443359375, 0.1942138671875, 0.23663330078125, 0.279052734375, 0.32147216796875, 0.3638916015625, 0.40631103515625, 0.44873046875, 0.49114990234375, 0.5335693359375, 0.57598876953125, 0.618408203125, 0.66082763671875, 0.7032470703125, 0.74566650390625, 0.7880859375, 0.83050537109375, 0.8729248046875, 0.91534423828125, 0.957763671875, 1.00018310546875, 1.0426025390625, 1.08502197265625, 1.12744140625, 1.16986083984375, 1.2122802734375, 1.25469970703125, 1.297119140625, 1.33953857421875, 1.3819580078125, 1.42437744140625, 1.466796875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 3.0, 7.0, 7.0, 20.0, 49.0, 108.0, 162.0, 303.0, 186.0, 84.0, 32.0, 16.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.440269470214844, -32.2733268737793, -31.106386184692383, -29.939443588256836, -28.772502899169922, -27.605560302734375, -26.438617706298828, -25.271677017211914, -24.104736328125, -22.937793731689453, -21.77085304260254, -20.603910446166992, -19.436969757080078, -18.27002716064453, -17.103084564208984, -15.93614387512207, -14.769201278686523, -13.602259635925293, -12.435317993164062, -11.268375396728516, -10.101434707641602, -8.934492111206055, -7.767550468444824, -6.600608825683594, -5.433667182922363, -4.266725540161133, -3.0997836589813232, -1.9328417778015137, -0.7659001350402832, 0.40104150772094727, 1.567983627319336, 2.7349252700805664, 3.901866912841797, 5.068808555603027, 6.235750198364258, 7.4026923179626465, 8.569633483886719, 9.736576080322266, 10.903517723083496, 12.070459365844727, 13.237401008605957, 14.404342651367188, 15.571284294128418, 16.73822593688965, 17.905168533325195, 19.07210922241211, 20.239051818847656, 21.405994415283203, 22.572935104370117, 23.739877700805664, 24.906818389892578, 26.073760986328125, 27.24070167541504, 28.407644271850586, 29.5745849609375, 30.741527557373047, 31.908470153808594, 33.07541275024414, 34.24235534667969, 35.40929412841797, 36.576236724853516, 37.74317932128906, 38.91012191772461, 40.077064514160156, 41.24400329589844]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 9.0, 6.0, 8.0, 10.0, 13.0, 21.0, 15.0, 23.0, 15.0, 22.0, 20.0, 23.0, 31.0, 22.0, 32.0, 44.0, 50.0, 53.0, 66.0, 67.0, 50.0, 41.0, 38.0, 34.0, 34.0, 25.0, 30.0, 27.0, 22.0, 19.0, 23.0, 17.0, 16.0, 7.0, 10.0, 7.0, 6.0, 4.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0], "bins": [-15.456674575805664, -15.016027450561523, -14.5753812789917, -14.134734153747559, -13.694087028503418, -13.253440856933594, -12.812793731689453, -12.372146606445312, -11.931499481201172, -11.490852355957031, -11.050206184387207, -10.609559059143066, -10.168911933898926, -9.728265762329102, -9.287618637084961, -8.84697151184082, -8.40632438659668, -7.965677738189697, -7.525030612945557, -7.084383964538574, -6.643736839294434, -6.203090190887451, -5.762443542480469, -5.321796417236328, -4.881150245666504, -4.4405035972595215, -3.999856472015381, -3.5592098236083984, -3.118562698364258, -2.6779160499572754, -2.237269163131714, -1.7966222763061523, -1.3559751510620117, -0.9153282642364502, -0.47468143701553345, -0.0340346097946167, 0.4066122770309448, 0.8472590446472168, 1.2879059314727783, 1.7285528182983398, 2.1691997051239014, 2.609846591949463, 3.0504934787750244, 3.491140365600586, 3.9317870140075684, 4.372433662414551, 4.813080787658691, 5.253727912902832, 5.6943745613098145, 6.135021209716797, 6.5756683349609375, 7.01631498336792, 7.4569621086120605, 7.897608757019043, 8.338255882263184, 8.778902053833008, 9.219549179077148, 9.660196304321289, 10.100842475891113, 10.541489601135254, 10.982136726379395, 11.422782897949219, 11.86343002319336, 12.3040771484375, 12.74472427368164]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 9.0, 15.0, 25.0, 22.0, 49.0, 65.0, 126.0, 236.0, 431.0, 806.0, 1755.0, 4084.0, 12634.0, 51186.0, 418469.0, 2950189.0, 662034.0, 68229.0, 15118.0, 4940.0, 1889.0, 892.0, 443.0, 253.0, 144.0, 76.0, 56.0, 33.0, 19.0, 16.0, 8.0, 7.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.61328125, -1.5605316162109375, -1.507781982421875, -1.4550323486328125, -1.40228271484375, -1.3495330810546875, -1.296783447265625, -1.2440338134765625, -1.1912841796875, -1.1385345458984375, -1.085784912109375, -1.0330352783203125, -0.98028564453125, -0.9275360107421875, -0.874786376953125, -0.8220367431640625, -0.769287109375, -0.7165374755859375, -0.663787841796875, -0.6110382080078125, -0.55828857421875, -0.5055389404296875, -0.452789306640625, -0.4000396728515625, -0.3472900390625, -0.2945404052734375, -0.241790771484375, -0.1890411376953125, -0.13629150390625, -0.0835418701171875, -0.030792236328125, 0.0219573974609375, 0.07470703125, 0.1274566650390625, 0.180206298828125, 0.2329559326171875, 0.28570556640625, 0.3384552001953125, 0.391204833984375, 0.4439544677734375, 0.4967041015625, 0.5494537353515625, 0.602203369140625, 0.6549530029296875, 0.70770263671875, 0.7604522705078125, 0.813201904296875, 0.8659515380859375, 0.918701171875, 0.9714508056640625, 1.024200439453125, 1.0769500732421875, 1.12969970703125, 1.1824493408203125, 1.235198974609375, 1.2879486083984375, 1.3406982421875, 1.3934478759765625, 1.446197509765625, 1.4989471435546875, 1.55169677734375, 1.6044464111328125, 1.657196044921875, 1.7099456787109375, 1.7626953125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 7.0, 11.0, 11.0, 21.0, 18.0, 24.0, 38.0, 31.0, 43.0, 51.0, 42.0, 57.0, 46.0, 48.0, 70.0, 54.0, 52.0, 51.0, 59.0, 47.0, 30.0, 30.0, 33.0, 22.0, 18.0, 13.0, 18.0, 12.0, 5.0, 9.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.0087890625, -0.975616455078125, -0.94244384765625, -0.909271240234375, -0.8760986328125, -0.842926025390625, -0.80975341796875, -0.776580810546875, -0.743408203125, -0.710235595703125, -0.67706298828125, -0.643890380859375, -0.6107177734375, -0.577545166015625, -0.54437255859375, -0.511199951171875, -0.47802734375, -0.444854736328125, -0.41168212890625, -0.378509521484375, -0.3453369140625, -0.312164306640625, -0.27899169921875, -0.245819091796875, -0.212646484375, -0.179473876953125, -0.14630126953125, -0.113128662109375, -0.0799560546875, -0.046783447265625, -0.01361083984375, 0.019561767578125, 0.052734375, 0.085906982421875, 0.11907958984375, 0.152252197265625, 0.1854248046875, 0.218597412109375, 0.25177001953125, 0.284942626953125, 0.318115234375, 0.351287841796875, 0.38446044921875, 0.417633056640625, 0.4508056640625, 0.483978271484375, 0.51715087890625, 0.550323486328125, 0.58349609375, 0.616668701171875, 0.64984130859375, 0.683013916015625, 0.7161865234375, 0.749359130859375, 0.78253173828125, 0.815704345703125, 0.848876953125, 0.882049560546875, 0.91522216796875, 0.948394775390625, 0.9815673828125, 1.014739990234375, 1.04791259765625, 1.081085205078125, 1.1142578125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 10.0, 17.0, 22.0, 59.0, 118.0, 249.0, 661.0, 2872.0, 22820.0, 2072434.0, 2070554.0, 21046.0, 2499.0, 541.0, 221.0, 79.0, 36.0, 23.0, 15.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.9232177734375, -4.764404296875, -4.6055908203125, -4.44677734375, -4.2879638671875, -4.129150390625, -3.9703369140625, -3.8115234375, -3.6527099609375, -3.493896484375, -3.3350830078125, -3.17626953125, -3.0174560546875, -2.858642578125, -2.6998291015625, -2.541015625, -2.3822021484375, -2.223388671875, -2.0645751953125, -1.90576171875, -1.7469482421875, -1.588134765625, -1.4293212890625, -1.2705078125, -1.1116943359375, -0.952880859375, -0.7940673828125, -0.63525390625, -0.4764404296875, -0.317626953125, -0.1588134765625, 0.0, 0.1588134765625, 0.317626953125, 0.4764404296875, 0.63525390625, 0.7940673828125, 0.952880859375, 1.1116943359375, 1.2705078125, 1.4293212890625, 1.588134765625, 1.7469482421875, 1.90576171875, 2.0645751953125, 2.223388671875, 2.3822021484375, 2.541015625, 2.6998291015625, 2.858642578125, 3.0174560546875, 3.17626953125, 3.3350830078125, 3.493896484375, 3.6527099609375, 3.8115234375, 3.9703369140625, 4.129150390625, 4.2879638671875, 4.44677734375, 4.6055908203125, 4.764404296875, 4.9232177734375, 5.08203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 11.0, 17.0, 22.0, 22.0, 32.0, 51.0, 110.0, 212.0, 378.0, 723.0, 949.0, 744.0, 357.0, 185.0, 92.0, 48.0, 35.0, 25.0, 13.0, 11.0, 4.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.421875, -3.328033447265625, -3.23419189453125, -3.140350341796875, -3.0465087890625, -2.952667236328125, -2.85882568359375, -2.764984130859375, -2.671142578125, -2.577301025390625, -2.48345947265625, -2.389617919921875, -2.2957763671875, -2.201934814453125, -2.10809326171875, -2.014251708984375, -1.92041015625, -1.826568603515625, -1.73272705078125, -1.638885498046875, -1.5450439453125, -1.451202392578125, -1.35736083984375, -1.263519287109375, -1.169677734375, -1.075836181640625, -0.98199462890625, -0.888153076171875, -0.7943115234375, -0.700469970703125, -0.60662841796875, -0.512786865234375, -0.4189453125, -0.325103759765625, -0.23126220703125, -0.137420654296875, -0.0435791015625, 0.050262451171875, 0.14410400390625, 0.237945556640625, 0.331787109375, 0.425628662109375, 0.51947021484375, 0.613311767578125, 0.7071533203125, 0.800994873046875, 0.89483642578125, 0.988677978515625, 1.08251953125, 1.176361083984375, 1.27020263671875, 1.364044189453125, 1.4578857421875, 1.551727294921875, 1.64556884765625, 1.739410400390625, 1.833251953125, 1.927093505859375, 2.02093505859375, 2.114776611328125, 2.2086181640625, 2.302459716796875, 2.39630126953125, 2.490142822265625, 2.583984375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 9.0, 9.0, 19.0, 64.0, 217.0, 328.0, 224.0, 75.0, 27.0, 7.0, 9.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.11677551269531, -41.941532135009766, -40.76628875732422, -39.59104919433594, -38.41580581665039, -37.240562438964844, -36.0653190612793, -34.89007568359375, -33.7148323059082, -32.539588928222656, -31.364347457885742, -30.189104080200195, -29.01386070251465, -27.838619232177734, -26.663375854492188, -25.48813247680664, -24.312891006469727, -23.13764762878418, -21.962406158447266, -20.78716278076172, -19.611919403076172, -18.436676025390625, -17.26143455505371, -16.086191177368164, -14.910948753356934, -13.735706329345703, -12.560462951660156, -11.385220527648926, -10.209978103637695, -9.034734725952148, -7.859492301940918, -6.684248924255371, -5.509006500244141, -4.333763599395752, -3.1585209369659424, -1.9832782745361328, -0.8080353736877441, 0.36720752716064453, 1.542449951171875, 2.717693328857422, 3.8929357528686523, 5.068178653717041, 6.24342155456543, 7.41866397857666, 8.59390640258789, 9.769149780273438, 10.944392204284668, 12.119635581970215, 13.294878005981445, 14.470120429992676, 15.645363807678223, 16.820606231689453, 17.995849609375, 19.171092987060547, 20.34633445739746, 21.521577835083008, 22.696819305419922, 23.87206268310547, 25.047304153442383, 26.22254753112793, 27.397790908813477, 28.57303237915039, 29.748275756835938, 30.923519134521484, 32.09876251220703]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 8.0, 9.0, 8.0, 12.0, 12.0, 26.0, 16.0, 18.0, 32.0, 37.0, 36.0, 43.0, 42.0, 40.0, 48.0, 53.0, 52.0, 53.0, 49.0, 49.0, 41.0, 51.0, 44.0, 38.0, 30.0, 24.0, 26.0, 19.0, 14.0, 16.0, 7.0, 7.0, 7.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.015947341918945, -10.669189453125, -10.322431564331055, -9.97567367553711, -9.62891674041748, -9.282158851623535, -8.93540096282959, -8.588643074035645, -8.2418851852417, -7.895127296447754, -7.548369884490967, -7.2016119956970215, -6.854854106903076, -6.508096694946289, -6.161338806152344, -5.814580917358398, -5.467823505401611, -5.121065616607666, -4.774308204650879, -4.427550315856934, -4.080792427062988, -3.734034776687622, -3.387277126312256, -3.0405192375183105, -2.6937615871429443, -2.347003936767578, -2.000246047973633, -1.6534883975982666, -1.3067306280136108, -0.9599728584289551, -0.6132152080535889, -0.26645731925964355, 0.08030033111572266, 0.42705807089805603, 0.7738158106803894, 1.1205735206604004, 1.4673312902450562, 1.814089059829712, 2.160846710205078, 2.5076045989990234, 2.8543622493743896, 3.201119899749756, 3.547877788543701, 3.8946354389190674, 4.241393089294434, 4.588150978088379, 4.934908866882324, 5.2816667556762695, 5.628424167633057, 5.975182056427002, 6.321939468383789, 6.668697357177734, 7.01545524597168, 7.362213134765625, 7.708970546722412, 8.055728912353516, 8.402485847473145, 8.74924373626709, 9.096001625061035, 9.442758560180664, 9.78951644897461, 10.136274337768555, 10.4830322265625, 10.829790115356445, 11.17654800415039]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 11.0, 12.0, 20.0, 28.0, 40.0, 67.0, 111.0, 191.0, 381.0, 656.0, 1286.0, 2584.0, 5775.0, 13367.0, 33783.0, 87929.0, 217679.0, 330560.0, 211892.0, 85648.0, 32688.0, 12955.0, 5614.0, 2542.0, 1263.0, 632.0, 342.0, 209.0, 98.0, 60.0, 48.0, 22.0, 21.0, 13.0, 8.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.830078125, -1.77850341796875, -1.7269287109375, -1.67535400390625, -1.623779296875, -1.57220458984375, -1.5206298828125, -1.46905517578125, -1.41748046875, -1.36590576171875, -1.3143310546875, -1.26275634765625, -1.211181640625, -1.15960693359375, -1.1080322265625, -1.05645751953125, -1.0048828125, -0.95330810546875, -0.9017333984375, -0.85015869140625, -0.798583984375, -0.74700927734375, -0.6954345703125, -0.64385986328125, -0.59228515625, -0.54071044921875, -0.4891357421875, -0.43756103515625, -0.385986328125, -0.33441162109375, -0.2828369140625, -0.23126220703125, -0.1796875, -0.12811279296875, -0.0765380859375, -0.02496337890625, 0.026611328125, 0.07818603515625, 0.1297607421875, 0.18133544921875, 0.23291015625, 0.28448486328125, 0.3360595703125, 0.38763427734375, 0.439208984375, 0.49078369140625, 0.5423583984375, 0.59393310546875, 0.6455078125, 0.69708251953125, 0.7486572265625, 0.80023193359375, 0.851806640625, 0.90338134765625, 0.9549560546875, 1.00653076171875, 1.05810546875, 1.10968017578125, 1.1612548828125, 1.21282958984375, 1.264404296875, 1.31597900390625, 1.3675537109375, 1.41912841796875, 1.470703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 6.0, 10.0, 8.0, 15.0, 15.0, 22.0, 23.0, 16.0, 35.0, 33.0, 41.0, 35.0, 54.0, 51.0, 55.0, 48.0, 53.0, 59.0, 54.0, 50.0, 47.0, 40.0, 33.0, 32.0, 26.0, 21.0, 23.0, 20.0, 20.0, 14.0, 9.0, 9.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.0146484375, -0.9810943603515625, -0.947540283203125, -0.9139862060546875, -0.88043212890625, -0.8468780517578125, -0.813323974609375, -0.7797698974609375, -0.7462158203125, -0.7126617431640625, -0.679107666015625, -0.6455535888671875, -0.61199951171875, -0.5784454345703125, -0.544891357421875, -0.5113372802734375, -0.477783203125, -0.4442291259765625, -0.410675048828125, -0.3771209716796875, -0.34356689453125, -0.3100128173828125, -0.276458740234375, -0.2429046630859375, -0.2093505859375, -0.1757965087890625, -0.142242431640625, -0.1086883544921875, -0.07513427734375, -0.0415802001953125, -0.008026123046875, 0.0255279541015625, 0.05908203125, 0.0926361083984375, 0.126190185546875, 0.1597442626953125, 0.19329833984375, 0.2268524169921875, 0.260406494140625, 0.2939605712890625, 0.3275146484375, 0.3610687255859375, 0.394622802734375, 0.4281768798828125, 0.46173095703125, 0.4952850341796875, 0.528839111328125, 0.5623931884765625, 0.595947265625, 0.6295013427734375, 0.663055419921875, 0.6966094970703125, 0.73016357421875, 0.7637176513671875, 0.797271728515625, 0.8308258056640625, 0.8643798828125, 0.8979339599609375, 0.931488037109375, 0.9650421142578125, 0.99859619140625, 1.0321502685546875, 1.065704345703125, 1.0992584228515625, 1.1328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 9.0, 8.0, 12.0, 15.0, 18.0, 23.0, 39.0, 38.0, 66.0, 81.0, 157.0, 263.0, 525.0, 1148.0, 3154.0, 10109.0, 40381.0, 198270.0, 613605.0, 139126.0, 28890.0, 7969.0, 2514.0, 990.0, 449.0, 236.0, 136.0, 86.0, 64.0, 55.0, 26.0, 19.0, 18.0, 11.0, 11.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.814453125, -2.73016357421875, -2.6458740234375, -2.56158447265625, -2.477294921875, -2.39300537109375, -2.3087158203125, -2.22442626953125, -2.14013671875, -2.05584716796875, -1.9715576171875, -1.88726806640625, -1.802978515625, -1.71868896484375, -1.6343994140625, -1.55010986328125, -1.4658203125, -1.38153076171875, -1.2972412109375, -1.21295166015625, -1.128662109375, -1.04437255859375, -0.9600830078125, -0.87579345703125, -0.79150390625, -0.70721435546875, -0.6229248046875, -0.53863525390625, -0.454345703125, -0.37005615234375, -0.2857666015625, -0.20147705078125, -0.1171875, -0.03289794921875, 0.0513916015625, 0.13568115234375, 0.219970703125, 0.30426025390625, 0.3885498046875, 0.47283935546875, 0.55712890625, 0.64141845703125, 0.7257080078125, 0.80999755859375, 0.894287109375, 0.97857666015625, 1.0628662109375, 1.14715576171875, 1.2314453125, 1.31573486328125, 1.4000244140625, 1.48431396484375, 1.568603515625, 1.65289306640625, 1.7371826171875, 1.82147216796875, 1.90576171875, 1.99005126953125, 2.0743408203125, 2.15863037109375, 2.242919921875, 2.32720947265625, 2.4114990234375, 2.49578857421875, 2.580078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 9.0, 6.0, 10.0, 9.0, 7.0, 16.0, 13.0, 19.0, 24.0, 25.0, 28.0, 30.0, 38.0, 45.0, 45.0, 56.0, 52.0, 55.0, 38.0, 49.0, 46.0, 46.0, 37.0, 44.0, 43.0, 32.0, 30.0, 18.0, 20.0, 18.0, 16.0, 10.0, 16.0, 5.0, 8.0, 3.0, 5.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-3.47265625, -3.358123779296875, -3.24359130859375, -3.129058837890625, -3.0145263671875, -2.899993896484375, -2.78546142578125, -2.670928955078125, -2.556396484375, -2.441864013671875, -2.32733154296875, -2.212799072265625, -2.0982666015625, -1.983734130859375, -1.86920166015625, -1.754669189453125, -1.64013671875, -1.525604248046875, -1.41107177734375, -1.296539306640625, -1.1820068359375, -1.067474365234375, -0.95294189453125, -0.838409423828125, -0.723876953125, -0.609344482421875, -0.49481201171875, -0.380279541015625, -0.2657470703125, -0.151214599609375, -0.03668212890625, 0.077850341796875, 0.1923828125, 0.306915283203125, 0.42144775390625, 0.535980224609375, 0.6505126953125, 0.765045166015625, 0.87957763671875, 0.994110107421875, 1.108642578125, 1.223175048828125, 1.33770751953125, 1.452239990234375, 1.5667724609375, 1.681304931640625, 1.79583740234375, 1.910369873046875, 2.02490234375, 2.139434814453125, 2.25396728515625, 2.368499755859375, 2.4830322265625, 2.597564697265625, 2.71209716796875, 2.826629638671875, 2.941162109375, 3.055694580078125, 3.17022705078125, 3.284759521484375, 3.3992919921875, 3.513824462890625, 3.62835693359375, 3.742889404296875, 3.857421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 6.0, 2.0, 7.0, 3.0, 8.0, 14.0, 13.0, 24.0, 23.0, 29.0, 55.0, 102.0, 142.0, 221.0, 452.0, 803.0, 1567.0, 3511.0, 8053.0, 19921.0, 51996.0, 138199.0, 474404.0, 212587.0, 82538.0, 31564.0, 12374.0, 5151.0, 2278.0, 1143.0, 585.0, 293.0, 176.0, 110.0, 58.0, 38.0, 36.0, 24.0, 12.0, 8.0, 9.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52197265625, -0.5049896240234375, -0.488006591796875, -0.4710235595703125, -0.45404052734375, -0.4370574951171875, -0.420074462890625, -0.4030914306640625, -0.3861083984375, -0.3691253662109375, -0.352142333984375, -0.3351593017578125, -0.31817626953125, -0.3011932373046875, -0.284210205078125, -0.2672271728515625, -0.250244140625, -0.2332611083984375, -0.216278076171875, -0.1992950439453125, -0.18231201171875, -0.1653289794921875, -0.148345947265625, -0.1313629150390625, -0.1143798828125, -0.0973968505859375, -0.080413818359375, -0.0634307861328125, -0.04644775390625, -0.0294647216796875, -0.012481689453125, 0.0045013427734375, 0.021484375, 0.0384674072265625, 0.055450439453125, 0.0724334716796875, 0.08941650390625, 0.1063995361328125, 0.123382568359375, 0.1403656005859375, 0.1573486328125, 0.1743316650390625, 0.191314697265625, 0.2082977294921875, 0.22528076171875, 0.2422637939453125, 0.259246826171875, 0.2762298583984375, 0.293212890625, 0.3101959228515625, 0.327178955078125, 0.3441619873046875, 0.36114501953125, 0.3781280517578125, 0.395111083984375, 0.4120941162109375, 0.4290771484375, 0.4460601806640625, 0.463043212890625, 0.4800262451171875, 0.49700927734375, 0.5139923095703125, 0.530975341796875, 0.5479583740234375, 0.56494140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 8.0, 4.0, 6.0, 12.0, 24.0, 17.0, 27.0, 38.0, 46.0, 55.0, 86.0, 93.0, 84.0, 100.0, 80.0, 63.0, 66.0, 52.0, 44.0, 21.0, 16.0, 21.0, 6.0, 8.0, 7.0, 4.0, 4.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002644062042236328, -0.00025657564401626587, -0.0002487450838088989, -0.00024091452360153198, -0.00023308396339416504, -0.0002252534031867981, -0.00021742284297943115, -0.0002095922827720642, -0.00020176172256469727, -0.00019393116235733032, -0.00018610060214996338, -0.00017827004194259644, -0.0001704394817352295, -0.00016260892152786255, -0.0001547783613204956, -0.00014694780111312866, -0.00013911724090576172, -0.00013128668069839478, -0.00012345612049102783, -0.00011562556028366089, -0.00010779500007629395, -9.9964439868927e-05, -9.213387966156006e-05, -8.430331945419312e-05, -7.647275924682617e-05, -6.864219903945923e-05, -6.0811638832092285e-05, -5.298107862472534e-05, -4.51505184173584e-05, -3.7319958209991455e-05, -2.9489398002624512e-05, -2.165883779525757e-05, -1.3828277587890625e-05, -5.997717380523682e-06, 1.8328428268432617e-06, 9.663403034210205e-06, 1.749396324157715e-05, 2.5324523448944092e-05, 3.3155083656311035e-05, 4.098564386367798e-05, 4.881620407104492e-05, 5.6646764278411865e-05, 6.447732448577881e-05, 7.230788469314575e-05, 8.01384449005127e-05, 8.796900510787964e-05, 9.579956531524658e-05, 0.00010363012552261353, 0.00011146068572998047, 0.00011929124593734741, 0.00012712180614471436, 0.0001349523663520813, 0.00014278292655944824, 0.00015061348676681519, 0.00015844404697418213, 0.00016627460718154907, 0.00017410516738891602, 0.00018193572759628296, 0.0001897662878036499, 0.00019759684801101685, 0.0002054274082183838, 0.00021325796842575073, 0.00022108852863311768, 0.00022891908884048462, 0.00023674964904785156]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 3.0, 14.0, 13.0, 15.0, 26.0, 54.0, 101.0, 182.0, 358.0, 823.0, 2350.0, 8392.0, 37623.0, 198368.0, 628185.0, 136437.0, 26229.0, 6134.0, 1859.0, 725.0, 295.0, 152.0, 95.0, 42.0, 28.0, 18.0, 13.0, 9.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1171875, -1.0888214111328125, -1.060455322265625, -1.0320892333984375, -1.00372314453125, -0.9753570556640625, -0.946990966796875, -0.9186248779296875, -0.8902587890625, -0.8618927001953125, -0.833526611328125, -0.8051605224609375, -0.77679443359375, -0.7484283447265625, -0.720062255859375, -0.6916961669921875, -0.663330078125, -0.6349639892578125, -0.606597900390625, -0.5782318115234375, -0.54986572265625, -0.5214996337890625, -0.493133544921875, -0.4647674560546875, -0.4364013671875, -0.4080352783203125, -0.379669189453125, -0.3513031005859375, -0.32293701171875, -0.2945709228515625, -0.266204833984375, -0.2378387451171875, -0.20947265625, -0.1811065673828125, -0.152740478515625, -0.1243743896484375, -0.09600830078125, -0.0676422119140625, -0.039276123046875, -0.0109100341796875, 0.0174560546875, 0.0458221435546875, 0.074188232421875, 0.1025543212890625, 0.13092041015625, 0.1592864990234375, 0.187652587890625, 0.2160186767578125, 0.244384765625, 0.2727508544921875, 0.301116943359375, 0.3294830322265625, 0.35784912109375, 0.3862152099609375, 0.414581298828125, 0.4429473876953125, 0.4713134765625, 0.4996795654296875, 0.528045654296875, 0.5564117431640625, 0.58477783203125, 0.6131439208984375, 0.641510009765625, 0.6698760986328125, 0.6982421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 4.0, 9.0, 8.0, 10.0, 12.0, 17.0, 24.0, 32.0, 23.0, 57.0, 44.0, 69.0, 78.0, 75.0, 79.0, 80.0, 67.0, 69.0, 53.0, 62.0, 33.0, 26.0, 22.0, 15.0, 15.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.0283737182617188, -1.0001068115234375, -0.9718399047851562, -0.943572998046875, -0.9153060913085938, -0.8870391845703125, -0.8587722778320312, -0.83050537109375, -0.8022384643554688, -0.7739715576171875, -0.7457046508789062, -0.717437744140625, -0.6891708374023438, -0.6609039306640625, -0.6326370239257812, -0.6043701171875, -0.5761032104492188, -0.5478363037109375, -0.5195693969726562, -0.491302490234375, -0.46303558349609375, -0.4347686767578125, -0.40650177001953125, -0.37823486328125, -0.34996795654296875, -0.3217010498046875, -0.29343414306640625, -0.265167236328125, -0.23690032958984375, -0.2086334228515625, -0.18036651611328125, -0.152099609375, -0.12383270263671875, -0.0955657958984375, -0.06729888916015625, -0.039031982421875, -0.01076507568359375, 0.0175018310546875, 0.04576873779296875, 0.07403564453125, 0.10230255126953125, 0.1305694580078125, 0.15883636474609375, 0.187103271484375, 0.21537017822265625, 0.2436370849609375, 0.27190399169921875, 0.3001708984375, 0.32843780517578125, 0.3567047119140625, 0.38497161865234375, 0.413238525390625, 0.44150543212890625, 0.4697723388671875, 0.49803924560546875, 0.52630615234375, 0.5545730590820312, 0.5828399658203125, 0.6111068725585938, 0.639373779296875, 0.6676406860351562, 0.6959075927734375, 0.7241744995117188, 0.75244140625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 19.0, 31.0, 62.0, 126.0, 182.0, 281.0, 141.0, 76.0, 36.0, 12.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.8143310546875, -32.04029846191406, -31.266265869140625, -30.492233276367188, -29.71820068359375, -28.94416618347168, -28.170133590698242, -27.396100997924805, -26.622068405151367, -25.84803581237793, -25.074003219604492, -24.299970626831055, -23.525936126708984, -22.751903533935547, -21.97787094116211, -21.203838348388672, -20.429805755615234, -19.655773162841797, -18.88174057006836, -18.107707977294922, -17.333675384521484, -16.559640884399414, -15.785608291625977, -15.011575698852539, -14.237543106079102, -13.463510513305664, -12.689477920532227, -11.915444374084473, -11.141411781311035, -10.367379188537598, -9.593345642089844, -8.819313049316406, -8.045278549194336, -7.271245956420898, -6.497212886810303, -5.723179817199707, -4.9491472244262695, -4.175114631652832, -3.4010815620422363, -2.6270484924316406, -1.8530158996582031, -1.0789830684661865, -0.3049502372741699, 0.4690825939178467, 1.2431154251098633, 2.01714825630188, 2.7911810874938965, 3.565214157104492, 4.33924674987793, 5.113279342651367, 5.887312412261963, 6.661345481872559, 7.435378074645996, 8.209410667419434, 8.983444213867188, 9.757476806640625, 10.531509399414062, 11.3055419921875, 12.079574584960938, 12.853608131408691, 13.627640724182129, 14.401673316955566, 15.17570686340332, 15.949739456176758, 16.723772048950195]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 1.0, 3.0, 7.0, 6.0, 10.0, 9.0, 9.0, 17.0, 22.0, 24.0, 31.0, 31.0, 35.0, 26.0, 37.0, 50.0, 67.0, 84.0, 81.0, 86.0, 82.0, 44.0, 36.0, 31.0, 31.0, 25.0, 22.0, 15.0, 17.0, 10.0, 11.0, 11.0, 7.0, 10.0, 7.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.876969337463379, -13.332551002502441, -12.78813362121582, -12.243715286254883, -11.699296951293945, -11.154878616333008, -10.61046028137207, -10.06604290008545, -9.521624565124512, -8.977206230163574, -8.432788848876953, -7.888370513916016, -7.343952178955078, -6.799533843994141, -6.255115985870361, -5.710698127746582, -5.1662797927856445, -4.621861457824707, -4.077443599700928, -3.5330255031585693, -2.988607406616211, -2.4441893100738525, -1.8997712135314941, -1.3553531169891357, -0.8109350204467773, -0.26651692390441895, 0.27790117263793945, 0.8223192691802979, 1.3667373657226562, 1.9111554622650146, 2.455573558807373, 2.9999916553497314, 3.5444087982177734, 4.088827133178711, 4.63324499130249, 5.1776628494262695, 5.722081184387207, 6.2664995193481445, 6.810917377471924, 7.355335235595703, 7.899753570556641, 8.444171905517578, 8.988590240478516, 9.533007621765137, 10.077425956726074, 10.621844291687012, 11.166261672973633, 11.71068000793457, 12.255098342895508, 12.799516677856445, 13.343935012817383, 13.888352394104004, 14.432770729064941, 14.977189064025879, 15.5216064453125, 16.066024780273438, 16.610443115234375, 17.154861450195312, 17.69927978515625, 18.243698120117188, 18.788116455078125, 19.33253288269043, 19.876951217651367, 20.421369552612305, 20.965787887573242]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 9.0, 13.0, 29.0, 34.0, 65.0, 105.0, 186.0, 384.0, 742.0, 1668.0, 4264.0, 12652.0, 51117.0, 348611.0, 2462476.0, 1143337.0, 131501.0, 25082.0, 7124.0, 2617.0, 1086.0, 548.0, 294.0, 136.0, 72.0, 36.0, 31.0, 24.0, 11.0, 6.0, 6.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.439453125, -1.394134521484375, -1.34881591796875, -1.303497314453125, -1.2581787109375, -1.212860107421875, -1.16754150390625, -1.122222900390625, -1.076904296875, -1.031585693359375, -0.98626708984375, -0.940948486328125, -0.8956298828125, -0.850311279296875, -0.80499267578125, -0.759674072265625, -0.71435546875, -0.669036865234375, -0.62371826171875, -0.578399658203125, -0.5330810546875, -0.487762451171875, -0.44244384765625, -0.397125244140625, -0.351806640625, -0.306488037109375, -0.26116943359375, -0.215850830078125, -0.1705322265625, -0.125213623046875, -0.07989501953125, -0.034576416015625, 0.0107421875, 0.056060791015625, 0.10137939453125, 0.146697998046875, 0.1920166015625, 0.237335205078125, 0.28265380859375, 0.327972412109375, 0.373291015625, 0.418609619140625, 0.46392822265625, 0.509246826171875, 0.5545654296875, 0.599884033203125, 0.64520263671875, 0.690521240234375, 0.73583984375, 0.781158447265625, 0.82647705078125, 0.871795654296875, 0.9171142578125, 0.962432861328125, 1.00775146484375, 1.053070068359375, 1.098388671875, 1.143707275390625, 1.18902587890625, 1.234344482421875, 1.2796630859375, 1.324981689453125, 1.37030029296875, 1.415618896484375, 1.4609375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 10.0, 7.0, 5.0, 13.0, 18.0, 14.0, 24.0, 28.0, 28.0, 26.0, 44.0, 38.0, 27.0, 42.0, 43.0, 51.0, 59.0, 63.0, 62.0, 54.0, 47.0, 41.0, 34.0, 41.0, 38.0, 27.0, 21.0, 23.0, 25.0, 11.0, 8.0, 7.0, 5.0, 8.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94140625, -0.910125732421875, -0.87884521484375, -0.847564697265625, -0.8162841796875, -0.785003662109375, -0.75372314453125, -0.722442626953125, -0.691162109375, -0.659881591796875, -0.62860107421875, -0.597320556640625, -0.5660400390625, -0.534759521484375, -0.50347900390625, -0.472198486328125, -0.44091796875, -0.409637451171875, -0.37835693359375, -0.347076416015625, -0.3157958984375, -0.284515380859375, -0.25323486328125, -0.221954345703125, -0.190673828125, -0.159393310546875, -0.12811279296875, -0.096832275390625, -0.0655517578125, -0.034271240234375, -0.00299072265625, 0.028289794921875, 0.0595703125, 0.090850830078125, 0.12213134765625, 0.153411865234375, 0.1846923828125, 0.215972900390625, 0.24725341796875, 0.278533935546875, 0.309814453125, 0.341094970703125, 0.37237548828125, 0.403656005859375, 0.4349365234375, 0.466217041015625, 0.49749755859375, 0.528778076171875, 0.56005859375, 0.591339111328125, 0.62261962890625, 0.653900146484375, 0.6851806640625, 0.716461181640625, 0.74774169921875, 0.779022216796875, 0.810302734375, 0.841583251953125, 0.87286376953125, 0.904144287109375, 0.9354248046875, 0.966705322265625, 0.99798583984375, 1.029266357421875, 1.060546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 8.0, 12.0, 21.0, 28.0, 52.0, 108.0, 169.0, 411.0, 1160.0, 4988.0, 50470.0, 3139061.0, 969772.0, 23422.0, 3074.0, 893.0, 311.0, 149.0, 62.0, 36.0, 27.0, 11.0, 9.0, 8.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.28515625, -3.175140380859375, -3.06512451171875, -2.955108642578125, -2.8450927734375, -2.735076904296875, -2.62506103515625, -2.515045166015625, -2.405029296875, -2.295013427734375, -2.18499755859375, -2.074981689453125, -1.9649658203125, -1.854949951171875, -1.74493408203125, -1.634918212890625, -1.52490234375, -1.414886474609375, -1.30487060546875, -1.194854736328125, -1.0848388671875, -0.974822998046875, -0.86480712890625, -0.754791259765625, -0.644775390625, -0.534759521484375, -0.42474365234375, -0.314727783203125, -0.2047119140625, -0.094696044921875, 0.01531982421875, 0.125335693359375, 0.2353515625, 0.345367431640625, 0.45538330078125, 0.565399169921875, 0.6754150390625, 0.785430908203125, 0.89544677734375, 1.005462646484375, 1.115478515625, 1.225494384765625, 1.33551025390625, 1.445526123046875, 1.5555419921875, 1.665557861328125, 1.77557373046875, 1.885589599609375, 1.99560546875, 2.105621337890625, 2.21563720703125, 2.325653076171875, 2.4356689453125, 2.545684814453125, 2.65570068359375, 2.765716552734375, 2.875732421875, 2.985748291015625, 3.09576416015625, 3.205780029296875, 3.3157958984375, 3.425811767578125, 3.53582763671875, 3.645843505859375, 3.755859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 1.0, 4.0, 10.0, 13.0, 36.0, 33.0, 95.0, 121.0, 206.0, 363.0, 604.0, 911.0, 745.0, 367.0, 231.0, 143.0, 55.0, 37.0, 30.0, 23.0, 20.0, 6.0, 5.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.84765625, -2.767578125, -2.6875, -2.607421875, -2.52734375, -2.447265625, -2.3671875, -2.287109375, -2.20703125, -2.126953125, -2.046875, -1.966796875, -1.88671875, -1.806640625, -1.7265625, -1.646484375, -1.56640625, -1.486328125, -1.40625, -1.326171875, -1.24609375, -1.166015625, -1.0859375, -1.005859375, -0.92578125, -0.845703125, -0.765625, -0.685546875, -0.60546875, -0.525390625, -0.4453125, -0.365234375, -0.28515625, -0.205078125, -0.125, -0.044921875, 0.03515625, 0.115234375, 0.1953125, 0.275390625, 0.35546875, 0.435546875, 0.515625, 0.595703125, 0.67578125, 0.755859375, 0.8359375, 0.916015625, 0.99609375, 1.076171875, 1.15625, 1.236328125, 1.31640625, 1.396484375, 1.4765625, 1.556640625, 1.63671875, 1.716796875, 1.796875, 1.876953125, 1.95703125, 2.037109375, 2.1171875, 2.197265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 13.0, 10.0, 14.0, 27.0, 62.0, 127.0, 168.0, 204.0, 169.0, 98.0, 57.0, 29.0, 10.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.035877227783203, -29.37553596496582, -28.715192794799805, -28.054851531982422, -27.39451026916504, -26.734169006347656, -26.07382583618164, -25.413484573364258, -24.753143310546875, -24.092802047729492, -23.432458877563477, -22.772117614746094, -22.11177635192871, -21.451435089111328, -20.791091918945312, -20.13075065612793, -19.470409393310547, -18.810068130493164, -18.14972496032715, -17.489383697509766, -16.829042434692383, -16.168701171875, -15.508358001708984, -14.848016738891602, -14.187673568725586, -13.527331352233887, -12.866990089416504, -12.206647872924805, -11.546306610107422, -10.885964393615723, -10.225622177124023, -9.56528091430664, -8.904939651489258, -8.244597434997559, -7.584256172180176, -6.923913955688477, -6.263572692871094, -5.6032304763793945, -4.9428887367248535, -4.2825469970703125, -3.6222052574157715, -2.9618635177612305, -2.3015217781066895, -1.6411798000335693, -0.9808380603790283, -0.3204963207244873, 0.3398456573486328, 1.0001873970031738, 1.6605291366577148, 2.320870876312256, 2.981212615966797, 3.641554594039917, 4.301896095275879, 4.962238311767578, 5.622580051422119, 6.28292179107666, 6.943263530731201, 7.603605270385742, 8.263947486877441, 8.924288749694824, 9.584630966186523, 10.244972229003906, 10.905314445495605, 11.565656661987305, 12.225997924804688]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 7.0, 15.0, 19.0, 12.0, 11.0, 21.0, 23.0, 30.0, 25.0, 25.0, 36.0, 27.0, 55.0, 51.0, 51.0, 62.0, 59.0, 52.0, 49.0, 43.0, 39.0, 34.0, 39.0, 30.0, 30.0, 29.0, 19.0, 26.0, 17.0, 13.0, 12.0, 14.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.400609016418457, -8.133339881896973, -7.8660712242126465, -7.59880256652832, -7.331533432006836, -7.06426477432251, -6.796996116638184, -6.529726982116699, -6.262458324432373, -5.995189666748047, -5.7279205322265625, -5.460651874542236, -5.19338321685791, -4.926114082336426, -4.6588454246521, -4.391576766967773, -4.124307632446289, -3.857038736343384, -3.5897698402404785, -3.3225011825561523, -3.055232286453247, -2.787963390350342, -2.5206947326660156, -2.2534258365631104, -1.986156940460205, -1.7188880443572998, -1.451619267463684, -1.1843504905700684, -0.9170815944671631, -0.6498126983642578, -0.3825439214706421, -0.11527514457702637, 0.1519947052001953, 0.4192635416984558, 0.6865323781967163, 0.9538012146949768, 1.2210700511932373, 1.4883389472961426, 1.7556077241897583, 2.022876501083374, 2.2901453971862793, 2.5574142932891846, 2.82468318939209, 3.091951847076416, 3.3592207431793213, 3.6264896392822266, 3.8937582969665527, 4.161026954650879, 4.428296089172363, 4.6955647468566895, 4.962833881378174, 5.2301025390625, 5.497371673583984, 5.7646403312683105, 6.031908988952637, 6.299178123474121, 6.566446781158447, 6.833715438842773, 7.100984573364258, 7.368253231048584, 7.63552188873291, 7.9027910232543945, 8.170060157775879, 8.437328338623047, 8.704597473144531]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 4.0, 14.0, 14.0, 20.0, 38.0, 50.0, 81.0, 117.0, 213.0, 359.0, 625.0, 1079.0, 2147.0, 4231.0, 9502.0, 21327.0, 50646.0, 121996.0, 264954.0, 300955.0, 155241.0, 64896.0, 27269.0, 11627.0, 5376.0, 2634.0, 1323.0, 765.0, 423.0, 216.0, 156.0, 98.0, 48.0, 33.0, 28.0, 16.0, 14.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.46484375, -1.42315673828125, -1.3814697265625, -1.33978271484375, -1.298095703125, -1.25640869140625, -1.2147216796875, -1.17303466796875, -1.13134765625, -1.08966064453125, -1.0479736328125, -1.00628662109375, -0.964599609375, -0.92291259765625, -0.8812255859375, -0.83953857421875, -0.7978515625, -0.75616455078125, -0.7144775390625, -0.67279052734375, -0.631103515625, -0.58941650390625, -0.5477294921875, -0.50604248046875, -0.46435546875, -0.42266845703125, -0.3809814453125, -0.33929443359375, -0.297607421875, -0.25592041015625, -0.2142333984375, -0.17254638671875, -0.130859375, -0.08917236328125, -0.0474853515625, -0.00579833984375, 0.035888671875, 0.07757568359375, 0.1192626953125, 0.16094970703125, 0.20263671875, 0.24432373046875, 0.2860107421875, 0.32769775390625, 0.369384765625, 0.41107177734375, 0.4527587890625, 0.49444580078125, 0.5361328125, 0.57781982421875, 0.6195068359375, 0.66119384765625, 0.702880859375, 0.74456787109375, 0.7862548828125, 0.82794189453125, 0.86962890625, 0.91131591796875, 0.9530029296875, 0.99468994140625, 1.036376953125, 1.07806396484375, 1.1197509765625, 1.16143798828125, 1.203125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 7.0, 8.0, 11.0, 15.0, 19.0, 21.0, 19.0, 20.0, 32.0, 45.0, 34.0, 40.0, 35.0, 45.0, 47.0, 51.0, 62.0, 53.0, 47.0, 60.0, 49.0, 52.0, 42.0, 27.0, 23.0, 29.0, 18.0, 26.0, 15.0, 15.0, 11.0, 2.0, 10.0, 6.0, 2.0, 7.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -1.0063323974609375, -0.973602294921875, -0.9408721923828125, -0.90814208984375, -0.8754119873046875, -0.842681884765625, -0.8099517822265625, -0.7772216796875, -0.7444915771484375, -0.711761474609375, -0.6790313720703125, -0.64630126953125, -0.6135711669921875, -0.580841064453125, -0.5481109619140625, -0.515380859375, -0.4826507568359375, -0.449920654296875, -0.4171905517578125, -0.38446044921875, -0.3517303466796875, -0.319000244140625, -0.2862701416015625, -0.2535400390625, -0.2208099365234375, -0.188079833984375, -0.1553497314453125, -0.12261962890625, -0.0898895263671875, -0.057159423828125, -0.0244293212890625, 0.00830078125, 0.0410308837890625, 0.073760986328125, 0.1064910888671875, 0.13922119140625, 0.1719512939453125, 0.204681396484375, 0.2374114990234375, 0.2701416015625, 0.3028717041015625, 0.335601806640625, 0.3683319091796875, 0.40106201171875, 0.4337921142578125, 0.466522216796875, 0.4992523193359375, 0.531982421875, 0.5647125244140625, 0.597442626953125, 0.6301727294921875, 0.66290283203125, 0.6956329345703125, 0.728363037109375, 0.7610931396484375, 0.7938232421875, 0.8265533447265625, 0.859283447265625, 0.8920135498046875, 0.92474365234375, 0.9574737548828125, 0.990203857421875, 1.0229339599609375, 1.0556640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 6.0, 11.0, 11.0, 12.0, 15.0, 18.0, 35.0, 45.0, 44.0, 69.0, 100.0, 152.0, 145.0, 301.0, 477.0, 833.0, 1743.0, 4549.0, 14415.0, 60374.0, 279584.0, 567801.0, 86932.0, 20197.0, 5885.0, 2085.0, 1002.0, 543.0, 330.0, 236.0, 134.0, 130.0, 87.0, 54.0, 44.0, 37.0, 23.0, 22.0, 10.0, 10.0, 15.0, 6.0, 6.0, 9.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.29022216796875, -2.2210693359375, -2.15191650390625, -2.082763671875, -2.01361083984375, -1.9444580078125, -1.87530517578125, -1.80615234375, -1.73699951171875, -1.6678466796875, -1.59869384765625, -1.529541015625, -1.46038818359375, -1.3912353515625, -1.32208251953125, -1.2529296875, -1.18377685546875, -1.1146240234375, -1.04547119140625, -0.976318359375, -0.90716552734375, -0.8380126953125, -0.76885986328125, -0.69970703125, -0.63055419921875, -0.5614013671875, -0.49224853515625, -0.423095703125, -0.35394287109375, -0.2847900390625, -0.21563720703125, -0.146484375, -0.07733154296875, -0.0081787109375, 0.06097412109375, 0.130126953125, 0.19927978515625, 0.2684326171875, 0.33758544921875, 0.40673828125, 0.47589111328125, 0.5450439453125, 0.61419677734375, 0.683349609375, 0.75250244140625, 0.8216552734375, 0.89080810546875, 0.9599609375, 1.02911376953125, 1.0982666015625, 1.16741943359375, 1.236572265625, 1.30572509765625, 1.3748779296875, 1.44403076171875, 1.51318359375, 1.58233642578125, 1.6514892578125, 1.72064208984375, 1.789794921875, 1.85894775390625, 1.9281005859375, 1.99725341796875, 2.06640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 11.0, 9.0, 15.0, 14.0, 20.0, 30.0, 33.0, 25.0, 31.0, 52.0, 52.0, 53.0, 55.0, 68.0, 63.0, 53.0, 52.0, 66.0, 51.0, 47.0, 33.0, 35.0, 22.0, 28.0, 13.0, 16.0, 8.0, 17.0, 6.0, 8.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.24609375, -4.12152099609375, -3.9969482421875, -3.87237548828125, -3.747802734375, -3.62322998046875, -3.4986572265625, -3.37408447265625, -3.24951171875, -3.12493896484375, -3.0003662109375, -2.87579345703125, -2.751220703125, -2.62664794921875, -2.5020751953125, -2.37750244140625, -2.2529296875, -2.12835693359375, -2.0037841796875, -1.87921142578125, -1.754638671875, -1.63006591796875, -1.5054931640625, -1.38092041015625, -1.25634765625, -1.13177490234375, -1.0072021484375, -0.88262939453125, -0.758056640625, -0.63348388671875, -0.5089111328125, -0.38433837890625, -0.259765625, -0.13519287109375, -0.0106201171875, 0.11395263671875, 0.238525390625, 0.36309814453125, 0.4876708984375, 0.61224365234375, 0.73681640625, 0.86138916015625, 0.9859619140625, 1.11053466796875, 1.235107421875, 1.35968017578125, 1.4842529296875, 1.60882568359375, 1.7333984375, 1.85797119140625, 1.9825439453125, 2.10711669921875, 2.231689453125, 2.35626220703125, 2.4808349609375, 2.60540771484375, 2.72998046875, 2.85455322265625, 2.9791259765625, 3.10369873046875, 3.228271484375, 3.35284423828125, 3.4774169921875, 3.60198974609375, 3.7265625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 5.0, 11.0, 12.0, 17.0, 26.0, 38.0, 50.0, 88.0, 121.0, 171.0, 303.0, 575.0, 1243.0, 2648.0, 6616.0, 18526.0, 58594.0, 241817.0, 588186.0, 87409.0, 26238.0, 9151.0, 3561.0, 1408.0, 707.0, 375.0, 208.0, 135.0, 86.0, 61.0, 39.0, 25.0, 26.0, 17.0, 15.0, 15.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7578125, -0.7368545532226562, -0.7158966064453125, -0.6949386596679688, -0.673980712890625, -0.6530227661132812, -0.6320648193359375, -0.6111068725585938, -0.59014892578125, -0.5691909790039062, -0.5482330322265625, -0.5272750854492188, -0.506317138671875, -0.48535919189453125, -0.4644012451171875, -0.44344329833984375, -0.4224853515625, -0.40152740478515625, -0.3805694580078125, -0.35961151123046875, -0.338653564453125, -0.31769561767578125, -0.2967376708984375, -0.27577972412109375, -0.25482177734375, -0.23386383056640625, -0.2129058837890625, -0.19194793701171875, -0.170989990234375, -0.15003204345703125, -0.1290740966796875, -0.10811614990234375, -0.087158203125, -0.06620025634765625, -0.0452423095703125, -0.02428436279296875, -0.003326416015625, 0.01763153076171875, 0.0385894775390625, 0.05954742431640625, 0.08050537109375, 0.10146331787109375, 0.1224212646484375, 0.14337921142578125, 0.164337158203125, 0.18529510498046875, 0.2062530517578125, 0.22721099853515625, 0.2481689453125, 0.26912689208984375, 0.2900848388671875, 0.31104278564453125, 0.332000732421875, 0.35295867919921875, 0.3739166259765625, 0.39487457275390625, 0.41583251953125, 0.43679046630859375, 0.4577484130859375, 0.47870635986328125, 0.499664306640625, 0.5206222534179688, 0.5415802001953125, 0.5625381469726562, 0.58349609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 9.0, 8.0, 10.0, 17.0, 13.0, 19.0, 15.0, 28.0, 31.0, 37.0, 47.0, 71.0, 92.0, 100.0, 105.0, 81.0, 73.0, 44.0, 41.0, 33.0, 28.0, 24.0, 13.0, 11.0, 7.0, 7.0, 9.0, 5.0, 9.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00021982192993164062, -0.00021314993500709534, -0.00020647794008255005, -0.00019980594515800476, -0.00019313395023345947, -0.00018646195530891418, -0.0001797899603843689, -0.0001731179654598236, -0.00016644597053527832, -0.00015977397561073303, -0.00015310198068618774, -0.00014642998576164246, -0.00013975799083709717, -0.00013308599591255188, -0.0001264140009880066, -0.0001197420060634613, -0.00011307001113891602, -0.00010639801621437073, -9.972602128982544e-05, -9.305402636528015e-05, -8.638203144073486e-05, -7.971003651618958e-05, -7.303804159164429e-05, -6.6366046667099e-05, -5.969405174255371e-05, -5.302205681800842e-05, -4.6350061893463135e-05, -3.967806696891785e-05, -3.300607204437256e-05, -2.633407711982727e-05, -1.9662082195281982e-05, -1.2990087270736694e-05, -6.318092346191406e-06, 3.5390257835388184e-07, 7.02589750289917e-06, 1.3697892427444458e-05, 2.0369887351989746e-05, 2.7041882276535034e-05, 3.371387720108032e-05, 4.038587212562561e-05, 4.70578670501709e-05, 5.3729861974716187e-05, 6.0401856899261475e-05, 6.707385182380676e-05, 7.374584674835205e-05, 8.041784167289734e-05, 8.708983659744263e-05, 9.376183152198792e-05, 0.0001004338264465332, 0.00010710582137107849, 0.00011377781629562378, 0.00012044981122016907, 0.00012712180614471436, 0.00013379380106925964, 0.00014046579599380493, 0.00014713779091835022, 0.0001538097858428955, 0.0001604817807674408, 0.00016715377569198608, 0.00017382577061653137, 0.00018049776554107666, 0.00018716976046562195, 0.00019384175539016724, 0.00020051375031471252, 0.0002071857452392578]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 3.0, 8.0, 5.0, 11.0, 8.0, 12.0, 16.0, 21.0, 26.0, 40.0, 46.0, 87.0, 134.0, 220.0, 429.0, 708.0, 1412.0, 3185.0, 8015.0, 23387.0, 82044.0, 572518.0, 266311.0, 60107.0, 17990.0, 6444.0, 2568.0, 1217.0, 622.0, 365.0, 215.0, 140.0, 71.0, 52.0, 28.0, 29.0, 15.0, 10.0, 13.0, 5.0, 11.0, 2.0, 5.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5038070678710938, -0.4827117919921875, -0.46161651611328125, -0.440521240234375, -0.41942596435546875, -0.3983306884765625, -0.37723541259765625, -0.35614013671875, -0.33504486083984375, -0.3139495849609375, -0.29285430908203125, -0.271759033203125, -0.25066375732421875, -0.2295684814453125, -0.20847320556640625, -0.1873779296875, -0.16628265380859375, -0.1451873779296875, -0.12409210205078125, -0.102996826171875, -0.08190155029296875, -0.0608062744140625, -0.03971099853515625, -0.01861572265625, 0.00247955322265625, 0.0235748291015625, 0.04467010498046875, 0.065765380859375, 0.08686065673828125, 0.1079559326171875, 0.12905120849609375, 0.150146484375, 0.17124176025390625, 0.1923370361328125, 0.21343231201171875, 0.234527587890625, 0.25562286376953125, 0.2767181396484375, 0.29781341552734375, 0.31890869140625, 0.34000396728515625, 0.3610992431640625, 0.38219451904296875, 0.403289794921875, 0.42438507080078125, 0.4454803466796875, 0.46657562255859375, 0.4876708984375, 0.5087661743164062, 0.5298614501953125, 0.5509567260742188, 0.572052001953125, 0.5931472778320312, 0.6142425537109375, 0.6353378295898438, 0.65643310546875, 0.6775283813476562, 0.6986236572265625, 0.7197189331054688, 0.740814208984375, 0.7619094848632812, 0.7830047607421875, 0.8041000366210938, 0.8251953125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 6.0, 5.0, 14.0, 12.0, 10.0, 20.0, 30.0, 30.0, 55.0, 59.0, 69.0, 66.0, 81.0, 82.0, 85.0, 85.0, 55.0, 49.0, 35.0, 23.0, 34.0, 18.0, 11.0, 14.0, 8.0, 10.0, 9.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6748046875, -0.6509170532226562, -0.6270294189453125, -0.6031417846679688, -0.579254150390625, -0.5553665161132812, -0.5314788818359375, -0.5075912475585938, -0.48370361328125, -0.45981597900390625, -0.4359283447265625, -0.41204071044921875, -0.388153076171875, -0.36426544189453125, -0.3403778076171875, -0.31649017333984375, -0.2926025390625, -0.26871490478515625, -0.2448272705078125, -0.22093963623046875, -0.197052001953125, -0.17316436767578125, -0.1492767333984375, -0.12538909912109375, -0.10150146484375, -0.07761383056640625, -0.0537261962890625, -0.02983856201171875, -0.005950927734375, 0.01793670654296875, 0.0418243408203125, 0.06571197509765625, 0.089599609375, 0.11348724365234375, 0.1373748779296875, 0.16126251220703125, 0.185150146484375, 0.20903778076171875, 0.2329254150390625, 0.25681304931640625, 0.28070068359375, 0.30458831787109375, 0.3284759521484375, 0.35236358642578125, 0.376251220703125, 0.40013885498046875, 0.4240264892578125, 0.44791412353515625, 0.4718017578125, 0.49568939208984375, 0.5195770263671875, 0.5434646606445312, 0.567352294921875, 0.5912399291992188, 0.6151275634765625, 0.6390151977539062, 0.66290283203125, 0.6867904663085938, 0.7106781005859375, 0.7345657348632812, 0.758453369140625, 0.7823410034179688, 0.8062286376953125, 0.8301162719726562, 0.85400390625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 8.0, 15.0, 23.0, 53.0, 102.0, 172.0, 293.0, 126.0, 95.0, 44.0, 25.0, 15.0, 10.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.28775405883789, -27.601970672607422, -26.916189193725586, -26.230405807495117, -25.54462242126465, -24.858840942382812, -24.173057556152344, -23.487274169921875, -22.80149269104004, -22.11570930480957, -21.429927825927734, -20.744144439697266, -20.058361053466797, -19.37257957458496, -18.686796188354492, -18.001014709472656, -17.315231323242188, -16.62944793701172, -15.943665504455566, -15.257883071899414, -14.572100639343262, -13.88631820678711, -13.20053482055664, -12.514752388000488, -11.828968048095703, -11.14318561553955, -10.457402229309082, -9.77161979675293, -9.085837364196777, -8.400054931640625, -7.714271545410156, -7.028489112854004, -6.342706680297852, -5.656923770904541, -4.971141338348389, -4.285358428955078, -3.5995757579803467, -2.9137930870056152, -2.2280101776123047, -1.5422277450561523, -0.8564448356628418, -0.17066210508346558, 0.5151206254959106, 1.2009034156799316, 1.886686086654663, 2.5724687576293945, 3.258251667022705, 3.9440340995788574, 4.629817008972168, 5.3155999183654785, 6.001382350921631, 6.687165260314941, 7.372947692871094, 8.058731079101562, 8.744513511657715, 9.430295944213867, 10.116079330444336, 10.801861763000488, 11.487645149230957, 12.17342758178711, 12.859210014343262, 13.544992446899414, 14.230775833129883, 14.916558265686035, 15.602340698242188]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 0.0, 4.0, 4.0, 8.0, 7.0, 7.0, 16.0, 14.0, 11.0, 12.0, 18.0, 8.0, 25.0, 29.0, 25.0, 33.0, 31.0, 32.0, 32.0, 54.0, 78.0, 91.0, 86.0, 46.0, 46.0, 34.0, 34.0, 24.0, 17.0, 19.0, 20.0, 17.0, 20.0, 15.0, 12.0, 9.0, 10.0, 11.0, 6.0, 9.0, 9.0, 5.0, 5.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.715522766113281, -11.332314491271973, -10.949106216430664, -10.565897941589355, -10.182689666748047, -9.799481391906738, -9.41627311706543, -9.033063888549805, -8.649856567382812, -8.266648292541504, -7.883440017700195, -7.500231742858887, -7.117023468017578, -6.7338151931762695, -6.350606441497803, -5.967398166656494, -5.584189414978027, -5.200981140136719, -4.81777286529541, -4.434564590454102, -4.051356315612793, -3.6681478023529053, -3.2849392890930176, -2.901731014251709, -2.5185227394104004, -2.135314464569092, -1.7521060705184937, -1.3688976764678955, -0.9856894016265869, -0.6024811267852783, -0.21927261352539062, 0.16393566131591797, 0.5471439361572266, 0.9303522706031799, 1.3135606050491333, 1.6967689990997314, 2.07997727394104, 2.4631855487823486, 2.8463940620422363, 3.229602336883545, 3.6128106117248535, 3.996018886566162, 4.379227161407471, 4.7624359130859375, 5.145644187927246, 5.528852462768555, 5.912060737609863, 6.295269012451172, 6.6784772872924805, 7.061685562133789, 7.444893836975098, 7.828102111816406, 8.211310386657715, 8.594518661499023, 8.977727890014648, 9.36093521118164, 9.744144439697266, 10.127352714538574, 10.510560989379883, 10.893769264221191, 11.2769775390625, 11.660185813903809, 12.043394088745117, 12.426603317260742, 12.809810638427734]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 12.0, 9.0, 14.0, 20.0, 32.0, 58.0, 78.0, 160.0, 317.0, 618.0, 1512.0, 3748.0, 10804.0, 40182.0, 211875.0, 1473553.0, 2045022.0, 327913.0, 56078.0, 14198.0, 4676.0, 1758.0, 814.0, 366.0, 205.0, 103.0, 67.0, 35.0, 19.0, 10.0, 9.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2607421875, -1.217437744140625, -1.17413330078125, -1.130828857421875, -1.0875244140625, -1.044219970703125, -1.00091552734375, -0.957611083984375, -0.914306640625, -0.871002197265625, -0.82769775390625, -0.784393310546875, -0.7410888671875, -0.697784423828125, -0.65447998046875, -0.611175537109375, -0.56787109375, -0.524566650390625, -0.48126220703125, -0.437957763671875, -0.3946533203125, -0.351348876953125, -0.30804443359375, -0.264739990234375, -0.221435546875, -0.178131103515625, -0.13482666015625, -0.091522216796875, -0.0482177734375, -0.004913330078125, 0.03839111328125, 0.081695556640625, 0.125, 0.168304443359375, 0.21160888671875, 0.254913330078125, 0.2982177734375, 0.341522216796875, 0.38482666015625, 0.428131103515625, 0.471435546875, 0.514739990234375, 0.55804443359375, 0.601348876953125, 0.6446533203125, 0.687957763671875, 0.73126220703125, 0.774566650390625, 0.81787109375, 0.861175537109375, 0.90447998046875, 0.947784423828125, 0.9910888671875, 1.034393310546875, 1.07769775390625, 1.121002197265625, 1.164306640625, 1.207611083984375, 1.25091552734375, 1.294219970703125, 1.3375244140625, 1.380828857421875, 1.42413330078125, 1.467437744140625, 1.5107421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 8.0, 7.0, 14.0, 10.0, 15.0, 25.0, 17.0, 27.0, 27.0, 42.0, 45.0, 46.0, 46.0, 49.0, 53.0, 61.0, 65.0, 57.0, 57.0, 53.0, 52.0, 46.0, 29.0, 29.0, 30.0, 12.0, 23.0, 19.0, 10.0, 5.0, 3.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.14453125, -1.1107635498046875, -1.076995849609375, -1.0432281494140625, -1.00946044921875, -0.9756927490234375, -0.941925048828125, -0.9081573486328125, -0.8743896484375, -0.8406219482421875, -0.806854248046875, -0.7730865478515625, -0.73931884765625, -0.7055511474609375, -0.671783447265625, -0.6380157470703125, -0.604248046875, -0.5704803466796875, -0.536712646484375, -0.5029449462890625, -0.46917724609375, -0.4354095458984375, -0.401641845703125, -0.3678741455078125, -0.3341064453125, -0.3003387451171875, -0.266571044921875, -0.2328033447265625, -0.19903564453125, -0.1652679443359375, -0.131500244140625, -0.0977325439453125, -0.06396484375, -0.0301971435546875, 0.003570556640625, 0.0373382568359375, 0.07110595703125, 0.1048736572265625, 0.138641357421875, 0.1724090576171875, 0.2061767578125, 0.2399444580078125, 0.273712158203125, 0.3074798583984375, 0.34124755859375, 0.3750152587890625, 0.408782958984375, 0.4425506591796875, 0.476318359375, 0.5100860595703125, 0.543853759765625, 0.5776214599609375, 0.61138916015625, 0.6451568603515625, 0.678924560546875, 0.7126922607421875, 0.7464599609375, 0.7802276611328125, 0.813995361328125, 0.8477630615234375, 0.88153076171875, 0.9152984619140625, 0.949066162109375, 0.9828338623046875, 1.0166015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 8.0, 9.0, 11.0, 13.0, 9.0, 16.0, 29.0, 39.0, 66.0, 73.0, 153.0, 299.0, 760.0, 2228.0, 9191.0, 65996.0, 1708168.0, 2311154.0, 81625.0, 10294.0, 2488.0, 852.0, 343.0, 147.0, 99.0, 42.0, 39.0, 24.0, 30.0, 10.0, 11.0, 9.0, 8.0, 6.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.304168701171875, -2.22747802734375, -2.150787353515625, -2.0740966796875, -1.997406005859375, -1.92071533203125, -1.844024658203125, -1.767333984375, -1.690643310546875, -1.61395263671875, -1.537261962890625, -1.4605712890625, -1.383880615234375, -1.30718994140625, -1.230499267578125, -1.15380859375, -1.077117919921875, -1.00042724609375, -0.923736572265625, -0.8470458984375, -0.770355224609375, -0.69366455078125, -0.616973876953125, -0.540283203125, -0.463592529296875, -0.38690185546875, -0.310211181640625, -0.2335205078125, -0.156829833984375, -0.08013916015625, -0.003448486328125, 0.0732421875, 0.149932861328125, 0.22662353515625, 0.303314208984375, 0.3800048828125, 0.456695556640625, 0.53338623046875, 0.610076904296875, 0.686767578125, 0.763458251953125, 0.84014892578125, 0.916839599609375, 0.9935302734375, 1.070220947265625, 1.14691162109375, 1.223602294921875, 1.30029296875, 1.376983642578125, 1.45367431640625, 1.530364990234375, 1.6070556640625, 1.683746337890625, 1.76043701171875, 1.837127685546875, 1.913818359375, 1.990509033203125, 2.06719970703125, 2.143890380859375, 2.2205810546875, 2.297271728515625, 2.37396240234375, 2.450653076171875, 2.52734375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 5.0, 19.0, 16.0, 25.0, 35.0, 35.0, 66.0, 65.0, 126.0, 169.0, 257.0, 437.0, 595.0, 579.0, 487.0, 379.0, 253.0, 175.0, 91.0, 85.0, 50.0, 33.0, 29.0, 15.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8408203125, -1.7800445556640625, -1.719268798828125, -1.6584930419921875, -1.59771728515625, -1.5369415283203125, -1.476165771484375, -1.4153900146484375, -1.3546142578125, -1.2938385009765625, -1.233062744140625, -1.1722869873046875, -1.11151123046875, -1.0507354736328125, -0.989959716796875, -0.9291839599609375, -0.868408203125, -0.8076324462890625, -0.746856689453125, -0.6860809326171875, -0.62530517578125, -0.5645294189453125, -0.503753662109375, -0.4429779052734375, -0.3822021484375, -0.3214263916015625, -0.260650634765625, -0.1998748779296875, -0.13909912109375, -0.0783233642578125, -0.017547607421875, 0.0432281494140625, 0.10400390625, 0.1647796630859375, 0.225555419921875, 0.2863311767578125, 0.34710693359375, 0.4078826904296875, 0.468658447265625, 0.5294342041015625, 0.5902099609375, 0.6509857177734375, 0.711761474609375, 0.7725372314453125, 0.83331298828125, 0.8940887451171875, 0.954864501953125, 1.0156402587890625, 1.076416015625, 1.1371917724609375, 1.197967529296875, 1.2587432861328125, 1.31951904296875, 1.3802947998046875, 1.441070556640625, 1.5018463134765625, 1.5626220703125, 1.6233978271484375, 1.684173583984375, 1.7449493408203125, 1.80572509765625, 1.8665008544921875, 1.927276611328125, 1.9880523681640625, 2.048828125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 14.0, 13.0, 18.0, 37.0, 54.0, 76.0, 100.0, 126.0, 113.0, 123.0, 102.0, 68.0, 50.0, 32.0, 14.0, 14.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.516680717468262, -15.084033012390137, -14.651386260986328, -14.218738555908203, -13.786091804504395, -13.35344409942627, -12.920797348022461, -12.488149642944336, -12.055501937866211, -11.622854232788086, -11.190207481384277, -10.757559776306152, -10.324913024902344, -9.892265319824219, -9.459617614746094, -9.026970863342285, -8.594324111938477, -8.161676406860352, -7.729029655456543, -7.296381950378418, -6.863735198974609, -6.431087493896484, -5.998440265655518, -5.565793037414551, -5.133145809173584, -4.700498580932617, -4.26785135269165, -3.8352038860321045, -3.4025566577911377, -2.969909429550171, -2.537261962890625, -2.104614734649658, -1.671966552734375, -1.2393193244934082, -0.8066719770431519, -0.3740246295928955, 0.05862259864807129, 0.4912698268890381, 0.923917293548584, 1.3565645217895508, 1.7892117500305176, 2.2218589782714844, 2.654506206512451, 3.087153673171997, 3.519800901412964, 3.9524481296539307, 4.385095596313477, 4.817742824554443, 5.25039005279541, 5.683037281036377, 6.115684509277344, 6.548332214355469, 6.980978965759277, 7.413626670837402, 7.846273899078369, 8.278921127319336, 8.711568832397461, 9.144216537475586, 9.576863288879395, 10.00951099395752, 10.442157745361328, 10.874805450439453, 11.307453155517578, 11.740099906921387, 12.172746658325195]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 16.0, 10.0, 11.0, 13.0, 16.0, 13.0, 24.0, 28.0, 38.0, 42.0, 49.0, 43.0, 80.0, 62.0, 84.0, 70.0, 64.0, 46.0, 49.0, 43.0, 31.0, 26.0, 24.0, 31.0, 19.0, 20.0, 18.0, 9.0, 8.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.482513427734375, -9.128331184387207, -8.774149894714355, -8.419967651367188, -8.06578540802002, -7.71160364151001, -7.357421875, -7.003239631652832, -6.649057865142822, -6.2948760986328125, -5.9406938552856445, -5.586512088775635, -5.232330322265625, -4.878148078918457, -4.523966312408447, -4.1697845458984375, -3.8156023025512695, -3.4614202976226807, -3.107238292694092, -2.753056526184082, -2.398874521255493, -2.0446925163269043, -1.6905107498168945, -1.3363287448883057, -0.9821467399597168, -0.6279647946357727, -0.2737828493118286, 0.0803990364074707, 0.43458104133605957, 0.7887630462646484, 1.1429448127746582, 1.497126817703247, 1.851308822631836, 2.205490827560425, 2.5596728324890137, 2.9138545989990234, 3.2680366039276123, 3.622218608856201, 3.976400375366211, 4.330582618713379, 4.684764385223389, 5.038946151733398, 5.393128395080566, 5.747310161590576, 6.101491928100586, 6.455674171447754, 6.809855937957764, 7.164037704467773, 7.518219947814941, 7.872401714324951, 8.226583480834961, 8.580765724182129, 8.934947967529297, 9.289129257202148, 9.643311500549316, 9.997493743896484, 10.351675033569336, 10.705857276916504, 11.060038566589355, 11.414220809936523, 11.768403053283691, 12.12258529663086, 12.476766586303711, 12.830948829650879, 13.185131072998047]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 7.0, 9.0, 13.0, 13.0, 39.0, 50.0, 111.0, 150.0, 279.0, 492.0, 914.0, 1713.0, 3523.0, 6970.0, 14775.0, 34582.0, 83851.0, 214683.0, 355328.0, 195718.0, 76705.0, 31750.0, 13807.0, 6292.0, 3170.0, 1612.0, 845.0, 457.0, 256.0, 163.0, 115.0, 62.0, 37.0, 25.0, 14.0, 8.0, 5.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2783203125, -1.23175048828125, -1.1851806640625, -1.13861083984375, -1.092041015625, -1.04547119140625, -0.9989013671875, -0.95233154296875, -0.90576171875, -0.85919189453125, -0.8126220703125, -0.76605224609375, -0.719482421875, -0.67291259765625, -0.6263427734375, -0.57977294921875, -0.533203125, -0.48663330078125, -0.4400634765625, -0.39349365234375, -0.346923828125, -0.30035400390625, -0.2537841796875, -0.20721435546875, -0.16064453125, -0.11407470703125, -0.0675048828125, -0.02093505859375, 0.025634765625, 0.07220458984375, 0.1187744140625, 0.16534423828125, 0.2119140625, 0.25848388671875, 0.3050537109375, 0.35162353515625, 0.398193359375, 0.44476318359375, 0.4913330078125, 0.53790283203125, 0.58447265625, 0.63104248046875, 0.6776123046875, 0.72418212890625, 0.770751953125, 0.81732177734375, 0.8638916015625, 0.91046142578125, 0.95703125, 1.00360107421875, 1.0501708984375, 1.09674072265625, 1.143310546875, 1.18988037109375, 1.2364501953125, 1.28302001953125, 1.32958984375, 1.37615966796875, 1.4227294921875, 1.46929931640625, 1.515869140625, 1.56243896484375, 1.6090087890625, 1.65557861328125, 1.7021484375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 9.0, 4.0, 10.0, 18.0, 14.0, 25.0, 25.0, 16.0, 26.0, 35.0, 25.0, 32.0, 36.0, 46.0, 58.0, 49.0, 54.0, 50.0, 46.0, 40.0, 39.0, 48.0, 35.0, 47.0, 28.0, 24.0, 21.0, 21.0, 19.0, 15.0, 16.0, 7.0, 14.0, 9.0, 4.0, 8.0, 4.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.88037109375, -0.851409912109375, -0.82244873046875, -0.793487548828125, -0.7645263671875, -0.735565185546875, -0.70660400390625, -0.677642822265625, -0.648681640625, -0.619720458984375, -0.59075927734375, -0.561798095703125, -0.5328369140625, -0.503875732421875, -0.47491455078125, -0.445953369140625, -0.4169921875, -0.388031005859375, -0.35906982421875, -0.330108642578125, -0.3011474609375, -0.272186279296875, -0.24322509765625, -0.214263916015625, -0.185302734375, -0.156341552734375, -0.12738037109375, -0.098419189453125, -0.0694580078125, -0.040496826171875, -0.01153564453125, 0.017425537109375, 0.04638671875, 0.075347900390625, 0.10430908203125, 0.133270263671875, 0.1622314453125, 0.191192626953125, 0.22015380859375, 0.249114990234375, 0.278076171875, 0.307037353515625, 0.33599853515625, 0.364959716796875, 0.3939208984375, 0.422882080078125, 0.45184326171875, 0.480804443359375, 0.509765625, 0.538726806640625, 0.56768798828125, 0.596649169921875, 0.6256103515625, 0.654571533203125, 0.68353271484375, 0.712493896484375, 0.741455078125, 0.770416259765625, 0.79937744140625, 0.828338623046875, 0.8572998046875, 0.886260986328125, 0.91522216796875, 0.944183349609375, 0.97314453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 7.0, 7.0, 16.0, 22.0, 22.0, 27.0, 34.0, 50.0, 62.0, 67.0, 99.0, 180.0, 241.0, 325.0, 520.0, 772.0, 1332.0, 2632.0, 7424.0, 30248.0, 197422.0, 703709.0, 78959.0, 15120.0, 4343.0, 1936.0, 1029.0, 584.0, 384.0, 281.0, 191.0, 124.0, 98.0, 74.0, 63.0, 29.0, 34.0, 20.0, 17.0, 13.0, 12.0, 8.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6953125, -2.611785888671875, -2.52825927734375, -2.444732666015625, -2.3612060546875, -2.277679443359375, -2.19415283203125, -2.110626220703125, -2.027099609375, -1.943572998046875, -1.86004638671875, -1.776519775390625, -1.6929931640625, -1.609466552734375, -1.52593994140625, -1.442413330078125, -1.35888671875, -1.275360107421875, -1.19183349609375, -1.108306884765625, -1.0247802734375, -0.941253662109375, -0.85772705078125, -0.774200439453125, -0.690673828125, -0.607147216796875, -0.52362060546875, -0.440093994140625, -0.3565673828125, -0.273040771484375, -0.18951416015625, -0.105987548828125, -0.0224609375, 0.061065673828125, 0.14459228515625, 0.228118896484375, 0.3116455078125, 0.395172119140625, 0.47869873046875, 0.562225341796875, 0.645751953125, 0.729278564453125, 0.81280517578125, 0.896331787109375, 0.9798583984375, 1.063385009765625, 1.14691162109375, 1.230438232421875, 1.31396484375, 1.397491455078125, 1.48101806640625, 1.564544677734375, 1.6480712890625, 1.731597900390625, 1.81512451171875, 1.898651123046875, 1.982177734375, 2.065704345703125, 2.14923095703125, 2.232757568359375, 2.3162841796875, 2.399810791015625, 2.48333740234375, 2.566864013671875, 2.650390625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 7.0, 9.0, 8.0, 8.0, 11.0, 18.0, 14.0, 14.0, 27.0, 24.0, 39.0, 31.0, 36.0, 55.0, 39.0, 61.0, 63.0, 56.0, 72.0, 63.0, 52.0, 42.0, 41.0, 29.0, 28.0, 25.0, 17.0, 20.0, 20.0, 18.0, 10.0, 10.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0234375, -3.902435302734375, -3.78143310546875, -3.660430908203125, -3.5394287109375, -3.418426513671875, -3.29742431640625, -3.176422119140625, -3.055419921875, -2.934417724609375, -2.81341552734375, -2.692413330078125, -2.5714111328125, -2.450408935546875, -2.32940673828125, -2.208404541015625, -2.08740234375, -1.966400146484375, -1.84539794921875, -1.724395751953125, -1.6033935546875, -1.482391357421875, -1.36138916015625, -1.240386962890625, -1.119384765625, -0.998382568359375, -0.87738037109375, -0.756378173828125, -0.6353759765625, -0.514373779296875, -0.39337158203125, -0.272369384765625, -0.1513671875, -0.030364990234375, 0.09063720703125, 0.211639404296875, 0.3326416015625, 0.453643798828125, 0.57464599609375, 0.695648193359375, 0.816650390625, 0.937652587890625, 1.05865478515625, 1.179656982421875, 1.3006591796875, 1.421661376953125, 1.54266357421875, 1.663665771484375, 1.78466796875, 1.905670166015625, 2.02667236328125, 2.147674560546875, 2.2686767578125, 2.389678955078125, 2.51068115234375, 2.631683349609375, 2.752685546875, 2.873687744140625, 2.99468994140625, 3.115692138671875, 3.2366943359375, 3.357696533203125, 3.47869873046875, 3.599700927734375, 3.720703125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 1.0, 10.0, 4.0, 13.0, 14.0, 21.0, 19.0, 29.0, 36.0, 51.0, 64.0, 115.0, 169.0, 289.0, 579.0, 1171.0, 3081.0, 10092.0, 46475.0, 672408.0, 267693.0, 33470.0, 7851.0, 2556.0, 1037.0, 493.0, 274.0, 183.0, 99.0, 59.0, 52.0, 35.0, 31.0, 20.0, 14.0, 8.0, 12.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8134765625, -0.7879791259765625, -0.762481689453125, -0.7369842529296875, -0.71148681640625, -0.6859893798828125, -0.660491943359375, -0.6349945068359375, -0.6094970703125, -0.5839996337890625, -0.558502197265625, -0.5330047607421875, -0.50750732421875, -0.4820098876953125, -0.456512451171875, -0.4310150146484375, -0.405517578125, -0.3800201416015625, -0.354522705078125, -0.3290252685546875, -0.30352783203125, -0.2780303955078125, -0.252532958984375, -0.2270355224609375, -0.2015380859375, -0.1760406494140625, -0.150543212890625, -0.1250457763671875, -0.09954833984375, -0.0740509033203125, -0.048553466796875, -0.0230560302734375, 0.00244140625, 0.0279388427734375, 0.053436279296875, 0.0789337158203125, 0.10443115234375, 0.1299285888671875, 0.155426025390625, 0.1809234619140625, 0.2064208984375, 0.2319183349609375, 0.257415771484375, 0.2829132080078125, 0.30841064453125, 0.3339080810546875, 0.359405517578125, 0.3849029541015625, 0.410400390625, 0.4358978271484375, 0.461395263671875, 0.4868927001953125, 0.51239013671875, 0.5378875732421875, 0.563385009765625, 0.5888824462890625, 0.6143798828125, 0.6398773193359375, 0.665374755859375, 0.6908721923828125, 0.71636962890625, 0.7418670654296875, 0.767364501953125, 0.7928619384765625, 0.818359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 3.0, 10.0, 2.0, 12.0, 13.0, 19.0, 24.0, 31.0, 37.0, 51.0, 56.0, 87.0, 121.0, 122.0, 94.0, 66.0, 54.0, 44.0, 27.0, 29.0, 20.0, 19.0, 11.0, 8.0, 6.0, 4.0, 5.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017559528350830078, -0.00016832910478115082, -0.00016106292605400085, -0.0001537967473268509, -0.00014653056859970093, -0.00013926438987255096, -0.000131998211145401, -0.00012473203241825104, -0.00011746585369110107, -0.00011019967496395111, -0.00010293349623680115, -9.566731750965118e-05, -8.840113878250122e-05, -8.113496005535126e-05, -7.38687813282013e-05, -6.660260260105133e-05, -5.933642387390137e-05, -5.2070245146751404e-05, -4.480406641960144e-05, -3.753788769245148e-05, -3.0271708965301514e-05, -2.300553023815155e-05, -1.5739351511001587e-05, -8.473172783851624e-06, -1.2069940567016602e-06, 6.059184670448303e-06, 1.3325363397598267e-05, 2.059154212474823e-05, 2.7857720851898193e-05, 3.512389957904816e-05, 4.239007830619812e-05, 4.9656257033348083e-05, 5.692243576049805e-05, 6.418861448764801e-05, 7.145479321479797e-05, 7.872097194194794e-05, 8.59871506690979e-05, 9.325332939624786e-05, 0.00010051950812339783, 0.00010778568685054779, 0.00011505186557769775, 0.00012231804430484772, 0.00012958422303199768, 0.00013685040175914764, 0.0001441165804862976, 0.00015138275921344757, 0.00015864893794059753, 0.0001659151166677475, 0.00017318129539489746, 0.00018044747412204742, 0.0001877136528491974, 0.00019497983157634735, 0.00020224601030349731, 0.00020951218903064728, 0.00021677836775779724, 0.0002240445464849472, 0.00023131072521209717, 0.00023857690393924713, 0.0002458430826663971, 0.00025310926139354706, 0.000260375440120697, 0.000267641618847847, 0.00027490779757499695, 0.0002821739763021469, 0.0002894401550292969]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 6.0, 8.0, 13.0, 31.0, 22.0, 39.0, 50.0, 75.0, 102.0, 179.0, 287.0, 437.0, 807.0, 1496.0, 3063.0, 8024.0, 26121.0, 115021.0, 684809.0, 155953.0, 34349.0, 10010.0, 3806.0, 1655.0, 863.0, 483.0, 270.0, 182.0, 124.0, 86.0, 60.0, 41.0, 20.0, 18.0, 9.0, 8.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.46044921875, -0.4424591064453125, -0.424468994140625, -0.4064788818359375, -0.38848876953125, -0.3704986572265625, -0.352508544921875, -0.3345184326171875, -0.3165283203125, -0.2985382080078125, -0.280548095703125, -0.2625579833984375, -0.24456787109375, -0.2265777587890625, -0.208587646484375, -0.1905975341796875, -0.172607421875, -0.1546173095703125, -0.136627197265625, -0.1186370849609375, -0.10064697265625, -0.0826568603515625, -0.064666748046875, -0.0466766357421875, -0.0286865234375, -0.0106964111328125, 0.007293701171875, 0.0252838134765625, 0.04327392578125, 0.0612640380859375, 0.079254150390625, 0.0972442626953125, 0.115234375, 0.1332244873046875, 0.151214599609375, 0.1692047119140625, 0.18719482421875, 0.2051849365234375, 0.223175048828125, 0.2411651611328125, 0.2591552734375, 0.2771453857421875, 0.295135498046875, 0.3131256103515625, 0.33111572265625, 0.3491058349609375, 0.367095947265625, 0.3850860595703125, 0.403076171875, 0.4210662841796875, 0.439056396484375, 0.4570465087890625, 0.47503662109375, 0.4930267333984375, 0.511016845703125, 0.5290069580078125, 0.5469970703125, 0.5649871826171875, 0.582977294921875, 0.6009674072265625, 0.61895751953125, 0.6369476318359375, 0.654937744140625, 0.6729278564453125, 0.69091796875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 7.0, 11.0, 20.0, 14.0, 27.0, 37.0, 55.0, 74.0, 103.0, 150.0, 127.0, 111.0, 72.0, 49.0, 35.0, 33.0, 25.0, 18.0, 11.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.609375, -0.5772705078125, -0.545166015625, -0.5130615234375, -0.48095703125, -0.4488525390625, -0.416748046875, -0.3846435546875, -0.3525390625, -0.3204345703125, -0.288330078125, -0.2562255859375, -0.22412109375, -0.1920166015625, -0.159912109375, -0.1278076171875, -0.095703125, -0.0635986328125, -0.031494140625, 0.0006103515625, 0.03271484375, 0.0648193359375, 0.096923828125, 0.1290283203125, 0.1611328125, 0.1932373046875, 0.225341796875, 0.2574462890625, 0.28955078125, 0.3216552734375, 0.353759765625, 0.3858642578125, 0.41796875, 0.4500732421875, 0.482177734375, 0.5142822265625, 0.54638671875, 0.5784912109375, 0.610595703125, 0.6427001953125, 0.6748046875, 0.7069091796875, 0.739013671875, 0.7711181640625, 0.80322265625, 0.8353271484375, 0.867431640625, 0.8995361328125, 0.931640625, 0.9637451171875, 0.995849609375, 1.0279541015625, 1.06005859375, 1.0921630859375, 1.124267578125, 1.1563720703125, 1.1884765625, 1.2205810546875, 1.252685546875, 1.2847900390625, 1.31689453125, 1.3489990234375, 1.381103515625, 1.4132080078125, 1.4453125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 7.0, 16.0, 46.0, 131.0, 433.0, 217.0, 87.0, 36.0, 14.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.34639358520508, -42.25325012207031, -41.16010284423828, -40.06695556640625, -38.973812103271484, -37.88066864013672, -36.78752136230469, -35.694374084472656, -34.60123062133789, -33.508087158203125, -32.414939880371094, -31.321794509887695, -30.228649139404297, -29.1355037689209, -28.0423583984375, -26.9492130279541, -25.856067657470703, -24.762922286987305, -23.669776916503906, -22.576631546020508, -21.48348617553711, -20.39034080505371, -19.297195434570312, -18.204050064086914, -17.110904693603516, -16.017759323120117, -14.924613952636719, -13.83146858215332, -12.738323211669922, -11.645177841186523, -10.552032470703125, -9.458887100219727, -8.365739822387695, -7.272594451904297, -6.179449081420898, -5.0863037109375, -3.9931583404541016, -2.900012969970703, -1.8068675994873047, -0.7137222290039062, 0.3794231414794922, 1.4725685119628906, 2.565713882446289, 3.6588592529296875, 4.752004623413086, 5.845149993896484, 6.938295364379883, 8.031440734863281, 9.12458610534668, 10.217731475830078, 11.310876846313477, 12.404022216796875, 13.497167587280273, 14.590312957763672, 15.68345832824707, 16.77660369873047, 17.869749069213867, 18.962894439697266, 20.056039810180664, 21.149185180664062, 22.24233055114746, 23.33547592163086, 24.428621292114258, 25.521766662597656, 26.614912033081055]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 10.0, 3.0, 9.0, 9.0, 13.0, 9.0, 16.0, 21.0, 15.0, 28.0, 19.0, 24.0, 24.0, 33.0, 39.0, 51.0, 131.0, 142.0, 69.0, 46.0, 36.0, 31.0, 32.0, 26.0, 23.0, 17.0, 28.0, 15.0, 14.0, 12.0, 10.0, 12.0, 11.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.147406578063965, -14.675943374633789, -14.204479217529297, -13.733016014099121, -13.261552810668945, -12.790088653564453, -12.318625450134277, -11.847162246704102, -11.37569808959961, -10.904234886169434, -10.432770729064941, -9.961307525634766, -9.48984432220459, -9.018381118774414, -8.546916961669922, -8.075453758239746, -7.60399055480957, -7.132526874542236, -6.6610636711120605, -6.189599990844727, -5.718136787414551, -5.246673107147217, -4.775209426879883, -4.303746223449707, -3.832282543182373, -3.360819101333618, -2.8893556594848633, -2.4178919792175293, -1.9464285373687744, -1.4749650955200195, -1.0035014152526855, -0.5320379734039307, -0.060573577880859375, 0.4108899235725403, 0.8823534250259399, 1.3538169860839844, 1.8252804279327393, 2.296743869781494, 2.768207550048828, 3.239670991897583, 3.711134433746338, 4.182598114013672, 4.654061317443848, 5.125524997711182, 5.596988677978516, 6.068451881408691, 6.539915561676025, 7.011379241943359, 7.482842445373535, 7.954306125640869, 8.425769805908203, 8.897233009338379, 9.368696212768555, 9.840160369873047, 10.311623573303223, 10.783086776733398, 11.25455093383789, 11.726014137268066, 12.197478294372559, 12.668941497802734, 13.14040470123291, 13.611867904663086, 14.083332061767578, 14.554795265197754, 15.02625846862793]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 9.0, 18.0, 18.0, 40.0, 78.0, 143.0, 293.0, 584.0, 1146.0, 2578.0, 6840.0, 25452.0, 150316.0, 1014254.0, 2308036.0, 580783.0, 78614.0, 16154.0, 4928.0, 1978.0, 949.0, 460.0, 242.0, 135.0, 88.0, 46.0, 31.0, 20.0, 10.0, 5.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9384765625, -1.8820343017578125, -1.825592041015625, -1.7691497802734375, -1.71270751953125, -1.6562652587890625, -1.599822998046875, -1.5433807373046875, -1.4869384765625, -1.4304962158203125, -1.374053955078125, -1.3176116943359375, -1.26116943359375, -1.2047271728515625, -1.148284912109375, -1.0918426513671875, -1.035400390625, -0.9789581298828125, -0.922515869140625, -0.8660736083984375, -0.80963134765625, -0.7531890869140625, -0.696746826171875, -0.6403045654296875, -0.5838623046875, -0.5274200439453125, -0.470977783203125, -0.4145355224609375, -0.35809326171875, -0.3016510009765625, -0.245208740234375, -0.1887664794921875, -0.13232421875, -0.0758819580078125, -0.019439697265625, 0.0370025634765625, 0.09344482421875, 0.1498870849609375, 0.206329345703125, 0.2627716064453125, 0.3192138671875, 0.3756561279296875, 0.432098388671875, 0.4885406494140625, 0.54498291015625, 0.6014251708984375, 0.657867431640625, 0.7143096923828125, 0.770751953125, 0.8271942138671875, 0.883636474609375, 0.9400787353515625, 0.99652099609375, 1.0529632568359375, 1.109405517578125, 1.1658477783203125, 1.2222900390625, 1.2787322998046875, 1.335174560546875, 1.3916168212890625, 1.44805908203125, 1.5045013427734375, 1.560943603515625, 1.6173858642578125, 1.673828125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 11.0, 12.0, 16.0, 16.0, 25.0, 19.0, 32.0, 29.0, 31.0, 42.0, 33.0, 49.0, 48.0, 57.0, 51.0, 62.0, 40.0, 35.0, 43.0, 55.0, 39.0, 39.0, 30.0, 29.0, 27.0, 22.0, 14.0, 12.0, 22.0, 8.0, 9.0, 8.0, 5.0, 4.0, 10.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9775390625, -0.9483795166015625, -0.919219970703125, -0.8900604248046875, -0.86090087890625, -0.8317413330078125, -0.802581787109375, -0.7734222412109375, -0.7442626953125, -0.7151031494140625, -0.685943603515625, -0.6567840576171875, -0.62762451171875, -0.5984649658203125, -0.569305419921875, -0.5401458740234375, -0.510986328125, -0.4818267822265625, -0.452667236328125, -0.4235076904296875, -0.39434814453125, -0.3651885986328125, -0.336029052734375, -0.3068695068359375, -0.2777099609375, -0.2485504150390625, -0.219390869140625, -0.1902313232421875, -0.16107177734375, -0.1319122314453125, -0.102752685546875, -0.0735931396484375, -0.04443359375, -0.0152740478515625, 0.013885498046875, 0.0430450439453125, 0.07220458984375, 0.1013641357421875, 0.130523681640625, 0.1596832275390625, 0.1888427734375, 0.2180023193359375, 0.247161865234375, 0.2763214111328125, 0.30548095703125, 0.3346405029296875, 0.363800048828125, 0.3929595947265625, 0.422119140625, 0.4512786865234375, 0.480438232421875, 0.5095977783203125, 0.53875732421875, 0.5679168701171875, 0.597076416015625, 0.6262359619140625, 0.6553955078125, 0.6845550537109375, 0.713714599609375, 0.7428741455078125, 0.77203369140625, 0.8011932373046875, 0.830352783203125, 0.8595123291015625, 0.888671875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 2.0, 5.0, 11.0, 6.0, 16.0, 18.0, 34.0, 60.0, 83.0, 131.0, 225.0, 427.0, 898.0, 2242.0, 9151.0, 261767.0, 3864006.0, 47211.0, 4972.0, 1550.0, 656.0, 307.0, 176.0, 99.0, 76.0, 48.0, 31.0, 23.0, 16.0, 12.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.65625, -5.49603271484375, -5.3358154296875, -5.17559814453125, -5.015380859375, -4.85516357421875, -4.6949462890625, -4.53472900390625, -4.37451171875, -4.21429443359375, -4.0540771484375, -3.89385986328125, -3.733642578125, -3.57342529296875, -3.4132080078125, -3.25299072265625, -3.0927734375, -2.93255615234375, -2.7723388671875, -2.61212158203125, -2.451904296875, -2.29168701171875, -2.1314697265625, -1.97125244140625, -1.81103515625, -1.65081787109375, -1.4906005859375, -1.33038330078125, -1.170166015625, -1.00994873046875, -0.8497314453125, -0.68951416015625, -0.529296875, -0.36907958984375, -0.2088623046875, -0.04864501953125, 0.111572265625, 0.27178955078125, 0.4320068359375, 0.59222412109375, 0.75244140625, 0.91265869140625, 1.0728759765625, 1.23309326171875, 1.393310546875, 1.55352783203125, 1.7137451171875, 1.87396240234375, 2.0341796875, 2.19439697265625, 2.3546142578125, 2.51483154296875, 2.675048828125, 2.83526611328125, 2.9954833984375, 3.15570068359375, 3.31591796875, 3.47613525390625, 3.6363525390625, 3.79656982421875, 3.956787109375, 4.11700439453125, 4.2772216796875, 4.43743896484375, 4.59765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 13.0, 19.0, 24.0, 44.0, 60.0, 77.0, 90.0, 134.0, 200.0, 314.0, 462.0, 627.0, 555.0, 416.0, 315.0, 208.0, 150.0, 99.0, 65.0, 56.0, 43.0, 27.0, 16.0, 11.0, 8.0, 9.0, 8.0, 1.0, 0.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.671875, -2.581878662109375, -2.49188232421875, -2.401885986328125, -2.3118896484375, -2.221893310546875, -2.13189697265625, -2.041900634765625, -1.951904296875, -1.861907958984375, -1.77191162109375, -1.681915283203125, -1.5919189453125, -1.501922607421875, -1.41192626953125, -1.321929931640625, -1.23193359375, -1.141937255859375, -1.05194091796875, -0.961944580078125, -0.8719482421875, -0.781951904296875, -0.69195556640625, -0.601959228515625, -0.511962890625, -0.421966552734375, -0.33197021484375, -0.241973876953125, -0.1519775390625, -0.061981201171875, 0.02801513671875, 0.118011474609375, 0.2080078125, 0.298004150390625, 0.38800048828125, 0.477996826171875, 0.5679931640625, 0.657989501953125, 0.74798583984375, 0.837982177734375, 0.927978515625, 1.017974853515625, 1.10797119140625, 1.197967529296875, 1.2879638671875, 1.377960205078125, 1.46795654296875, 1.557952880859375, 1.64794921875, 1.737945556640625, 1.82794189453125, 1.917938232421875, 2.0079345703125, 2.097930908203125, 2.18792724609375, 2.277923583984375, 2.367919921875, 2.457916259765625, 2.54791259765625, 2.637908935546875, 2.7279052734375, 2.817901611328125, 2.90789794921875, 2.997894287109375, 3.087890625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 15.0, 18.0, 54.0, 183.0, 330.0, 225.0, 90.0, 37.0, 16.0, 6.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.00481414794922, -41.09550094604492, -39.18618392944336, -37.27687072753906, -35.367557525634766, -33.45824432373047, -31.548927307128906, -29.63961410522461, -27.73029899597168, -25.82098388671875, -23.911670684814453, -22.002355575561523, -20.093040466308594, -18.183727264404297, -16.274412155151367, -14.365097999572754, -12.45578384399414, -10.546469688415527, -8.637155532836914, -6.727840423583984, -4.818526268005371, -2.909212112426758, -0.9998970031738281, 0.9094171524047852, 2.8187313079833984, 4.728045463562012, 6.637360095977783, 8.546674728393555, 10.455988883972168, 12.365303039550781, 14.274618148803711, 16.18393325805664, 18.093246459960938, 20.002561569213867, 21.911874771118164, 23.821189880371094, 25.73050308227539, 27.63981819152832, 29.54913330078125, 31.458446502685547, 33.367759704589844, 35.27707290649414, 37.1863899230957, 39.095703125, 41.0050163269043, 42.914329528808594, 44.823646545410156, 46.73295974731445, 48.642276763916016, 50.55158996582031, 52.460906982421875, 54.37022018432617, 56.27953338623047, 58.18885040283203, 60.09816360473633, 62.007476806640625, 63.91679382324219, 65.82611083984375, 67.73542022705078, 69.64473724365234, 71.5540542602539, 73.46336364746094, 75.3726806640625, 77.28199768066406, 79.1913070678711]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 7.0, 11.0, 14.0, 8.0, 25.0, 21.0, 24.0, 24.0, 29.0, 30.0, 34.0, 35.0, 44.0, 35.0, 37.0, 50.0, 50.0, 69.0, 52.0, 60.0, 50.0, 42.0, 35.0, 29.0, 29.0, 30.0, 26.0, 15.0, 12.0, 17.0, 5.0, 5.0, 8.0, 9.0, 1.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.243824005126953, -17.69647216796875, -17.14912223815918, -16.601770401000977, -16.054420471191406, -15.507068634033203, -14.959717750549316, -14.41236686706543, -13.865015983581543, -13.317665100097656, -12.77031421661377, -12.222963333129883, -11.67561149597168, -11.12826156616211, -10.580909729003906, -10.03355884552002, -9.486207962036133, -8.938857078552246, -8.39150619506836, -7.8441548347473145, -7.296803951263428, -6.749453067779541, -6.202101707458496, -5.654750823974609, -5.107399940490723, -4.560049057006836, -4.012698173522949, -3.4653468132019043, -2.9179959297180176, -2.370645046234131, -1.823293924331665, -1.2759428024291992, -0.7285919189453125, -0.18124091625213623, 0.36611008644104004, 0.9134610891342163, 1.4608120918273926, 2.0081629753112793, 2.555514097213745, 3.102865219116211, 3.6502161026000977, 4.197566986083984, 4.744917869567871, 5.292269229888916, 5.839620113372803, 6.3869709968566895, 6.934322357177734, 7.481673240661621, 8.029024124145508, 8.576375007629395, 9.123725891113281, 9.671076774597168, 10.218427658081055, 10.765779495239258, 11.313130378723145, 11.860481262207031, 12.407832145690918, 12.955183029174805, 13.502533912658691, 14.049884796142578, 14.597236633300781, 15.144586563110352, 15.691938400268555, 16.239288330078125, 16.786640167236328]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 7.0, 13.0, 14.0, 25.0, 35.0, 45.0, 83.0, 128.0, 243.0, 401.0, 685.0, 1141.0, 2041.0, 3867.0, 7958.0, 17119.0, 43041.0, 120358.0, 459130.0, 261121.0, 76919.0, 29117.0, 12394.0, 5847.0, 2956.0, 1610.0, 881.0, 542.0, 284.0, 202.0, 120.0, 77.0, 54.0, 28.0, 19.0, 15.0, 9.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.235809326171875, -1.19134521484375, -1.146881103515625, -1.1024169921875, -1.057952880859375, -1.01348876953125, -0.969024658203125, -0.924560546875, -0.880096435546875, -0.83563232421875, -0.791168212890625, -0.7467041015625, -0.702239990234375, -0.65777587890625, -0.613311767578125, -0.56884765625, -0.524383544921875, -0.47991943359375, -0.435455322265625, -0.3909912109375, -0.346527099609375, -0.30206298828125, -0.257598876953125, -0.213134765625, -0.168670654296875, -0.12420654296875, -0.079742431640625, -0.0352783203125, 0.009185791015625, 0.05364990234375, 0.098114013671875, 0.142578125, 0.187042236328125, 0.23150634765625, 0.275970458984375, 0.3204345703125, 0.364898681640625, 0.40936279296875, 0.453826904296875, 0.498291015625, 0.542755126953125, 0.58721923828125, 0.631683349609375, 0.6761474609375, 0.720611572265625, 0.76507568359375, 0.809539794921875, 0.85400390625, 0.898468017578125, 0.94293212890625, 0.987396240234375, 1.0318603515625, 1.076324462890625, 1.12078857421875, 1.165252685546875, 1.209716796875, 1.254180908203125, 1.29864501953125, 1.343109130859375, 1.3875732421875, 1.432037353515625, 1.47650146484375, 1.520965576171875, 1.5654296875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 13.0, 11.0, 11.0, 15.0, 16.0, 17.0, 14.0, 35.0, 24.0, 31.0, 41.0, 49.0, 39.0, 37.0, 45.0, 37.0, 51.0, 49.0, 43.0, 31.0, 52.0, 36.0, 36.0, 34.0, 30.0, 27.0, 28.0, 15.0, 22.0, 20.0, 22.0, 12.0, 11.0, 4.0, 6.0, 8.0, 2.0, 4.0, 6.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.037109375, -1.0050048828125, -0.972900390625, -0.9407958984375, -0.90869140625, -0.8765869140625, -0.844482421875, -0.8123779296875, -0.7802734375, -0.7481689453125, -0.716064453125, -0.6839599609375, -0.65185546875, -0.6197509765625, -0.587646484375, -0.5555419921875, -0.5234375, -0.4913330078125, -0.459228515625, -0.4271240234375, -0.39501953125, -0.3629150390625, -0.330810546875, -0.2987060546875, -0.2666015625, -0.2344970703125, -0.202392578125, -0.1702880859375, -0.13818359375, -0.1060791015625, -0.073974609375, -0.0418701171875, -0.009765625, 0.0223388671875, 0.054443359375, 0.0865478515625, 0.11865234375, 0.1507568359375, 0.182861328125, 0.2149658203125, 0.2470703125, 0.2791748046875, 0.311279296875, 0.3433837890625, 0.37548828125, 0.4075927734375, 0.439697265625, 0.4718017578125, 0.50390625, 0.5360107421875, 0.568115234375, 0.6002197265625, 0.63232421875, 0.6644287109375, 0.696533203125, 0.7286376953125, 0.7607421875, 0.7928466796875, 0.824951171875, 0.8570556640625, 0.88916015625, 0.9212646484375, 0.953369140625, 0.9854736328125, 1.017578125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 11.0, 15.0, 14.0, 22.0, 31.0, 38.0, 79.0, 134.0, 186.0, 364.0, 727.0, 2099.0, 10362.0, 129703.0, 872616.0, 26115.0, 3752.0, 1130.0, 457.0, 286.0, 149.0, 100.0, 66.0, 35.0, 21.0, 10.0, 10.0, 9.0, 8.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.56805419921875, -2.4661865234375, -2.36431884765625, -2.262451171875, -2.16058349609375, -2.0587158203125, -1.95684814453125, -1.85498046875, -1.75311279296875, -1.6512451171875, -1.54937744140625, -1.447509765625, -1.34564208984375, -1.2437744140625, -1.14190673828125, -1.0400390625, -0.93817138671875, -0.8363037109375, -0.73443603515625, -0.632568359375, -0.53070068359375, -0.4288330078125, -0.32696533203125, -0.22509765625, -0.12322998046875, -0.0213623046875, 0.08050537109375, 0.182373046875, 0.28424072265625, 0.3861083984375, 0.48797607421875, 0.58984375, 0.69171142578125, 0.7935791015625, 0.89544677734375, 0.997314453125, 1.09918212890625, 1.2010498046875, 1.30291748046875, 1.40478515625, 1.50665283203125, 1.6085205078125, 1.71038818359375, 1.812255859375, 1.91412353515625, 2.0159912109375, 2.11785888671875, 2.2197265625, 2.32159423828125, 2.4234619140625, 2.52532958984375, 2.627197265625, 2.72906494140625, 2.8309326171875, 2.93280029296875, 3.03466796875, 3.13653564453125, 3.2384033203125, 3.34027099609375, 3.442138671875, 3.54400634765625, 3.6458740234375, 3.74774169921875, 3.849609375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 7.0, 6.0, 7.0, 9.0, 6.0, 11.0, 15.0, 12.0, 16.0, 16.0, 32.0, 35.0, 31.0, 49.0, 51.0, 64.0, 70.0, 79.0, 68.0, 76.0, 61.0, 47.0, 37.0, 29.0, 27.0, 18.0, 13.0, 25.0, 19.0, 8.0, 7.0, 10.0, 9.0, 10.0, 5.0, 7.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.86328125, -4.722412109375, -4.58154296875, -4.440673828125, -4.2998046875, -4.158935546875, -4.01806640625, -3.877197265625, -3.736328125, -3.595458984375, -3.45458984375, -3.313720703125, -3.1728515625, -3.031982421875, -2.89111328125, -2.750244140625, -2.609375, -2.468505859375, -2.32763671875, -2.186767578125, -2.0458984375, -1.905029296875, -1.76416015625, -1.623291015625, -1.482421875, -1.341552734375, -1.20068359375, -1.059814453125, -0.9189453125, -0.778076171875, -0.63720703125, -0.496337890625, -0.35546875, -0.214599609375, -0.07373046875, 0.067138671875, 0.2080078125, 0.348876953125, 0.48974609375, 0.630615234375, 0.771484375, 0.912353515625, 1.05322265625, 1.194091796875, 1.3349609375, 1.475830078125, 1.61669921875, 1.757568359375, 1.8984375, 2.039306640625, 2.18017578125, 2.321044921875, 2.4619140625, 2.602783203125, 2.74365234375, 2.884521484375, 3.025390625, 3.166259765625, 3.30712890625, 3.447998046875, 3.5888671875, 3.729736328125, 3.87060546875, 4.011474609375, 4.15234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 5.0, 5.0, 8.0, 15.0, 28.0, 28.0, 47.0, 86.0, 102.0, 188.0, 533.0, 1312.0, 3944.0, 17327.0, 151828.0, 830024.0, 33461.0, 6369.0, 1856.0, 684.0, 299.0, 149.0, 76.0, 59.0, 35.0, 16.0, 16.0, 12.0, 6.0, 3.0, 1.0, 5.0, 4.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.60888671875, -0.5910720825195312, -0.5732574462890625, -0.5554428100585938, -0.537628173828125, -0.5198135375976562, -0.5019989013671875, -0.48418426513671875, -0.46636962890625, -0.44855499267578125, -0.4307403564453125, -0.41292572021484375, -0.395111083984375, -0.37729644775390625, -0.3594818115234375, -0.34166717529296875, -0.3238525390625, -0.30603790283203125, -0.2882232666015625, -0.27040863037109375, -0.252593994140625, -0.23477935791015625, -0.2169647216796875, -0.19915008544921875, -0.18133544921875, -0.16352081298828125, -0.1457061767578125, -0.12789154052734375, -0.110076904296875, -0.09226226806640625, -0.0744476318359375, -0.05663299560546875, -0.038818359375, -0.02100372314453125, -0.0031890869140625, 0.01462554931640625, 0.032440185546875, 0.05025482177734375, 0.0680694580078125, 0.08588409423828125, 0.10369873046875, 0.12151336669921875, 0.1393280029296875, 0.15714263916015625, 0.174957275390625, 0.19277191162109375, 0.2105865478515625, 0.22840118408203125, 0.2462158203125, 0.26403045654296875, 0.2818450927734375, 0.29965972900390625, 0.317474365234375, 0.33528900146484375, 0.3531036376953125, 0.37091827392578125, 0.38873291015625, 0.40654754638671875, 0.4243621826171875, 0.44217681884765625, 0.459991455078125, 0.47780609130859375, 0.4956207275390625, 0.5134353637695312, 0.53125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 12.0, 11.0, 14.0, 20.0, 12.0, 15.0, 26.0, 34.0, 35.0, 38.0, 65.0, 91.0, 106.0, 93.0, 95.0, 56.0, 45.0, 45.0, 36.0, 30.0, 18.0, 18.0, 17.0, 12.0, 14.0, 9.0, 10.0, 5.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001506805419921875, -0.00014637969434261322, -0.00014207884669303894, -0.00013777799904346466, -0.00013347715139389038, -0.0001291763037443161, -0.00012487545609474182, -0.00012057460844516754, -0.00011627376079559326, -0.00011197291314601898, -0.0001076720654964447, -0.00010337121784687042, -9.907037019729614e-05, -9.476952254772186e-05, -9.046867489814758e-05, -8.61678272485733e-05, -8.186697959899902e-05, -7.756613194942474e-05, -7.326528429985046e-05, -6.896443665027618e-05, -6.46635890007019e-05, -6.0362741351127625e-05, -5.6061893701553345e-05, -5.1761046051979065e-05, -4.7460198402404785e-05, -4.3159350752830505e-05, -3.8858503103256226e-05, -3.4557655453681946e-05, -3.0256807804107666e-05, -2.5955960154533386e-05, -2.1655112504959106e-05, -1.7354264855384827e-05, -1.3053417205810547e-05, -8.752569556236267e-06, -4.451721906661987e-06, -1.5087425708770752e-07, 4.149973392486572e-06, 8.450821042060852e-06, 1.2751668691635132e-05, 1.705251634120941e-05, 2.135336399078369e-05, 2.565421164035797e-05, 2.995505928993225e-05, 3.425590693950653e-05, 3.855675458908081e-05, 4.285760223865509e-05, 4.715844988822937e-05, 5.145929753780365e-05, 5.576014518737793e-05, 6.006099283695221e-05, 6.436184048652649e-05, 6.866268813610077e-05, 7.296353578567505e-05, 7.726438343524933e-05, 8.156523108482361e-05, 8.586607873439789e-05, 9.016692638397217e-05, 9.446777403354645e-05, 9.876862168312073e-05, 0.00010306946933269501, 0.00010737031698226929, 0.00011167116463184357, 0.00011597201228141785, 0.00012027285993099213, 0.0001245737075805664]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 12.0, 10.0, 10.0, 26.0, 22.0, 38.0, 62.0, 93.0, 145.0, 246.0, 472.0, 802.0, 1624.0, 3504.0, 8438.0, 25954.0, 103680.0, 773584.0, 91760.0, 23619.0, 7803.0, 3330.0, 1475.0, 767.0, 398.0, 235.0, 158.0, 76.0, 51.0, 45.0, 28.0, 17.0, 12.0, 8.0, 9.0, 9.0, 7.0, 4.0, 2.0, 8.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.32470703125, -0.31528472900390625, -0.3058624267578125, -0.29644012451171875, -0.287017822265625, -0.27759552001953125, -0.2681732177734375, -0.25875091552734375, -0.24932861328125, -0.23990631103515625, -0.2304840087890625, -0.22106170654296875, -0.211639404296875, -0.20221710205078125, -0.1927947998046875, -0.18337249755859375, -0.1739501953125, -0.16452789306640625, -0.1551055908203125, -0.14568328857421875, -0.136260986328125, -0.12683868408203125, -0.1174163818359375, -0.10799407958984375, -0.09857177734375, -0.08914947509765625, -0.0797271728515625, -0.07030487060546875, -0.060882568359375, -0.05146026611328125, -0.0420379638671875, -0.03261566162109375, -0.023193359375, -0.01377105712890625, -0.0043487548828125, 0.00507354736328125, 0.014495849609375, 0.02391815185546875, 0.0333404541015625, 0.04276275634765625, 0.05218505859375, 0.06160736083984375, 0.0710296630859375, 0.08045196533203125, 0.089874267578125, 0.09929656982421875, 0.1087188720703125, 0.11814117431640625, 0.1275634765625, 0.13698577880859375, 0.1464080810546875, 0.15583038330078125, 0.165252685546875, 0.17467498779296875, 0.1840972900390625, 0.19351959228515625, 0.20294189453125, 0.21236419677734375, 0.2217864990234375, 0.23120880126953125, 0.240631103515625, 0.25005340576171875, 0.2594757080078125, 0.26889801025390625, 0.2783203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 5.0, 5.0, 9.0, 18.0, 21.0, 29.0, 27.0, 57.0, 81.0, 95.0, 109.0, 134.0, 107.0, 93.0, 67.0, 41.0, 35.0, 20.0, 11.0, 7.0, 11.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.767578125, -0.7484512329101562, -0.7293243408203125, -0.7101974487304688, -0.691070556640625, -0.6719436645507812, -0.6528167724609375, -0.6336898803710938, -0.61456298828125, -0.5954360961914062, -0.5763092041015625, -0.5571823120117188, -0.538055419921875, -0.5189285278320312, -0.4998016357421875, -0.48067474365234375, -0.4615478515625, -0.44242095947265625, -0.4232940673828125, -0.40416717529296875, -0.385040283203125, -0.36591339111328125, -0.3467864990234375, -0.32765960693359375, -0.30853271484375, -0.28940582275390625, -0.2702789306640625, -0.25115203857421875, -0.232025146484375, -0.21289825439453125, -0.1937713623046875, -0.17464447021484375, -0.155517578125, -0.13639068603515625, -0.1172637939453125, -0.09813690185546875, -0.079010009765625, -0.05988311767578125, -0.0407562255859375, -0.02162933349609375, -0.00250244140625, 0.01662445068359375, 0.0357513427734375, 0.05487823486328125, 0.074005126953125, 0.09313201904296875, 0.1122589111328125, 0.13138580322265625, 0.1505126953125, 0.16963958740234375, 0.1887664794921875, 0.20789337158203125, 0.227020263671875, 0.24614715576171875, 0.2652740478515625, 0.28440093994140625, 0.30352783203125, 0.32265472412109375, 0.3417816162109375, 0.36090850830078125, 0.380035400390625, 0.39916229248046875, 0.4182891845703125, 0.43741607666015625, 0.45654296875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 18.0, 28.0, 37.0, 70.0, 240.0, 434.0, 82.0, 36.0, 28.0, 12.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.834199905395508, -18.084224700927734, -17.334247589111328, -16.584272384643555, -15.834297180175781, -15.084321022033691, -14.334344863891602, -13.584369659423828, -12.834393501281738, -12.084417343139648, -11.334442138671875, -10.584465980529785, -9.834489822387695, -9.084514617919922, -8.334538459777832, -7.5845627784729, -6.834587097167969, -6.084611415863037, -5.3346357345581055, -4.584659576416016, -3.834683895111084, -3.0847082138061523, -2.3347320556640625, -1.5847563743591309, -0.8347806930541992, -0.08480489253997803, 0.6651709079742432, 1.415146827697754, 2.1651225090026855, 2.915098190307617, 3.665074348449707, 4.415050029754639, 5.1650238037109375, 5.914999485015869, 6.664975166320801, 7.414951324462891, 8.164926528930664, 8.914902687072754, 9.664878845214844, 10.414854049682617, 11.164830207824707, 11.914806365966797, 12.66478157043457, 13.41475772857666, 14.16473388671875, 14.914709091186523, 15.664685249328613, 16.414661407470703, 17.164636611938477, 17.91461181640625, 18.664588928222656, 19.41456413269043, 20.164539337158203, 20.91451644897461, 21.664491653442383, 22.414466857910156, 23.164443969726562, 23.914419174194336, 24.664396286010742, 25.414371490478516, 26.16434669494629, 26.914321899414062, 27.66429901123047, 28.414274215698242, 29.164249420166016]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 8.0, 3.0, 5.0, 11.0, 5.0, 9.0, 18.0, 18.0, 27.0, 16.0, 25.0, 21.0, 31.0, 116.0, 292.0, 160.0, 45.0, 39.0, 34.0, 27.0, 27.0, 17.0, 17.0, 12.0, 9.0, 9.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.464738845825195, -21.924413681030273, -21.38408660888672, -20.843761444091797, -20.303434371948242, -19.76310920715332, -19.222782135009766, -18.682456970214844, -18.142131805419922, -17.601806640625, -17.061479568481445, -16.521154403686523, -15.980827331542969, -15.440502166748047, -14.900176048278809, -14.35984992980957, -13.819522857666016, -13.279196739196777, -12.738870620727539, -12.1985445022583, -11.658218383789062, -11.11789321899414, -10.577567100524902, -10.037240982055664, -9.496914863586426, -8.956588745117188, -8.41626262664795, -7.875936985015869, -7.335610866546631, -6.795284748077393, -6.2549591064453125, -5.714632987976074, -5.1743059158325195, -4.633979797363281, -4.093653678894043, -3.553328037261963, -3.0130019187927246, -2.4726758003234863, -1.9323499202728271, -1.392024040222168, -0.8516979217529297, -0.31137192249298096, 0.22895407676696777, 0.7692800760269165, 1.3096060752868652, 1.8499321937561035, 2.3902580738067627, 2.930583953857422, 3.47091007232666, 4.011236190795898, 4.551562309265137, 5.091887950897217, 5.632214069366455, 6.172540187835693, 6.712865829467773, 7.253191947937012, 7.79351806640625, 8.333844184875488, 8.874170303344727, 9.414496421813965, 9.954822540283203, 10.495147705078125, 11.035473823547363, 11.575799942016602, 12.11612606048584]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 4.0, 2.0, 7.0, 8.0, 11.0, 12.0, 20.0, 19.0, 29.0, 39.0, 40.0, 40.0, 72.0, 274.0, 127.0, 47.0, 51.0, 47.0, 34.0, 29.0, 19.0, 13.0, 14.0, 14.0, 13.0, 7.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1025390625, -1.057708740234375, -1.01287841796875, -0.968048095703125, -0.9232177734375, -0.878387451171875, -0.83355712890625, -0.788726806640625, -0.743896484375, -0.699066162109375, -0.65423583984375, -0.609405517578125, -0.5645751953125, -0.519744873046875, -0.47491455078125, -0.430084228515625, -0.38525390625, -0.340423583984375, -0.29559326171875, -0.250762939453125, -0.2059326171875, -0.161102294921875, -0.11627197265625, -0.071441650390625, -0.026611328125, 0.018218994140625, 0.06304931640625, 0.107879638671875, 0.1527099609375, 0.197540283203125, 0.24237060546875, 0.287200927734375, 0.33203125, 0.376861572265625, 0.42169189453125, 0.466522216796875, 0.5113525390625, 0.556182861328125, 0.60101318359375, 0.645843505859375, 0.690673828125, 0.735504150390625, 0.78033447265625, 0.825164794921875, 0.8699951171875, 0.914825439453125, 0.95965576171875, 1.004486083984375, 1.04931640625, 1.094146728515625, 1.13897705078125, 1.183807373046875, 1.2286376953125, 1.273468017578125, 1.31829833984375, 1.363128662109375, 1.407958984375, 1.452789306640625, 1.49761962890625, 1.542449951171875, 1.5872802734375, 1.632110595703125, 1.67694091796875, 1.721771240234375, 1.7666015625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 3.0, 1.0, 3.0, 5.0, 12.0, 12.0, 15.0, 20.0, 19.0, 45.0, 81.0, 259.0, 1169.0, 29845.0, 8353710.0, 2687.0, 387.0, 134.0, 50.0, 30.0, 23.0, 15.0, 26.0, 8.0, 5.0, 8.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0], "bins": [-29.955928802490234, -29.210172653198242, -28.46441650390625, -27.718660354614258, -26.972904205322266, -26.227148056030273, -25.48139190673828, -24.735633850097656, -23.989879608154297, -23.244123458862305, -22.498367309570312, -21.75261116027832, -21.006855010986328, -20.261098861694336, -19.515342712402344, -18.76958465576172, -18.023828506469727, -17.278072357177734, -16.532316207885742, -15.78656005859375, -15.040803909301758, -14.295047760009766, -13.549290657043457, -12.803534507751465, -12.057778358459473, -11.31202220916748, -10.566266059875488, -9.82050895690918, -9.074752807617188, -8.328996658325195, -7.583240509033203, -6.837484359741211, -6.091726303100586, -5.345970153808594, -4.600214004516602, -3.854457378387451, -3.108701229095459, -2.362945079803467, -1.6171884536743164, -0.8714323043823242, -0.12567615509033203, 0.6200801134109497, 1.3658363819122314, 2.1115927696228027, 2.857348918914795, 3.603105068206787, 4.3488616943359375, 5.09461784362793, 5.840373992919922, 6.586130142211914, 7.331886291503906, 8.077642440795898, 8.82339859008789, 9.569154739379883, 10.314911842346191, 11.060667991638184, 11.806424140930176, 12.552180290222168, 13.29793643951416, 14.043693542480469, 14.789449691772461, 15.535205841064453, 16.280961990356445, 17.026718139648438, 17.77247428894043]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 5.0, 5.0, 8.0, 6.0, 5.0, 2.0, 8.0, 4.0, 4.0, 4.0, 2.0, 7.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.23585319519043, -13.7855863571167, -13.335319519042969, -12.885052680969238, -12.434785842895508, -11.984519004821777, -11.534252166748047, -11.083986282348633, -10.633718490600586, -10.183451652526855, -9.733184814453125, -9.282917976379395, -8.832651138305664, -8.382384300231934, -7.932117938995361, -7.481851100921631, -7.031584739685059, -6.581317901611328, -6.131051063537598, -5.680784225463867, -5.230517387390137, -4.780250549316406, -4.329984188079834, -3.8797173500061035, -3.429450511932373, -2.9791836738586426, -2.528916835784912, -2.0786502361297607, -1.6283833980560303, -1.1781165599822998, -0.7278499603271484, -0.27758312225341797, 0.1726846694946289, 0.6229514479637146, 1.0732182264328003, 1.5234849452972412, 1.9737517833709717, 2.424018621444702, 2.8742852210998535, 3.324552059173584, 3.7748188972473145, 4.225085735321045, 4.675352573394775, 5.125618934631348, 5.575885772705078, 6.026152610778809, 6.476419448852539, 6.9266862869262695, 7.376953125, 7.8272199630737305, 8.277486801147461, 8.727753639221191, 9.178020477294922, 9.628287315368652, 10.078554153442383, 10.528820037841797, 10.979087829589844, 11.429354667663574, 11.879621505737305, 12.329888343811035, 12.780155181884766, 13.230422019958496, 13.680688858032227, 14.13095474243164, 14.581221580505371]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 8.0, 10.0, 16.0, 24.0, 30.0, 54.0, 69.0, 107.0, 189.0, 345.0, 683.0, 1546.0, 3718.0, 10273.0, 29742.0, 88722.0, 198867.0, 125304.0, 41718.0, 14002.0, 5082.0, 1888.0, 866.0, 396.0, 216.0, 110.0, 77.0, 73.0, 36.0, 25.0, 9.0, 19.0, 9.0, 9.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.42578125, -7.16680908203125, -6.9078369140625, -6.64886474609375, -6.389892578125, -6.13092041015625, -5.8719482421875, -5.61297607421875, -5.35400390625, -5.09503173828125, -4.8360595703125, -4.57708740234375, -4.318115234375, -4.05914306640625, -3.8001708984375, -3.54119873046875, -3.2822265625, -3.02325439453125, -2.7642822265625, -2.50531005859375, -2.246337890625, -1.98736572265625, -1.7283935546875, -1.46942138671875, -1.21044921875, -0.95147705078125, -0.6925048828125, -0.43353271484375, -0.174560546875, 0.08441162109375, 0.3433837890625, 0.60235595703125, 0.861328125, 1.12030029296875, 1.3792724609375, 1.63824462890625, 1.897216796875, 2.15618896484375, 2.4151611328125, 2.67413330078125, 2.93310546875, 3.19207763671875, 3.4510498046875, 3.71002197265625, 3.968994140625, 4.22796630859375, 4.4869384765625, 4.74591064453125, 5.0048828125, 5.26385498046875, 5.5228271484375, 5.78179931640625, 6.040771484375, 6.29974365234375, 6.5587158203125, 6.81768798828125, 7.07666015625, 7.33563232421875, 7.5946044921875, 7.85357666015625, 8.112548828125, 8.37152099609375, 8.6304931640625, 8.88946533203125, 9.1484375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 2.0, 7.0, 6.0, 4.0, 10.0, 13.0, 18.0, 15.0, 25.0, 30.0, 24.0, 45.0, 51.0, 57.0, 83.0, 70.0, 76.0, 55.0, 71.0, 61.0, 46.0, 38.0, 39.0, 34.0, 25.0, 21.0, 18.0, 23.0, 9.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.361328125, -1.321533203125, -1.28173828125, -1.241943359375, -1.2021484375, -1.162353515625, -1.12255859375, -1.082763671875, -1.04296875, -1.003173828125, -0.96337890625, -0.923583984375, -0.8837890625, -0.843994140625, -0.80419921875, -0.764404296875, -0.724609375, -0.684814453125, -0.64501953125, -0.605224609375, -0.5654296875, -0.525634765625, -0.48583984375, -0.446044921875, -0.40625, -0.366455078125, -0.32666015625, -0.286865234375, -0.2470703125, -0.207275390625, -0.16748046875, -0.127685546875, -0.087890625, -0.048095703125, -0.00830078125, 0.031494140625, 0.0712890625, 0.111083984375, 0.15087890625, 0.190673828125, 0.23046875, 0.270263671875, 0.31005859375, 0.349853515625, 0.3896484375, 0.429443359375, 0.46923828125, 0.509033203125, 0.548828125, 0.588623046875, 0.62841796875, 0.668212890625, 0.7080078125, 0.747802734375, 0.78759765625, 0.827392578125, 0.8671875, 0.906982421875, 0.94677734375, 0.986572265625, 1.0263671875, 1.066162109375, 1.10595703125, 1.145751953125, 1.185546875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 11.0, 20.0, 28.0, 63.0, 95.0, 96.0, 65.0, 46.0, 15.0, 14.0, 5.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.867976188659668, -7.524501800537109, -7.181026935577393, -6.837552070617676, -6.494077682495117, -6.150603294372559, -5.807128429412842, -5.463653564453125, -5.120179176330566, -4.776704788208008, -4.433229923248291, -4.089755058288574, -3.7462806701660156, -3.402806043624878, -3.0593314170837402, -2.7158567905426025, -2.372382164001465, -2.028907537460327, -1.6854329109191895, -1.3419582843780518, -0.9984836578369141, -0.6550090312957764, -0.31153440475463867, 0.03194022178649902, 0.3754148483276367, 0.7188894748687744, 1.062364101409912, 1.4058387279510498, 1.7493133544921875, 2.092787981033325, 2.436262607574463, 2.7797372341156006, 3.1232128143310547, 3.4666874408721924, 3.81016206741333, 4.153636932373047, 4.4971113204956055, 4.840585708618164, 5.184060573577881, 5.527535438537598, 5.871009826660156, 6.214484214782715, 6.557959079742432, 6.901433944702148, 7.244908332824707, 7.588382720947266, 7.931857585906982, 8.2753324508667, 8.618806838989258, 8.962281227111816, 9.305755615234375, 9.64923095703125, 9.992705345153809, 10.336179733276367, 10.679655075073242, 11.0231294631958, 11.36660385131836, 11.710078239440918, 12.053552627563477, 12.397027969360352, 12.74050235748291, 13.083976745605469, 13.427452087402344, 13.770926475524902, 14.114400863647461]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 9.0, 3.0, 8.0, 6.0, 12.0, 13.0, 42.0, 87.0, 92.0, 82.0, 48.0, 23.0, 10.0, 6.0, 6.0, 3.0, 4.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.573070526123047, -6.361219882965088, -6.149369239807129, -5.93751859664917, -5.725667953491211, -5.513817310333252, -5.301966667175293, -5.090116024017334, -4.878265380859375, -4.666414737701416, -4.454564094543457, -4.242713451385498, -4.030862808227539, -3.81901216506958, -3.607161521911621, -3.395310878753662, -3.1834604740142822, -2.9716098308563232, -2.7597591876983643, -2.5479085445404053, -2.3360579013824463, -2.1242074966430664, -1.9123567342758179, -1.7005060911178589, -1.4886554479599, -1.276804804801941, -1.064954161643982, -0.8531035780906677, -0.6412529349327087, -0.42940235137939453, -0.21755170822143555, -0.0057010650634765625, 0.20614957809448242, 0.4180002212524414, 0.6298508644104004, 0.8417014479637146, 1.0535521507263184, 1.2654026746749878, 1.4772533178329468, 1.6891039609909058, 1.9009546041488647, 2.112805128097534, 2.324655771255493, 2.536506414413452, 2.748357057571411, 2.96020770072937, 3.172058343887329, 3.383908987045288, 3.595759630203247, 3.807610273361206, 4.019460678100586, 4.231311321258545, 4.443161964416504, 4.655012607574463, 4.866863250732422, 5.078713893890381, 5.29056453704834, 5.502415180206299, 5.714265823364258, 5.926116466522217, 6.137967109680176, 6.349817752838135, 6.561668395996094, 6.773519039154053, 6.985369682312012]}, "eval/loss": 6.721965789794922, "eval/wer": 1.942317995118757, "eval/runtime": 950.7357, "eval/samples_per_second": 2.779, "eval/steps_per_second": 0.348} \ No newline at end of file +{"train/loss": 6.4588, "train/learning_rate": 1.8429334916864606e-05, "train/epoch": 8.41, "train/global_step": 7500, "_runtime": 50324, "_timestamp": 1646996092, "_step": 7504, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 123.0, 24.0, 5.0, 5.0, 6.0, 4.0, 30099.0, 141.0, 50.0, 13.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.59375, -56.720703125, -54.84765625, -52.974609375, -51.1015625, -49.228515625, -47.35546875, -45.482421875, -43.609375, -41.736328125, -39.86328125, -37.990234375, -36.1171875, -34.244140625, -32.37109375, -30.498046875, -28.625, -26.751953125, -24.87890625, -23.005859375, -21.1328125, -19.259765625, -17.38671875, -15.513671875, -13.640625, -11.767578125, -9.89453125, -8.021484375, -6.1484375, -4.275390625, -2.40234375, -0.529296875, 1.34375, 3.216796875, 5.08984375, 6.962890625, 8.8359375, 10.708984375, 12.58203125, 14.455078125, 16.328125, 18.201171875, 20.07421875, 21.947265625, 23.8203125, 25.693359375, 27.56640625, 29.439453125, 31.3125, 33.185546875, 35.05859375, 36.931640625, 38.8046875, 40.677734375, 42.55078125, 44.423828125, 46.296875, 48.169921875, 50.04296875, 51.916015625, 53.7890625, 55.662109375, 57.53515625, 59.408203125, 61.28125]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 11.0, 17.0, 24.0, 20.0, 73.0, 290.0, 383.0, 155.0, 30.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.78602600097656, -147.02088928222656, -144.2557373046875, -141.4906005859375, -138.72544860839844, -135.96031188964844, -133.19515991210938, -130.43002319335938, -127.66488647460938, -124.89974212646484, -122.13459777832031, -119.36946105957031, -116.60431671142578, -113.83917236328125, -111.07402801513672, -108.30888366699219, -105.54373931884766, -102.77859497070312, -100.0134506225586, -97.24830627441406, -94.48316955566406, -91.71802520751953, -88.952880859375, -86.18773651123047, -83.42259216308594, -80.6574478149414, -77.89230346679688, -75.12716674804688, -72.36202239990234, -69.59687805175781, -66.83173370361328, -64.06658935546875, -61.301448822021484, -58.53630447387695, -55.77116394042969, -53.006019592285156, -50.240875244140625, -47.47573471069336, -44.71059036254883, -41.94544982910156, -39.18030548095703, -36.4151611328125, -33.650020599365234, -30.884876251220703, -28.119733810424805, -25.354591369628906, -22.589447021484375, -19.824304580688477, -17.059162139892578, -14.29401969909668, -11.528876304626465, -8.76373291015625, -5.998590469360352, -3.233448028564453, -0.4683036804199219, 2.2968387603759766, 5.061981201171875, 7.827124118804932, 10.592267036437988, 13.357410430908203, 16.1225528717041, 18.8876953125, 21.65283966064453, 24.41798210144043, 27.183124542236328]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 11.0, 6.0, 10.0, 15.0, 14.0, 30.0, 32.0, 17.0, 30.0, 43.0, 46.0, 43.0, 53.0, 56.0, 53.0, 49.0, 45.0, 44.0, 48.0, 40.0, 31.0, 30.0, 33.0, 24.0, 31.0, 22.0, 18.0, 19.0, 15.0, 11.0, 14.0, 16.0, 6.0, 8.0, 6.0, 6.0, 5.0, 3.0, 8.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.109256744384766, -26.128297805786133, -25.147336959838867, -24.166378021240234, -23.1854190826416, -22.204458236694336, -21.223499298095703, -20.242538452148438, -19.261579513549805, -18.280620574951172, -17.299659729003906, -16.318700790405273, -15.337740898132324, -14.356781005859375, -13.375822067260742, -12.394862174987793, -11.41390323638916, -10.432943344116211, -9.451984405517578, -8.471024513244629, -7.49006462097168, -6.509105205535889, -5.528145790100098, -4.547185897827148, -3.5662264823913574, -2.5852668285369873, -1.6043072938919067, -0.6233477592468262, 0.35761189460754395, 1.338571548461914, 2.319530963897705, 3.3004908561706543, 4.281450271606445, 5.262409687042236, 6.2433695793151855, 7.224328994750977, 8.205288887023926, 9.186248779296875, 10.167207717895508, 11.148167610168457, 12.129127502441406, 13.110087394714355, 14.091046333312988, 15.072006225585938, 16.05296516418457, 17.033926010131836, 18.01488494873047, 18.995845794677734, 19.976802825927734, 20.957761764526367, 21.938722610473633, 22.919681549072266, 23.9006404876709, 24.881601333618164, 25.862560272216797, 26.843521118164062, 27.824480056762695, 28.805438995361328, 29.786399841308594, 30.767358779907227, 31.74831771850586, 32.729278564453125, 33.710235595703125, 34.69119644165039, 35.672157287597656]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 12.0, 10.0, 15.0, 24.0, 41.0, 59.0, 85.0, 147.0, 262.0, 431.0, 845.0, 1724.0, 3899.0, 9981.0, 28224.0, 82871.0, 222967.0, 408460.0, 185400.0, 65738.0, 22631.0, 8349.0, 3261.0, 1411.0, 702.0, 394.0, 225.0, 127.0, 75.0, 54.0, 33.0, 22.0, 15.0, 18.0, 5.0, 8.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-65.375, -63.35693359375, -61.3388671875, -59.32080078125, -57.302734375, -55.28466796875, -53.2666015625, -51.24853515625, -49.23046875, -47.21240234375, -45.1943359375, -43.17626953125, -41.158203125, -39.14013671875, -37.1220703125, -35.10400390625, -33.0859375, -31.06787109375, -29.0498046875, -27.03173828125, -25.013671875, -22.99560546875, -20.9775390625, -18.95947265625, -16.94140625, -14.92333984375, -12.9052734375, -10.88720703125, -8.869140625, -6.85107421875, -4.8330078125, -2.81494140625, -0.796875, 1.22119140625, 3.2392578125, 5.25732421875, 7.275390625, 9.29345703125, 11.3115234375, 13.32958984375, 15.34765625, 17.36572265625, 19.3837890625, 21.40185546875, 23.419921875, 25.43798828125, 27.4560546875, 29.47412109375, 31.4921875, 33.51025390625, 35.5283203125, 37.54638671875, 39.564453125, 41.58251953125, 43.6005859375, 45.61865234375, 47.63671875, 49.65478515625, 51.6728515625, 53.69091796875, 55.708984375, 57.72705078125, 59.7451171875, 61.76318359375, 63.78125]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 8.0, 9.0, 7.0, 15.0, 19.0, 20.0, 21.0, 23.0, 24.0, 28.0, 36.0, 36.0, 40.0, 42.0, 48.0, 43.0, 53.0, 108.0, 51.0, 33.0, 51.0, 36.0, 22.0, 22.0, 30.0, 22.0, 19.0, 20.0, 22.0, 15.0, 11.0, 13.0, 11.0, 13.0, 4.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.390625, -16.8515625, -16.3125, -15.7734375, -15.234375, -14.6953125, -14.15625, -13.6171875, -13.078125, -12.5390625, -12.0, -11.4609375, -10.921875, -10.3828125, -9.84375, -9.3046875, -8.765625, -8.2265625, -7.6875, -7.1484375, -6.609375, -6.0703125, -5.53125, -4.9921875, -4.453125, -3.9140625, -3.375, -2.8359375, -2.296875, -1.7578125, -1.21875, -0.6796875, -0.140625, 0.3984375, 0.9375, 1.4765625, 2.015625, 2.5546875, 3.09375, 3.6328125, 4.171875, 4.7109375, 5.25, 5.7890625, 6.328125, 6.8671875, 7.40625, 7.9453125, 8.484375, 9.0234375, 9.5625, 10.1015625, 10.640625, 11.1796875, 11.71875, 12.2578125, 12.796875, 13.3359375, 13.875, 14.4140625, 14.953125, 15.4921875, 16.03125, 16.5703125, 17.109375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 5.0, 7.0, 8.0, 13.0, 14.0, 17.0, 32.0, 39.0, 57.0, 65.0, 88.0, 95.0, 113.0, 114.0, 76.0, 69.0, 50.0, 30.0, 38.0, 14.0, 15.0, 14.0, 8.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.2972412109375, -29.189777374267578, -28.082313537597656, -26.9748477935791, -25.86738395690918, -24.759920120239258, -23.652454376220703, -22.54499053955078, -21.43752670288086, -20.330062866210938, -19.222599029541016, -18.11513328552246, -17.00766944885254, -15.900205612182617, -14.792740821838379, -13.68527603149414, -12.577812194824219, -11.470348358154297, -10.362883567810059, -9.25541877746582, -8.147954940795898, -7.040490627288818, -5.933026313781738, -4.825562000274658, -3.718097686767578, -2.610633373260498, -1.503169059753418, -0.3957047462463379, 0.7117595672607422, 1.8192238807678223, 2.9266881942749023, 4.034152507781982, 5.141620635986328, 6.249084949493408, 7.356549263000488, 8.464014053344727, 9.571477890014648, 10.67894172668457, 11.786406517028809, 12.893871307373047, 14.001335144042969, 15.10879898071289, 16.216262817382812, 17.323728561401367, 18.43119239807129, 19.53865623474121, 20.646121978759766, 21.753585815429688, 22.86104965209961, 23.96851348876953, 25.075977325439453, 26.183443069458008, 27.29090690612793, 28.39837074279785, 29.505836486816406, 30.613300323486328, 31.72076416015625, 32.82822799682617, 33.935691833496094, 35.043155670166016, 36.15061950683594, 37.258087158203125, 38.36555099487305, 39.47301483154297, 40.58047866821289]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 6.0, 17.0, 17.0, 8.0, 19.0, 22.0, 29.0, 20.0, 25.0, 35.0, 37.0, 31.0, 39.0, 35.0, 62.0, 42.0, 40.0, 43.0, 59.0, 54.0, 49.0, 45.0, 43.0, 34.0, 32.0, 17.0, 25.0, 17.0, 16.0, 14.0, 17.0, 11.0, 7.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.99042510986328, -20.20842742919922, -19.426427841186523, -18.64443016052246, -17.862430572509766, -17.080432891845703, -16.29843521118164, -15.516435623168945, -14.734436988830566, -13.952438354492188, -13.170439720153809, -12.38844108581543, -11.606443405151367, -10.824443817138672, -10.04244613647461, -9.26044750213623, -8.478448867797852, -7.696450233459473, -6.914451599121094, -6.132453441619873, -5.350454807281494, -4.568456172943115, -3.7864580154418945, -3.0044593811035156, -2.2224607467651367, -1.4404622316360474, -0.658463716506958, 0.1235346794128418, 0.9055333137512207, 1.6875319480895996, 2.4695301055908203, 3.251528739929199, 4.033529281616211, 4.81552791595459, 5.597526550292969, 6.3795247077941895, 7.161523342132568, 7.943521976470947, 8.725520133972168, 9.507518768310547, 10.289517402648926, 11.071516036987305, 11.853514671325684, 12.635513305664062, 13.417510986328125, 14.19951057434082, 14.981508255004883, 15.763506889343262, 16.54550552368164, 17.327503204345703, 18.1095027923584, 18.89150047302246, 19.673500061035156, 20.45549774169922, 21.23749542236328, 22.019495010375977, 22.801494598388672, 23.583492279052734, 24.36549186706543, 25.147489547729492, 25.929489135742188, 26.71148681640625, 27.493484497070312, 28.275484085083008, 29.05748176574707]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 6.0, 14.0, 11.0, 19.0, 29.0, 50.0, 56.0, 73.0, 130.0, 155.0, 232.0, 330.0, 493.0, 726.0, 1096.0, 1647.0, 2730.0, 4835.0, 9273.0, 20707.0, 68075.0, 1229408.0, 2705304.0, 99683.0, 24539.0, 10552.0, 5398.0, 3081.0, 1899.0, 1244.0, 789.0, 539.0, 358.0, 271.0, 158.0, 123.0, 77.0, 54.0, 24.0, 26.0, 26.0, 12.0, 13.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-27.0625, -26.21923828125, -25.3759765625, -24.53271484375, -23.689453125, -22.84619140625, -22.0029296875, -21.15966796875, -20.31640625, -19.47314453125, -18.6298828125, -17.78662109375, -16.943359375, -16.10009765625, -15.2568359375, -14.41357421875, -13.5703125, -12.72705078125, -11.8837890625, -11.04052734375, -10.197265625, -9.35400390625, -8.5107421875, -7.66748046875, -6.82421875, -5.98095703125, -5.1376953125, -4.29443359375, -3.451171875, -2.60791015625, -1.7646484375, -0.92138671875, -0.078125, 0.76513671875, 1.6083984375, 2.45166015625, 3.294921875, 4.13818359375, 4.9814453125, 5.82470703125, 6.66796875, 7.51123046875, 8.3544921875, 9.19775390625, 10.041015625, 10.88427734375, 11.7275390625, 12.57080078125, 13.4140625, 14.25732421875, 15.1005859375, 15.94384765625, 16.787109375, 17.63037109375, 18.4736328125, 19.31689453125, 20.16015625, 21.00341796875, 21.8466796875, 22.68994140625, 23.533203125, 24.37646484375, 25.2197265625, 26.06298828125, 26.90625]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 8.0, 6.0, 11.0, 14.0, 15.0, 16.0, 16.0, 24.0, 21.0, 25.0, 34.0, 29.0, 26.0, 26.0, 36.0, 42.0, 48.0, 38.0, 43.0, 42.0, 41.0, 48.0, 48.0, 47.0, 32.0, 27.0, 30.0, 24.0, 25.0, 28.0, 27.0, 16.0, 16.0, 15.0, 14.0, 8.0, 6.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.328125, -10.9105224609375, -10.492919921875, -10.0753173828125, -9.65771484375, -9.2401123046875, -8.822509765625, -8.4049072265625, -7.9873046875, -7.5697021484375, -7.152099609375, -6.7344970703125, -6.31689453125, -5.8992919921875, -5.481689453125, -5.0640869140625, -4.646484375, -4.2288818359375, -3.811279296875, -3.3936767578125, -2.97607421875, -2.5584716796875, -2.140869140625, -1.7232666015625, -1.3056640625, -0.8880615234375, -0.470458984375, -0.0528564453125, 0.36474609375, 0.7823486328125, 1.199951171875, 1.6175537109375, 2.03515625, 2.4527587890625, 2.870361328125, 3.2879638671875, 3.70556640625, 4.1231689453125, 4.540771484375, 4.9583740234375, 5.3759765625, 5.7935791015625, 6.211181640625, 6.6287841796875, 7.04638671875, 7.4639892578125, 7.881591796875, 8.2991943359375, 8.716796875, 9.1343994140625, 9.552001953125, 9.9696044921875, 10.38720703125, 10.8048095703125, 11.222412109375, 11.6400146484375, 12.0576171875, 12.4752197265625, 12.892822265625, 13.3104248046875, 13.72802734375, 14.1456298828125, 14.563232421875, 14.9808349609375, 15.3984375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 1.0, 3.0, 5.0, 8.0, 8.0, 16.0, 23.0, 21.0, 57.0, 123.0, 540.0, 11278.0, 4165395.0, 15809.0, 706.0, 144.0, 60.0, 30.0, 21.0, 12.0, 11.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.375, -181.958984375, -174.54296875, -167.126953125, -159.7109375, -152.294921875, -144.87890625, -137.462890625, -130.046875, -122.630859375, -115.21484375, -107.798828125, -100.3828125, -92.966796875, -85.55078125, -78.134765625, -70.71875, -63.302734375, -55.88671875, -48.470703125, -41.0546875, -33.638671875, -26.22265625, -18.806640625, -11.390625, -3.974609375, 3.44140625, 10.857421875, 18.2734375, 25.689453125, 33.10546875, 40.521484375, 47.9375, 55.353515625, 62.76953125, 70.185546875, 77.6015625, 85.017578125, 92.43359375, 99.849609375, 107.265625, 114.681640625, 122.09765625, 129.513671875, 136.9296875, 144.345703125, 151.76171875, 159.177734375, 166.59375, 174.009765625, 181.42578125, 188.841796875, 196.2578125, 203.673828125, 211.08984375, 218.505859375, 225.921875, 233.337890625, 240.75390625, 248.169921875, 255.5859375, 263.001953125, 270.41796875, 277.833984375, 285.25]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 5.0, 4.0, 5.0, 4.0, 7.0, 6.0, 15.0, 20.0, 25.0, 25.0, 54.0, 92.0, 280.0, 1041.0, 1738.0, 406.0, 155.0, 64.0, 51.0, 22.0, 20.0, 17.0, 13.0, 8.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.34375, -8.972900390625, -8.60205078125, -8.231201171875, -7.8603515625, -7.489501953125, -7.11865234375, -6.747802734375, -6.376953125, -6.006103515625, -5.63525390625, -5.264404296875, -4.8935546875, -4.522705078125, -4.15185546875, -3.781005859375, -3.41015625, -3.039306640625, -2.66845703125, -2.297607421875, -1.9267578125, -1.555908203125, -1.18505859375, -0.814208984375, -0.443359375, -0.072509765625, 0.29833984375, 0.669189453125, 1.0400390625, 1.410888671875, 1.78173828125, 2.152587890625, 2.5234375, 2.894287109375, 3.26513671875, 3.635986328125, 4.0068359375, 4.377685546875, 4.74853515625, 5.119384765625, 5.490234375, 5.861083984375, 6.23193359375, 6.602783203125, 6.9736328125, 7.344482421875, 7.71533203125, 8.086181640625, 8.45703125, 8.827880859375, 9.19873046875, 9.569580078125, 9.9404296875, 10.311279296875, 10.68212890625, 11.052978515625, 11.423828125, 11.794677734375, 12.16552734375, 12.536376953125, 12.9072265625, 13.278076171875, 13.64892578125, 14.019775390625, 14.390625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 1.0, 5.0, 4.0, 14.0, 14.0, 7.0, 12.0, 27.0, 27.0, 35.0, 39.0, 38.0, 58.0, 64.0, 68.0, 74.0, 77.0, 81.0, 56.0, 53.0, 38.0, 44.0, 33.0, 26.0, 22.0, 21.0, 16.0, 11.0, 7.0, 7.0, 5.0, 0.0, 3.0, 9.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.966155052185059, -14.511995315551758, -14.057835578918457, -13.60367488861084, -13.149515151977539, -12.695355415344238, -12.241195678710938, -11.78703498840332, -11.33287525177002, -10.878715515136719, -10.424555778503418, -9.9703950881958, -9.5162353515625, -9.0620756149292, -8.607915878295898, -8.153755187988281, -7.699595928192139, -7.245436191558838, -6.791275978088379, -6.337116241455078, -5.882956027984619, -5.428796291351318, -4.974636077880859, -4.520476341247559, -4.066316604614258, -3.612156629562378, -3.157996654510498, -2.7038369178771973, -2.2496767044067383, -1.7955169677734375, -1.3413569927215576, -0.8871970176696777, -0.43303680419921875, 0.021123141050338745, 0.47528308629989624, 0.9294430017471313, 1.3836029767990112, 1.8377628326416016, 2.2919228076934814, 2.7460827827453613, 3.200242757797241, 3.654402732849121, 4.108562469482422, 4.562722682952881, 5.016882419586182, 5.471042633056641, 5.925202369689941, 6.379362106323242, 6.833522319793701, 7.287682056427002, 7.741842269897461, 8.196002006530762, 8.650161743164062, 9.10432243347168, 9.55848217010498, 10.012641906738281, 10.466801643371582, 10.920961380004883, 11.375121116638184, 11.8292818069458, 12.283441543579102, 12.737601280212402, 13.191761016845703, 13.64592170715332, 14.100081443786621]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 8.0, 8.0, 18.0, 11.0, 16.0, 12.0, 18.0, 24.0, 28.0, 35.0, 33.0, 34.0, 48.0, 50.0, 44.0, 49.0, 48.0, 65.0, 46.0, 45.0, 55.0, 47.0, 49.0, 23.0, 30.0, 30.0, 22.0, 21.0, 13.0, 14.0, 14.0, 5.0, 10.0, 7.0, 2.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.279983520507812, -11.805401802062988, -11.330820083618164, -10.856239318847656, -10.381657600402832, -9.907075881958008, -9.4324951171875, -8.957913398742676, -8.483331680297852, -8.008749961853027, -7.534168720245361, -7.059587478637695, -6.585005760192871, -6.110424041748047, -5.635842800140381, -5.161261558532715, -4.686679840087891, -4.212098121643066, -3.7375168800354004, -3.2629354000091553, -2.78835391998291, -2.313772439956665, -1.83919095993042, -1.3646094799041748, -0.8900279998779297, -0.41544651985168457, 0.05913496017456055, 0.5337164402008057, 1.0082979202270508, 1.482879400253296, 1.957460880279541, 2.432042360305786, 2.9066238403320312, 3.3812053203582764, 3.8557868003845215, 4.3303680419921875, 4.804949760437012, 5.279531478881836, 5.754112720489502, 6.228693962097168, 6.703275680541992, 7.177857398986816, 7.652438640594482, 8.127019882202148, 8.601601600646973, 9.076183319091797, 9.550764083862305, 10.025345802307129, 10.499927520751953, 10.974509239196777, 11.449090957641602, 11.92367172241211, 12.398253440856934, 12.872835159301758, 13.347415924072266, 13.82199764251709, 14.296579360961914, 14.771161079406738, 15.245742797851562, 15.72032356262207, 16.194904327392578, 16.66948699951172, 17.144067764282227, 17.618650436401367, 18.093231201171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 11.0, 12.0, 13.0, 26.0, 39.0, 58.0, 91.0, 150.0, 240.0, 356.0, 621.0, 960.0, 1639.0, 2793.0, 4981.0, 9663.0, 20461.0, 44582.0, 102811.0, 242956.0, 333559.0, 156510.0, 66612.0, 29419.0, 14000.0, 6869.0, 3751.0, 2113.0, 1204.0, 830.0, 442.0, 289.0, 169.0, 125.0, 72.0, 36.0, 38.0, 22.0, 11.0, 9.0, 3.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.765625, -20.12158203125, -19.4775390625, -18.83349609375, -18.189453125, -17.54541015625, -16.9013671875, -16.25732421875, -15.61328125, -14.96923828125, -14.3251953125, -13.68115234375, -13.037109375, -12.39306640625, -11.7490234375, -11.10498046875, -10.4609375, -9.81689453125, -9.1728515625, -8.52880859375, -7.884765625, -7.24072265625, -6.5966796875, -5.95263671875, -5.30859375, -4.66455078125, -4.0205078125, -3.37646484375, -2.732421875, -2.08837890625, -1.4443359375, -0.80029296875, -0.15625, 0.48779296875, 1.1318359375, 1.77587890625, 2.419921875, 3.06396484375, 3.7080078125, 4.35205078125, 4.99609375, 5.64013671875, 6.2841796875, 6.92822265625, 7.572265625, 8.21630859375, 8.8603515625, 9.50439453125, 10.1484375, 10.79248046875, 11.4365234375, 12.08056640625, 12.724609375, 13.36865234375, 14.0126953125, 14.65673828125, 15.30078125, 15.94482421875, 16.5888671875, 17.23291015625, 17.876953125, 18.52099609375, 19.1650390625, 19.80908203125, 20.453125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 14.0, 8.0, 14.0, 10.0, 15.0, 13.0, 23.0, 29.0, 34.0, 30.0, 37.0, 40.0, 35.0, 60.0, 43.0, 51.0, 50.0, 41.0, 58.0, 55.0, 40.0, 40.0, 34.0, 34.0, 34.0, 33.0, 21.0, 25.0, 16.0, 17.0, 12.0, 5.0, 8.0, 9.0, 4.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.9130859375, -9.544921875, -9.1767578125, -8.80859375, -8.4404296875, -8.072265625, -7.7041015625, -7.3359375, -6.9677734375, -6.599609375, -6.2314453125, -5.86328125, -5.4951171875, -5.126953125, -4.7587890625, -4.390625, -4.0224609375, -3.654296875, -3.2861328125, -2.91796875, -2.5498046875, -2.181640625, -1.8134765625, -1.4453125, -1.0771484375, -0.708984375, -0.3408203125, 0.02734375, 0.3955078125, 0.763671875, 1.1318359375, 1.5, 1.8681640625, 2.236328125, 2.6044921875, 2.97265625, 3.3408203125, 3.708984375, 4.0771484375, 4.4453125, 4.8134765625, 5.181640625, 5.5498046875, 5.91796875, 6.2861328125, 6.654296875, 7.0224609375, 7.390625, 7.7587890625, 8.126953125, 8.4951171875, 8.86328125, 9.2314453125, 9.599609375, 9.9677734375, 10.3359375, 10.7041015625, 11.072265625, 11.4404296875, 11.80859375, 12.1767578125, 12.544921875, 12.9130859375, 13.28125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 3.0, 8.0, 7.0, 12.0, 17.0, 19.0, 36.0, 47.0, 63.0, 74.0, 97.0, 150.0, 245.0, 343.0, 535.0, 934.0, 1527.0, 3360.0, 9270.0, 31511.0, 201680.0, 698369.0, 72423.0, 16589.0, 5571.0, 2415.0, 1182.0, 659.0, 447.0, 284.0, 172.0, 140.0, 98.0, 68.0, 42.0, 32.0, 32.0, 22.0, 17.0, 10.0, 4.0, 8.0, 2.0, 3.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.953125, -27.029296875, -26.10546875, -25.181640625, -24.2578125, -23.333984375, -22.41015625, -21.486328125, -20.5625, -19.638671875, -18.71484375, -17.791015625, -16.8671875, -15.943359375, -15.01953125, -14.095703125, -13.171875, -12.248046875, -11.32421875, -10.400390625, -9.4765625, -8.552734375, -7.62890625, -6.705078125, -5.78125, -4.857421875, -3.93359375, -3.009765625, -2.0859375, -1.162109375, -0.23828125, 0.685546875, 1.609375, 2.533203125, 3.45703125, 4.380859375, 5.3046875, 6.228515625, 7.15234375, 8.076171875, 9.0, 9.923828125, 10.84765625, 11.771484375, 12.6953125, 13.619140625, 14.54296875, 15.466796875, 16.390625, 17.314453125, 18.23828125, 19.162109375, 20.0859375, 21.009765625, 21.93359375, 22.857421875, 23.78125, 24.705078125, 25.62890625, 26.552734375, 27.4765625, 28.400390625, 29.32421875, 30.248046875, 31.171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 7.0, 8.0, 14.0, 8.0, 18.0, 13.0, 17.0, 15.0, 13.0, 14.0, 31.0, 29.0, 22.0, 25.0, 30.0, 25.0, 38.0, 34.0, 30.0, 40.0, 50.0, 45.0, 42.0, 26.0, 38.0, 34.0, 40.0, 37.0, 29.0, 28.0, 22.0, 32.0, 24.0, 22.0, 15.0, 23.0, 15.0, 10.0, 7.0, 3.0, 5.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.666748046875, -5.47021484375, -5.273681640625, -5.0771484375, -4.880615234375, -4.68408203125, -4.487548828125, -4.291015625, -4.094482421875, -3.89794921875, -3.701416015625, -3.5048828125, -3.308349609375, -3.11181640625, -2.915283203125, -2.71875, -2.522216796875, -2.32568359375, -2.129150390625, -1.9326171875, -1.736083984375, -1.53955078125, -1.343017578125, -1.146484375, -0.949951171875, -0.75341796875, -0.556884765625, -0.3603515625, -0.163818359375, 0.03271484375, 0.229248046875, 0.42578125, 0.622314453125, 0.81884765625, 1.015380859375, 1.2119140625, 1.408447265625, 1.60498046875, 1.801513671875, 1.998046875, 2.194580078125, 2.39111328125, 2.587646484375, 2.7841796875, 2.980712890625, 3.17724609375, 3.373779296875, 3.5703125, 3.766845703125, 3.96337890625, 4.159912109375, 4.3564453125, 4.552978515625, 4.74951171875, 4.946044921875, 5.142578125, 5.339111328125, 5.53564453125, 5.732177734375, 5.9287109375, 6.125244140625, 6.32177734375, 6.518310546875, 6.71484375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 10.0, 7.0, 7.0, 8.0, 22.0, 27.0, 24.0, 40.0, 62.0, 97.0, 115.0, 198.0, 375.0, 635.0, 1067.0, 2334.0, 5534.0, 16475.0, 88689.0, 830597.0, 76749.0, 15334.0, 5254.0, 2262.0, 1057.0, 555.0, 362.0, 210.0, 146.0, 79.0, 53.0, 40.0, 29.0, 28.0, 17.0, 14.0, 11.0, 6.0, 6.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.140625, -21.458740234375, -20.77685546875, -20.094970703125, -19.4130859375, -18.731201171875, -18.04931640625, -17.367431640625, -16.685546875, -16.003662109375, -15.32177734375, -14.639892578125, -13.9580078125, -13.276123046875, -12.59423828125, -11.912353515625, -11.23046875, -10.548583984375, -9.86669921875, -9.184814453125, -8.5029296875, -7.821044921875, -7.13916015625, -6.457275390625, -5.775390625, -5.093505859375, -4.41162109375, -3.729736328125, -3.0478515625, -2.365966796875, -1.68408203125, -1.002197265625, -0.3203125, 0.361572265625, 1.04345703125, 1.725341796875, 2.4072265625, 3.089111328125, 3.77099609375, 4.452880859375, 5.134765625, 5.816650390625, 6.49853515625, 7.180419921875, 7.8623046875, 8.544189453125, 9.22607421875, 9.907958984375, 10.58984375, 11.271728515625, 11.95361328125, 12.635498046875, 13.3173828125, 13.999267578125, 14.68115234375, 15.363037109375, 16.044921875, 16.726806640625, 17.40869140625, 18.090576171875, 18.7724609375, 19.454345703125, 20.13623046875, 20.818115234375, 21.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 6.0, 6.0, 6.0, 13.0, 15.0, 12.0, 18.0, 29.0, 49.0, 62.0, 97.0, 107.0, 129.0, 132.0, 90.0, 66.0, 38.0, 33.0, 18.0, 20.0, 15.0, 9.0, 6.0, 7.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007810592651367188, -0.0007577985525131226, -0.0007345378398895264, -0.0007112771272659302, -0.000688016414642334, -0.0006647557020187378, -0.0006414949893951416, -0.0006182342767715454, -0.0005949735641479492, -0.000571712851524353, -0.0005484521389007568, -0.0005251914262771606, -0.0005019307136535645, -0.00047867000102996826, -0.00045540928840637207, -0.0004321485757827759, -0.0004088878631591797, -0.0003856271505355835, -0.0003623664379119873, -0.0003391057252883911, -0.0003158450126647949, -0.00029258430004119873, -0.00026932358741760254, -0.00024606287479400635, -0.00022280216217041016, -0.00019954144954681396, -0.00017628073692321777, -0.00015302002429962158, -0.0001297593116760254, -0.0001064985990524292, -8.323788642883301e-05, -5.9977173805236816e-05, -3.6716461181640625e-05, -1.3455748558044434e-05, 9.804964065551758e-06, 3.306567668914795e-05, 5.632638931274414e-05, 7.958710193634033e-05, 0.00010284781455993652, 0.00012610852718353271, 0.0001493692398071289, 0.0001726299524307251, 0.0001958906650543213, 0.00021915137767791748, 0.00024241209030151367, 0.00026567280292510986, 0.00028893351554870605, 0.00031219422817230225, 0.00033545494079589844, 0.00035871565341949463, 0.0003819763660430908, 0.000405237078666687, 0.0004284977912902832, 0.0004517585039138794, 0.0004750192165374756, 0.0004982799291610718, 0.000521540641784668, 0.0005448013544082642, 0.0005680620670318604, 0.0005913227796554565, 0.0006145834922790527, 0.0006378442049026489, 0.0006611049175262451, 0.0006843656301498413, 0.0007076263427734375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 5.0, 5.0, 15.0, 13.0, 17.0, 16.0, 23.0, 42.0, 50.0, 97.0, 622.0, 23149.0, 1009031.0, 14646.0, 489.0, 111.0, 44.0, 41.0, 22.0, 25.0, 15.0, 17.0, 9.0, 8.0, 5.0, 10.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.25, -57.66796875, -56.0859375, -54.50390625, -52.921875, -51.33984375, -49.7578125, -48.17578125, -46.59375, -45.01171875, -43.4296875, -41.84765625, -40.265625, -38.68359375, -37.1015625, -35.51953125, -33.9375, -32.35546875, -30.7734375, -29.19140625, -27.609375, -26.02734375, -24.4453125, -22.86328125, -21.28125, -19.69921875, -18.1171875, -16.53515625, -14.953125, -13.37109375, -11.7890625, -10.20703125, -8.625, -7.04296875, -5.4609375, -3.87890625, -2.296875, -0.71484375, 0.8671875, 2.44921875, 4.03125, 5.61328125, 7.1953125, 8.77734375, 10.359375, 11.94140625, 13.5234375, 15.10546875, 16.6875, 18.26953125, 19.8515625, 21.43359375, 23.015625, 24.59765625, 26.1796875, 27.76171875, 29.34375, 30.92578125, 32.5078125, 34.08984375, 35.671875, 37.25390625, 38.8359375, 40.41796875, 42.0]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 8.0, 10.0, 10.0, 17.0, 21.0, 19.0, 30.0, 30.0, 59.0, 71.0, 104.0, 147.0, 136.0, 68.0, 57.0, 54.0, 37.0, 24.0, 24.0, 17.0, 11.0, 9.0, 8.0, 8.0, 8.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.77734375, -2.70166015625, -2.6259765625, -2.55029296875, -2.474609375, -2.39892578125, -2.3232421875, -2.24755859375, -2.171875, -2.09619140625, -2.0205078125, -1.94482421875, -1.869140625, -1.79345703125, -1.7177734375, -1.64208984375, -1.56640625, -1.49072265625, -1.4150390625, -1.33935546875, -1.263671875, -1.18798828125, -1.1123046875, -1.03662109375, -0.9609375, -0.88525390625, -0.8095703125, -0.73388671875, -0.658203125, -0.58251953125, -0.5068359375, -0.43115234375, -0.35546875, -0.27978515625, -0.2041015625, -0.12841796875, -0.052734375, 0.02294921875, 0.0986328125, 0.17431640625, 0.25, 0.32568359375, 0.4013671875, 0.47705078125, 0.552734375, 0.62841796875, 0.7041015625, 0.77978515625, 0.85546875, 0.93115234375, 1.0068359375, 1.08251953125, 1.158203125, 1.23388671875, 1.3095703125, 1.38525390625, 1.4609375, 1.53662109375, 1.6123046875, 1.68798828125, 1.763671875, 1.83935546875, 1.9150390625, 1.99072265625, 2.06640625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 2.0, 11.0, 9.0, 7.0, 10.0, 8.0, 11.0, 14.0, 20.0, 23.0, 23.0, 40.0, 39.0, 42.0, 47.0, 56.0, 49.0, 47.0, 57.0, 55.0, 60.0, 40.0, 43.0, 39.0, 29.0, 47.0, 25.0, 14.0, 23.0, 21.0, 18.0, 13.0, 12.0, 9.0, 8.0, 6.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.876824378967285, -9.562353134155273, -9.247881889343262, -8.933411598205566, -8.618940353393555, -8.304469108581543, -7.989997863769531, -7.675527095794678, -7.361056327819824, -7.0465850830078125, -6.732114315032959, -6.417643070220947, -6.103172302246094, -5.788701057434082, -5.47422981262207, -5.159759044647217, -4.845287799835205, -4.530816555023193, -4.21634578704834, -3.901874542236328, -3.5874037742614746, -3.272932529449463, -2.9584615230560303, -2.6439905166625977, -2.329519510269165, -2.0150485038757324, -1.7005774974822998, -1.3861063718795776, -1.071635365486145, -0.7571643590927124, -0.44269323348999023, -0.12822222709655762, 0.186248779296875, 0.5007197856903076, 0.815190851688385, 1.1296619176864624, 1.444132924079895, 1.7586039304733276, 2.07307505607605, 2.3875460624694824, 2.702017068862915, 3.0164880752563477, 3.3309590816497803, 3.645430088043213, 3.9599013328552246, 4.274372100830078, 4.58884334564209, 4.903314590454102, 5.217785358428955, 5.532256603240967, 5.84672737121582, 6.161198616027832, 6.4756693840026855, 6.790140628814697, 7.104611396789551, 7.4190826416015625, 7.733553886413574, 8.048025131225586, 8.362496376037598, 8.676966667175293, 8.991437911987305, 9.305909156799316, 9.620380401611328, 9.934850692749023, 10.249321937561035]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 10.0, 12.0, 9.0, 10.0, 16.0, 14.0, 10.0, 22.0, 32.0, 34.0, 24.0, 38.0, 38.0, 47.0, 52.0, 58.0, 48.0, 62.0, 40.0, 62.0, 42.0, 47.0, 41.0, 45.0, 34.0, 32.0, 31.0, 14.0, 15.0, 14.0, 9.0, 11.0, 13.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7036714553833, -9.322959899902344, -8.94224739074707, -8.561535835266113, -8.180824279785156, -7.800111770629883, -7.419400215148926, -7.0386881828308105, -6.657976150512695, -6.27726411819458, -5.896552085876465, -5.515840530395508, -5.135128498077393, -4.754416465759277, -4.37370491027832, -3.992992877960205, -3.61228084564209, -3.2315688133239746, -2.8508570194244385, -2.4701452255249023, -2.089433193206787, -1.7087212800979614, -1.3280093669891357, -0.9472975730895996, -0.5665855407714844, -0.1858736276626587, 0.194838285446167, 0.5755501985549927, 0.9562621116638184, 1.336974024772644, 1.7176859378814697, 2.098397731781006, 2.479109764099121, 2.8598217964172363, 3.2405335903167725, 3.6212453842163086, 4.001957416534424, 4.382669448852539, 4.763381004333496, 5.144093036651611, 5.524805068969727, 5.905517101287842, 6.286229133605957, 6.666940689086914, 7.047652721405029, 7.4283647537231445, 7.809076309204102, 8.189788818359375, 8.570500373840332, 8.951211929321289, 9.331924438476562, 9.71263599395752, 10.093347549438477, 10.47406005859375, 10.854771614074707, 11.235483169555664, 11.616195678710938, 11.996907234191895, 12.377619743347168, 12.758331298828125, 13.139043807983398, 13.519755363464355, 13.900466918945312, 14.281179428100586, 14.661890983581543]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 10.0, 14.0, 20.0, 30.0, 57.0, 73.0, 88.0, 157.0, 255.0, 461.0, 838.0, 1653.0, 3435.0, 7406.0, 16347.0, 36645.0, 80306.0, 159395.0, 241209.0, 230051.0, 142031.0, 69645.0, 31768.0, 13968.0, 6402.0, 3033.0, 1465.0, 753.0, 402.0, 226.0, 134.0, 95.0, 59.0, 34.0, 30.0, 13.0, 8.0, 5.0, 7.0, 7.0, 1.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.359375, -13.82568359375, -13.2919921875, -12.75830078125, -12.224609375, -11.69091796875, -11.1572265625, -10.62353515625, -10.08984375, -9.55615234375, -9.0224609375, -8.48876953125, -7.955078125, -7.42138671875, -6.8876953125, -6.35400390625, -5.8203125, -5.28662109375, -4.7529296875, -4.21923828125, -3.685546875, -3.15185546875, -2.6181640625, -2.08447265625, -1.55078125, -1.01708984375, -0.4833984375, 0.05029296875, 0.583984375, 1.11767578125, 1.6513671875, 2.18505859375, 2.71875, 3.25244140625, 3.7861328125, 4.31982421875, 4.853515625, 5.38720703125, 5.9208984375, 6.45458984375, 6.98828125, 7.52197265625, 8.0556640625, 8.58935546875, 9.123046875, 9.65673828125, 10.1904296875, 10.72412109375, 11.2578125, 11.79150390625, 12.3251953125, 12.85888671875, 13.392578125, 13.92626953125, 14.4599609375, 14.99365234375, 15.52734375, 16.06103515625, 16.5947265625, 17.12841796875, 17.662109375, 18.19580078125, 18.7294921875, 19.26318359375, 19.796875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 10.0, 7.0, 9.0, 15.0, 10.0, 9.0, 18.0, 23.0, 22.0, 32.0, 39.0, 30.0, 53.0, 47.0, 46.0, 42.0, 45.0, 55.0, 57.0, 45.0, 61.0, 52.0, 43.0, 44.0, 29.0, 24.0, 18.0, 21.0, 20.0, 21.0, 13.0, 14.0, 8.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1875, -4.98333740234375, -4.7791748046875, -4.57501220703125, -4.370849609375, -4.16668701171875, -3.9625244140625, -3.75836181640625, -3.55419921875, -3.35003662109375, -3.1458740234375, -2.94171142578125, -2.737548828125, -2.53338623046875, -2.3292236328125, -2.12506103515625, -1.9208984375, -1.71673583984375, -1.5125732421875, -1.30841064453125, -1.104248046875, -0.90008544921875, -0.6959228515625, -0.49176025390625, -0.28759765625, -0.08343505859375, 0.1207275390625, 0.32489013671875, 0.529052734375, 0.73321533203125, 0.9373779296875, 1.14154052734375, 1.345703125, 1.54986572265625, 1.7540283203125, 1.95819091796875, 2.162353515625, 2.36651611328125, 2.5706787109375, 2.77484130859375, 2.97900390625, 3.18316650390625, 3.3873291015625, 3.59149169921875, 3.795654296875, 3.99981689453125, 4.2039794921875, 4.40814208984375, 4.6123046875, 4.81646728515625, 5.0206298828125, 5.22479248046875, 5.428955078125, 5.63311767578125, 5.8372802734375, 6.04144287109375, 6.24560546875, 6.44976806640625, 6.6539306640625, 6.85809326171875, 7.062255859375, 7.26641845703125, 7.4705810546875, 7.67474365234375, 7.87890625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 3.0, 5.0, 8.0, 6.0, 5.0, 13.0, 9.0, 11.0, 12.0, 16.0, 22.0, 16.0, 21.0, 22.0, 15.0, 31.0, 25.0, 38.0, 35.0, 39.0, 76.0, 713.0, 27784.0, 753059.0, 261005.0, 4916.0, 213.0, 53.0, 36.0, 31.0, 35.0, 29.0, 32.0, 25.0, 19.0, 21.0, 21.0, 10.0, 18.0, 14.0, 18.0, 19.0, 11.0, 4.0, 7.0, 7.0, 5.0, 8.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-80.0625, -77.6201171875, -75.177734375, -72.7353515625, -70.29296875, -67.8505859375, -65.408203125, -62.9658203125, -60.5234375, -58.0810546875, -55.638671875, -53.1962890625, -50.75390625, -48.3115234375, -45.869140625, -43.4267578125, -40.984375, -38.5419921875, -36.099609375, -33.6572265625, -31.21484375, -28.7724609375, -26.330078125, -23.8876953125, -21.4453125, -19.0029296875, -16.560546875, -14.1181640625, -11.67578125, -9.2333984375, -6.791015625, -4.3486328125, -1.90625, 0.5361328125, 2.978515625, 5.4208984375, 7.86328125, 10.3056640625, 12.748046875, 15.1904296875, 17.6328125, 20.0751953125, 22.517578125, 24.9599609375, 27.40234375, 29.8447265625, 32.287109375, 34.7294921875, 37.171875, 39.6142578125, 42.056640625, 44.4990234375, 46.94140625, 49.3837890625, 51.826171875, 54.2685546875, 56.7109375, 59.1533203125, 61.595703125, 64.0380859375, 66.48046875, 68.9228515625, 71.365234375, 73.8076171875, 76.25]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 9.0, 2.0, 6.0, 5.0, 10.0, 9.0, 15.0, 7.0, 10.0, 23.0, 18.0, 21.0, 23.0, 18.0, 24.0, 24.0, 30.0, 34.0, 46.0, 29.0, 33.0, 37.0, 35.0, 23.0, 36.0, 43.0, 39.0, 38.0, 29.0, 36.0, 24.0, 37.0, 22.0, 22.0, 22.0, 18.0, 20.0, 20.0, 12.0, 18.0, 18.0, 12.0, 6.0, 8.0, 8.0, 10.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0], "bins": [-6.015625, -5.841552734375, -5.66748046875, -5.493408203125, -5.3193359375, -5.145263671875, -4.97119140625, -4.797119140625, -4.623046875, -4.448974609375, -4.27490234375, -4.100830078125, -3.9267578125, -3.752685546875, -3.57861328125, -3.404541015625, -3.23046875, -3.056396484375, -2.88232421875, -2.708251953125, -2.5341796875, -2.360107421875, -2.18603515625, -2.011962890625, -1.837890625, -1.663818359375, -1.48974609375, -1.315673828125, -1.1416015625, -0.967529296875, -0.79345703125, -0.619384765625, -0.4453125, -0.271240234375, -0.09716796875, 0.076904296875, 0.2509765625, 0.425048828125, 0.59912109375, 0.773193359375, 0.947265625, 1.121337890625, 1.29541015625, 1.469482421875, 1.6435546875, 1.817626953125, 1.99169921875, 2.165771484375, 2.33984375, 2.513916015625, 2.68798828125, 2.862060546875, 3.0361328125, 3.210205078125, 3.38427734375, 3.558349609375, 3.732421875, 3.906494140625, 4.08056640625, 4.254638671875, 4.4287109375, 4.602783203125, 4.77685546875, 4.950927734375, 5.125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 6.0, 2.0, 2.0, 13.0, 8.0, 21.0, 22.0, 24.0, 41.0, 58.0, 93.0, 155.0, 208.0, 333.0, 547.0, 937.0, 1686.0, 2948.0, 6172.0, 14487.0, 40501.0, 142951.0, 564550.0, 190887.0, 49618.0, 17335.0, 7106.0, 3375.0, 1795.0, 1014.0, 590.0, 372.0, 225.0, 149.0, 94.0, 68.0, 51.0, 34.0, 11.0, 17.0, 15.0, 14.0, 8.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0], "bins": [-5.05859375, -4.912353515625, -4.76611328125, -4.619873046875, -4.4736328125, -4.327392578125, -4.18115234375, -4.034912109375, -3.888671875, -3.742431640625, -3.59619140625, -3.449951171875, -3.3037109375, -3.157470703125, -3.01123046875, -2.864990234375, -2.71875, -2.572509765625, -2.42626953125, -2.280029296875, -2.1337890625, -1.987548828125, -1.84130859375, -1.695068359375, -1.548828125, -1.402587890625, -1.25634765625, -1.110107421875, -0.9638671875, -0.817626953125, -0.67138671875, -0.525146484375, -0.37890625, -0.232666015625, -0.08642578125, 0.059814453125, 0.2060546875, 0.352294921875, 0.49853515625, 0.644775390625, 0.791015625, 0.937255859375, 1.08349609375, 1.229736328125, 1.3759765625, 1.522216796875, 1.66845703125, 1.814697265625, 1.9609375, 2.107177734375, 2.25341796875, 2.399658203125, 2.5458984375, 2.692138671875, 2.83837890625, 2.984619140625, 3.130859375, 3.277099609375, 3.42333984375, 3.569580078125, 3.7158203125, 3.862060546875, 4.00830078125, 4.154541015625, 4.30078125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 5.0, 13.0, 16.0, 30.0, 40.0, 63.0, 101.0, 125.0, 133.0, 126.0, 119.0, 64.0, 58.0, 29.0, 22.0, 10.0, 11.0, 10.0, 3.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.0008511543273925781, -0.0008321106433868408, -0.0008130669593811035, -0.0007940232753753662, -0.0007749795913696289, -0.0007559359073638916, -0.0007368922233581543, -0.000717848539352417, -0.0006988048553466797, -0.0006797611713409424, -0.0006607174873352051, -0.0006416738033294678, -0.0006226301193237305, -0.0006035864353179932, -0.0005845427513122559, -0.0005654990673065186, -0.0005464553833007812, -0.0005274116992950439, -0.0005083680152893066, -0.0004893243312835693, -0.00047028064727783203, -0.0004512369632720947, -0.0004321932792663574, -0.0004131495952606201, -0.0003941059112548828, -0.0003750622272491455, -0.0003560185432434082, -0.0003369748592376709, -0.0003179311752319336, -0.0002988874912261963, -0.000279843807220459, -0.0002608001232147217, -0.00024175643920898438, -0.00022271275520324707, -0.00020366907119750977, -0.00018462538719177246, -0.00016558170318603516, -0.00014653801918029785, -0.00012749433517456055, -0.00010845065116882324, -8.940696716308594e-05, -7.036328315734863e-05, -5.131959915161133e-05, -3.2275915145874023e-05, -1.3232231140136719e-05, 5.811452865600586e-06, 2.485513687133789e-05, 4.3898820877075195e-05, 6.29425048828125e-05, 8.19861888885498e-05, 0.00010102987289428711, 0.00012007355690002441, 0.00013911724090576172, 0.00015816092491149902, 0.00017720460891723633, 0.00019624829292297363, 0.00021529197692871094, 0.00023433566093444824, 0.00025337934494018555, 0.00027242302894592285, 0.00029146671295166016, 0.00031051039695739746, 0.00032955408096313477, 0.00034859776496887207, 0.0003676414489746094]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 8.0, 2.0, 7.0, 10.0, 12.0, 16.0, 18.0, 27.0, 38.0, 47.0, 84.0, 605.0, 40639.0, 1000544.0, 5973.0, 268.0, 64.0, 42.0, 23.0, 29.0, 13.0, 20.0, 11.0, 12.0, 9.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.8125, -25.013671875, -24.21484375, -23.416015625, -22.6171875, -21.818359375, -21.01953125, -20.220703125, -19.421875, -18.623046875, -17.82421875, -17.025390625, -16.2265625, -15.427734375, -14.62890625, -13.830078125, -13.03125, -12.232421875, -11.43359375, -10.634765625, -9.8359375, -9.037109375, -8.23828125, -7.439453125, -6.640625, -5.841796875, -5.04296875, -4.244140625, -3.4453125, -2.646484375, -1.84765625, -1.048828125, -0.25, 0.548828125, 1.34765625, 2.146484375, 2.9453125, 3.744140625, 4.54296875, 5.341796875, 6.140625, 6.939453125, 7.73828125, 8.537109375, 9.3359375, 10.134765625, 10.93359375, 11.732421875, 12.53125, 13.330078125, 14.12890625, 14.927734375, 15.7265625, 16.525390625, 17.32421875, 18.123046875, 18.921875, 19.720703125, 20.51953125, 21.318359375, 22.1171875, 22.916015625, 23.71484375, 24.513671875, 25.3125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 7.0, 2.0, 11.0, 7.0, 16.0, 17.0, 20.0, 22.0, 40.0, 47.0, 54.0, 79.0, 127.0, 145.0, 97.0, 71.0, 52.0, 31.0, 32.0, 28.0, 16.0, 14.0, 14.0, 7.0, 12.0, 5.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.744140625, -1.691650390625, -1.63916015625, -1.586669921875, -1.5341796875, -1.481689453125, -1.42919921875, -1.376708984375, -1.32421875, -1.271728515625, -1.21923828125, -1.166748046875, -1.1142578125, -1.061767578125, -1.00927734375, -0.956787109375, -0.904296875, -0.851806640625, -0.79931640625, -0.746826171875, -0.6943359375, -0.641845703125, -0.58935546875, -0.536865234375, -0.484375, -0.431884765625, -0.37939453125, -0.326904296875, -0.2744140625, -0.221923828125, -0.16943359375, -0.116943359375, -0.064453125, -0.011962890625, 0.04052734375, 0.093017578125, 0.1455078125, 0.197998046875, 0.25048828125, 0.302978515625, 0.35546875, 0.407958984375, 0.46044921875, 0.512939453125, 0.5654296875, 0.617919921875, 0.67041015625, 0.722900390625, 0.775390625, 0.827880859375, 0.88037109375, 0.932861328125, 0.9853515625, 1.037841796875, 1.09033203125, 1.142822265625, 1.1953125, 1.247802734375, 1.30029296875, 1.352783203125, 1.4052734375, 1.457763671875, 1.51025390625, 1.562744140625, 1.615234375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 15.0, 16.0, 51.0, 110.0, 184.0, 179.0, 196.0, 115.0, 76.0, 40.0, 19.0, 5.0, 1.0, 3.0], "bins": [-42.20933151245117, -41.45339584350586, -40.69746017456055, -39.94152069091797, -39.185585021972656, -38.429649353027344, -37.67371368408203, -36.91777801513672, -36.161842346191406, -35.405906677246094, -34.64997100830078, -33.89403533935547, -33.13809585571289, -32.38216018676758, -31.626224517822266, -30.870288848876953, -30.114351272583008, -29.358415603637695, -28.60247802734375, -27.846542358398438, -27.090606689453125, -26.334671020507812, -25.578733444213867, -24.822797775268555, -24.06686019897461, -23.310924530029297, -22.55498695373535, -21.79905128479004, -21.043115615844727, -20.28717803955078, -19.53124237060547, -18.775306701660156, -18.019371032714844, -17.26343536376953, -16.507497787475586, -15.751562118530273, -14.995626449584961, -14.239689826965332, -13.483753204345703, -12.72781753540039, -11.971881866455078, -11.21594524383545, -10.460009574890137, -9.704072952270508, -8.948137283325195, -8.192200660705566, -7.4362640380859375, -6.680327892303467, -5.924391746520996, -5.168455600738525, -4.412519454956055, -3.656582832336426, -2.900646686553955, -2.1447105407714844, -1.3887739181518555, -0.6328377723693848, 0.12309837341308594, 0.8790346384048462, 1.6349709033966064, 2.3909072875976562, 3.146843433380127, 3.9027795791625977, 4.658716201782227, 5.414652347564697, 6.170588493347168]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 7.0, 13.0, 11.0, 8.0, 16.0, 14.0, 16.0, 18.0, 24.0, 34.0, 33.0, 39.0, 37.0, 44.0, 32.0, 35.0, 49.0, 44.0, 50.0, 71.0, 32.0, 45.0, 27.0, 26.0, 44.0, 28.0, 28.0, 32.0, 24.0, 32.0, 15.0, 14.0, 12.0, 9.0, 14.0, 4.0, 9.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.796786308288574, -9.47227954864502, -9.147773742675781, -8.823266983032227, -8.498760223388672, -8.174254417419434, -7.849747657775879, -7.525241374969482, -7.200735092163086, -6.8762288093566895, -6.551722526550293, -6.227215766906738, -5.902709484100342, -5.578203201293945, -5.253696441650391, -4.929190158843994, -4.604683876037598, -4.280177593231201, -3.9556710720062256, -3.63116455078125, -3.3066582679748535, -2.982151985168457, -2.6576454639434814, -2.333138942718506, -2.0086326599121094, -1.6841262578964233, -1.3596198558807373, -1.0351134538650513, -0.7106070518493652, -0.3861006498336792, -0.061594247817993164, 0.2629122734069824, 0.5874185562133789, 0.9119249582290649, 1.236431360244751, 1.560937762260437, 1.885444164276123, 2.2099504470825195, 2.534456968307495, 2.8589634895324707, 3.183469772338867, 3.5079760551452637, 3.8324825763702393, 4.156989097595215, 4.481495380401611, 4.806001663208008, 5.1305084228515625, 5.455014705657959, 5.7795209884643555, 6.104027271270752, 6.428533554077148, 6.753040313720703, 7.0775465965271, 7.402052879333496, 7.726559638977051, 8.051065444946289, 8.375572204589844, 8.700078964233398, 9.024584770202637, 9.349091529846191, 9.67359733581543, 9.998104095458984, 10.322610855102539, 10.647117614746094, 10.971623420715332]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 10.0, 10.0, 6.0, 11.0, 15.0, 15.0, 36.0, 51.0, 70.0, 113.0, 160.0, 311.0, 379.0, 669.0, 1119.0, 1858.0, 3159.0, 5648.0, 10391.0, 20645.0, 43949.0, 123154.0, 1322404.0, 2354990.0, 196447.0, 55253.0, 24968.0, 12549.0, 6667.0, 3780.0, 2161.0, 1306.0, 756.0, 477.0, 276.0, 182.0, 111.0, 75.0, 39.0, 33.0, 12.0, 6.0, 5.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.1484375, -14.740478515625, -14.33251953125, -13.924560546875, -13.5166015625, -13.108642578125, -12.70068359375, -12.292724609375, -11.884765625, -11.476806640625, -11.06884765625, -10.660888671875, -10.2529296875, -9.844970703125, -9.43701171875, -9.029052734375, -8.62109375, -8.213134765625, -7.80517578125, -7.397216796875, -6.9892578125, -6.581298828125, -6.17333984375, -5.765380859375, -5.357421875, -4.949462890625, -4.54150390625, -4.133544921875, -3.7255859375, -3.317626953125, -2.90966796875, -2.501708984375, -2.09375, -1.685791015625, -1.27783203125, -0.869873046875, -0.4619140625, -0.053955078125, 0.35400390625, 0.761962890625, 1.169921875, 1.577880859375, 1.98583984375, 2.393798828125, 2.8017578125, 3.209716796875, 3.61767578125, 4.025634765625, 4.43359375, 4.841552734375, 5.24951171875, 5.657470703125, 6.0654296875, 6.473388671875, 6.88134765625, 7.289306640625, 7.697265625, 8.105224609375, 8.51318359375, 8.921142578125, 9.3291015625, 9.737060546875, 10.14501953125, 10.552978515625, 10.9609375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 11.0, 8.0, 5.0, 11.0, 9.0, 13.0, 15.0, 18.0, 23.0, 16.0, 36.0, 32.0, 31.0, 43.0, 41.0, 34.0, 33.0, 52.0, 55.0, 39.0, 62.0, 41.0, 36.0, 47.0, 40.0, 33.0, 31.0, 31.0, 38.0, 22.0, 22.0, 16.0, 11.0, 6.0, 13.0, 8.0, 8.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96875, -5.7716064453125, -5.574462890625, -5.3773193359375, -5.18017578125, -4.9830322265625, -4.785888671875, -4.5887451171875, -4.3916015625, -4.1944580078125, -3.997314453125, -3.8001708984375, -3.60302734375, -3.4058837890625, -3.208740234375, -3.0115966796875, -2.814453125, -2.6173095703125, -2.420166015625, -2.2230224609375, -2.02587890625, -1.8287353515625, -1.631591796875, -1.4344482421875, -1.2373046875, -1.0401611328125, -0.843017578125, -0.6458740234375, -0.44873046875, -0.2515869140625, -0.054443359375, 0.1427001953125, 0.33984375, 0.5369873046875, 0.734130859375, 0.9312744140625, 1.12841796875, 1.3255615234375, 1.522705078125, 1.7198486328125, 1.9169921875, 2.1141357421875, 2.311279296875, 2.5084228515625, 2.70556640625, 2.9027099609375, 3.099853515625, 3.2969970703125, 3.494140625, 3.6912841796875, 3.888427734375, 4.0855712890625, 4.28271484375, 4.4798583984375, 4.677001953125, 4.8741455078125, 5.0712890625, 5.2684326171875, 5.465576171875, 5.6627197265625, 5.85986328125, 6.0570068359375, 6.254150390625, 6.4512939453125, 6.6484375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 11.0, 3.0, 8.0, 12.0, 18.0, 25.0, 27.0, 34.0, 32.0, 65.0, 76.0, 107.0, 159.0, 410.0, 8427.0, 4087088.0, 96181.0, 1003.0, 192.0, 93.0, 73.0, 62.0, 40.0, 21.0, 34.0, 15.0, 13.0, 8.0, 12.0, 12.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.6875, -96.97265625, -94.2578125, -91.54296875, -88.828125, -86.11328125, -83.3984375, -80.68359375, -77.96875, -75.25390625, -72.5390625, -69.82421875, -67.109375, -64.39453125, -61.6796875, -58.96484375, -56.25, -53.53515625, -50.8203125, -48.10546875, -45.390625, -42.67578125, -39.9609375, -37.24609375, -34.53125, -31.81640625, -29.1015625, -26.38671875, -23.671875, -20.95703125, -18.2421875, -15.52734375, -12.8125, -10.09765625, -7.3828125, -4.66796875, -1.953125, 0.76171875, 3.4765625, 6.19140625, 8.90625, 11.62109375, 14.3359375, 17.05078125, 19.765625, 22.48046875, 25.1953125, 27.91015625, 30.625, 33.33984375, 36.0546875, 38.76953125, 41.484375, 44.19921875, 46.9140625, 49.62890625, 52.34375, 55.05859375, 57.7734375, 60.48828125, 63.203125, 65.91796875, 68.6328125, 71.34765625, 74.0625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 2.0, 2.0, 7.0, 5.0, 10.0, 10.0, 19.0, 21.0, 26.0, 27.0, 38.0, 51.0, 62.0, 94.0, 116.0, 194.0, 392.0, 728.0, 914.0, 526.0, 311.0, 135.0, 88.0, 66.0, 55.0, 38.0, 29.0, 22.0, 20.0, 14.0, 6.0, 11.0, 10.0, 7.0, 7.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09765625, -3.97845458984375, -3.8592529296875, -3.74005126953125, -3.620849609375, -3.50164794921875, -3.3824462890625, -3.26324462890625, -3.14404296875, -3.02484130859375, -2.9056396484375, -2.78643798828125, -2.667236328125, -2.54803466796875, -2.4288330078125, -2.30963134765625, -2.1904296875, -2.07122802734375, -1.9520263671875, -1.83282470703125, -1.713623046875, -1.59442138671875, -1.4752197265625, -1.35601806640625, -1.23681640625, -1.11761474609375, -0.9984130859375, -0.87921142578125, -0.760009765625, -0.64080810546875, -0.5216064453125, -0.40240478515625, -0.283203125, -0.16400146484375, -0.0447998046875, 0.07440185546875, 0.193603515625, 0.31280517578125, 0.4320068359375, 0.55120849609375, 0.67041015625, 0.78961181640625, 0.9088134765625, 1.02801513671875, 1.147216796875, 1.26641845703125, 1.3856201171875, 1.50482177734375, 1.6240234375, 1.74322509765625, 1.8624267578125, 1.98162841796875, 2.100830078125, 2.22003173828125, 2.3392333984375, 2.45843505859375, 2.57763671875, 2.69683837890625, 2.8160400390625, 2.93524169921875, 3.054443359375, 3.17364501953125, 3.2928466796875, 3.41204833984375, 3.53125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 8.0, 46.0, 173.0, 366.0, 289.0, 95.0, 29.0, 11.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.152997016906738, -5.940060138702393, -4.727123260498047, -3.514186382293701, -2.3012495040893555, -1.0883126258850098, 0.12462425231933594, 1.3375616073608398, 2.5504980087280273, 3.763434886932373, 4.976371765136719, 6.1893086433410645, 7.40224552154541, 8.615182876586914, 9.828119277954102, 11.041056632995605, 12.253993034362793, 13.466930389404297, 14.679866790771484, 15.892803192138672, 17.10573959350586, 18.31867790222168, 19.531614303588867, 20.744552612304688, 21.957489013671875, 23.170425415039062, 24.38336181640625, 25.59630012512207, 26.809236526489258, 28.022172927856445, 29.235111236572266, 30.448047637939453, 31.660980224609375, 32.87391662597656, 34.08685302734375, 35.29978942871094, 36.512725830078125, 37.72566604614258, 38.938602447509766, 40.15153884887695, 41.36447525024414, 42.57741165161133, 43.790348052978516, 45.0032844543457, 46.216224670410156, 47.429161071777344, 48.64209747314453, 49.85503387451172, 51.067970275878906, 52.280906677246094, 53.49384307861328, 54.70677947998047, 55.919715881347656, 57.13265609741211, 58.3455924987793, 59.558528900146484, 60.77146530151367, 61.98440170288086, 63.19733810424805, 64.4102783203125, 65.62321472167969, 66.83615112304688, 68.04908752441406, 69.26202392578125, 70.47496032714844]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 9.0, 7.0, 3.0, 12.0, 12.0, 12.0, 12.0, 17.0, 24.0, 33.0, 32.0, 40.0, 54.0, 47.0, 44.0, 39.0, 58.0, 46.0, 52.0, 53.0, 35.0, 57.0, 42.0, 35.0, 32.0, 32.0, 33.0, 30.0, 27.0, 14.0, 15.0, 13.0, 14.0, 6.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.62014102935791, -9.318951606750488, -9.01776123046875, -8.716571807861328, -8.415382385253906, -8.114192962646484, -7.813003063201904, -7.511813163757324, -7.210623741149902, -6.9094343185424805, -6.6082444190979, -6.30705451965332, -6.005865097045898, -5.704675674438477, -5.4034857749938965, -5.102295875549316, -4.8011064529418945, -4.499917030334473, -4.198727130889893, -3.8975374698638916, -3.5963478088378906, -3.2951581478118896, -2.9939684867858887, -2.6927788257598877, -2.3915891647338867, -2.0903995037078857, -1.7892098426818848, -1.4880201816558838, -1.1868305206298828, -0.8856408596038818, -0.5844511985778809, -0.2832615375518799, 0.0179290771484375, 0.3191187381744385, 0.6203083992004395, 0.9214980602264404, 1.2226877212524414, 1.5238773822784424, 1.8250670433044434, 2.1262567043304443, 2.4274463653564453, 2.7286360263824463, 3.0298256874084473, 3.3310153484344482, 3.632205009460449, 3.93339467048645, 4.234584331512451, 4.535774230957031, 4.836963653564453, 5.138153076171875, 5.439342975616455, 5.740532875061035, 6.041722297668457, 6.342911720275879, 6.644101619720459, 6.945291519165039, 7.246480941772461, 7.547670364379883, 7.848860263824463, 8.150050163269043, 8.451239585876465, 8.752429008483887, 9.053619384765625, 9.354808807373047, 9.655998229980469]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 10.0, 6.0, 7.0, 17.0, 17.0, 23.0, 47.0, 50.0, 62.0, 80.0, 121.0, 189.0, 251.0, 437.0, 675.0, 1152.0, 2030.0, 3865.0, 7428.0, 15024.0, 30892.0, 67207.0, 155168.0, 339502.0, 236933.0, 99141.0, 44633.0, 20942.0, 10419.0, 5429.0, 2779.0, 1493.0, 915.0, 590.0, 300.0, 235.0, 142.0, 99.0, 70.0, 46.0, 32.0, 33.0, 29.0, 14.0, 10.0, 6.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.4140625, -12.046142578125, -11.67822265625, -11.310302734375, -10.9423828125, -10.574462890625, -10.20654296875, -9.838623046875, -9.470703125, -9.102783203125, -8.73486328125, -8.366943359375, -7.9990234375, -7.631103515625, -7.26318359375, -6.895263671875, -6.52734375, -6.159423828125, -5.79150390625, -5.423583984375, -5.0556640625, -4.687744140625, -4.31982421875, -3.951904296875, -3.583984375, -3.216064453125, -2.84814453125, -2.480224609375, -2.1123046875, -1.744384765625, -1.37646484375, -1.008544921875, -0.640625, -0.272705078125, 0.09521484375, 0.463134765625, 0.8310546875, 1.198974609375, 1.56689453125, 1.934814453125, 2.302734375, 2.670654296875, 3.03857421875, 3.406494140625, 3.7744140625, 4.142333984375, 4.51025390625, 4.878173828125, 5.24609375, 5.614013671875, 5.98193359375, 6.349853515625, 6.7177734375, 7.085693359375, 7.45361328125, 7.821533203125, 8.189453125, 8.557373046875, 8.92529296875, 9.293212890625, 9.6611328125, 10.029052734375, 10.39697265625, 10.764892578125, 11.1328125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 4.0, 6.0, 8.0, 8.0, 9.0, 4.0, 11.0, 20.0, 10.0, 27.0, 21.0, 35.0, 37.0, 41.0, 36.0, 38.0, 37.0, 44.0, 41.0, 46.0, 42.0, 40.0, 46.0, 53.0, 35.0, 36.0, 34.0, 33.0, 38.0, 28.0, 20.0, 17.0, 16.0, 15.0, 21.0, 16.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4375, -7.22039794921875, -7.0032958984375, -6.78619384765625, -6.569091796875, -6.35198974609375, -6.1348876953125, -5.91778564453125, -5.70068359375, -5.48358154296875, -5.2664794921875, -5.04937744140625, -4.832275390625, -4.61517333984375, -4.3980712890625, -4.18096923828125, -3.9638671875, -3.74676513671875, -3.5296630859375, -3.31256103515625, -3.095458984375, -2.87835693359375, -2.6612548828125, -2.44415283203125, -2.22705078125, -2.00994873046875, -1.7928466796875, -1.57574462890625, -1.358642578125, -1.14154052734375, -0.9244384765625, -0.70733642578125, -0.490234375, -0.27313232421875, -0.0560302734375, 0.16107177734375, 0.378173828125, 0.59527587890625, 0.8123779296875, 1.02947998046875, 1.24658203125, 1.46368408203125, 1.6807861328125, 1.89788818359375, 2.114990234375, 2.33209228515625, 2.5491943359375, 2.76629638671875, 2.9833984375, 3.20050048828125, 3.4176025390625, 3.63470458984375, 3.851806640625, 4.06890869140625, 4.2860107421875, 4.50311279296875, 4.72021484375, 4.93731689453125, 5.1544189453125, 5.37152099609375, 5.588623046875, 5.80572509765625, 6.0228271484375, 6.23992919921875, 6.45703125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 9.0, 8.0, 11.0, 11.0, 12.0, 21.0, 29.0, 33.0, 47.0, 68.0, 115.0, 159.0, 283.0, 430.0, 734.0, 1324.0, 2637.0, 5703.0, 14457.0, 45079.0, 240578.0, 616291.0, 81513.0, 22563.0, 8418.0, 3689.0, 1804.0, 943.0, 586.0, 362.0, 217.0, 137.0, 63.0, 72.0, 40.0, 28.0, 17.0, 20.0, 11.0, 11.0, 4.0, 11.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9140625, -13.46826171875, -13.0224609375, -12.57666015625, -12.130859375, -11.68505859375, -11.2392578125, -10.79345703125, -10.34765625, -9.90185546875, -9.4560546875, -9.01025390625, -8.564453125, -8.11865234375, -7.6728515625, -7.22705078125, -6.78125, -6.33544921875, -5.8896484375, -5.44384765625, -4.998046875, -4.55224609375, -4.1064453125, -3.66064453125, -3.21484375, -2.76904296875, -2.3232421875, -1.87744140625, -1.431640625, -0.98583984375, -0.5400390625, -0.09423828125, 0.3515625, 0.79736328125, 1.2431640625, 1.68896484375, 2.134765625, 2.58056640625, 3.0263671875, 3.47216796875, 3.91796875, 4.36376953125, 4.8095703125, 5.25537109375, 5.701171875, 6.14697265625, 6.5927734375, 7.03857421875, 7.484375, 7.93017578125, 8.3759765625, 8.82177734375, 9.267578125, 9.71337890625, 10.1591796875, 10.60498046875, 11.05078125, 11.49658203125, 11.9423828125, 12.38818359375, 12.833984375, 13.27978515625, 13.7255859375, 14.17138671875, 14.6171875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 6.0, 9.0, 6.0, 10.0, 11.0, 16.0, 20.0, 24.0, 24.0, 37.0, 39.0, 29.0, 45.0, 40.0, 28.0, 47.0, 53.0, 55.0, 53.0, 57.0, 35.0, 49.0, 52.0, 38.0, 29.0, 41.0, 23.0, 23.0, 26.0, 18.0, 12.0, 8.0, 8.0, 13.0, 8.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.23828125, -6.06463623046875, -5.8909912109375, -5.71734619140625, -5.543701171875, -5.37005615234375, -5.1964111328125, -5.02276611328125, -4.84912109375, -4.67547607421875, -4.5018310546875, -4.32818603515625, -4.154541015625, -3.98089599609375, -3.8072509765625, -3.63360595703125, -3.4599609375, -3.28631591796875, -3.1126708984375, -2.93902587890625, -2.765380859375, -2.59173583984375, -2.4180908203125, -2.24444580078125, -2.07080078125, -1.89715576171875, -1.7235107421875, -1.54986572265625, -1.376220703125, -1.20257568359375, -1.0289306640625, -0.85528564453125, -0.681640625, -0.50799560546875, -0.3343505859375, -0.16070556640625, 0.012939453125, 0.18658447265625, 0.3602294921875, 0.53387451171875, 0.70751953125, 0.88116455078125, 1.0548095703125, 1.22845458984375, 1.402099609375, 1.57574462890625, 1.7493896484375, 1.92303466796875, 2.0966796875, 2.27032470703125, 2.4439697265625, 2.61761474609375, 2.791259765625, 2.96490478515625, 3.1385498046875, 3.31219482421875, 3.48583984375, 3.65948486328125, 3.8331298828125, 4.00677490234375, 4.180419921875, 4.35406494140625, 4.5277099609375, 4.70135498046875, 4.875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 9.0, 7.0, 9.0, 10.0, 18.0, 16.0, 23.0, 39.0, 52.0, 62.0, 82.0, 130.0, 165.0, 290.0, 391.0, 562.0, 927.0, 1457.0, 2344.0, 4564.0, 9069.0, 23680.0, 101806.0, 768021.0, 92838.0, 22288.0, 8739.0, 4235.0, 2402.0, 1391.0, 906.0, 611.0, 390.0, 275.0, 206.0, 127.0, 122.0, 87.0, 48.0, 42.0, 22.0, 24.0, 17.0, 14.0, 11.0, 10.0, 7.0, 6.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-14.2421875, -13.8167724609375, -13.391357421875, -12.9659423828125, -12.54052734375, -12.1151123046875, -11.689697265625, -11.2642822265625, -10.8388671875, -10.4134521484375, -9.988037109375, -9.5626220703125, -9.13720703125, -8.7117919921875, -8.286376953125, -7.8609619140625, -7.435546875, -7.0101318359375, -6.584716796875, -6.1593017578125, -5.73388671875, -5.3084716796875, -4.883056640625, -4.4576416015625, -4.0322265625, -3.6068115234375, -3.181396484375, -2.7559814453125, -2.33056640625, -1.9051513671875, -1.479736328125, -1.0543212890625, -0.62890625, -0.2034912109375, 0.221923828125, 0.6473388671875, 1.07275390625, 1.4981689453125, 1.923583984375, 2.3489990234375, 2.7744140625, 3.1998291015625, 3.625244140625, 4.0506591796875, 4.47607421875, 4.9014892578125, 5.326904296875, 5.7523193359375, 6.177734375, 6.6031494140625, 7.028564453125, 7.4539794921875, 7.87939453125, 8.3048095703125, 8.730224609375, 9.1556396484375, 9.5810546875, 10.0064697265625, 10.431884765625, 10.8572998046875, 11.28271484375, 11.7081298828125, 12.133544921875, 12.5589599609375, 12.984375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 7.0, 7.0, 6.0, 11.0, 15.0, 20.0, 21.0, 27.0, 34.0, 43.0, 48.0, 64.0, 85.0, 85.0, 111.0, 94.0, 70.0, 62.0, 41.0, 34.0, 14.0, 20.0, 13.0, 8.0, 11.0, 10.0, 5.0, 12.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00026917457580566406, -0.000260230153799057, -0.00025128573179244995, -0.0002423413097858429, -0.00023339688777923584, -0.00022445246577262878, -0.00021550804376602173, -0.00020656362175941467, -0.00019761919975280762, -0.00018867477774620056, -0.0001797303557395935, -0.00017078593373298645, -0.0001618415117263794, -0.00015289708971977234, -0.00014395266771316528, -0.00013500824570655823, -0.00012606382369995117, -0.00011711940169334412, -0.00010817497968673706, -9.923055768013e-05, -9.028613567352295e-05, -8.13417136669159e-05, -7.239729166030884e-05, -6.345286965370178e-05, -5.4508447647094727e-05, -4.556402564048767e-05, -3.6619603633880615e-05, -2.767518162727356e-05, -1.8730759620666504e-05, -9.786337614059448e-06, -8.419156074523926e-07, 8.102506399154663e-06, 1.704692840576172e-05, 2.5991350412368774e-05, 3.493577241897583e-05, 4.3880194425582886e-05, 5.282461643218994e-05, 6.1769038438797e-05, 7.071346044540405e-05, 7.965788245201111e-05, 8.860230445861816e-05, 9.754672646522522e-05, 0.00010649114847183228, 0.00011543557047843933, 0.0001243799924850464, 0.00013332441449165344, 0.0001422688364982605, 0.00015121325850486755, 0.0001601576805114746, 0.00016910210251808167, 0.00017804652452468872, 0.00018699094653129578, 0.00019593536853790283, 0.0002048797905445099, 0.00021382421255111694, 0.000222768634557724, 0.00023171305656433105, 0.0002406574785709381, 0.00024960190057754517, 0.0002585463225841522, 0.0002674907445907593, 0.00027643516659736633, 0.0002853795886039734, 0.00029432401061058044, 0.0003032684326171875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 5.0, 6.0, 8.0, 10.0, 15.0, 10.0, 20.0, 19.0, 30.0, 37.0, 32.0, 44.0, 188.0, 9659.0, 1010734.0, 27011.0, 386.0, 65.0, 30.0, 44.0, 29.0, 30.0, 23.0, 20.0, 14.0, 13.0, 6.0, 12.0, 8.0, 6.0, 10.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.40625, -52.7373046875, -51.068359375, -49.3994140625, -47.73046875, -46.0615234375, -44.392578125, -42.7236328125, -41.0546875, -39.3857421875, -37.716796875, -36.0478515625, -34.37890625, -32.7099609375, -31.041015625, -29.3720703125, -27.703125, -26.0341796875, -24.365234375, -22.6962890625, -21.02734375, -19.3583984375, -17.689453125, -16.0205078125, -14.3515625, -12.6826171875, -11.013671875, -9.3447265625, -7.67578125, -6.0068359375, -4.337890625, -2.6689453125, -1.0, 0.6689453125, 2.337890625, 4.0068359375, 5.67578125, 7.3447265625, 9.013671875, 10.6826171875, 12.3515625, 14.0205078125, 15.689453125, 17.3583984375, 19.02734375, 20.6962890625, 22.365234375, 24.0341796875, 25.703125, 27.3720703125, 29.041015625, 30.7099609375, 32.37890625, 34.0478515625, 35.716796875, 37.3857421875, 39.0546875, 40.7236328125, 42.392578125, 44.0615234375, 45.73046875, 47.3994140625, 49.068359375, 50.7373046875, 52.40625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 5.0, 1.0, 6.0, 1.0, 0.0, 3.0, 6.0, 7.0, 8.0, 8.0, 13.0, 11.0, 12.0, 13.0, 24.0, 27.0, 33.0, 37.0, 43.0, 70.0, 84.0, 125.0, 99.0, 83.0, 52.0, 31.0, 33.0, 31.0, 24.0, 22.0, 18.0, 13.0, 10.0, 18.0, 5.0, 6.0, 7.0, 8.0, 7.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.13671875, -2.070892333984375, -2.00506591796875, -1.939239501953125, -1.8734130859375, -1.807586669921875, -1.74176025390625, -1.675933837890625, -1.610107421875, -1.544281005859375, -1.47845458984375, -1.412628173828125, -1.3468017578125, -1.280975341796875, -1.21514892578125, -1.149322509765625, -1.08349609375, -1.017669677734375, -0.95184326171875, -0.886016845703125, -0.8201904296875, -0.754364013671875, -0.68853759765625, -0.622711181640625, -0.556884765625, -0.491058349609375, -0.42523193359375, -0.359405517578125, -0.2935791015625, -0.227752685546875, -0.16192626953125, -0.096099853515625, -0.0302734375, 0.035552978515625, 0.10137939453125, 0.167205810546875, 0.2330322265625, 0.298858642578125, 0.36468505859375, 0.430511474609375, 0.496337890625, 0.562164306640625, 0.62799072265625, 0.693817138671875, 0.7596435546875, 0.825469970703125, 0.89129638671875, 0.957122802734375, 1.02294921875, 1.088775634765625, 1.15460205078125, 1.220428466796875, 1.2862548828125, 1.352081298828125, 1.41790771484375, 1.483734130859375, 1.549560546875, 1.615386962890625, 1.68121337890625, 1.747039794921875, 1.8128662109375, 1.878692626953125, 1.94451904296875, 2.010345458984375, 2.076171875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 10.0, 20.0, 33.0, 67.0, 114.0, 171.0, 213.0, 149.0, 100.0, 53.0, 39.0, 17.0, 11.0, 12.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.236847877502441, -7.670434474945068, -7.104021072387695, -6.5376081466674805, -5.971194744110107, -5.404781341552734, -4.8383684158325195, -4.2719550132751465, -3.7055416107177734, -3.1391282081604004, -2.5727150440216064, -2.0063018798828125, -1.4398884773254395, -0.8734750747680664, -0.30706191062927246, 0.2593512535095215, 0.8257646560668945, 1.392177939414978, 1.9585912227630615, 2.5250043869018555, 3.0914177894592285, 3.6578311920166016, 4.224244117736816, 4.7906575202941895, 5.3570709228515625, 5.9234843254089355, 6.489897727966309, 7.056310653686523, 7.6227240562438965, 8.18913745880127, 8.755550384521484, 9.321964263916016, 9.888378143310547, 10.454791069030762, 11.021204948425293, 11.587617874145508, 12.154031753540039, 12.720444679260254, 13.286857604980469, 13.853271484375, 14.419684410095215, 14.98609733581543, 15.552511215209961, 16.118925094604492, 16.68533706665039, 17.251750946044922, 17.818164825439453, 18.38457679748535, 18.950990676879883, 19.517404556274414, 20.083816528320312, 20.650230407714844, 21.216644287109375, 21.783058166503906, 22.349470138549805, 22.915884017944336, 23.482295989990234, 24.048709869384766, 24.615121841430664, 25.181535720825195, 25.747949600219727, 26.314361572265625, 26.880775451660156, 27.447189331054688, 28.01360321044922]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 9.0, 11.0, 10.0, 11.0, 20.0, 16.0, 19.0, 27.0, 28.0, 45.0, 49.0, 49.0, 38.0, 50.0, 61.0, 48.0, 58.0, 50.0, 43.0, 43.0, 46.0, 37.0, 34.0, 32.0, 28.0, 25.0, 20.0, 24.0, 21.0, 9.0, 14.0, 5.0, 4.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.655970573425293, -8.387137413024902, -8.118305206298828, -7.8494720458984375, -7.580638885498047, -7.311805725097656, -7.042973041534424, -6.774140357971191, -6.505307197570801, -6.23647403717041, -5.967641353607178, -5.698808670043945, -5.429975509643555, -5.161142349243164, -4.892309665679932, -4.623476982116699, -4.354643821716309, -4.085810661315918, -3.8169779777526855, -3.548145055770874, -3.2793121337890625, -3.010479211807251, -2.7416462898254395, -2.472813367843628, -2.2039804458618164, -1.9351475238800049, -1.6663146018981934, -1.3974816799163818, -1.1286487579345703, -0.8598158359527588, -0.5909829139709473, -0.32214999198913574, -0.05331707000732422, 0.2155158519744873, 0.48434877395629883, 0.7531816959381104, 1.0220146179199219, 1.2908475399017334, 1.559680461883545, 1.8285133838653564, 2.097346305847168, 2.3661792278289795, 2.635012149810791, 2.9038450717926025, 3.172677993774414, 3.4415109157562256, 3.710343837738037, 3.9791767597198486, 4.24800968170166, 4.516842842102051, 4.785675525665283, 5.054508209228516, 5.323341369628906, 5.592174530029297, 5.861007213592529, 6.129839897155762, 6.398673057556152, 6.667506217956543, 6.936338901519775, 7.205171585083008, 7.474004745483398, 7.742837905883789, 8.01167106628418, 8.280503273010254, 8.549336433410645]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 7.0, 4.0, 11.0, 20.0, 31.0, 43.0, 45.0, 81.0, 102.0, 171.0, 223.0, 300.0, 468.0, 602.0, 866.0, 1249.0, 1985.0, 3525.0, 7869.0, 19316.0, 55051.0, 162074.0, 363804.0, 273368.0, 98031.0, 33811.0, 12554.0, 5280.0, 2598.0, 1572.0, 928.0, 706.0, 518.0, 379.0, 287.0, 195.0, 145.0, 109.0, 91.0, 42.0, 32.0, 22.0, 16.0, 9.0, 6.0, 6.0, 3.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.0625, -16.525390625, -15.98828125, -15.451171875, -14.9140625, -14.376953125, -13.83984375, -13.302734375, -12.765625, -12.228515625, -11.69140625, -11.154296875, -10.6171875, -10.080078125, -9.54296875, -9.005859375, -8.46875, -7.931640625, -7.39453125, -6.857421875, -6.3203125, -5.783203125, -5.24609375, -4.708984375, -4.171875, -3.634765625, -3.09765625, -2.560546875, -2.0234375, -1.486328125, -0.94921875, -0.412109375, 0.125, 0.662109375, 1.19921875, 1.736328125, 2.2734375, 2.810546875, 3.34765625, 3.884765625, 4.421875, 4.958984375, 5.49609375, 6.033203125, 6.5703125, 7.107421875, 7.64453125, 8.181640625, 8.71875, 9.255859375, 9.79296875, 10.330078125, 10.8671875, 11.404296875, 11.94140625, 12.478515625, 13.015625, 13.552734375, 14.08984375, 14.626953125, 15.1640625, 15.701171875, 16.23828125, 16.775390625, 17.3125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 3.0, 9.0, 11.0, 10.0, 7.0, 9.0, 16.0, 19.0, 24.0, 27.0, 32.0, 33.0, 41.0, 54.0, 49.0, 44.0, 54.0, 55.0, 51.0, 50.0, 50.0, 48.0, 38.0, 40.0, 27.0, 32.0, 30.0, 24.0, 23.0, 23.0, 25.0, 12.0, 9.0, 10.0, 4.0, 7.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16015625, -5.9688720703125, -5.777587890625, -5.5863037109375, -5.39501953125, -5.2037353515625, -5.012451171875, -4.8211669921875, -4.6298828125, -4.4385986328125, -4.247314453125, -4.0560302734375, -3.86474609375, -3.6734619140625, -3.482177734375, -3.2908935546875, -3.099609375, -2.9083251953125, -2.717041015625, -2.5257568359375, -2.33447265625, -2.1431884765625, -1.951904296875, -1.7606201171875, -1.5693359375, -1.3780517578125, -1.186767578125, -0.9954833984375, -0.80419921875, -0.6129150390625, -0.421630859375, -0.2303466796875, -0.0390625, 0.1522216796875, 0.343505859375, 0.5347900390625, 0.72607421875, 0.9173583984375, 1.108642578125, 1.2999267578125, 1.4912109375, 1.6824951171875, 1.873779296875, 2.0650634765625, 2.25634765625, 2.4476318359375, 2.638916015625, 2.8302001953125, 3.021484375, 3.2127685546875, 3.404052734375, 3.5953369140625, 3.78662109375, 3.9779052734375, 4.169189453125, 4.3604736328125, 4.5517578125, 4.7430419921875, 4.934326171875, 5.1256103515625, 5.31689453125, 5.5081787109375, 5.699462890625, 5.8907470703125, 6.08203125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 4.0, 7.0, 15.0, 6.0, 19.0, 16.0, 37.0, 31.0, 43.0, 65.0, 71.0, 277.0, 4661.0, 989252.0, 52796.0, 832.0, 109.0, 57.0, 51.0, 45.0, 29.0, 28.0, 12.0, 14.0, 19.0, 12.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-139.0, -134.4765625, -129.953125, -125.4296875, -120.90625, -116.3828125, -111.859375, -107.3359375, -102.8125, -98.2890625, -93.765625, -89.2421875, -84.71875, -80.1953125, -75.671875, -71.1484375, -66.625, -62.1015625, -57.578125, -53.0546875, -48.53125, -44.0078125, -39.484375, -34.9609375, -30.4375, -25.9140625, -21.390625, -16.8671875, -12.34375, -7.8203125, -3.296875, 1.2265625, 5.75, 10.2734375, 14.796875, 19.3203125, 23.84375, 28.3671875, 32.890625, 37.4140625, 41.9375, 46.4609375, 50.984375, 55.5078125, 60.03125, 64.5546875, 69.078125, 73.6015625, 78.125, 82.6484375, 87.171875, 91.6953125, 96.21875, 100.7421875, 105.265625, 109.7890625, 114.3125, 118.8359375, 123.359375, 127.8828125, 132.40625, 136.9296875, 141.453125, 145.9765625, 150.5]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 5.0, 5.0, 7.0, 7.0, 8.0, 12.0, 14.0, 18.0, 30.0, 35.0, 43.0, 57.0, 69.0, 52.0, 64.0, 79.0, 88.0, 70.0, 55.0, 63.0, 50.0, 39.0, 31.0, 19.0, 19.0, 17.0, 14.0, 10.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.90625, -10.5506591796875, -10.195068359375, -9.8394775390625, -9.48388671875, -9.1282958984375, -8.772705078125, -8.4171142578125, -8.0615234375, -7.7059326171875, -7.350341796875, -6.9947509765625, -6.63916015625, -6.2835693359375, -5.927978515625, -5.5723876953125, -5.216796875, -4.8612060546875, -4.505615234375, -4.1500244140625, -3.79443359375, -3.4388427734375, -3.083251953125, -2.7276611328125, -2.3720703125, -2.0164794921875, -1.660888671875, -1.3052978515625, -0.94970703125, -0.5941162109375, -0.238525390625, 0.1170654296875, 0.47265625, 0.8282470703125, 1.183837890625, 1.5394287109375, 1.89501953125, 2.2506103515625, 2.606201171875, 2.9617919921875, 3.3173828125, 3.6729736328125, 4.028564453125, 4.3841552734375, 4.73974609375, 5.0953369140625, 5.450927734375, 5.8065185546875, 6.162109375, 6.5177001953125, 6.873291015625, 7.2288818359375, 7.58447265625, 7.9400634765625, 8.295654296875, 8.6512451171875, 9.0068359375, 9.3624267578125, 9.718017578125, 10.0736083984375, 10.42919921875, 10.7847900390625, 11.140380859375, 11.4959716796875, 11.8515625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 5.0, 11.0, 13.0, 23.0, 33.0, 50.0, 73.0, 140.0, 232.0, 525.0, 1168.0, 2690.0, 7504.0, 36187.0, 771970.0, 201046.0, 18276.0, 4868.0, 1983.0, 847.0, 405.0, 213.0, 114.0, 62.0, 37.0, 32.0, 15.0, 7.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69140625, -7.39349365234375, -7.0955810546875, -6.79766845703125, -6.499755859375, -6.20184326171875, -5.9039306640625, -5.60601806640625, -5.30810546875, -5.01019287109375, -4.7122802734375, -4.41436767578125, -4.116455078125, -3.81854248046875, -3.5206298828125, -3.22271728515625, -2.9248046875, -2.62689208984375, -2.3289794921875, -2.03106689453125, -1.733154296875, -1.43524169921875, -1.1373291015625, -0.83941650390625, -0.54150390625, -0.24359130859375, 0.0543212890625, 0.35223388671875, 0.650146484375, 0.94805908203125, 1.2459716796875, 1.54388427734375, 1.841796875, 2.13970947265625, 2.4376220703125, 2.73553466796875, 3.033447265625, 3.33135986328125, 3.6292724609375, 3.92718505859375, 4.22509765625, 4.52301025390625, 4.8209228515625, 5.11883544921875, 5.416748046875, 5.71466064453125, 6.0125732421875, 6.31048583984375, 6.6083984375, 6.90631103515625, 7.2042236328125, 7.50213623046875, 7.800048828125, 8.09796142578125, 8.3958740234375, 8.69378662109375, 8.99169921875, 9.28961181640625, 9.5875244140625, 9.88543701171875, 10.183349609375, 10.48126220703125, 10.7791748046875, 11.07708740234375, 11.375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 1.0, 4.0, 4.0, 11.0, 7.0, 14.0, 25.0, 32.0, 44.0, 55.0, 94.0, 148.0, 192.0, 116.0, 73.0, 39.0, 30.0, 26.0, 16.0, 17.0, 13.0, 6.0, 9.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003459453582763672, -0.0003351867198944092, -0.00032442808151245117, -0.00031366944313049316, -0.00030291080474853516, -0.00029215216636657715, -0.00028139352798461914, -0.00027063488960266113, -0.0002598762512207031, -0.0002491176128387451, -0.0002383589744567871, -0.0002276003360748291, -0.0002168416976928711, -0.00020608305931091309, -0.00019532442092895508, -0.00018456578254699707, -0.00017380714416503906, -0.00016304850578308105, -0.00015228986740112305, -0.00014153122901916504, -0.00013077259063720703, -0.00012001395225524902, -0.00010925531387329102, -9.849667549133301e-05, -8.7738037109375e-05, -7.697939872741699e-05, -6.622076034545898e-05, -5.5462121963500977e-05, -4.470348358154297e-05, -3.394484519958496e-05, -2.3186206817626953e-05, -1.2427568435668945e-05, -1.6689300537109375e-06, 9.08970832824707e-06, 1.9848346710205078e-05, 3.0606985092163086e-05, 4.1365623474121094e-05, 5.21242618560791e-05, 6.288290023803711e-05, 7.364153861999512e-05, 8.440017700195312e-05, 9.515881538391113e-05, 0.00010591745376586914, 0.00011667609214782715, 0.00012743473052978516, 0.00013819336891174316, 0.00014895200729370117, 0.00015971064567565918, 0.0001704692840576172, 0.0001812279224395752, 0.0001919865608215332, 0.0002027451992034912, 0.00021350383758544922, 0.00022426247596740723, 0.00023502111434936523, 0.00024577975273132324, 0.00025653839111328125, 0.00026729702949523926, 0.00027805566787719727, 0.0002888143062591553, 0.0002995729446411133, 0.0003103315830230713, 0.0003210902214050293, 0.0003318488597869873, 0.0003426074981689453]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 3.0, 7.0, 10.0, 12.0, 16.0, 21.0, 18.0, 53.0, 51.0, 149.0, 8284.0, 1038951.0, 734.0, 75.0, 47.0, 34.0, 27.0, 18.0, 12.0, 8.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.3125, -51.552734375, -49.79296875, -48.033203125, -46.2734375, -44.513671875, -42.75390625, -40.994140625, -39.234375, -37.474609375, -35.71484375, -33.955078125, -32.1953125, -30.435546875, -28.67578125, -26.916015625, -25.15625, -23.396484375, -21.63671875, -19.876953125, -18.1171875, -16.357421875, -14.59765625, -12.837890625, -11.078125, -9.318359375, -7.55859375, -5.798828125, -4.0390625, -2.279296875, -0.51953125, 1.240234375, 3.0, 4.759765625, 6.51953125, 8.279296875, 10.0390625, 11.798828125, 13.55859375, 15.318359375, 17.078125, 18.837890625, 20.59765625, 22.357421875, 24.1171875, 25.876953125, 27.63671875, 29.396484375, 31.15625, 32.916015625, 34.67578125, 36.435546875, 38.1953125, 39.955078125, 41.71484375, 43.474609375, 45.234375, 46.994140625, 48.75390625, 50.513671875, 52.2734375, 54.033203125, 55.79296875, 57.552734375, 59.3125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 3.0, 7.0, 10.0, 12.0, 18.0, 18.0, 23.0, 48.0, 46.0, 85.0, 141.0, 235.0, 111.0, 71.0, 48.0, 35.0, 28.0, 20.0, 9.0, 12.0, 2.0, 5.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.43359375, -3.320281982421875, -3.20697021484375, -3.093658447265625, -2.9803466796875, -2.867034912109375, -2.75372314453125, -2.640411376953125, -2.527099609375, -2.413787841796875, -2.30047607421875, -2.187164306640625, -2.0738525390625, -1.960540771484375, -1.84722900390625, -1.733917236328125, -1.62060546875, -1.507293701171875, -1.39398193359375, -1.280670166015625, -1.1673583984375, -1.054046630859375, -0.94073486328125, -0.827423095703125, -0.714111328125, -0.600799560546875, -0.48748779296875, -0.374176025390625, -0.2608642578125, -0.147552490234375, -0.03424072265625, 0.079071044921875, 0.1923828125, 0.305694580078125, 0.41900634765625, 0.532318115234375, 0.6456298828125, 0.758941650390625, 0.87225341796875, 0.985565185546875, 1.098876953125, 1.212188720703125, 1.32550048828125, 1.438812255859375, 1.5521240234375, 1.665435791015625, 1.77874755859375, 1.892059326171875, 2.00537109375, 2.118682861328125, 2.23199462890625, 2.345306396484375, 2.4586181640625, 2.571929931640625, 2.68524169921875, 2.798553466796875, 2.911865234375, 3.025177001953125, 3.13848876953125, 3.251800537109375, 3.3651123046875, 3.478424072265625, 3.59173583984375, 3.705047607421875, 3.818359375]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 163.0, 786.0, 64.0], "bins": [-167.507080078125, -164.82371520996094, -162.14035034179688, -159.45697021484375, -156.7736053466797, -154.09024047851562, -151.40687561035156, -148.7235107421875, -146.04014587402344, -143.35678100585938, -140.6734161376953, -137.99005126953125, -135.30667114257812, -132.62330627441406, -129.93994140625, -127.25657653808594, -124.57319641113281, -121.88983154296875, -119.20645904541016, -116.5230941772461, -113.83972930908203, -111.15635681152344, -108.47299194335938, -105.78962707519531, -103.10626220703125, -100.42289733886719, -97.7395248413086, -95.05615997314453, -92.37279510498047, -89.68942260742188, -87.00605773925781, -84.32269287109375, -81.63932037353516, -78.9559555053711, -76.2725830078125, -73.58921813964844, -70.90585327148438, -68.22248077392578, -65.53911590576172, -62.85574722290039, -60.17238235473633, -57.489013671875, -54.80564880371094, -52.12228012084961, -49.43891143798828, -46.75554656982422, -44.07217788696289, -41.38880920410156, -38.7054443359375, -36.02207565307617, -33.33871078491211, -30.65534210205078, -27.971973419189453, -25.288606643676758, -22.605239868164062, -19.921871185302734, -17.23850440979004, -14.555136680603027, -11.871768951416016, -9.18840217590332, -6.505034446716309, -3.821666717529297, -1.1382999420166016, 1.5450687408447266, 4.22843599319458]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 15.0, 18.0, 25.0, 36.0, 62.0, 78.0, 57.0, 98.0, 88.0, 93.0, 79.0, 87.0, 86.0, 60.0, 42.0, 32.0, 13.0, 22.0, 10.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.20122718811035, -16.676685333251953, -16.152143478393555, -15.62760066986084, -15.103058815002441, -14.578516960144043, -14.053974151611328, -13.52943229675293, -13.004890441894531, -12.480348587036133, -11.955806732177734, -11.43126392364502, -10.906722068786621, -10.382180213928223, -9.857637405395508, -9.33309555053711, -8.808553695678711, -8.284011840820312, -7.759469509124756, -7.234927177429199, -6.710385322570801, -6.185843467712402, -5.661301136016846, -5.136758804321289, -4.612216949462891, -4.087675094604492, -3.5631327629089355, -3.038590669631958, -2.5140485763549805, -1.989506483078003, -1.4649643898010254, -0.9404222965240479, -0.4158802032470703, 0.10866189002990723, 0.6332039833068848, 1.1577460765838623, 1.6822881698608398, 2.2068302631378174, 2.731372356414795, 3.2559144496917725, 3.78045654296875, 4.304998397827148, 4.829540729522705, 5.354083061218262, 5.87862491607666, 6.403166770935059, 6.927709102630615, 7.452251434326172, 7.97679328918457, 8.501335144042969, 9.025876998901367, 9.550419807434082, 10.07496166229248, 10.599503517150879, 11.124046325683594, 11.648588180541992, 12.17313003540039, 12.697671890258789, 13.222213745117188, 13.746756553649902, 14.2712984085083, 14.7958402633667, 15.320383071899414, 15.844924926757812, 16.36946678161621]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 0.0, 4.0, 6.0, 3.0, 2.0, 10.0, 17.0, 19.0, 27.0, 22.0, 39.0, 58.0, 83.0, 91.0, 149.0, 252.0, 321.0, 430.0, 603.0, 880.0, 1190.0, 1791.0, 2566.0, 3983.0, 6264.0, 10499.0, 21431.0, 83950.0, 730436.0, 2363999.0, 821678.0, 91093.0, 21882.0, 11204.0, 6575.0, 4088.0, 2800.0, 1865.0, 1261.0, 826.0, 578.0, 425.0, 275.0, 162.0, 161.0, 97.0, 68.0, 40.0, 25.0, 18.0, 17.0, 6.0, 7.0, 6.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0], "bins": [-7.35546875, -7.1361083984375, -6.916748046875, -6.6973876953125, -6.47802734375, -6.2586669921875, -6.039306640625, -5.8199462890625, -5.6005859375, -5.3812255859375, -5.161865234375, -4.9425048828125, -4.72314453125, -4.5037841796875, -4.284423828125, -4.0650634765625, -3.845703125, -3.6263427734375, -3.406982421875, -3.1876220703125, -2.96826171875, -2.7489013671875, -2.529541015625, -2.3101806640625, -2.0908203125, -1.8714599609375, -1.652099609375, -1.4327392578125, -1.21337890625, -0.9940185546875, -0.774658203125, -0.5552978515625, -0.3359375, -0.1165771484375, 0.102783203125, 0.3221435546875, 0.54150390625, 0.7608642578125, 0.980224609375, 1.1995849609375, 1.4189453125, 1.6383056640625, 1.857666015625, 2.0770263671875, 2.29638671875, 2.5157470703125, 2.735107421875, 2.9544677734375, 3.173828125, 3.3931884765625, 3.612548828125, 3.8319091796875, 4.05126953125, 4.2706298828125, 4.489990234375, 4.7093505859375, 4.9287109375, 5.1480712890625, 5.367431640625, 5.5867919921875, 5.80615234375, 6.0255126953125, 6.244873046875, 6.4642333984375, 6.68359375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 7.0, 6.0, 11.0, 16.0, 16.0, 14.0, 22.0, 34.0, 37.0, 40.0, 26.0, 41.0, 38.0, 42.0, 48.0, 42.0, 50.0, 48.0, 52.0, 35.0, 38.0, 36.0, 39.0, 37.0, 39.0, 28.0, 24.0, 30.0, 21.0, 14.0, 12.0, 9.0, 8.0, 11.0, 11.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.54156494140625, -4.3800048828125, -4.21844482421875, -4.056884765625, -3.89532470703125, -3.7337646484375, -3.57220458984375, -3.41064453125, -3.24908447265625, -3.0875244140625, -2.92596435546875, -2.764404296875, -2.60284423828125, -2.4412841796875, -2.27972412109375, -2.1181640625, -1.95660400390625, -1.7950439453125, -1.63348388671875, -1.471923828125, -1.31036376953125, -1.1488037109375, -0.98724365234375, -0.82568359375, -0.66412353515625, -0.5025634765625, -0.34100341796875, -0.179443359375, -0.01788330078125, 0.1436767578125, 0.30523681640625, 0.466796875, 0.62835693359375, 0.7899169921875, 0.95147705078125, 1.113037109375, 1.27459716796875, 1.4361572265625, 1.59771728515625, 1.75927734375, 1.92083740234375, 2.0823974609375, 2.24395751953125, 2.405517578125, 2.56707763671875, 2.7286376953125, 2.89019775390625, 3.0517578125, 3.21331787109375, 3.3748779296875, 3.53643798828125, 3.697998046875, 3.85955810546875, 4.0211181640625, 4.18267822265625, 4.34423828125, 4.50579833984375, 4.6673583984375, 4.82891845703125, 4.990478515625, 5.15203857421875, 5.3135986328125, 5.47515869140625, 5.63671875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 3.0, 6.0, 5.0, 6.0, 8.0, 12.0, 12.0, 18.0, 20.0, 21.0, 51.0, 69.0, 121.0, 210.0, 527.0, 5778.0, 4162607.0, 23233.0, 816.0, 311.0, 171.0, 78.0, 49.0, 41.0, 25.0, 22.0, 14.0, 8.0, 7.0, 7.0, 2.0, 6.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-69.25, -67.40966796875, -65.5693359375, -63.72900390625, -61.888671875, -60.04833984375, -58.2080078125, -56.36767578125, -54.52734375, -52.68701171875, -50.8466796875, -49.00634765625, -47.166015625, -45.32568359375, -43.4853515625, -41.64501953125, -39.8046875, -37.96435546875, -36.1240234375, -34.28369140625, -32.443359375, -30.60302734375, -28.7626953125, -26.92236328125, -25.08203125, -23.24169921875, -21.4013671875, -19.56103515625, -17.720703125, -15.88037109375, -14.0400390625, -12.19970703125, -10.359375, -8.51904296875, -6.6787109375, -4.83837890625, -2.998046875, -1.15771484375, 0.6826171875, 2.52294921875, 4.36328125, 6.20361328125, 8.0439453125, 9.88427734375, 11.724609375, 13.56494140625, 15.4052734375, 17.24560546875, 19.0859375, 20.92626953125, 22.7666015625, 24.60693359375, 26.447265625, 28.28759765625, 30.1279296875, 31.96826171875, 33.80859375, 35.64892578125, 37.4892578125, 39.32958984375, 41.169921875, 43.01025390625, 44.8505859375, 46.69091796875, 48.53125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 9.0, 6.0, 9.0, 11.0, 12.0, 18.0, 23.0, 23.0, 60.0, 77.0, 136.0, 255.0, 418.0, 693.0, 787.0, 603.0, 388.0, 206.0, 92.0, 61.0, 46.0, 35.0, 20.0, 14.0, 19.0, 8.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.68359375, -2.609375, -2.53515625, -2.4609375, -2.38671875, -2.3125, -2.23828125, -2.1640625, -2.08984375, -2.015625, -1.94140625, -1.8671875, -1.79296875, -1.71875, -1.64453125, -1.5703125, -1.49609375, -1.421875, -1.34765625, -1.2734375, -1.19921875, -1.125, -1.05078125, -0.9765625, -0.90234375, -0.828125, -0.75390625, -0.6796875, -0.60546875, -0.53125, -0.45703125, -0.3828125, -0.30859375, -0.234375, -0.16015625, -0.0859375, -0.01171875, 0.0625, 0.13671875, 0.2109375, 0.28515625, 0.359375, 0.43359375, 0.5078125, 0.58203125, 0.65625, 0.73046875, 0.8046875, 0.87890625, 0.953125, 1.02734375, 1.1015625, 1.17578125, 1.25, 1.32421875, 1.3984375, 1.47265625, 1.546875, 1.62109375, 1.6953125, 1.76953125, 1.84375, 1.91796875, 1.9921875, 2.06640625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 3.0, 19.0, 137.0, 498.0, 322.0, 33.0, 9.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.020809173583984, -3.991067886352539, -2.961326837539673, -1.9315857887268066, -0.9018445014953613, 0.12789678573608398, 1.157637596130371, 2.1873788833618164, 3.2171201705932617, 4.246861457824707, 5.276602745056152, 6.3063435554504395, 7.336084842681885, 8.365825653076172, 9.395566940307617, 10.425308227539062, 11.455049514770508, 12.484790802001953, 13.514532089233398, 14.544273376464844, 15.574014663696289, 16.603755950927734, 17.633495330810547, 18.663238525390625, 19.692977905273438, 20.722719192504883, 21.752460479736328, 22.782201766967773, 23.81194305419922, 24.841684341430664, 25.87142562866211, 26.901165008544922, 27.930908203125, 28.960649490356445, 29.99039077758789, 31.020132064819336, 32.04987335205078, 33.079612731933594, 34.10935592651367, 35.139095306396484, 36.16883850097656, 37.198577880859375, 38.22832107543945, 39.258060455322266, 40.287803649902344, 41.317543029785156, 42.347286224365234, 43.37702560424805, 44.406768798828125, 45.43650817871094, 46.466251373291016, 47.49599075317383, 48.525733947753906, 49.55547332763672, 50.5852165222168, 51.61495590209961, 52.64469528198242, 53.674434661865234, 54.70417785644531, 55.733917236328125, 56.7636604309082, 57.793399810791016, 58.823143005371094, 59.852882385253906, 60.882625579833984]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 5.0, 4.0, 1.0, 9.0, 12.0, 11.0, 13.0, 14.0, 22.0, 18.0, 20.0, 17.0, 29.0, 28.0, 29.0, 28.0, 35.0, 27.0, 45.0, 39.0, 42.0, 40.0, 24.0, 46.0, 39.0, 42.0, 29.0, 33.0, 34.0, 25.0, 21.0, 25.0, 22.0, 31.0, 23.0, 16.0, 23.0, 13.0, 16.0, 14.0, 7.0, 6.0, 9.0, 6.0, 6.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-4.865946292877197, -4.717266082763672, -4.568586349487305, -4.419906139373779, -4.271225929260254, -4.122546195983887, -3.9738659858703613, -3.825185775756836, -3.6765058040618896, -3.5278258323669434, -3.379145622253418, -3.2304656505584717, -3.0817856788635254, -2.93310546875, -2.7844254970550537, -2.6357455253601074, -2.487065315246582, -2.3383853435516357, -2.1897051334381104, -2.041025161743164, -1.8923450708389282, -1.7436649799346924, -1.594985008239746, -1.4463049173355103, -1.2976248264312744, -1.1489447355270386, -1.0002646446228027, -0.8515846729278564, -0.7029045820236206, -0.5542244911193848, -0.4055444598197937, -0.25686442852020264, -0.108184814453125, 0.04049524664878845, 0.1891753077507019, 0.33785536885261536, 0.4865354299545288, 0.6352155208587646, 0.7838955521583557, 0.9325755834579468, 1.0812556743621826, 1.2299357652664185, 1.3786158561706543, 1.5272958278656006, 1.6759759187698364, 1.8246560096740723, 1.9733359813690186, 2.122015953063965, 2.2706961631774902, 2.4193761348724365, 2.568056344985962, 2.716736316680908, 2.8654165267944336, 3.01409649848938, 3.162776470184326, 3.3114566802978516, 3.460136651992798, 3.608816623687744, 3.7574968338012695, 3.906176805496216, 4.054856777191162, 4.2035369873046875, 4.352217197418213, 4.50089693069458, 4.6495771408081055]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 7.0, 4.0, 5.0, 7.0, 13.0, 17.0, 32.0, 34.0, 41.0, 74.0, 100.0, 129.0, 170.0, 217.0, 358.0, 503.0, 806.0, 1104.0, 1707.0, 2733.0, 4378.0, 7210.0, 12742.0, 23665.0, 48926.0, 116928.0, 307013.0, 301179.0, 114757.0, 48145.0, 23342.0, 12587.0, 7320.0, 4346.0, 2652.0, 1712.0, 1151.0, 759.0, 491.0, 348.0, 252.0, 192.0, 123.0, 74.0, 59.0, 41.0, 27.0, 32.0, 10.0, 15.0, 4.0, 7.0, 10.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.1484375, -7.885498046875, -7.62255859375, -7.359619140625, -7.0966796875, -6.833740234375, -6.57080078125, -6.307861328125, -6.044921875, -5.781982421875, -5.51904296875, -5.256103515625, -4.9931640625, -4.730224609375, -4.46728515625, -4.204345703125, -3.94140625, -3.678466796875, -3.41552734375, -3.152587890625, -2.8896484375, -2.626708984375, -2.36376953125, -2.100830078125, -1.837890625, -1.574951171875, -1.31201171875, -1.049072265625, -0.7861328125, -0.523193359375, -0.26025390625, 0.002685546875, 0.265625, 0.528564453125, 0.79150390625, 1.054443359375, 1.3173828125, 1.580322265625, 1.84326171875, 2.106201171875, 2.369140625, 2.632080078125, 2.89501953125, 3.157958984375, 3.4208984375, 3.683837890625, 3.94677734375, 4.209716796875, 4.47265625, 4.735595703125, 4.99853515625, 5.261474609375, 5.5244140625, 5.787353515625, 6.05029296875, 6.313232421875, 6.576171875, 6.839111328125, 7.10205078125, 7.364990234375, 7.6279296875, 7.890869140625, 8.15380859375, 8.416748046875, 8.6796875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 9.0, 11.0, 20.0, 15.0, 22.0, 24.0, 25.0, 18.0, 28.0, 35.0, 32.0, 36.0, 36.0, 43.0, 32.0, 38.0, 42.0, 52.0, 35.0, 41.0, 34.0, 30.0, 40.0, 39.0, 25.0, 31.0, 23.0, 22.0, 21.0, 28.0, 21.0, 15.0, 12.0, 13.0, 13.0, 4.0, 1.0, 9.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-3.5390625, -3.433013916015625, -3.32696533203125, -3.220916748046875, -3.1148681640625, -3.008819580078125, -2.90277099609375, -2.796722412109375, -2.690673828125, -2.584625244140625, -2.47857666015625, -2.372528076171875, -2.2664794921875, -2.160430908203125, -2.05438232421875, -1.948333740234375, -1.84228515625, -1.736236572265625, -1.63018798828125, -1.524139404296875, -1.4180908203125, -1.312042236328125, -1.20599365234375, -1.099945068359375, -0.993896484375, -0.887847900390625, -0.78179931640625, -0.675750732421875, -0.5697021484375, -0.463653564453125, -0.35760498046875, -0.251556396484375, -0.1455078125, -0.039459228515625, 0.06658935546875, 0.172637939453125, 0.2786865234375, 0.384735107421875, 0.49078369140625, 0.596832275390625, 0.702880859375, 0.808929443359375, 0.91497802734375, 1.021026611328125, 1.1270751953125, 1.233123779296875, 1.33917236328125, 1.445220947265625, 1.55126953125, 1.657318115234375, 1.76336669921875, 1.869415283203125, 1.9754638671875, 2.081512451171875, 2.18756103515625, 2.293609619140625, 2.399658203125, 2.505706787109375, 2.61175537109375, 2.717803955078125, 2.8238525390625, 2.929901123046875, 3.03594970703125, 3.141998291015625, 3.248046875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 5.0, 8.0, 10.0, 10.0, 16.0, 18.0, 23.0, 27.0, 64.0, 86.0, 88.0, 135.0, 183.0, 250.0, 344.0, 493.0, 717.0, 1068.0, 1516.0, 2483.0, 4025.0, 6992.0, 13286.0, 29216.0, 81478.0, 415863.0, 357435.0, 74058.0, 27413.0, 12745.0, 6844.0, 3955.0, 2475.0, 1565.0, 1120.0, 750.0, 522.0, 341.0, 247.0, 163.0, 152.0, 87.0, 73.0, 56.0, 39.0, 32.0, 19.0, 19.0, 14.0, 16.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0], "bins": [-6.62890625, -6.4337158203125, -6.238525390625, -6.0433349609375, -5.84814453125, -5.6529541015625, -5.457763671875, -5.2625732421875, -5.0673828125, -4.8721923828125, -4.677001953125, -4.4818115234375, -4.28662109375, -4.0914306640625, -3.896240234375, -3.7010498046875, -3.505859375, -3.3106689453125, -3.115478515625, -2.9202880859375, -2.72509765625, -2.5299072265625, -2.334716796875, -2.1395263671875, -1.9443359375, -1.7491455078125, -1.553955078125, -1.3587646484375, -1.16357421875, -0.9683837890625, -0.773193359375, -0.5780029296875, -0.3828125, -0.1876220703125, 0.007568359375, 0.2027587890625, 0.39794921875, 0.5931396484375, 0.788330078125, 0.9835205078125, 1.1787109375, 1.3739013671875, 1.569091796875, 1.7642822265625, 1.95947265625, 2.1546630859375, 2.349853515625, 2.5450439453125, 2.740234375, 2.9354248046875, 3.130615234375, 3.3258056640625, 3.52099609375, 3.7161865234375, 3.911376953125, 4.1065673828125, 4.3017578125, 4.4969482421875, 4.692138671875, 4.8873291015625, 5.08251953125, 5.2777099609375, 5.472900390625, 5.6680908203125, 5.86328125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 5.0, 6.0, 9.0, 10.0, 13.0, 15.0, 13.0, 22.0, 22.0, 33.0, 29.0, 35.0, 27.0, 30.0, 34.0, 45.0, 33.0, 47.0, 41.0, 60.0, 40.0, 45.0, 32.0, 25.0, 36.0, 35.0, 30.0, 27.0, 23.0, 28.0, 21.0, 21.0, 10.0, 21.0, 13.0, 11.0, 10.0, 5.0, 8.0, 6.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.39453125, -2.318450927734375, -2.24237060546875, -2.166290283203125, -2.0902099609375, -2.014129638671875, -1.93804931640625, -1.861968994140625, -1.785888671875, -1.709808349609375, -1.63372802734375, -1.557647705078125, -1.4815673828125, -1.405487060546875, -1.32940673828125, -1.253326416015625, -1.17724609375, -1.101165771484375, -1.02508544921875, -0.949005126953125, -0.8729248046875, -0.796844482421875, -0.72076416015625, -0.644683837890625, -0.568603515625, -0.492523193359375, -0.41644287109375, -0.340362548828125, -0.2642822265625, -0.188201904296875, -0.11212158203125, -0.036041259765625, 0.0400390625, 0.116119384765625, 0.19219970703125, 0.268280029296875, 0.3443603515625, 0.420440673828125, 0.49652099609375, 0.572601318359375, 0.648681640625, 0.724761962890625, 0.80084228515625, 0.876922607421875, 0.9530029296875, 1.029083251953125, 1.10516357421875, 1.181243896484375, 1.25732421875, 1.333404541015625, 1.40948486328125, 1.485565185546875, 1.5616455078125, 1.637725830078125, 1.71380615234375, 1.789886474609375, 1.865966796875, 1.942047119140625, 2.01812744140625, 2.094207763671875, 2.1702880859375, 2.246368408203125, 2.32244873046875, 2.398529052734375, 2.474609375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 3.0, 4.0, 5.0, 1.0, 7.0, 14.0, 18.0, 24.0, 33.0, 45.0, 43.0, 75.0, 105.0, 153.0, 230.0, 357.0, 610.0, 1162.0, 2407.0, 5542.0, 17898.0, 133113.0, 842099.0, 29620.0, 8125.0, 3268.0, 1393.0, 799.0, 450.0, 317.0, 195.0, 124.0, 77.0, 53.0, 51.0, 37.0, 24.0, 17.0, 10.0, 18.0, 7.0, 4.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.9453125, -11.573974609375, -11.20263671875, -10.831298828125, -10.4599609375, -10.088623046875, -9.71728515625, -9.345947265625, -8.974609375, -8.603271484375, -8.23193359375, -7.860595703125, -7.4892578125, -7.117919921875, -6.74658203125, -6.375244140625, -6.00390625, -5.632568359375, -5.26123046875, -4.889892578125, -4.5185546875, -4.147216796875, -3.77587890625, -3.404541015625, -3.033203125, -2.661865234375, -2.29052734375, -1.919189453125, -1.5478515625, -1.176513671875, -0.80517578125, -0.433837890625, -0.0625, 0.308837890625, 0.68017578125, 1.051513671875, 1.4228515625, 1.794189453125, 2.16552734375, 2.536865234375, 2.908203125, 3.279541015625, 3.65087890625, 4.022216796875, 4.3935546875, 4.764892578125, 5.13623046875, 5.507568359375, 5.87890625, 6.250244140625, 6.62158203125, 6.992919921875, 7.3642578125, 7.735595703125, 8.10693359375, 8.478271484375, 8.849609375, 9.220947265625, 9.59228515625, 9.963623046875, 10.3349609375, 10.706298828125, 11.07763671875, 11.448974609375, 11.8203125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 8.0, 6.0, 7.0, 13.0, 14.0, 21.0, 37.0, 51.0, 70.0, 114.0, 175.0, 172.0, 97.0, 63.0, 50.0, 23.0, 24.0, 15.0, 10.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012922286987304688, -0.00012274086475372314, -0.00011625885963439941, -0.00010977685451507568, -0.00010329484939575195, -9.681284427642822e-05, -9.033083915710449e-05, -8.384883403778076e-05, -7.736682891845703e-05, -7.08848237991333e-05, -6.440281867980957e-05, -5.792081356048584e-05, -5.143880844116211e-05, -4.495680332183838e-05, -3.847479820251465e-05, -3.199279308319092e-05, -2.5510787963867188e-05, -1.9028782844543457e-05, -1.2546777725219727e-05, -6.064772605895996e-06, 4.172325134277344e-07, 6.899237632751465e-06, 1.3381242752075195e-05, 1.9863247871398926e-05, 2.6345252990722656e-05, 3.282725811004639e-05, 3.930926322937012e-05, 4.579126834869385e-05, 5.227327346801758e-05, 5.875527858734131e-05, 6.523728370666504e-05, 7.171928882598877e-05, 7.82012939453125e-05, 8.468329906463623e-05, 9.116530418395996e-05, 9.764730930328369e-05, 0.00010412931442260742, 0.00011061131954193115, 0.00011709332466125488, 0.0001235753297805786, 0.00013005733489990234, 0.00013653934001922607, 0.0001430213451385498, 0.00014950335025787354, 0.00015598535537719727, 0.000162467360496521, 0.00016894936561584473, 0.00017543137073516846, 0.0001819133758544922, 0.00018839538097381592, 0.00019487738609313965, 0.00020135939121246338, 0.0002078413963317871, 0.00021432340145111084, 0.00022080540657043457, 0.0002272874116897583, 0.00023376941680908203, 0.00024025142192840576, 0.0002467334270477295, 0.0002532154321670532, 0.00025969743728637695, 0.0002661794424057007, 0.0002726614475250244, 0.00027914345264434814, 0.0002856254577636719]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 9.0, 12.0, 20.0, 158.0, 8748.0, 1038796.0, 685.0, 56.0, 16.0, 8.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-359.75, -350.09375, -340.4375, -330.78125, -321.125, -311.46875, -301.8125, -292.15625, -282.5, -272.84375, -263.1875, -253.53125, -243.875, -234.21875, -224.5625, -214.90625, -205.25, -195.59375, -185.9375, -176.28125, -166.625, -156.96875, -147.3125, -137.65625, -128.0, -118.34375, -108.6875, -99.03125, -89.375, -79.71875, -70.0625, -60.40625, -50.75, -41.09375, -31.4375, -21.78125, -12.125, -2.46875, 7.1875, 16.84375, 26.5, 36.15625, 45.8125, 55.46875, 65.125, 74.78125, 84.4375, 94.09375, 103.75, 113.40625, 123.0625, 132.71875, 142.375, 152.03125, 161.6875, 171.34375, 181.0, 190.65625, 200.3125, 209.96875, 219.625, 229.28125, 238.9375, 248.59375, 258.25]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 2.0, 4.0, 5.0, 6.0, 11.0, 11.0, 19.0, 56.0, 153.0, 578.0, 63.0, 31.0, 17.0, 7.0, 5.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0, -9.73126220703125, -9.4625244140625, -9.19378662109375, -8.925048828125, -8.65631103515625, -8.3875732421875, -8.11883544921875, -7.85009765625, -7.58135986328125, -7.3126220703125, -7.04388427734375, -6.775146484375, -6.50640869140625, -6.2376708984375, -5.96893310546875, -5.7001953125, -5.43145751953125, -5.1627197265625, -4.89398193359375, -4.625244140625, -4.35650634765625, -4.0877685546875, -3.81903076171875, -3.55029296875, -3.28155517578125, -3.0128173828125, -2.74407958984375, -2.475341796875, -2.20660400390625, -1.9378662109375, -1.66912841796875, -1.400390625, -1.13165283203125, -0.8629150390625, -0.59417724609375, -0.325439453125, -0.05670166015625, 0.2120361328125, 0.48077392578125, 0.74951171875, 1.01824951171875, 1.2869873046875, 1.55572509765625, 1.824462890625, 2.09320068359375, 2.3619384765625, 2.63067626953125, 2.8994140625, 3.16815185546875, 3.4368896484375, 3.70562744140625, 3.974365234375, 4.24310302734375, 4.5118408203125, 4.78057861328125, 5.04931640625, 5.31805419921875, 5.5867919921875, 5.85552978515625, 6.124267578125, 6.39300537109375, 6.6617431640625, 6.93048095703125, 7.19921875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 17.0, 28.0, 93.0, 220.0, 327.0, 163.0, 72.0, 36.0, 21.0, 13.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-28.747377395629883, -28.16642189025879, -27.585466384887695, -27.00450897216797, -26.423553466796875, -25.84259796142578, -25.261642456054688, -24.680686950683594, -24.0997314453125, -23.518775939941406, -22.937820434570312, -22.356863021850586, -21.775907516479492, -21.1949520111084, -20.613996505737305, -20.03304100036621, -19.452083587646484, -18.87112808227539, -18.290172576904297, -17.70921516418457, -17.128259658813477, -16.547304153442383, -15.966348648071289, -15.385393142700195, -14.804436683654785, -14.223481178283691, -13.642524719238281, -13.061569213867188, -12.480613708496094, -11.899657249450684, -11.31870174407959, -10.73774528503418, -10.156789779663086, -9.575834274291992, -8.994877815246582, -8.413922309875488, -7.832966327667236, -7.252010345458984, -6.671054840087891, -6.090098857879639, -5.509142875671387, -4.928186893463135, -4.347230911254883, -3.766275405883789, -3.185319423675537, -2.604363441467285, -2.0234076976776123, -1.4424519538879395, -0.8614959716796875, -0.2805401086807251, 0.3004157543182373, 0.8813716173171997, 1.462327480316162, 2.043283462524414, 2.624239206314087, 3.2051949501037598, 3.7861509323120117, 4.367106914520264, 4.948062896728516, 5.529018402099609, 6.109974384307861, 6.690930366516113, 7.271885871887207, 7.852841854095459, 8.433797836303711]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 4.0, 16.0, 11.0, 18.0, 15.0, 8.0, 15.0, 20.0, 16.0, 25.0, 26.0, 25.0, 33.0, 34.0, 34.0, 25.0, 35.0, 32.0, 35.0, 26.0, 41.0, 36.0, 35.0, 30.0, 42.0, 46.0, 24.0, 25.0, 32.0, 28.0, 22.0, 23.0, 20.0, 23.0, 17.0, 9.0, 17.0, 7.0, 13.0, 8.0, 7.0, 9.0, 7.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-4.086501121520996, -3.9649012088775635, -3.843301296234131, -3.7217013835906982, -3.6001014709472656, -3.478501558303833, -3.3569016456604004, -3.235301971435547, -3.113701820373535, -2.9921019077301025, -2.87050199508667, -2.7489020824432373, -2.6273021697998047, -2.505702257156372, -2.3841023445129395, -2.262502670288086, -2.1409027576446533, -2.0193028450012207, -1.897702932357788, -1.7761030197143555, -1.6545031070709229, -1.5329031944274902, -1.4113034009933472, -1.2897034883499146, -1.168103575706482, -1.0465036630630493, -0.9249037504196167, -0.8033038973808289, -0.6817039847373962, -0.5601040720939636, -0.4385042190551758, -0.31690430641174316, -0.19530439376831055, -0.07370449602603912, 0.0478954017162323, 0.16949528455734253, 0.29109519720077515, 0.41269510984420776, 0.5342949628829956, 0.6558948755264282, 0.7774947881698608, 0.8990947008132935, 1.020694613456726, 1.1422944068908691, 1.2638943195343018, 1.3854942321777344, 1.507094144821167, 1.6286940574645996, 1.7502939701080322, 1.8718938827514648, 1.9934937953948975, 2.11509370803833, 2.2366936206817627, 2.3582935333251953, 2.479893207550049, 2.6014933586120605, 2.723093032836914, 2.8446929454803467, 2.9662928581237793, 3.087892770767212, 3.2094926834106445, 3.331092596054077, 3.4526925086975098, 3.5742921829223633, 3.695892333984375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 10.0, 9.0, 16.0, 13.0, 21.0, 34.0, 28.0, 45.0, 116.0, 335.0, 1318.0, 5306.0, 27995.0, 198650.0, 660390.0, 129365.0, 19327.0, 4034.0, 940.0, 271.0, 110.0, 57.0, 36.0, 25.0, 12.0, 21.0, 10.0, 13.0, 9.0, 4.0, 4.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0], "bins": [-31.875, -31.06591796875, -30.2568359375, -29.44775390625, -28.638671875, -27.82958984375, -27.0205078125, -26.21142578125, -25.40234375, -24.59326171875, -23.7841796875, -22.97509765625, -22.166015625, -21.35693359375, -20.5478515625, -19.73876953125, -18.9296875, -18.12060546875, -17.3115234375, -16.50244140625, -15.693359375, -14.88427734375, -14.0751953125, -13.26611328125, -12.45703125, -11.64794921875, -10.8388671875, -10.02978515625, -9.220703125, -8.41162109375, -7.6025390625, -6.79345703125, -5.984375, -5.17529296875, -4.3662109375, -3.55712890625, -2.748046875, -1.93896484375, -1.1298828125, -0.32080078125, 0.48828125, 1.29736328125, 2.1064453125, 2.91552734375, 3.724609375, 4.53369140625, 5.3427734375, 6.15185546875, 6.9609375, 7.77001953125, 8.5791015625, 9.38818359375, 10.197265625, 11.00634765625, 11.8154296875, 12.62451171875, 13.43359375, 14.24267578125, 15.0517578125, 15.86083984375, 16.669921875, 17.47900390625, 18.2880859375, 19.09716796875, 19.90625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 5.0, 4.0, 3.0, 3.0, 9.0, 10.0, 12.0, 14.0, 16.0, 21.0, 25.0, 35.0, 26.0, 39.0, 48.0, 43.0, 38.0, 50.0, 47.0, 30.0, 45.0, 46.0, 49.0, 49.0, 32.0, 41.0, 32.0, 37.0, 41.0, 27.0, 25.0, 21.0, 20.0, 9.0, 8.0, 14.0, 6.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.8984375, -6.695556640625, -6.49267578125, -6.289794921875, -6.0869140625, -5.884033203125, -5.68115234375, -5.478271484375, -5.275390625, -5.072509765625, -4.86962890625, -4.666748046875, -4.4638671875, -4.260986328125, -4.05810546875, -3.855224609375, -3.65234375, -3.449462890625, -3.24658203125, -3.043701171875, -2.8408203125, -2.637939453125, -2.43505859375, -2.232177734375, -2.029296875, -1.826416015625, -1.62353515625, -1.420654296875, -1.2177734375, -1.014892578125, -0.81201171875, -0.609130859375, -0.40625, -0.203369140625, -0.00048828125, 0.202392578125, 0.4052734375, 0.608154296875, 0.81103515625, 1.013916015625, 1.216796875, 1.419677734375, 1.62255859375, 1.825439453125, 2.0283203125, 2.231201171875, 2.43408203125, 2.636962890625, 2.83984375, 3.042724609375, 3.24560546875, 3.448486328125, 3.6513671875, 3.854248046875, 4.05712890625, 4.260009765625, 4.462890625, 4.665771484375, 4.86865234375, 5.071533203125, 5.2744140625, 5.477294921875, 5.68017578125, 5.883056640625, 6.0859375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 8.0, 4.0, 13.0, 11.0, 22.0, 15.0, 19.0, 23.0, 28.0, 31.0, 34.0, 50.0, 36.0, 54.0, 235.0, 9851.0, 981028.0, 56097.0, 568.0, 63.0, 48.0, 37.0, 29.0, 32.0, 35.0, 23.0, 19.0, 22.0, 21.0, 20.0, 12.0, 10.0, 4.0, 6.0, 6.0, 10.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0, -72.4716796875, -69.943359375, -67.4150390625, -64.88671875, -62.3583984375, -59.830078125, -57.3017578125, -54.7734375, -52.2451171875, -49.716796875, -47.1884765625, -44.66015625, -42.1318359375, -39.603515625, -37.0751953125, -34.546875, -32.0185546875, -29.490234375, -26.9619140625, -24.43359375, -21.9052734375, -19.376953125, -16.8486328125, -14.3203125, -11.7919921875, -9.263671875, -6.7353515625, -4.20703125, -1.6787109375, 0.849609375, 3.3779296875, 5.90625, 8.4345703125, 10.962890625, 13.4912109375, 16.01953125, 18.5478515625, 21.076171875, 23.6044921875, 26.1328125, 28.6611328125, 31.189453125, 33.7177734375, 36.24609375, 38.7744140625, 41.302734375, 43.8310546875, 46.359375, 48.8876953125, 51.416015625, 53.9443359375, 56.47265625, 59.0009765625, 61.529296875, 64.0576171875, 66.5859375, 69.1142578125, 71.642578125, 74.1708984375, 76.69921875, 79.2275390625, 81.755859375, 84.2841796875, 86.8125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 4.0, 10.0, 11.0, 10.0, 21.0, 15.0, 17.0, 17.0, 35.0, 31.0, 30.0, 48.0, 44.0, 41.0, 46.0, 54.0, 60.0, 62.0, 45.0, 38.0, 42.0, 44.0, 31.0, 27.0, 33.0, 25.0, 21.0, 21.0, 22.0, 18.0, 16.0, 9.0, 4.0, 6.0, 7.0, 9.0, 5.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.45703125, -7.20721435546875, -6.9573974609375, -6.70758056640625, -6.457763671875, -6.20794677734375, -5.9581298828125, -5.70831298828125, -5.45849609375, -5.20867919921875, -4.9588623046875, -4.70904541015625, -4.459228515625, -4.20941162109375, -3.9595947265625, -3.70977783203125, -3.4599609375, -3.21014404296875, -2.9603271484375, -2.71051025390625, -2.460693359375, -2.21087646484375, -1.9610595703125, -1.71124267578125, -1.46142578125, -1.21160888671875, -0.9617919921875, -0.71197509765625, -0.462158203125, -0.21234130859375, 0.0374755859375, 0.28729248046875, 0.537109375, 0.78692626953125, 1.0367431640625, 1.28656005859375, 1.536376953125, 1.78619384765625, 2.0360107421875, 2.28582763671875, 2.53564453125, 2.78546142578125, 3.0352783203125, 3.28509521484375, 3.534912109375, 3.78472900390625, 4.0345458984375, 4.28436279296875, 4.5341796875, 4.78399658203125, 5.0338134765625, 5.28363037109375, 5.533447265625, 5.78326416015625, 6.0330810546875, 6.28289794921875, 6.53271484375, 6.78253173828125, 7.0323486328125, 7.28216552734375, 7.531982421875, 7.78179931640625, 8.0316162109375, 8.28143310546875, 8.53125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 10.0, 19.0, 31.0, 69.0, 98.0, 201.0, 390.0, 753.0, 1323.0, 2499.0, 5202.0, 13055.0, 47002.0, 802300.0, 136877.0, 23475.0, 7975.0, 3484.0, 1655.0, 933.0, 506.0, 277.0, 160.0, 98.0, 57.0, 30.0, 18.0, 10.0, 5.0, 6.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5908203125, -1.5422515869140625, -1.493682861328125, -1.4451141357421875, -1.39654541015625, -1.3479766845703125, -1.299407958984375, -1.2508392333984375, -1.2022705078125, -1.1537017822265625, -1.105133056640625, -1.0565643310546875, -1.00799560546875, -0.9594268798828125, -0.910858154296875, -0.8622894287109375, -0.813720703125, -0.7651519775390625, -0.716583251953125, -0.6680145263671875, -0.61944580078125, -0.5708770751953125, -0.522308349609375, -0.4737396240234375, -0.4251708984375, -0.3766021728515625, -0.328033447265625, -0.2794647216796875, -0.23089599609375, -0.1823272705078125, -0.133758544921875, -0.0851898193359375, -0.03662109375, 0.0119476318359375, 0.060516357421875, 0.1090850830078125, 0.15765380859375, 0.2062225341796875, 0.254791259765625, 0.3033599853515625, 0.3519287109375, 0.4004974365234375, 0.449066162109375, 0.4976348876953125, 0.54620361328125, 0.5947723388671875, 0.643341064453125, 0.6919097900390625, 0.740478515625, 0.7890472412109375, 0.837615966796875, 0.8861846923828125, 0.93475341796875, 0.9833221435546875, 1.031890869140625, 1.0804595947265625, 1.1290283203125, 1.1775970458984375, 1.226165771484375, 1.2747344970703125, 1.32330322265625, 1.3718719482421875, 1.420440673828125, 1.4690093994140625, 1.517578125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 1.0, 7.0, 5.0, 5.0, 10.0, 20.0, 21.0, 36.0, 49.0, 86.0, 138.0, 195.0, 156.0, 103.0, 39.0, 36.0, 21.0, 22.0, 10.0, 6.0, 10.0, 7.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.882450103759766e-05, -9.526684880256653e-05, -9.17091965675354e-05, -8.815154433250427e-05, -8.459389209747314e-05, -8.103623986244202e-05, -7.747858762741089e-05, -7.392093539237976e-05, -7.036328315734863e-05, -6.68056309223175e-05, -6.324797868728638e-05, -5.969032645225525e-05, -5.613267421722412e-05, -5.257502198219299e-05, -4.9017369747161865e-05, -4.545971751213074e-05, -4.190206527709961e-05, -3.834441304206848e-05, -3.4786760807037354e-05, -3.1229108572006226e-05, -2.7671456336975098e-05, -2.411380410194397e-05, -2.0556151866912842e-05, -1.6998499631881714e-05, -1.3440847396850586e-05, -9.883195161819458e-06, -6.32554292678833e-06, -2.767890691757202e-06, 7.897615432739258e-07, 4.347413778305054e-06, 7.905066013336182e-06, 1.146271824836731e-05, 1.5020370483398438e-05, 1.8578022718429565e-05, 2.2135674953460693e-05, 2.569332718849182e-05, 2.925097942352295e-05, 3.280863165855408e-05, 3.6366283893585205e-05, 3.992393612861633e-05, 4.348158836364746e-05, 4.703924059867859e-05, 5.059689283370972e-05, 5.4154545068740845e-05, 5.771219730377197e-05, 6.12698495388031e-05, 6.482750177383423e-05, 6.838515400886536e-05, 7.194280624389648e-05, 7.550045847892761e-05, 7.905811071395874e-05, 8.261576294898987e-05, 8.6173415184021e-05, 8.973106741905212e-05, 9.328871965408325e-05, 9.684637188911438e-05, 0.00010040402412414551, 0.00010396167635917664, 0.00010751932859420776, 0.00011107698082923889, 0.00011463463306427002, 0.00011819228529930115, 0.00012174993753433228, 0.0001253075897693634, 0.00012886524200439453]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 7.0, 18.0, 155.0, 9371.0, 1036354.0, 2527.0, 58.0, 13.0, 9.0, 7.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.234375, -10.88720703125, -10.5400390625, -10.19287109375, -9.845703125, -9.49853515625, -9.1513671875, -8.80419921875, -8.45703125, -8.10986328125, -7.7626953125, -7.41552734375, -7.068359375, -6.72119140625, -6.3740234375, -6.02685546875, -5.6796875, -5.33251953125, -4.9853515625, -4.63818359375, -4.291015625, -3.94384765625, -3.5966796875, -3.24951171875, -2.90234375, -2.55517578125, -2.2080078125, -1.86083984375, -1.513671875, -1.16650390625, -0.8193359375, -0.47216796875, -0.125, 0.22216796875, 0.5693359375, 0.91650390625, 1.263671875, 1.61083984375, 1.9580078125, 2.30517578125, 2.65234375, 2.99951171875, 3.3466796875, 3.69384765625, 4.041015625, 4.38818359375, 4.7353515625, 5.08251953125, 5.4296875, 5.77685546875, 6.1240234375, 6.47119140625, 6.818359375, 7.16552734375, 7.5126953125, 7.85986328125, 8.20703125, 8.55419921875, 8.9013671875, 9.24853515625, 9.595703125, 9.94287109375, 10.2900390625, 10.63720703125, 10.984375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 7.0, 17.0, 25.0, 52.0, 138.0, 572.0, 92.0, 32.0, 20.0, 7.0, 11.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9814453125, -0.9511184692382812, -0.9207916259765625, -0.8904647827148438, -0.860137939453125, -0.8298110961914062, -0.7994842529296875, -0.7691574096679688, -0.73883056640625, -0.7085037231445312, -0.6781768798828125, -0.6478500366210938, -0.617523193359375, -0.5871963500976562, -0.5568695068359375, -0.5265426635742188, -0.4962158203125, -0.46588897705078125, -0.4355621337890625, -0.40523529052734375, -0.374908447265625, -0.34458160400390625, -0.3142547607421875, -0.28392791748046875, -0.25360107421875, -0.22327423095703125, -0.1929473876953125, -0.16262054443359375, -0.132293701171875, -0.10196685791015625, -0.0716400146484375, -0.04131317138671875, -0.010986328125, 0.01934051513671875, 0.0496673583984375, 0.07999420166015625, 0.110321044921875, 0.14064788818359375, 0.1709747314453125, 0.20130157470703125, 0.23162841796875, 0.26195526123046875, 0.2922821044921875, 0.32260894775390625, 0.352935791015625, 0.38326263427734375, 0.4135894775390625, 0.44391632080078125, 0.4742431640625, 0.5045700073242188, 0.5348968505859375, 0.5652236938476562, 0.595550537109375, 0.6258773803710938, 0.6562042236328125, 0.6865310668945312, 0.71685791015625, 0.7471847534179688, 0.7775115966796875, 0.8078384399414062, 0.838165283203125, 0.8684921264648438, 0.8988189697265625, 0.9291458129882812, 0.95947265625]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 232.0, 787.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-226.2407684326172, -221.5326385498047, -216.8245086669922, -212.11636352539062, -207.40823364257812, -202.70010375976562, -197.99197387695312, -193.28384399414062, -188.57571411132812, -183.86758422851562, -179.15945434570312, -174.45132446289062, -169.74317932128906, -165.03504943847656, -160.32691955566406, -155.61878967285156, -150.91064453125, -146.2025146484375, -141.494384765625, -136.7862548828125, -132.07810974121094, -127.36997985839844, -122.66184997558594, -117.95372009277344, -113.24559020996094, -108.53746032714844, -103.8293228149414, -99.1211929321289, -94.4130630493164, -89.70492553710938, -84.99679565429688, -80.28866577148438, -75.58053588867188, -70.87240600585938, -66.16426849365234, -61.456138610839844, -56.748008728027344, -52.03987503051758, -47.33174133300781, -42.62361145019531, -37.91547775268555, -33.20734405517578, -28.49921417236328, -23.791080474853516, -19.082948684692383, -14.37481689453125, -9.666683197021484, -4.958553314208984, -0.25041961669921875, 4.457712650299072, 9.165844917297363, 13.873977661132812, 18.582109451293945, 23.290241241455078, 27.998374938964844, 32.706504821777344, 37.41463851928711, 42.122772216796875, 46.830902099609375, 51.53903579711914, 56.247169494628906, 60.955299377441406, 65.66343688964844, 70.37156677246094, 75.07969665527344]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 8.0, 16.0, 18.0, 16.0, 20.0, 21.0, 32.0, 28.0, 38.0, 41.0, 46.0, 52.0, 41.0, 57.0, 47.0, 59.0, 55.0, 53.0, 37.0, 53.0, 51.0, 34.0, 34.0, 33.0, 26.0, 13.0, 16.0, 16.0, 10.0, 3.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.655713081359863, -12.338146209716797, -12.020580291748047, -11.703014373779297, -11.38544750213623, -11.067880630493164, -10.750314712524414, -10.432748794555664, -10.115181922912598, -9.797615051269531, -9.480049133300781, -9.162483215332031, -8.844916343688965, -8.527349472045898, -8.209783554077148, -7.89221715927124, -7.574650764465332, -7.257084369659424, -6.939517974853516, -6.621951580047607, -6.304385185241699, -5.986818790435791, -5.669252395629883, -5.351686000823975, -5.034119606018066, -4.716553211212158, -4.39898681640625, -4.081420421600342, -3.7638540267944336, -3.4462876319885254, -3.128721237182617, -2.811154842376709, -2.4935879707336426, -2.1760215759277344, -1.8584551811218262, -1.540888786315918, -1.2233223915100098, -0.9057559967041016, -0.5881896018981934, -0.27062320709228516, 0.04694318771362305, 0.36450958251953125, 0.6820759773254395, 0.9996423721313477, 1.3172087669372559, 1.634775161743164, 1.9523415565490723, 2.2699079513549805, 2.5874743461608887, 2.905040740966797, 3.222607135772705, 3.5401735305786133, 3.8577399253845215, 4.17530632019043, 4.492872714996338, 4.810439109802246, 5.128005504608154, 5.4455718994140625, 5.763138294219971, 6.080704689025879, 6.398271083831787, 6.715837478637695, 7.0334038734436035, 7.350970268249512, 7.66853666305542]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 11.0, 13.0, 22.0, 24.0, 44.0, 54.0, 64.0, 84.0, 141.0, 144.0, 195.0, 317.0, 400.0, 756.0, 1890.0, 6611.0, 51675.0, 3703715.0, 408828.0, 13105.0, 3227.0, 1090.0, 575.0, 322.0, 262.0, 191.0, 129.0, 106.0, 87.0, 46.0, 46.0, 20.0, 22.0, 22.0, 8.0, 8.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1796875, -12.7506103515625, -12.321533203125, -11.8924560546875, -11.46337890625, -11.0343017578125, -10.605224609375, -10.1761474609375, -9.7470703125, -9.3179931640625, -8.888916015625, -8.4598388671875, -8.03076171875, -7.6016845703125, -7.172607421875, -6.7435302734375, -6.314453125, -5.8853759765625, -5.456298828125, -5.0272216796875, -4.59814453125, -4.1690673828125, -3.739990234375, -3.3109130859375, -2.8818359375, -2.4527587890625, -2.023681640625, -1.5946044921875, -1.16552734375, -0.7364501953125, -0.307373046875, 0.1217041015625, 0.55078125, 0.9798583984375, 1.408935546875, 1.8380126953125, 2.26708984375, 2.6961669921875, 3.125244140625, 3.5543212890625, 3.9833984375, 4.4124755859375, 4.841552734375, 5.2706298828125, 5.69970703125, 6.1287841796875, 6.557861328125, 6.9869384765625, 7.416015625, 7.8450927734375, 8.274169921875, 8.7032470703125, 9.13232421875, 9.5614013671875, 9.990478515625, 10.4195556640625, 10.8486328125, 11.2777099609375, 11.706787109375, 12.1358642578125, 12.56494140625, 12.9940185546875, 13.423095703125, 13.8521728515625, 14.28125]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 3.0, 4.0, 4.0, 10.0, 9.0, 7.0, 19.0, 15.0, 18.0, 19.0, 21.0, 22.0, 25.0, 27.0, 51.0, 49.0, 37.0, 46.0, 46.0, 46.0, 54.0, 56.0, 48.0, 49.0, 41.0, 38.0, 44.0, 34.0, 28.0, 31.0, 25.0, 15.0, 11.0, 6.0, 13.0, 8.0, 8.0, 8.0, 6.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.129058837890625, -3.02569580078125, -2.922332763671875, -2.8189697265625, -2.715606689453125, -2.61224365234375, -2.508880615234375, -2.405517578125, -2.302154541015625, -2.19879150390625, -2.095428466796875, -1.9920654296875, -1.888702392578125, -1.78533935546875, -1.681976318359375, -1.57861328125, -1.475250244140625, -1.37188720703125, -1.268524169921875, -1.1651611328125, -1.061798095703125, -0.95843505859375, -0.855072021484375, -0.751708984375, -0.648345947265625, -0.54498291015625, -0.441619873046875, -0.3382568359375, -0.234893798828125, -0.13153076171875, -0.028167724609375, 0.0751953125, 0.178558349609375, 0.28192138671875, 0.385284423828125, 0.4886474609375, 0.592010498046875, 0.69537353515625, 0.798736572265625, 0.902099609375, 1.005462646484375, 1.10882568359375, 1.212188720703125, 1.3155517578125, 1.418914794921875, 1.52227783203125, 1.625640869140625, 1.72900390625, 1.832366943359375, 1.93572998046875, 2.039093017578125, 2.1424560546875, 2.245819091796875, 2.34918212890625, 2.452545166015625, 2.555908203125, 2.659271240234375, 2.76263427734375, 2.865997314453125, 2.9693603515625, 3.072723388671875, 3.17608642578125, 3.279449462890625, 3.3828125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 13.0, 6.0, 24.0, 32.0, 64.0, 293.0, 2227.0, 4182762.0, 8064.0, 578.0, 110.0, 39.0, 14.0, 11.0, 12.0, 12.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-78.5, -75.853515625, -73.20703125, -70.560546875, -67.9140625, -65.267578125, -62.62109375, -59.974609375, -57.328125, -54.681640625, -52.03515625, -49.388671875, -46.7421875, -44.095703125, -41.44921875, -38.802734375, -36.15625, -33.509765625, -30.86328125, -28.216796875, -25.5703125, -22.923828125, -20.27734375, -17.630859375, -14.984375, -12.337890625, -9.69140625, -7.044921875, -4.3984375, -1.751953125, 0.89453125, 3.541015625, 6.1875, 8.833984375, 11.48046875, 14.126953125, 16.7734375, 19.419921875, 22.06640625, 24.712890625, 27.359375, 30.005859375, 32.65234375, 35.298828125, 37.9453125, 40.591796875, 43.23828125, 45.884765625, 48.53125, 51.177734375, 53.82421875, 56.470703125, 59.1171875, 61.763671875, 64.41015625, 67.056640625, 69.703125, 72.349609375, 74.99609375, 77.642578125, 80.2890625, 82.935546875, 85.58203125, 88.228515625, 90.875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 11.0, 9.0, 14.0, 20.0, 38.0, 95.0, 464.0, 1830.0, 1129.0, 292.0, 73.0, 31.0, 23.0, 11.0, 11.0, 8.0, 12.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.572265625, -3.459930419921875, -3.34759521484375, -3.235260009765625, -3.1229248046875, -3.010589599609375, -2.89825439453125, -2.785919189453125, -2.673583984375, -2.561248779296875, -2.44891357421875, -2.336578369140625, -2.2242431640625, -2.111907958984375, -1.99957275390625, -1.887237548828125, -1.77490234375, -1.662567138671875, -1.55023193359375, -1.437896728515625, -1.3255615234375, -1.213226318359375, -1.10089111328125, -0.988555908203125, -0.876220703125, -0.763885498046875, -0.65155029296875, -0.539215087890625, -0.4268798828125, -0.314544677734375, -0.20220947265625, -0.089874267578125, 0.0224609375, 0.134796142578125, 0.24713134765625, 0.359466552734375, 0.4718017578125, 0.584136962890625, 0.69647216796875, 0.808807373046875, 0.921142578125, 1.033477783203125, 1.14581298828125, 1.258148193359375, 1.3704833984375, 1.482818603515625, 1.59515380859375, 1.707489013671875, 1.81982421875, 1.932159423828125, 2.04449462890625, 2.156829833984375, 2.2691650390625, 2.381500244140625, 2.49383544921875, 2.606170654296875, 2.718505859375, 2.830841064453125, 2.94317626953125, 3.055511474609375, 3.1678466796875, 3.280181884765625, 3.39251708984375, 3.504852294921875, 3.6171875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 331.0, 663.0, 23.0, 3.0], "bins": [-102.6961669921875, -101.0140609741211, -99.33196258544922, -97.64985656738281, -95.96775817871094, -94.28565216064453, -92.60354614257812, -90.92144775390625, -89.23934173583984, -87.55723571777344, -85.87513732910156, -84.19303131103516, -82.51093292236328, -80.82882690429688, -79.146728515625, -77.4646224975586, -75.78251647949219, -74.10041046142578, -72.4183120727539, -70.7362060546875, -69.05410766601562, -67.37200164794922, -65.68989562988281, -64.00779724121094, -62.32569885253906, -60.64359664916992, -58.96149444580078, -57.279388427734375, -55.597286224365234, -53.915184020996094, -52.23308181762695, -50.55097961425781, -48.868873596191406, -47.186771392822266, -45.504669189453125, -43.82256317138672, -42.14046096801758, -40.45835876464844, -38.7762565612793, -37.094154357910156, -35.412052154541016, -33.729949951171875, -32.047847747802734, -30.36574363708496, -28.683639526367188, -27.001537322998047, -25.319435119628906, -23.637332916259766, -21.955228805541992, -20.27312660217285, -18.591022491455078, -16.908920288085938, -15.22681713104248, -13.544713973999023, -11.862611770629883, -10.180508613586426, -8.498405456542969, -6.816302299499512, -5.134199619293213, -3.452096939086914, -1.769993782043457, -0.087890625, 1.5942115783691406, 3.2763147354125977, 4.958418369293213]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 8.0, 9.0, 11.0, 15.0, 17.0, 13.0, 26.0, 17.0, 25.0, 39.0, 38.0, 38.0, 33.0, 34.0, 44.0, 40.0, 49.0, 55.0, 43.0, 54.0, 39.0, 36.0, 31.0, 36.0, 38.0, 29.0, 38.0, 17.0, 16.0, 12.0, 16.0, 11.0, 11.0, 11.0, 10.0, 5.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3235228061676025, -3.217550039291382, -3.111577272415161, -3.0056045055389404, -2.8996317386627197, -2.793658971786499, -2.6876862049102783, -2.5817134380340576, -2.475740671157837, -2.369767904281616, -2.2637951374053955, -2.157822370529175, -2.051849603652954, -1.9458768367767334, -1.8399040699005127, -1.733931303024292, -1.6279585361480713, -1.5219857692718506, -1.4160130023956299, -1.3100402355194092, -1.2040674686431885, -1.0980947017669678, -0.9921219348907471, -0.8861491680145264, -0.7801764011383057, -0.674203634262085, -0.5682308673858643, -0.46225810050964355, -0.35628533363342285, -0.25031256675720215, -0.14433979988098145, -0.03836703300476074, 0.06760549545288086, 0.17357826232910156, 0.27955102920532227, 0.38552379608154297, 0.49149656295776367, 0.5974693298339844, 0.7034420967102051, 0.8094148635864258, 0.9153876304626465, 1.0213603973388672, 1.127333164215088, 1.2333059310913086, 1.3392786979675293, 1.44525146484375, 1.5512242317199707, 1.6571969985961914, 1.763169765472412, 1.8691425323486328, 1.9751152992248535, 2.081088066101074, 2.187060832977295, 2.2930335998535156, 2.3990063667297363, 2.504979133605957, 2.6109519004821777, 2.7169246673583984, 2.822897434234619, 2.92887020111084, 3.0348429679870605, 3.1408157348632812, 3.246788501739502, 3.3527612686157227, 3.4587340354919434]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 4.0, 3.0, 13.0, 28.0, 29.0, 43.0, 54.0, 91.0, 140.0, 200.0, 309.0, 465.0, 784.0, 1280.0, 1892.0, 3201.0, 5228.0, 8618.0, 14814.0, 25768.0, 46772.0, 90920.0, 223484.0, 354708.0, 127863.0, 61722.0, 33305.0, 18798.0, 10862.0, 6536.0, 3999.0, 2500.0, 1495.0, 932.0, 590.0, 393.0, 227.0, 155.0, 92.0, 83.0, 46.0, 33.0, 19.0, 21.0, 15.0, 8.0, 3.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.08984375, -5.894775390625, -5.69970703125, -5.504638671875, -5.3095703125, -5.114501953125, -4.91943359375, -4.724365234375, -4.529296875, -4.334228515625, -4.13916015625, -3.944091796875, -3.7490234375, -3.553955078125, -3.35888671875, -3.163818359375, -2.96875, -2.773681640625, -2.57861328125, -2.383544921875, -2.1884765625, -1.993408203125, -1.79833984375, -1.603271484375, -1.408203125, -1.213134765625, -1.01806640625, -0.822998046875, -0.6279296875, -0.432861328125, -0.23779296875, -0.042724609375, 0.15234375, 0.347412109375, 0.54248046875, 0.737548828125, 0.9326171875, 1.127685546875, 1.32275390625, 1.517822265625, 1.712890625, 1.907958984375, 2.10302734375, 2.298095703125, 2.4931640625, 2.688232421875, 2.88330078125, 3.078369140625, 3.2734375, 3.468505859375, 3.66357421875, 3.858642578125, 4.0537109375, 4.248779296875, 4.44384765625, 4.638916015625, 4.833984375, 5.029052734375, 5.22412109375, 5.419189453125, 5.6142578125, 5.809326171875, 6.00439453125, 6.199462890625, 6.39453125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 1.0, 4.0, 9.0, 7.0, 12.0, 9.0, 10.0, 10.0, 20.0, 22.0, 28.0, 22.0, 39.0, 35.0, 32.0, 42.0, 41.0, 55.0, 49.0, 42.0, 48.0, 58.0, 43.0, 54.0, 29.0, 45.0, 27.0, 44.0, 28.0, 24.0, 14.0, 12.0, 18.0, 16.0, 15.0, 10.0, 6.0, 8.0, 3.0, 10.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01171875, -1.950897216796875, -1.89007568359375, -1.829254150390625, -1.7684326171875, -1.707611083984375, -1.64678955078125, -1.585968017578125, -1.525146484375, -1.464324951171875, -1.40350341796875, -1.342681884765625, -1.2818603515625, -1.221038818359375, -1.16021728515625, -1.099395751953125, -1.03857421875, -0.977752685546875, -0.91693115234375, -0.856109619140625, -0.7952880859375, -0.734466552734375, -0.67364501953125, -0.612823486328125, -0.552001953125, -0.491180419921875, -0.43035888671875, -0.369537353515625, -0.3087158203125, -0.247894287109375, -0.18707275390625, -0.126251220703125, -0.0654296875, -0.004608154296875, 0.05621337890625, 0.117034912109375, 0.1778564453125, 0.238677978515625, 0.29949951171875, 0.360321044921875, 0.421142578125, 0.481964111328125, 0.54278564453125, 0.603607177734375, 0.6644287109375, 0.725250244140625, 0.78607177734375, 0.846893310546875, 0.90771484375, 0.968536376953125, 1.02935791015625, 1.090179443359375, 1.1510009765625, 1.211822509765625, 1.27264404296875, 1.333465576171875, 1.394287109375, 1.455108642578125, 1.51593017578125, 1.576751708984375, 1.6375732421875, 1.698394775390625, 1.75921630859375, 1.820037841796875, 1.880859375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 8.0, 16.0, 15.0, 24.0, 27.0, 37.0, 55.0, 70.0, 92.0, 104.0, 178.0, 230.0, 301.0, 434.0, 545.0, 854.0, 1340.0, 1781.0, 2737.0, 4411.0, 7544.0, 12714.0, 25407.0, 61360.0, 437262.0, 372620.0, 60196.0, 24959.0, 12484.0, 7380.0, 4372.0, 2777.0, 1834.0, 1288.0, 909.0, 591.0, 424.0, 310.0, 223.0, 171.0, 121.0, 89.0, 56.0, 43.0, 40.0, 27.0, 24.0, 20.0, 12.0, 13.0, 6.0, 9.0, 0.0, 5.0, 0.0, 0.0, 2.0], "bins": [-6.53125, -6.32708740234375, -6.1229248046875, -5.91876220703125, -5.714599609375, -5.51043701171875, -5.3062744140625, -5.10211181640625, -4.89794921875, -4.69378662109375, -4.4896240234375, -4.28546142578125, -4.081298828125, -3.87713623046875, -3.6729736328125, -3.46881103515625, -3.2646484375, -3.06048583984375, -2.8563232421875, -2.65216064453125, -2.447998046875, -2.24383544921875, -2.0396728515625, -1.83551025390625, -1.63134765625, -1.42718505859375, -1.2230224609375, -1.01885986328125, -0.814697265625, -0.61053466796875, -0.4063720703125, -0.20220947265625, 0.001953125, 0.20611572265625, 0.4102783203125, 0.61444091796875, 0.818603515625, 1.02276611328125, 1.2269287109375, 1.43109130859375, 1.63525390625, 1.83941650390625, 2.0435791015625, 2.24774169921875, 2.451904296875, 2.65606689453125, 2.8602294921875, 3.06439208984375, 3.2685546875, 3.47271728515625, 3.6768798828125, 3.88104248046875, 4.085205078125, 4.28936767578125, 4.4935302734375, 4.69769287109375, 4.90185546875, 5.10601806640625, 5.3101806640625, 5.51434326171875, 5.718505859375, 5.92266845703125, 6.1268310546875, 6.33099365234375, 6.53515625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 5.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 10.0, 13.0, 19.0, 12.0, 20.0, 19.0, 29.0, 15.0, 35.0, 44.0, 42.0, 39.0, 50.0, 38.0, 47.0, 32.0, 44.0, 39.0, 46.0, 45.0, 42.0, 30.0, 28.0, 33.0, 34.0, 32.0, 26.0, 19.0, 14.0, 15.0, 12.0, 13.0, 9.0, 6.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.184967041015625, -1.14239501953125, -1.099822998046875, -1.0572509765625, -1.014678955078125, -0.97210693359375, -0.929534912109375, -0.886962890625, -0.844390869140625, -0.80181884765625, -0.759246826171875, -0.7166748046875, -0.674102783203125, -0.63153076171875, -0.588958740234375, -0.54638671875, -0.503814697265625, -0.46124267578125, -0.418670654296875, -0.3760986328125, -0.333526611328125, -0.29095458984375, -0.248382568359375, -0.205810546875, -0.163238525390625, -0.12066650390625, -0.078094482421875, -0.0355224609375, 0.007049560546875, 0.04962158203125, 0.092193603515625, 0.134765625, 0.177337646484375, 0.21990966796875, 0.262481689453125, 0.3050537109375, 0.347625732421875, 0.39019775390625, 0.432769775390625, 0.475341796875, 0.517913818359375, 0.56048583984375, 0.603057861328125, 0.6456298828125, 0.688201904296875, 0.73077392578125, 0.773345947265625, 0.81591796875, 0.858489990234375, 0.90106201171875, 0.943634033203125, 0.9862060546875, 1.028778076171875, 1.07135009765625, 1.113922119140625, 1.156494140625, 1.199066162109375, 1.24163818359375, 1.284210205078125, 1.3267822265625, 1.369354248046875, 1.41192626953125, 1.454498291015625, 1.4970703125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 2.0, 2.0, 6.0, 8.0, 8.0, 12.0, 18.0, 17.0, 26.0, 22.0, 27.0, 58.0, 72.0, 84.0, 123.0, 180.0, 285.0, 411.0, 649.0, 1238.0, 2396.0, 6353.0, 993213.0, 34260.0, 4289.0, 1907.0, 1049.0, 584.0, 374.0, 233.0, 161.0, 121.0, 87.0, 69.0, 49.0, 31.0, 35.0, 19.0, 20.0, 13.0, 7.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-6.08203125, -5.89678955078125, -5.7115478515625, -5.52630615234375, -5.341064453125, -5.15582275390625, -4.9705810546875, -4.78533935546875, -4.60009765625, -4.41485595703125, -4.2296142578125, -4.04437255859375, -3.859130859375, -3.67388916015625, -3.4886474609375, -3.30340576171875, -3.1181640625, -2.93292236328125, -2.7476806640625, -2.56243896484375, -2.377197265625, -2.19195556640625, -2.0067138671875, -1.82147216796875, -1.63623046875, -1.45098876953125, -1.2657470703125, -1.08050537109375, -0.895263671875, -0.71002197265625, -0.5247802734375, -0.33953857421875, -0.154296875, 0.03094482421875, 0.2161865234375, 0.40142822265625, 0.586669921875, 0.77191162109375, 0.9571533203125, 1.14239501953125, 1.32763671875, 1.51287841796875, 1.6981201171875, 1.88336181640625, 2.068603515625, 2.25384521484375, 2.4390869140625, 2.62432861328125, 2.8095703125, 2.99481201171875, 3.1800537109375, 3.36529541015625, 3.550537109375, 3.73577880859375, 3.9210205078125, 4.10626220703125, 4.29150390625, 4.47674560546875, 4.6619873046875, 4.84722900390625, 5.032470703125, 5.21771240234375, 5.4029541015625, 5.58819580078125, 5.7734375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 10.0, 17.0, 17.0, 23.0, 41.0, 40.0, 74.0, 146.0, 219.0, 150.0, 82.0, 52.0, 32.0, 19.0, 13.0, 13.0, 11.0, 3.0, 5.0, 3.0, 6.0, 1.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0127506256103516e-05, -4.767719656229019e-05, -4.522688686847687e-05, -4.2776577174663544e-05, -4.032626748085022e-05, -3.7875957787036896e-05, -3.542564809322357e-05, -3.297533839941025e-05, -3.0525028705596924e-05, -2.80747190117836e-05, -2.5624409317970276e-05, -2.3174099624156952e-05, -2.0723789930343628e-05, -1.8273480236530304e-05, -1.582317054271698e-05, -1.3372860848903656e-05, -1.0922551155090332e-05, -8.472241461277008e-06, -6.021931767463684e-06, -3.57162207365036e-06, -1.1213123798370361e-06, 1.3289973139762878e-06, 3.779307007789612e-06, 6.229616701602936e-06, 8.67992639541626e-06, 1.1130236089229584e-05, 1.3580545783042908e-05, 1.603085547685623e-05, 1.8481165170669556e-05, 2.093147486448288e-05, 2.3381784558296204e-05, 2.5832094252109528e-05, 2.828240394592285e-05, 3.0732713639736176e-05, 3.31830233335495e-05, 3.5633333027362823e-05, 3.808364272117615e-05, 4.053395241498947e-05, 4.2984262108802795e-05, 4.543457180261612e-05, 4.788488149642944e-05, 5.033519119024277e-05, 5.278550088405609e-05, 5.5235810577869415e-05, 5.768612027168274e-05, 6.013642996549606e-05, 6.258673965930939e-05, 6.503704935312271e-05, 6.748735904693604e-05, 6.993766874074936e-05, 7.238797843456268e-05, 7.483828812837601e-05, 7.728859782218933e-05, 7.973890751600266e-05, 8.218921720981598e-05, 8.46395269036293e-05, 8.708983659744263e-05, 8.954014629125595e-05, 9.199045598506927e-05, 9.44407656788826e-05, 9.689107537269592e-05, 9.934138506650925e-05, 0.00010179169476032257, 0.0001042420044541359, 0.00010669231414794922]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 11.0, 9.0, 24.0, 104.0, 1968.0, 1043076.0, 3156.0, 123.0, 23.0, 8.0, 8.0, 8.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.625, -111.208984375, -107.79296875, -104.376953125, -100.9609375, -97.544921875, -94.12890625, -90.712890625, -87.296875, -83.880859375, -80.46484375, -77.048828125, -73.6328125, -70.216796875, -66.80078125, -63.384765625, -59.96875, -56.552734375, -53.13671875, -49.720703125, -46.3046875, -42.888671875, -39.47265625, -36.056640625, -32.640625, -29.224609375, -25.80859375, -22.392578125, -18.9765625, -15.560546875, -12.14453125, -8.728515625, -5.3125, -1.896484375, 1.51953125, 4.935546875, 8.3515625, 11.767578125, 15.18359375, 18.599609375, 22.015625, 25.431640625, 28.84765625, 32.263671875, 35.6796875, 39.095703125, 42.51171875, 45.927734375, 49.34375, 52.759765625, 56.17578125, 59.591796875, 63.0078125, 66.423828125, 69.83984375, 73.255859375, 76.671875, 80.087890625, 83.50390625, 86.919921875, 90.3359375, 93.751953125, 97.16796875, 100.583984375, 104.0]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 961.0, 3.0, 4.0, 2.0, 5.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.38446044921875, -4.2493896484375, -4.11431884765625, -3.979248046875, -3.84417724609375, -3.7091064453125, -3.57403564453125, -3.43896484375, -3.30389404296875, -3.1688232421875, -3.03375244140625, -2.898681640625, -2.76361083984375, -2.6285400390625, -2.49346923828125, -2.3583984375, -2.22332763671875, -2.0882568359375, -1.95318603515625, -1.818115234375, -1.68304443359375, -1.5479736328125, -1.41290283203125, -1.27783203125, -1.14276123046875, -1.0076904296875, -0.87261962890625, -0.737548828125, -0.60247802734375, -0.4674072265625, -0.33233642578125, -0.197265625, -0.06219482421875, 0.0728759765625, 0.20794677734375, 0.343017578125, 0.47808837890625, 0.6131591796875, 0.74822998046875, 0.88330078125, 1.01837158203125, 1.1534423828125, 1.28851318359375, 1.423583984375, 1.55865478515625, 1.6937255859375, 1.82879638671875, 1.9638671875, 2.09893798828125, 2.2340087890625, 2.36907958984375, 2.504150390625, 2.63922119140625, 2.7742919921875, 2.90936279296875, 3.04443359375, 3.17950439453125, 3.3145751953125, 3.44964599609375, 3.584716796875, 3.71978759765625, 3.8548583984375, 3.98992919921875, 4.125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 688.0, 284.0, 34.0, 6.0, 1.0, 1.0], "bins": [-59.8785400390625, -58.86000061035156, -57.841461181640625, -56.82292175292969, -55.80438232421875, -54.78584289550781, -53.767303466796875, -52.74876403808594, -51.730224609375, -50.71168518066406, -49.693145751953125, -48.67460632324219, -47.65606689453125, -46.63752746582031, -45.618988037109375, -44.60044860839844, -43.581905364990234, -42.5633659362793, -41.54482650756836, -40.52628707885742, -39.507747650146484, -38.48920822143555, -37.47066879272461, -36.452125549316406, -35.43358612060547, -34.41504669189453, -33.396507263183594, -32.377967834472656, -31.35942840576172, -30.34088897705078, -29.32234764099121, -28.303808212280273, -27.285266876220703, -26.266727447509766, -25.248188018798828, -24.22964859008789, -23.211109161376953, -22.192569732666016, -21.174028396606445, -20.155488967895508, -19.136951446533203, -18.118412017822266, -17.099872589111328, -16.08133316040039, -15.062792778015137, -14.0442533493042, -13.025712966918945, -12.007173538208008, -10.988633155822754, -9.970093727111816, -8.951553344726562, -7.933013916015625, -6.9144744873046875, -5.89593505859375, -4.877395153045654, -3.8588552474975586, -2.840315818786621, -1.8217761516571045, -0.8032364845275879, 0.2153031826019287, 1.2338428497314453, 2.252382278442383, 3.2709221839904785, 4.289462089538574, 5.308001518249512]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 12.0, 5.0, 14.0, 28.0, 12.0, 21.0, 29.0, 40.0, 31.0, 40.0, 48.0, 41.0, 49.0, 66.0, 59.0, 49.0, 53.0, 46.0, 51.0, 46.0, 43.0, 39.0, 28.0, 32.0, 17.0, 22.0, 12.0, 10.0, 8.0, 12.0, 7.0, 6.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5236878395080566, -2.4469056129455566, -2.3701233863830566, -2.2933411598205566, -2.2165589332580566, -2.1397767066955566, -2.0629944801330566, -1.986212134361267, -1.909429907798767, -1.832647681236267, -1.755865454673767, -1.679083228111267, -1.6023008823394775, -1.5255186557769775, -1.4487364292144775, -1.3719542026519775, -1.2951719760894775, -1.2183897495269775, -1.1416075229644775, -1.0648252964019775, -0.9880430102348328, -0.9112607836723328, -0.834478497505188, -0.757696270942688, -0.680914044380188, -0.604131817817688, -0.527349591255188, -0.4505673050880432, -0.3737850785255432, -0.2970028519630432, -0.22022059559822083, -0.14343833923339844, -0.06665635108947754, 0.010125890374183655, 0.08690813183784485, 0.16369037330150604, 0.24047261476516724, 0.31725484132766724, 0.3940370976924896, 0.470819354057312, 0.547601580619812, 0.624383807182312, 0.701166033744812, 0.7779483199119568, 0.8547305464744568, 0.9315127730369568, 1.0082950592041016, 1.0850772857666016, 1.1618595123291016, 1.2386417388916016, 1.3154239654541016, 1.3922061920166016, 1.4689884185791016, 1.5457706451416016, 1.6225529909133911, 1.6993352174758911, 1.7761174440383911, 1.8528996706008911, 1.9296818971633911, 2.0064642429351807, 2.0832464694976807, 2.1600286960601807, 2.2368109226226807, 2.3135931491851807, 2.3903753757476807]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 7.0, 7.0, 17.0, 18.0, 11.0, 19.0, 32.0, 34.0, 69.0, 47.0, 73.0, 179.0, 644.0, 4099.0, 41985.0, 810478.0, 176058.0, 12478.0, 1497.0, 314.0, 126.0, 77.0, 65.0, 45.0, 32.0, 29.0, 21.0, 17.0, 17.0, 13.0, 9.0, 6.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0625, -12.6234130859375, -12.184326171875, -11.7452392578125, -11.30615234375, -10.8670654296875, -10.427978515625, -9.9888916015625, -9.5498046875, -9.1107177734375, -8.671630859375, -8.2325439453125, -7.79345703125, -7.3543701171875, -6.915283203125, -6.4761962890625, -6.037109375, -5.5980224609375, -5.158935546875, -4.7198486328125, -4.28076171875, -3.8416748046875, -3.402587890625, -2.9635009765625, -2.5244140625, -2.0853271484375, -1.646240234375, -1.2071533203125, -0.76806640625, -0.3289794921875, 0.110107421875, 0.5491943359375, 0.98828125, 1.4273681640625, 1.866455078125, 2.3055419921875, 2.74462890625, 3.1837158203125, 3.622802734375, 4.0618896484375, 4.5009765625, 4.9400634765625, 5.379150390625, 5.8182373046875, 6.25732421875, 6.6964111328125, 7.135498046875, 7.5745849609375, 8.013671875, 8.4527587890625, 8.891845703125, 9.3309326171875, 9.77001953125, 10.2091064453125, 10.648193359375, 11.0872802734375, 11.5263671875, 11.9654541015625, 12.404541015625, 12.8436279296875, 13.28271484375, 13.7218017578125, 14.160888671875, 14.5999755859375, 15.0390625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 18.0, 23.0, 48.0, 51.0, 93.0, 100.0, 130.0, 122.0, 118.0, 97.0, 83.0, 55.0, 33.0, 22.0, 8.0, 9.0], "bins": [-7.25390625, -7.1226043701171875, -6.991302490234375, -6.8600006103515625, -6.72869873046875, -6.5973968505859375, -6.466094970703125, -6.3347930908203125, -6.2034912109375, -6.0721893310546875, -5.940887451171875, -5.8095855712890625, -5.67828369140625, -5.5469818115234375, -5.415679931640625, -5.2843780517578125, -5.153076171875, -5.0217742919921875, -4.890472412109375, -4.7591705322265625, -4.62786865234375, -4.4965667724609375, -4.365264892578125, -4.2339630126953125, -4.1026611328125, -3.9713592529296875, -3.840057373046875, -3.7087554931640625, -3.57745361328125, -3.4461517333984375, -3.314849853515625, -3.1835479736328125, -3.05224609375, -2.9209442138671875, -2.789642333984375, -2.6583404541015625, -2.52703857421875, -2.3957366943359375, -2.264434814453125, -2.1331329345703125, -2.0018310546875, -1.8705291748046875, -1.739227294921875, -1.6079254150390625, -1.47662353515625, -1.3453216552734375, -1.214019775390625, -1.0827178955078125, -0.951416015625, -0.8201141357421875, -0.688812255859375, -0.5575103759765625, -0.42620849609375, -0.2949066162109375, -0.163604736328125, -0.0323028564453125, 0.0989990234375, 0.2303009033203125, 0.361602783203125, 0.4929046630859375, 0.62420654296875, 0.7555084228515625, 0.886810302734375, 1.0181121826171875, 1.1494140625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 14.0, 15.0, 15.0, 8.0, 15.0, 14.0, 12.0, 33.0, 29.0, 23.0, 30.0, 30.0, 42.0, 56.0, 142.0, 787.0, 13488.0, 787172.0, 239756.0, 5919.0, 437.0, 121.0, 58.0, 49.0, 39.0, 28.0, 22.0, 26.0, 28.0, 23.0, 9.0, 13.0, 13.0, 14.0, 8.0, 14.0, 10.0, 6.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.09375, -15.572509765625, -15.05126953125, -14.530029296875, -14.0087890625, -13.487548828125, -12.96630859375, -12.445068359375, -11.923828125, -11.402587890625, -10.88134765625, -10.360107421875, -9.8388671875, -9.317626953125, -8.79638671875, -8.275146484375, -7.75390625, -7.232666015625, -6.71142578125, -6.190185546875, -5.6689453125, -5.147705078125, -4.62646484375, -4.105224609375, -3.583984375, -3.062744140625, -2.54150390625, -2.020263671875, -1.4990234375, -0.977783203125, -0.45654296875, 0.064697265625, 0.5859375, 1.107177734375, 1.62841796875, 2.149658203125, 2.6708984375, 3.192138671875, 3.71337890625, 4.234619140625, 4.755859375, 5.277099609375, 5.79833984375, 6.319580078125, 6.8408203125, 7.362060546875, 7.88330078125, 8.404541015625, 8.92578125, 9.447021484375, 9.96826171875, 10.489501953125, 11.0107421875, 11.531982421875, 12.05322265625, 12.574462890625, 13.095703125, 13.616943359375, 14.13818359375, 14.659423828125, 15.1806640625, 15.701904296875, 16.22314453125, 16.744384765625, 17.265625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 0.0, 10.0, 9.0, 10.0, 10.0, 16.0, 13.0, 14.0, 26.0, 20.0, 28.0, 24.0, 30.0, 29.0, 33.0, 38.0, 41.0, 45.0, 33.0, 44.0, 47.0, 37.0, 50.0, 37.0, 43.0, 39.0, 42.0, 28.0, 27.0, 27.0, 29.0, 19.0, 13.0, 13.0, 13.0, 10.0, 6.0, 14.0, 10.0, 4.0, 10.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.73046875, -1.6729278564453125, -1.615386962890625, -1.5578460693359375, -1.50030517578125, -1.4427642822265625, -1.385223388671875, -1.3276824951171875, -1.2701416015625, -1.2126007080078125, -1.155059814453125, -1.0975189208984375, -1.03997802734375, -0.9824371337890625, -0.924896240234375, -0.8673553466796875, -0.809814453125, -0.7522735595703125, -0.694732666015625, -0.6371917724609375, -0.57965087890625, -0.5221099853515625, -0.464569091796875, -0.4070281982421875, -0.3494873046875, -0.2919464111328125, -0.234405517578125, -0.1768646240234375, -0.11932373046875, -0.0617828369140625, -0.004241943359375, 0.0532989501953125, 0.11083984375, 0.1683807373046875, 0.225921630859375, 0.2834625244140625, 0.34100341796875, 0.3985443115234375, 0.456085205078125, 0.5136260986328125, 0.5711669921875, 0.6287078857421875, 0.686248779296875, 0.7437896728515625, 0.80133056640625, 0.8588714599609375, 0.916412353515625, 0.9739532470703125, 1.031494140625, 1.0890350341796875, 1.146575927734375, 1.2041168212890625, 1.26165771484375, 1.3191986083984375, 1.376739501953125, 1.4342803955078125, 1.4918212890625, 1.5493621826171875, 1.606903076171875, 1.6644439697265625, 1.72198486328125, 1.7795257568359375, 1.837066650390625, 1.8946075439453125, 1.9521484375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 10.0, 7.0, 12.0, 13.0, 24.0, 38.0, 67.0, 244.0, 1106.0, 8792.0, 770719.0, 259550.0, 6621.0, 950.0, 209.0, 63.0, 32.0, 22.0, 15.0, 11.0, 7.0, 4.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.361083984375, -0.35131072998046875, -0.3415374755859375, -0.33176422119140625, -0.321990966796875, -0.31221771240234375, -0.3024444580078125, -0.29267120361328125, -0.28289794921875, -0.27312469482421875, -0.2633514404296875, -0.25357818603515625, -0.243804931640625, -0.23403167724609375, -0.2242584228515625, -0.21448516845703125, -0.2047119140625, -0.19493865966796875, -0.1851654052734375, -0.17539215087890625, -0.165618896484375, -0.15584564208984375, -0.1460723876953125, -0.13629913330078125, -0.12652587890625, -0.11675262451171875, -0.1069793701171875, -0.09720611572265625, -0.087432861328125, -0.07765960693359375, -0.0678863525390625, -0.05811309814453125, -0.04833984375, -0.03856658935546875, -0.0287933349609375, -0.01902008056640625, -0.009246826171875, 0.00052642822265625, 0.0102996826171875, 0.02007293701171875, 0.02984619140625, 0.03961944580078125, 0.0493927001953125, 0.05916595458984375, 0.068939208984375, 0.07871246337890625, 0.0884857177734375, 0.09825897216796875, 0.1080322265625, 0.11780548095703125, 0.1275787353515625, 0.13735198974609375, 0.147125244140625, 0.15689849853515625, 0.1666717529296875, 0.17644500732421875, 0.18621826171875, 0.19599151611328125, 0.2057647705078125, 0.21553802490234375, 0.225311279296875, 0.23508453369140625, 0.2448577880859375, 0.25463104248046875, 0.264404296875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 7.0, 8.0, 12.0, 11.0, 22.0, 23.0, 31.0, 35.0, 58.0, 113.0, 204.0, 189.0, 89.0, 51.0, 41.0, 28.0, 25.0, 15.0, 11.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.962350845336914e-05, -2.8631649911403656e-05, -2.763979136943817e-05, -2.6647932827472687e-05, -2.5656074285507202e-05, -2.4664215743541718e-05, -2.3672357201576233e-05, -2.2680498659610748e-05, -2.1688640117645264e-05, -2.069678157567978e-05, -1.9704923033714294e-05, -1.871306449174881e-05, -1.7721205949783325e-05, -1.672934740781784e-05, -1.5737488865852356e-05, -1.4745630323886871e-05, -1.3753771781921387e-05, -1.2761913239955902e-05, -1.1770054697990417e-05, -1.0778196156024933e-05, -9.786337614059448e-06, -8.794479072093964e-06, -7.802620530128479e-06, -6.810761988162994e-06, -5.81890344619751e-06, -4.827044904232025e-06, -3.8351863622665405e-06, -2.843327820301056e-06, -1.8514692783355713e-06, -8.596107363700867e-07, 1.3224780559539795e-07, 1.1241063475608826e-06, 2.115964889526367e-06, 3.107823431491852e-06, 4.0996819734573364e-06, 5.091540515422821e-06, 6.083399057388306e-06, 7.07525759935379e-06, 8.067116141319275e-06, 9.05897468328476e-06, 1.0050833225250244e-05, 1.1042691767215729e-05, 1.2034550309181213e-05, 1.3026408851146698e-05, 1.4018267393112183e-05, 1.5010125935077667e-05, 1.6001984477043152e-05, 1.6993843019008636e-05, 1.798570156097412e-05, 1.8977560102939606e-05, 1.996941864490509e-05, 2.0961277186870575e-05, 2.195313572883606e-05, 2.2944994270801544e-05, 2.393685281276703e-05, 2.4928711354732513e-05, 2.5920569896697998e-05, 2.6912428438663483e-05, 2.7904286980628967e-05, 2.8896145522594452e-05, 2.9888004064559937e-05, 3.087986260652542e-05, 3.1871721148490906e-05, 3.286357969045639e-05, 3.3855438232421875e-05]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 3.0, 3.0, 6.0, 2.0, 7.0, 6.0, 6.0, 10.0, 18.0, 25.0, 46.0, 76.0, 206.0, 1642.0, 45716.0, 993558.0, 6419.0, 553.0, 122.0, 47.0, 22.0, 14.0, 10.0, 8.0, 6.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.37109375, -0.3608512878417969, -0.35060882568359375, -0.3403663635253906, -0.3301239013671875, -0.3198814392089844, -0.30963897705078125, -0.2993965148925781, -0.289154052734375, -0.2789115905761719, -0.26866912841796875, -0.2584266662597656, -0.2481842041015625, -0.23794174194335938, -0.22769927978515625, -0.21745681762695312, -0.20721435546875, -0.19697189331054688, -0.18672943115234375, -0.17648696899414062, -0.1662445068359375, -0.15600204467773438, -0.14575958251953125, -0.13551712036132812, -0.125274658203125, -0.11503219604492188, -0.10478973388671875, -0.09454727172851562, -0.0843048095703125, -0.07406234741210938, -0.06381988525390625, -0.053577423095703125, -0.0433349609375, -0.033092498779296875, -0.02285003662109375, -0.012607574462890625, -0.0023651123046875, 0.007877349853515625, 0.01811981201171875, 0.028362274169921875, 0.038604736328125, 0.048847198486328125, 0.05908966064453125, 0.06933212280273438, 0.0795745849609375, 0.08981704711914062, 0.10005950927734375, 0.11030197143554688, 0.12054443359375, 0.13078689575195312, 0.14102935791015625, 0.15127182006835938, 0.1615142822265625, 0.17175674438476562, 0.18199920654296875, 0.19224166870117188, 0.202484130859375, 0.21272659301757812, 0.22296905517578125, 0.23321151733398438, 0.2434539794921875, 0.2536964416503906, 0.26393890380859375, 0.2741813659667969, 0.284423828125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 0.0, 5.0, 2.0, 5.0, 8.0, 6.0, 9.0, 9.0, 25.0, 26.0, 56.0, 74.0, 147.0, 189.0, 190.0, 102.0, 45.0, 25.0, 18.0, 11.0, 9.0, 7.0, 5.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.048614501953125, -0.0472569465637207, -0.045899391174316406, -0.04454183578491211, -0.04318428039550781, -0.041826725006103516, -0.04046916961669922, -0.03911161422729492, -0.037754058837890625, -0.03639650344848633, -0.03503894805908203, -0.033681392669677734, -0.03232383728027344, -0.03096628189086914, -0.029608726501464844, -0.028251171112060547, -0.02689361572265625, -0.025536060333251953, -0.024178504943847656, -0.02282094955444336, -0.021463394165039062, -0.020105838775634766, -0.01874828338623047, -0.017390727996826172, -0.016033172607421875, -0.014675617218017578, -0.013318061828613281, -0.011960506439208984, -0.010602951049804688, -0.00924539566040039, -0.007887840270996094, -0.006530284881591797, -0.0051727294921875, -0.003815174102783203, -0.0024576187133789062, -0.0011000633239746094, 0.0002574920654296875, 0.0016150474548339844, 0.0029726028442382812, 0.004330158233642578, 0.005687713623046875, 0.007045269012451172, 0.008402824401855469, 0.009760379791259766, 0.011117935180664062, 0.01247549057006836, 0.013833045959472656, 0.015190601348876953, 0.01654815673828125, 0.017905712127685547, 0.019263267517089844, 0.02062082290649414, 0.021978378295898438, 0.023335933685302734, 0.02469348907470703, 0.026051044464111328, 0.027408599853515625, 0.028766155242919922, 0.03012371063232422, 0.031481266021728516, 0.03283882141113281, 0.03419637680053711, 0.035553932189941406, 0.0369114875793457, 0.03826904296875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 32.0, 578.0, 344.0, 42.0, 13.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.795896530151367, -23.370182037353516, -22.944467544555664, -22.518753051757812, -22.09303855895996, -21.66732406616211, -21.241609573364258, -20.815895080566406, -20.390178680419922, -19.96446418762207, -19.53874969482422, -19.113035202026367, -18.687320709228516, -18.261606216430664, -17.835891723632812, -17.410175323486328, -16.98446273803711, -16.558748245239258, -16.133033752441406, -15.707319259643555, -15.281604766845703, -14.855890274047852, -14.430174827575684, -14.004460334777832, -13.57874584197998, -13.153031349182129, -12.727316856384277, -12.301602363586426, -11.875886917114258, -11.450172424316406, -11.024457931518555, -10.598743438720703, -10.173028945922852, -9.747314453125, -9.321599960327148, -8.895885467529297, -8.470170974731445, -8.044456481933594, -7.618741035461426, -7.193026542663574, -6.7673115730285645, -6.341597080230713, -5.915882110595703, -5.490167617797852, -5.064453125, -4.638738632202148, -4.213024139404297, -3.787309169769287, -3.3615946769714355, -2.935880184173584, -2.5101654529571533, -2.0844507217407227, -1.658736228942871, -1.2330217361450195, -0.8073070049285889, -0.3815922737121582, 0.04412221908569336, 0.4698368310928345, 0.8955514430999756, 1.3212660551071167, 1.7469806671142578, 2.1726951599121094, 2.59840989112854, 3.0241246223449707, 3.4498391151428223]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 6.0, 14.0, 17.0, 10.0, 14.0, 27.0, 40.0, 32.0, 58.0, 53.0, 59.0, 53.0, 51.0, 64.0, 61.0, 51.0, 52.0, 57.0, 61.0, 28.0, 38.0, 30.0, 30.0, 25.0, 12.0, 11.0, 7.0, 8.0, 5.0, 7.0, 2.0, 7.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.418497562408447, -4.313572406768799, -4.20864725112915, -4.103722095489502, -3.9987969398498535, -3.893871784210205, -3.7889466285705566, -3.684021472930908, -3.5790963172912598, -3.4741711616516113, -3.369246006011963, -3.2643208503723145, -3.159395694732666, -3.0544705390930176, -2.949545383453369, -2.8446202278137207, -2.739694833755493, -2.6347696781158447, -2.5298445224761963, -2.424919366836548, -2.3199942111968994, -2.215069055557251, -2.1101436614990234, -2.005218505859375, -1.9002934694290161, -1.7953683137893677, -1.6904431581497192, -1.5855178833007812, -1.4805927276611328, -1.3756675720214844, -1.270742416381836, -1.1658172607421875, -1.060892105102539, -0.9559669494628906, -0.8510417938232422, -0.746116578578949, -0.6411914229393005, -0.5362662672996521, -0.4313410520553589, -0.32641589641571045, -0.221490740776062, -0.11656557023525238, -0.011640399694442749, 0.09328478574752808, 0.1982099413871765, 0.30313509702682495, 0.40806031227111816, 0.5129854679107666, 0.617910623550415, 0.7228357791900635, 0.8277609348297119, 0.9326861500740051, 1.0376112461090088, 1.1425364017486572, 1.2474616765975952, 1.3523868322372437, 1.457311987876892, 1.5622371435165405, 1.667162299156189, 1.772087574005127, 1.8770127296447754, 1.9819378852844238, 2.0868630409240723, 2.1917881965637207, 2.296713352203369]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 6.0, 7.0, 9.0, 16.0, 18.0, 26.0, 36.0, 48.0, 61.0, 109.0, 145.0, 278.0, 536.0, 1347.0, 3669.0, 3791680.0, 390196.0, 3450.0, 1293.0, 582.0, 272.0, 172.0, 82.0, 44.0, 50.0, 30.0, 18.0, 15.0, 11.0, 13.0, 10.0, 13.0, 7.0, 3.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.734375, -15.3087158203125, -14.883056640625, -14.4573974609375, -14.03173828125, -13.6060791015625, -13.180419921875, -12.7547607421875, -12.3291015625, -11.9034423828125, -11.477783203125, -11.0521240234375, -10.62646484375, -10.2008056640625, -9.775146484375, -9.3494873046875, -8.923828125, -8.4981689453125, -8.072509765625, -7.6468505859375, -7.22119140625, -6.7955322265625, -6.369873046875, -5.9442138671875, -5.5185546875, -5.0928955078125, -4.667236328125, -4.2415771484375, -3.81591796875, -3.3902587890625, -2.964599609375, -2.5389404296875, -2.11328125, -1.6876220703125, -1.261962890625, -0.8363037109375, -0.41064453125, 0.0150146484375, 0.440673828125, 0.8663330078125, 1.2919921875, 1.7176513671875, 2.143310546875, 2.5689697265625, 2.99462890625, 3.4202880859375, 3.845947265625, 4.2716064453125, 4.697265625, 5.1229248046875, 5.548583984375, 5.9742431640625, 6.39990234375, 6.8255615234375, 7.251220703125, 7.6768798828125, 8.1025390625, 8.5281982421875, 8.953857421875, 9.3795166015625, 9.80517578125, 10.2308349609375, 10.656494140625, 11.0821533203125, 11.5078125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 7.0, 10.0, 14.0, 17.0, 23.0, 26.0, 26.0, 37.0, 54.0, 34.0, 45.0, 31.0, 46.0, 61.0, 43.0, 38.0, 57.0, 55.0, 37.0, 40.0, 45.0, 36.0, 26.0, 32.0, 24.0, 19.0, 16.0, 13.0, 11.0, 11.0, 15.0, 5.0, 8.0, 4.0, 2.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.90966796875, -0.8843154907226562, -0.8589630126953125, -0.8336105346679688, -0.808258056640625, -0.7829055786132812, -0.7575531005859375, -0.7322006225585938, -0.70684814453125, -0.6814956665039062, -0.6561431884765625, -0.6307907104492188, -0.605438232421875, -0.5800857543945312, -0.5547332763671875, -0.5293807983398438, -0.5040283203125, -0.47867584228515625, -0.4533233642578125, -0.42797088623046875, -0.402618408203125, -0.37726593017578125, -0.3519134521484375, -0.32656097412109375, -0.30120849609375, -0.27585601806640625, -0.2505035400390625, -0.22515106201171875, -0.199798583984375, -0.17444610595703125, -0.1490936279296875, -0.12374114990234375, -0.098388671875, -0.07303619384765625, -0.0476837158203125, -0.02233123779296875, 0.003021240234375, 0.02837371826171875, 0.0537261962890625, 0.07907867431640625, 0.10443115234375, 0.12978363037109375, 0.1551361083984375, 0.18048858642578125, 0.205841064453125, 0.23119354248046875, 0.2565460205078125, 0.28189849853515625, 0.3072509765625, 0.33260345458984375, 0.3579559326171875, 0.38330841064453125, 0.408660888671875, 0.43401336669921875, 0.4593658447265625, 0.48471832275390625, 0.51007080078125, 0.5354232788085938, 0.5607757568359375, 0.5861282348632812, 0.611480712890625, 0.6368331909179688, 0.6621856689453125, 0.6875381469726562, 0.712890625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 12.0, 12.0, 26.0, 31.0, 81.0, 283.0, 1799.0, 326908.0, 3862405.0, 2227.0, 308.0, 96.0, 35.0, 20.0, 16.0, 11.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.109375, -16.75323486328125, -16.3970947265625, -16.04095458984375, -15.684814453125, -15.32867431640625, -14.9725341796875, -14.61639404296875, -14.26025390625, -13.90411376953125, -13.5479736328125, -13.19183349609375, -12.835693359375, -12.47955322265625, -12.1234130859375, -11.76727294921875, -11.4111328125, -11.05499267578125, -10.6988525390625, -10.34271240234375, -9.986572265625, -9.63043212890625, -9.2742919921875, -8.91815185546875, -8.56201171875, -8.20587158203125, -7.8497314453125, -7.49359130859375, -7.137451171875, -6.78131103515625, -6.4251708984375, -6.06903076171875, -5.712890625, -5.35675048828125, -5.0006103515625, -4.64447021484375, -4.288330078125, -3.93218994140625, -3.5760498046875, -3.21990966796875, -2.86376953125, -2.50762939453125, -2.1514892578125, -1.79534912109375, -1.439208984375, -1.08306884765625, -0.7269287109375, -0.37078857421875, -0.0146484375, 0.34149169921875, 0.6976318359375, 1.05377197265625, 1.409912109375, 1.76605224609375, 2.1221923828125, 2.47833251953125, 2.83447265625, 3.19061279296875, 3.5467529296875, 3.90289306640625, 4.259033203125, 4.61517333984375, 4.9713134765625, 5.32745361328125, 5.68359375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 8.0, 10.0, 40.0, 173.0, 615.0, 2594.0, 439.0, 116.0, 36.0, 9.0, 9.0, 6.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.337890625, -0.31842041015625, -0.2989501953125, -0.27947998046875, -0.260009765625, -0.24053955078125, -0.2210693359375, -0.20159912109375, -0.18212890625, -0.16265869140625, -0.1431884765625, -0.12371826171875, -0.104248046875, -0.08477783203125, -0.0653076171875, -0.04583740234375, -0.0263671875, -0.00689697265625, 0.0125732421875, 0.03204345703125, 0.051513671875, 0.07098388671875, 0.0904541015625, 0.10992431640625, 0.12939453125, 0.14886474609375, 0.1683349609375, 0.18780517578125, 0.207275390625, 0.22674560546875, 0.2462158203125, 0.26568603515625, 0.28515625, 0.30462646484375, 0.3240966796875, 0.34356689453125, 0.363037109375, 0.38250732421875, 0.4019775390625, 0.42144775390625, 0.44091796875, 0.46038818359375, 0.4798583984375, 0.49932861328125, 0.518798828125, 0.53826904296875, 0.5577392578125, 0.57720947265625, 0.5966796875, 0.61614990234375, 0.6356201171875, 0.65509033203125, 0.674560546875, 0.69403076171875, 0.7135009765625, 0.73297119140625, 0.75244140625, 0.77191162109375, 0.7913818359375, 0.81085205078125, 0.830322265625, 0.84979248046875, 0.8692626953125, 0.88873291015625, 0.908203125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 13.0, 44.0, 162.0, 580.0, 139.0, 40.0, 27.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-9.706134796142578, -9.531092643737793, -9.356050491333008, -9.181008338928223, -9.005966186523438, -8.830924034118652, -8.655881881713867, -8.480838775634766, -8.305797576904297, -8.130755424499512, -7.955713272094727, -7.780671119689941, -7.605628967285156, -7.430586338043213, -7.255544185638428, -7.080502033233643, -6.905459403991699, -6.730417251586914, -6.555375099182129, -6.380332946777344, -6.205290794372559, -6.030248165130615, -5.85520601272583, -5.680163860321045, -5.50512170791626, -5.330079555511475, -5.1550374031066895, -4.979995250701904, -4.804952621459961, -4.629910469055176, -4.454868316650391, -4.2798261642456055, -4.104783535003662, -3.929741382598877, -3.754699230194092, -3.5796568393707275, -3.4046146869659424, -3.2295725345611572, -3.054530143737793, -2.879487991333008, -2.7044458389282227, -2.5294036865234375, -2.3543615341186523, -2.179319143295288, -2.004276990890503, -1.8292348384857178, -1.654192566871643, -1.4791502952575684, -1.3041082620620728, -1.129065990447998, -0.9540238380432129, -0.778981626033783, -0.603939414024353, -0.4288972020149231, -0.25385499000549316, -0.07881271839141846, 0.0962294340133667, 0.27127164602279663, 0.44631385803222656, 0.6213560700416565, 0.7963982820510864, 0.9714404940605164, 1.1464827060699463, 1.321524977684021, 1.4965671300888062]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 3.0, 5.0, 6.0, 10.0, 23.0, 28.0, 42.0, 37.0, 55.0, 66.0, 52.0, 76.0, 78.0, 83.0, 78.0, 60.0, 48.0, 54.0, 37.0, 46.0, 29.0, 20.0, 21.0, 16.0, 10.0, 6.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.677977204322815, -1.6391839981079102, -1.6003907918930054, -1.5615975856781006, -1.5228043794631958, -1.484011173248291, -1.4452180862426758, -1.406424880027771, -1.3676316738128662, -1.3288384675979614, -1.2900452613830566, -1.2512520551681519, -1.212458848953247, -1.1736657619476318, -1.1348724365234375, -1.0960793495178223, -1.057286024093628, -1.0184928178787231, -0.9796996116638184, -0.9409064054489136, -0.9021132588386536, -0.8633200526237488, -0.824526846408844, -0.785733699798584, -0.7469404935836792, -0.7081472873687744, -0.6693540811538696, -0.6305608749389648, -0.5917677283287048, -0.5529745221138, -0.5141813158988953, -0.47538813948631287, -0.43659496307373047, -0.3978017568588257, -0.3590085804462433, -0.3202153742313385, -0.2814221978187561, -0.24262899160385132, -0.20383578538894653, -0.16504260897636414, -0.12624940276145935, -0.08745621144771576, -0.04866301268339157, -0.009869813919067383, 0.02892337739467621, 0.0677165687084198, 0.10650977492332458, 0.14530295133590698, 0.18409615755081177, 0.22288934886455536, 0.26168254017829895, 0.30047574639320374, 0.33926892280578613, 0.3780621290206909, 0.4168553352355957, 0.4556485116481781, 0.4944417178630829, 0.5332348942756653, 0.5720281004905701, 0.6108213067054749, 0.6496145129203796, 0.6884076595306396, 0.7272008657455444, 0.7659940719604492, 0.804787278175354]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 2.0, 5.0, 3.0, 13.0, 11.0, 12.0, 10.0, 18.0, 34.0, 81.0, 126.0, 230.0, 468.0, 1040.0, 2435.0, 6645.0, 20585.0, 86728.0, 676380.0, 199260.0, 37009.0, 10677.0, 3908.0, 1514.0, 640.0, 323.0, 156.0, 85.0, 43.0, 31.0, 18.0, 15.0, 6.0, 7.0, 1.0, 3.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.83984375, -3.71484375, -3.58984375, -3.46484375, -3.33984375, -3.21484375, -3.08984375, -2.96484375, -2.83984375, -2.71484375, -2.58984375, -2.46484375, -2.33984375, -2.21484375, -2.08984375, -1.96484375, -1.83984375, -1.71484375, -1.58984375, -1.46484375, -1.33984375, -1.21484375, -1.08984375, -0.96484375, -0.83984375, -0.71484375, -0.58984375, -0.46484375, -0.33984375, -0.21484375, -0.08984375, 0.03515625, 0.16015625, 0.28515625, 0.41015625, 0.53515625, 0.66015625, 0.78515625, 0.91015625, 1.03515625, 1.16015625, 1.28515625, 1.41015625, 1.53515625, 1.66015625, 1.78515625, 1.91015625, 2.03515625, 2.16015625, 2.28515625, 2.41015625, 2.53515625, 2.66015625, 2.78515625, 2.91015625, 3.03515625, 3.16015625, 3.28515625, 3.41015625, 3.53515625, 3.66015625, 3.78515625, 3.91015625, 4.03515625, 4.16015625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 8.0, 14.0, 8.0, 21.0, 45.0, 47.0, 54.0, 69.0, 83.0, 94.0, 94.0, 97.0, 71.0, 67.0, 53.0, 49.0, 43.0, 33.0, 17.0, 18.0, 7.0, 8.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2451171875, -1.2178497314453125, -1.190582275390625, -1.1633148193359375, -1.13604736328125, -1.1087799072265625, -1.081512451171875, -1.0542449951171875, -1.0269775390625, -0.9997100830078125, -0.972442626953125, -0.9451751708984375, -0.91790771484375, -0.8906402587890625, -0.863372802734375, -0.8361053466796875, -0.808837890625, -0.7815704345703125, -0.754302978515625, -0.7270355224609375, -0.69976806640625, -0.6725006103515625, -0.645233154296875, -0.6179656982421875, -0.5906982421875, -0.5634307861328125, -0.536163330078125, -0.5088958740234375, -0.48162841796875, -0.4543609619140625, -0.427093505859375, -0.3998260498046875, -0.37255859375, -0.3452911376953125, -0.318023681640625, -0.2907562255859375, -0.26348876953125, -0.2362213134765625, -0.208953857421875, -0.1816864013671875, -0.1544189453125, -0.1271514892578125, -0.099884033203125, -0.0726165771484375, -0.04534912109375, -0.0180816650390625, 0.009185791015625, 0.0364532470703125, 0.063720703125, 0.0909881591796875, 0.118255615234375, 0.1455230712890625, 0.17279052734375, 0.2000579833984375, 0.227325439453125, 0.2545928955078125, 0.2818603515625, 0.3091278076171875, 0.336395263671875, 0.3636627197265625, 0.39093017578125, 0.4181976318359375, 0.445465087890625, 0.4727325439453125, 0.5]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 3.0, 8.0, 6.0, 16.0, 9.0, 30.0, 61.0, 91.0, 93.0, 168.0, 217.0, 350.0, 467.0, 768.0, 1206.0, 1959.0, 3177.0, 5472.0, 10104.0, 19994.0, 49073.0, 238580.0, 605057.0, 60824.0, 23453.0, 11638.0, 6127.0, 3528.0, 2196.0, 1341.0, 824.0, 575.0, 345.0, 244.0, 166.0, 146.0, 78.0, 53.0, 34.0, 34.0, 13.0, 6.0, 9.0, 9.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7490234375, -1.69091796875, -1.6328125, -1.57470703125, -1.5166015625, -1.45849609375, -1.400390625, -1.34228515625, -1.2841796875, -1.22607421875, -1.16796875, -1.10986328125, -1.0517578125, -0.99365234375, -0.935546875, -0.87744140625, -0.8193359375, -0.76123046875, -0.703125, -0.64501953125, -0.5869140625, -0.52880859375, -0.470703125, -0.41259765625, -0.3544921875, -0.29638671875, -0.23828125, -0.18017578125, -0.1220703125, -0.06396484375, -0.005859375, 0.05224609375, 0.1103515625, 0.16845703125, 0.2265625, 0.28466796875, 0.3427734375, 0.40087890625, 0.458984375, 0.51708984375, 0.5751953125, 0.63330078125, 0.69140625, 0.74951171875, 0.8076171875, 0.86572265625, 0.923828125, 0.98193359375, 1.0400390625, 1.09814453125, 1.15625, 1.21435546875, 1.2724609375, 1.33056640625, 1.388671875, 1.44677734375, 1.5048828125, 1.56298828125, 1.62109375, 1.67919921875, 1.7373046875, 1.79541015625, 1.853515625, 1.91162109375, 1.9697265625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 20.0, 5.0, 12.0, 19.0, 25.0, 26.0, 17.0, 34.0, 26.0, 37.0, 40.0, 48.0, 44.0, 50.0, 42.0, 54.0, 49.0, 35.0, 48.0, 51.0, 41.0, 54.0, 37.0, 31.0, 18.0, 22.0, 18.0, 18.0, 17.0, 14.0, 6.0, 14.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.336669921875, -0.3259239196777344, -0.31517791748046875, -0.3044319152832031, -0.2936859130859375, -0.2829399108886719, -0.27219390869140625, -0.2614479064941406, -0.250701904296875, -0.23995590209960938, -0.22920989990234375, -0.21846389770507812, -0.2077178955078125, -0.19697189331054688, -0.18622589111328125, -0.17547988891601562, -0.16473388671875, -0.15398788452148438, -0.14324188232421875, -0.13249588012695312, -0.1217498779296875, -0.11100387573242188, -0.10025787353515625, -0.08951187133789062, -0.078765869140625, -0.06801986694335938, -0.05727386474609375, -0.046527862548828125, -0.0357818603515625, -0.025035858154296875, -0.01428985595703125, -0.003543853759765625, 0.0072021484375, 0.017948150634765625, 0.02869415283203125, 0.039440155029296875, 0.0501861572265625, 0.060932159423828125, 0.07167816162109375, 0.08242416381835938, 0.093170166015625, 0.10391616821289062, 0.11466217041015625, 0.12540817260742188, 0.1361541748046875, 0.14690017700195312, 0.15764617919921875, 0.16839218139648438, 0.17913818359375, 0.18988418579101562, 0.20063018798828125, 0.21137619018554688, 0.2221221923828125, 0.23286819458007812, 0.24361419677734375, 0.2543601989746094, 0.265106201171875, 0.2758522033691406, 0.28659820556640625, 0.2973442077636719, 0.3080902099609375, 0.3188362121582031, 0.32958221435546875, 0.3403282165527344, 0.35107421875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 7.0, 17.0, 28.0, 29.0, 35.0, 67.0, 82.0, 109.0, 190.0, 280.0, 491.0, 755.0, 1160.0, 2043.0, 4120.0, 10007.0, 53684.0, 910466.0, 46324.0, 9604.0, 3902.0, 2020.0, 1118.0, 692.0, 450.0, 309.0, 165.0, 143.0, 59.0, 63.0, 37.0, 35.0, 14.0, 5.0, 14.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2076416015625, -0.20082664489746094, -0.19401168823242188, -0.1871967315673828, -0.18038177490234375, -0.1735668182373047, -0.16675186157226562, -0.15993690490722656, -0.1531219482421875, -0.14630699157714844, -0.13949203491210938, -0.1326770782470703, -0.12586212158203125, -0.11904716491699219, -0.11223220825195312, -0.10541725158691406, -0.098602294921875, -0.09178733825683594, -0.08497238159179688, -0.07815742492675781, -0.07134246826171875, -0.06452751159667969, -0.057712554931640625, -0.05089759826660156, -0.0440826416015625, -0.03726768493652344, -0.030452728271484375, -0.023637771606445312, -0.01682281494140625, -0.010007858276367188, -0.003192901611328125, 0.0036220550537109375, 0.01043701171875, 0.017251968383789062, 0.024066925048828125, 0.030881881713867188, 0.03769683837890625, 0.04451179504394531, 0.051326751708984375, 0.05814170837402344, 0.0649566650390625, 0.07177162170410156, 0.07858657836914062, 0.08540153503417969, 0.09221649169921875, 0.09903144836425781, 0.10584640502929688, 0.11266136169433594, 0.119476318359375, 0.12629127502441406, 0.13310623168945312, 0.1399211883544922, 0.14673614501953125, 0.1535511016845703, 0.16036605834960938, 0.16718101501464844, 0.1739959716796875, 0.18081092834472656, 0.18762588500976562, 0.1944408416748047, 0.20125579833984375, 0.2080707550048828, 0.21488571166992188, 0.22170066833496094, 0.228515625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 1.0, 4.0, 6.0, 2.0, 3.0, 6.0, 14.0, 6.0, 12.0, 12.0, 16.0, 18.0, 31.0, 55.0, 75.0, 105.0, 137.0, 149.0, 104.0, 74.0, 42.0, 31.0, 14.0, 20.0, 17.0, 11.0, 12.0, 8.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.3942203521728516e-05, -5.244184285402298e-05, -5.0941482186317444e-05, -4.944112151861191e-05, -4.794076085090637e-05, -4.6440400183200836e-05, -4.49400395154953e-05, -4.3439678847789764e-05, -4.193931818008423e-05, -4.043895751237869e-05, -3.893859684467316e-05, -3.743823617696762e-05, -3.5937875509262085e-05, -3.443751484155655e-05, -3.293715417385101e-05, -3.143679350614548e-05, -2.993643283843994e-05, -2.8436072170734406e-05, -2.693571150302887e-05, -2.5435350835323334e-05, -2.3934990167617798e-05, -2.2434629499912262e-05, -2.0934268832206726e-05, -1.943390816450119e-05, -1.7933547496795654e-05, -1.643318682909012e-05, -1.4932826161384583e-05, -1.3432465493679047e-05, -1.193210482597351e-05, -1.0431744158267975e-05, -8.931383490562439e-06, -7.431022822856903e-06, -5.930662155151367e-06, -4.430301487445831e-06, -2.9299408197402954e-06, -1.4295801520347595e-06, 7.078051567077637e-08, 1.5711411833763123e-06, 3.071501851081848e-06, 4.571862518787384e-06, 6.07222318649292e-06, 7.572583854198456e-06, 9.072944521903992e-06, 1.0573305189609528e-05, 1.2073665857315063e-05, 1.35740265250206e-05, 1.5074387192726135e-05, 1.657474786043167e-05, 1.8075108528137207e-05, 1.9575469195842743e-05, 2.107582986354828e-05, 2.2576190531253815e-05, 2.407655119895935e-05, 2.5576911866664886e-05, 2.7077272534370422e-05, 2.8577633202075958e-05, 3.0077993869781494e-05, 3.157835453748703e-05, 3.3078715205192566e-05, 3.45790758728981e-05, 3.607943654060364e-05, 3.7579797208309174e-05, 3.908015787601471e-05, 4.0580518543720245e-05, 4.208087921142578e-05]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 5.0, 3.0, 4.0, 4.0, 9.0, 7.0, 6.0, 5.0, 6.0, 13.0, 23.0, 45.0, 68.0, 262.0, 2237.0, 44103.0, 996565.0, 4439.0, 471.0, 105.0, 46.0, 29.0, 12.0, 6.0, 8.0, 10.0, 5.0, 4.0, 6.0, 4.0, 8.0, 5.0, 6.0, 2.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83447265625, -0.80584716796875, -0.7772216796875, -0.74859619140625, -0.719970703125, -0.69134521484375, -0.6627197265625, -0.63409423828125, -0.60546875, -0.57684326171875, -0.5482177734375, -0.51959228515625, -0.490966796875, -0.46234130859375, -0.4337158203125, -0.40509033203125, -0.37646484375, -0.34783935546875, -0.3192138671875, -0.29058837890625, -0.261962890625, -0.23333740234375, -0.2047119140625, -0.17608642578125, -0.1474609375, -0.11883544921875, -0.0902099609375, -0.06158447265625, -0.032958984375, -0.00433349609375, 0.0242919921875, 0.05291748046875, 0.08154296875, 0.11016845703125, 0.1387939453125, 0.16741943359375, 0.196044921875, 0.22467041015625, 0.2532958984375, 0.28192138671875, 0.310546875, 0.33917236328125, 0.3677978515625, 0.39642333984375, 0.425048828125, 0.45367431640625, 0.4822998046875, 0.51092529296875, 0.53955078125, 0.56817626953125, 0.5968017578125, 0.62542724609375, 0.654052734375, 0.68267822265625, 0.7113037109375, 0.73992919921875, 0.7685546875, 0.79718017578125, 0.8258056640625, 0.85443115234375, 0.883056640625, 0.91168212890625, 0.9403076171875, 0.96893310546875, 0.99755859375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 12.0, 10.0, 16.0, 46.0, 95.0, 174.0, 275.0, 179.0, 86.0, 35.0, 16.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037933349609375, -0.036550045013427734, -0.03516674041748047, -0.0337834358215332, -0.03240013122558594, -0.031016826629638672, -0.029633522033691406, -0.02825021743774414, -0.026866912841796875, -0.02548360824584961, -0.024100303649902344, -0.022716999053955078, -0.021333694458007812, -0.019950389862060547, -0.01856708526611328, -0.017183780670166016, -0.01580047607421875, -0.014417171478271484, -0.013033866882324219, -0.011650562286376953, -0.010267257690429688, -0.008883953094482422, -0.007500648498535156, -0.006117343902587891, -0.004734039306640625, -0.0033507347106933594, -0.0019674301147460938, -0.0005841255187988281, 0.0007991790771484375, 0.002182483673095703, 0.0035657882690429688, 0.004949092864990234, 0.0063323974609375, 0.007715702056884766, 0.009099006652832031, 0.010482311248779297, 0.011865615844726562, 0.013248920440673828, 0.014632225036621094, 0.01601552963256836, 0.017398834228515625, 0.01878213882446289, 0.020165443420410156, 0.021548748016357422, 0.022932052612304688, 0.024315357208251953, 0.02569866180419922, 0.027081966400146484, 0.02846527099609375, 0.029848575592041016, 0.03123188018798828, 0.03261518478393555, 0.03399848937988281, 0.03538179397583008, 0.036765098571777344, 0.03814840316772461, 0.039531707763671875, 0.04091501235961914, 0.042298316955566406, 0.04368162155151367, 0.04506492614746094, 0.0464482307434082, 0.04783153533935547, 0.049214839935302734, 0.05059814453125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 88.0, 689.0, 166.0, 41.0, 11.0, 7.0, 3.0, 4.0], "bins": [-7.631683826446533, -7.499127388000488, -7.366571426391602, -7.234015464782715, -7.10145902633667, -6.968902587890625, -6.836346626281738, -6.703790664672852, -6.571234226226807, -6.438677787780762, -6.306121826171875, -6.173565864562988, -6.041009426116943, -5.908452987670898, -5.775897026062012, -5.643341064453125, -5.51078462600708, -5.378228187561035, -5.245672225952148, -5.113116264343262, -4.980559825897217, -4.848003387451172, -4.715447425842285, -4.582891464233398, -4.4503350257873535, -4.317778587341309, -4.185222625732422, -4.052666664123535, -3.9201102256774902, -3.7875540256500244, -3.6549978256225586, -3.5224416255950928, -3.389885425567627, -3.257329225540161, -3.1247730255126953, -2.9922168254852295, -2.8596606254577637, -2.727104425430298, -2.594548225402832, -2.461992025375366, -2.3294358253479004, -2.1968796253204346, -2.0643234252929688, -1.931767225265503, -1.799211025238037, -1.6666548252105713, -1.5340986251831055, -1.4015424251556396, -1.2689861059188843, -1.1364299058914185, -1.0038737058639526, -0.8713175058364868, -0.738761305809021, -0.6062051057815552, -0.47364890575408936, -0.34109270572662354, -0.20853650569915771, -0.0759803056716919, 0.056575894355773926, 0.18913209438323975, 0.32168829441070557, 0.4542444944381714, 0.5868006944656372, 0.719356894493103, 0.8519130945205688]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 6.0, 5.0, 6.0, 11.0, 22.0, 33.0, 43.0, 44.0, 63.0, 57.0, 61.0, 78.0, 82.0, 90.0, 63.0, 58.0, 61.0, 42.0, 36.0, 45.0, 28.0, 13.0, 20.0, 14.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9789393544197083, -0.9566117525100708, -0.9342841506004333, -0.9119565486907959, -0.8896290063858032, -0.8673014044761658, -0.8449738025665283, -0.8226462006568909, -0.8003185987472534, -0.777990996837616, -0.7556633949279785, -0.7333358526229858, -0.7110082507133484, -0.6886806488037109, -0.6663530468940735, -0.644025444984436, -0.6216979026794434, -0.5993703007698059, -0.5770426988601685, -0.5547151565551758, -0.5323875546455383, -0.5100599527359009, -0.4877323508262634, -0.465404748916626, -0.4430771768093109, -0.42074957489967346, -0.3984220027923584, -0.37609440088272095, -0.3537667989730835, -0.33143922686576843, -0.309111624956131, -0.2867840528488159, -0.2644563913345337, -0.24212880432605743, -0.21980121731758118, -0.19747361540794373, -0.17514602839946747, -0.1528184413909912, -0.13049083948135376, -0.1081632524728775, -0.08583566546440125, -0.06350807845592499, -0.041180483996868134, -0.01885288953781128, 0.003474697470664978, 0.025802284479141235, 0.048129886388778687, 0.07045747339725494, 0.0927850604057312, 0.11511264741420746, 0.13744023442268372, 0.15976783633232117, 0.18209542334079742, 0.20442301034927368, 0.22675061225891113, 0.2490781992673874, 0.27140578627586365, 0.2937333881855011, 0.31606096029281616, 0.3383885622024536, 0.36071616411209106, 0.38304373621940613, 0.4053713381290436, 0.42769891023635864, 0.4500265121459961]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 11.0, 16.0, 13.0, 12.0, 26.0, 39.0, 73.0, 116.0, 241.0, 506.0, 1235.0, 3097.0, 8907.0, 28945.0, 116182.0, 639524.0, 188063.0, 42224.0, 12282.0, 4124.0, 1579.0, 648.0, 284.0, 131.0, 74.0, 45.0, 31.0, 22.0, 15.0, 14.0, 14.0, 12.0, 9.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.705078125, -1.643402099609375, -1.58172607421875, -1.520050048828125, -1.4583740234375, -1.396697998046875, -1.33502197265625, -1.273345947265625, -1.211669921875, -1.149993896484375, -1.08831787109375, -1.026641845703125, -0.9649658203125, -0.903289794921875, -0.84161376953125, -0.779937744140625, -0.71826171875, -0.656585693359375, -0.59490966796875, -0.533233642578125, -0.4715576171875, -0.409881591796875, -0.34820556640625, -0.286529541015625, -0.224853515625, -0.163177490234375, -0.10150146484375, -0.039825439453125, 0.0218505859375, 0.083526611328125, 0.14520263671875, 0.206878662109375, 0.2685546875, 0.330230712890625, 0.39190673828125, 0.453582763671875, 0.5152587890625, 0.576934814453125, 0.63861083984375, 0.700286865234375, 0.761962890625, 0.823638916015625, 0.88531494140625, 0.946990966796875, 1.0086669921875, 1.070343017578125, 1.13201904296875, 1.193695068359375, 1.25537109375, 1.317047119140625, 1.37872314453125, 1.440399169921875, 1.5020751953125, 1.563751220703125, 1.62542724609375, 1.687103271484375, 1.748779296875, 1.810455322265625, 1.87213134765625, 1.933807373046875, 1.9954833984375, 2.057159423828125, 2.11883544921875, 2.180511474609375, 2.2421875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 2.0, 5.0, 11.0, 13.0, 28.0, 38.0, 55.0, 53.0, 65.0, 73.0, 90.0, 97.0, 88.0, 69.0, 70.0, 69.0, 48.0, 35.0, 26.0, 24.0, 14.0, 12.0, 7.0, 6.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.384521484375, -0.3759136199951172, -0.3673057556152344, -0.35869789123535156, -0.35009002685546875, -0.34148216247558594, -0.3328742980957031, -0.3242664337158203, -0.3156585693359375, -0.3070507049560547, -0.2984428405761719, -0.28983497619628906, -0.28122711181640625, -0.27261924743652344, -0.2640113830566406, -0.2554035186767578, -0.246795654296875, -0.2381877899169922, -0.22957992553710938, -0.22097206115722656, -0.21236419677734375, -0.20375633239746094, -0.19514846801757812, -0.1865406036376953, -0.1779327392578125, -0.1693248748779297, -0.16071701049804688, -0.15210914611816406, -0.14350128173828125, -0.13489341735839844, -0.12628555297851562, -0.11767768859863281, -0.10906982421875, -0.10046195983886719, -0.09185409545898438, -0.08324623107910156, -0.07463836669921875, -0.06603050231933594, -0.057422637939453125, -0.04881477355957031, -0.0402069091796875, -0.03159904479980469, -0.022991180419921875, -0.014383316040039062, -0.00577545166015625, 0.0028324127197265625, 0.011440277099609375, 0.020048141479492188, 0.028656005859375, 0.03726387023925781, 0.045871734619140625, 0.05447959899902344, 0.06308746337890625, 0.07169532775878906, 0.08030319213867188, 0.08891105651855469, 0.0975189208984375, 0.10612678527832031, 0.11473464965820312, 0.12334251403808594, 0.13195037841796875, 0.14055824279785156, 0.14916610717773438, 0.1577739715576172, 0.1663818359375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 15.0, 13.0, 19.0, 25.0, 44.0, 67.0, 112.0, 163.0, 226.0, 331.0, 494.0, 771.0, 1166.0, 1862.0, 2843.0, 4580.0, 7342.0, 11721.0, 19032.0, 31428.0, 52845.0, 95930.0, 221796.0, 309235.0, 123523.0, 64781.0, 37969.0, 22600.0, 13957.0, 8615.0, 5428.0, 3393.0, 2171.0, 1460.0, 836.0, 599.0, 393.0, 239.0, 170.0, 113.0, 70.0, 58.0, 43.0, 30.0, 14.0, 7.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.40478515625, -0.39258575439453125, -0.3803863525390625, -0.36818695068359375, -0.355987548828125, -0.34378814697265625, -0.3315887451171875, -0.31938934326171875, -0.30718994140625, -0.29499053955078125, -0.2827911376953125, -0.27059173583984375, -0.258392333984375, -0.24619293212890625, -0.2339935302734375, -0.22179412841796875, -0.2095947265625, -0.19739532470703125, -0.1851959228515625, -0.17299652099609375, -0.160797119140625, -0.14859771728515625, -0.1363983154296875, -0.12419891357421875, -0.11199951171875, -0.09980010986328125, -0.0876007080078125, -0.07540130615234375, -0.063201904296875, -0.05100250244140625, -0.0388031005859375, -0.02660369873046875, -0.014404296875, -0.00220489501953125, 0.0099945068359375, 0.02219390869140625, 0.034393310546875, 0.04659271240234375, 0.0587921142578125, 0.07099151611328125, 0.08319091796875, 0.09539031982421875, 0.1075897216796875, 0.11978912353515625, 0.131988525390625, 0.14418792724609375, 0.1563873291015625, 0.16858673095703125, 0.1807861328125, 0.19298553466796875, 0.2051849365234375, 0.21738433837890625, 0.229583740234375, 0.24178314208984375, 0.2539825439453125, 0.26618194580078125, 0.27838134765625, 0.29058074951171875, 0.3027801513671875, 0.31497955322265625, 0.327178955078125, 0.33937835693359375, 0.3515777587890625, 0.36377716064453125, 0.3759765625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 3.0, 8.0, 16.0, 14.0, 14.0, 21.0, 22.0, 24.0, 30.0, 25.0, 31.0, 40.0, 41.0, 24.0, 31.0, 30.0, 46.0, 54.0, 46.0, 35.0, 58.0, 40.0, 40.0, 42.0, 33.0, 24.0, 26.0, 21.0, 26.0, 21.0, 18.0, 21.0, 14.0, 8.0, 7.0, 13.0, 3.0, 7.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1392822265625, -0.13517093658447266, -0.1310596466064453, -0.12694835662841797, -0.12283706665039062, -0.11872577667236328, -0.11461448669433594, -0.1105031967163086, -0.10639190673828125, -0.1022806167602539, -0.09816932678222656, -0.09405803680419922, -0.08994674682617188, -0.08583545684814453, -0.08172416687011719, -0.07761287689208984, -0.0735015869140625, -0.06939029693603516, -0.06527900695800781, -0.06116771697998047, -0.057056427001953125, -0.05294513702392578, -0.04883384704589844, -0.044722557067871094, -0.04061126708984375, -0.036499977111816406, -0.03238868713378906, -0.02827739715576172, -0.024166107177734375, -0.02005481719970703, -0.015943527221679688, -0.011832237243652344, -0.007720947265625, -0.0036096572875976562, 0.0005016326904296875, 0.004612922668457031, 0.008724212646484375, 0.012835502624511719, 0.016946792602539062, 0.021058082580566406, 0.02516937255859375, 0.029280662536621094, 0.03339195251464844, 0.03750324249267578, 0.041614532470703125, 0.04572582244873047, 0.04983711242675781, 0.053948402404785156, 0.0580596923828125, 0.062170982360839844, 0.06628227233886719, 0.07039356231689453, 0.07450485229492188, 0.07861614227294922, 0.08272743225097656, 0.0868387222290039, 0.09095001220703125, 0.0950613021850586, 0.09917259216308594, 0.10328388214111328, 0.10739517211914062, 0.11150646209716797, 0.11561775207519531, 0.11972904205322266, 0.12384033203125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 11.0, 11.0, 15.0, 22.0, 29.0, 43.0, 67.0, 94.0, 155.0, 237.0, 409.0, 638.0, 1095.0, 2118.0, 4167.0, 9454.0, 24753.0, 101184.0, 711283.0, 141378.0, 30477.0, 10700.0, 4725.0, 2333.0, 1214.0, 669.0, 467.0, 276.0, 163.0, 131.0, 94.0, 43.0, 33.0, 20.0, 9.0, 15.0, 5.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.021820068359375, -0.021170377731323242, -0.020520687103271484, -0.019870996475219727, -0.01922130584716797, -0.01857161521911621, -0.017921924591064453, -0.017272233963012695, -0.016622543334960938, -0.01597285270690918, -0.015323162078857422, -0.014673471450805664, -0.014023780822753906, -0.013374090194702148, -0.01272439956665039, -0.012074708938598633, -0.011425018310546875, -0.010775327682495117, -0.01012563705444336, -0.009475946426391602, -0.008826255798339844, -0.008176565170288086, -0.007526874542236328, -0.00687718391418457, -0.0062274932861328125, -0.005577802658081055, -0.004928112030029297, -0.004278421401977539, -0.0036287307739257812, -0.0029790401458740234, -0.0023293495178222656, -0.0016796588897705078, -0.00102996826171875, -0.0003802776336669922, 0.0002694129943847656, 0.0009191036224365234, 0.0015687942504882812, 0.002218484878540039, 0.002868175506591797, 0.0035178661346435547, 0.0041675567626953125, 0.00481724739074707, 0.005466938018798828, 0.006116628646850586, 0.006766319274902344, 0.0074160099029541016, 0.00806570053100586, 0.008715391159057617, 0.009365081787109375, 0.010014772415161133, 0.01066446304321289, 0.011314153671264648, 0.011963844299316406, 0.012613534927368164, 0.013263225555419922, 0.01391291618347168, 0.014562606811523438, 0.015212297439575195, 0.015861988067626953, 0.01651167869567871, 0.01716136932373047, 0.017811059951782227, 0.018460750579833984, 0.019110441207885742, 0.0197601318359375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 12.0, 8.0, 9.0, 20.0, 25.0, 23.0, 43.0, 95.0, 165.0, 217.0, 137.0, 70.0, 37.0, 31.0, 18.0, 12.0, 11.0, 14.0, 8.0, 10.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9848346710205078e-05, -1.9234605133533478e-05, -1.8620863556861877e-05, -1.8007121980190277e-05, -1.7393380403518677e-05, -1.6779638826847076e-05, -1.6165897250175476e-05, -1.5552155673503876e-05, -1.4938414096832275e-05, -1.4324672520160675e-05, -1.3710930943489075e-05, -1.3097189366817474e-05, -1.2483447790145874e-05, -1.1869706213474274e-05, -1.1255964636802673e-05, -1.0642223060131073e-05, -1.0028481483459473e-05, -9.414739906787872e-06, -8.800998330116272e-06, -8.187256753444672e-06, -7.573515176773071e-06, -6.959773600101471e-06, -6.346032023429871e-06, -5.73229044675827e-06, -5.11854887008667e-06, -4.50480729341507e-06, -3.891065716743469e-06, -3.277324140071869e-06, -2.6635825634002686e-06, -2.0498409867286682e-06, -1.4360994100570679e-06, -8.223578333854675e-07, -2.086162567138672e-07, 4.0512531995773315e-07, 1.0188668966293335e-06, 1.6326084733009338e-06, 2.246350049972534e-06, 2.8600916266441345e-06, 3.473833203315735e-06, 4.087574779987335e-06, 4.7013163566589355e-06, 5.315057933330536e-06, 5.928799510002136e-06, 6.5425410866737366e-06, 7.156282663345337e-06, 7.770024240016937e-06, 8.383765816688538e-06, 8.997507393360138e-06, 9.611248970031738e-06, 1.0224990546703339e-05, 1.0838732123374939e-05, 1.145247370004654e-05, 1.206621527671814e-05, 1.267995685338974e-05, 1.329369843006134e-05, 1.390744000673294e-05, 1.4521181583404541e-05, 1.5134923160076141e-05, 1.5748664736747742e-05, 1.6362406313419342e-05, 1.6976147890090942e-05, 1.7589889466762543e-05, 1.8203631043434143e-05, 1.8817372620105743e-05, 1.9431114196777344e-05]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 7.0, 7.0, 8.0, 14.0, 21.0, 38.0, 62.0, 63.0, 128.0, 156.0, 277.0, 434.0, 733.0, 1134.0, 1956.0, 3312.0, 5630.0, 10247.0, 18650.0, 35713.0, 73590.0, 186263.0, 414785.0, 158216.0, 65826.0, 32077.0, 16951.0, 9238.0, 5277.0, 3015.0, 1833.0, 1032.0, 692.0, 421.0, 259.0, 162.0, 106.0, 79.0, 49.0, 35.0, 19.0, 14.0, 14.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00614166259765625, -0.005952239036560059, -0.005762815475463867, -0.005573391914367676, -0.005383968353271484, -0.005194544792175293, -0.0050051212310791016, -0.00481569766998291, -0.004626274108886719, -0.004436850547790527, -0.004247426986694336, -0.0040580034255981445, -0.003868579864501953, -0.0036791563034057617, -0.0034897327423095703, -0.003300309181213379, -0.0031108856201171875, -0.002921462059020996, -0.0027320384979248047, -0.0025426149368286133, -0.002353191375732422, -0.0021637678146362305, -0.001974344253540039, -0.0017849206924438477, -0.0015954971313476562, -0.0014060735702514648, -0.0012166500091552734, -0.001027226448059082, -0.0008378028869628906, -0.0006483793258666992, -0.0004589557647705078, -0.0002695322036743164, -8.0108642578125e-05, 0.0001093149185180664, 0.0002987384796142578, 0.0004881620407104492, 0.0006775856018066406, 0.000867009162902832, 0.0010564327239990234, 0.0012458562850952148, 0.0014352798461914062, 0.0016247034072875977, 0.001814126968383789, 0.0020035505294799805, 0.002192974090576172, 0.0023823976516723633, 0.0025718212127685547, 0.002761244773864746, 0.0029506683349609375, 0.003140091896057129, 0.0033295154571533203, 0.0035189390182495117, 0.003708362579345703, 0.0038977861404418945, 0.004087209701538086, 0.004276633262634277, 0.004466056823730469, 0.00465548038482666, 0.0048449039459228516, 0.005034327507019043, 0.005223751068115234, 0.005413174629211426, 0.005602598190307617, 0.005792021751403809, 0.0059814453125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 9.0, 7.0, 6.0, 12.0, 18.0, 15.0, 25.0, 22.0, 33.0, 28.0, 48.0, 45.0, 55.0, 47.0, 59.0, 54.0, 60.0, 59.0, 53.0, 60.0, 50.0, 37.0, 36.0, 24.0, 19.0, 26.0, 23.0, 16.0, 19.0, 8.0, 7.0, 2.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001781463623046875, -0.0017209053039550781, -0.0016603469848632812, -0.0015997886657714844, -0.0015392303466796875, -0.0014786720275878906, -0.0014181137084960938, -0.0013575553894042969, -0.0012969970703125, -0.0012364387512207031, -0.0011758804321289062, -0.0011153221130371094, -0.0010547637939453125, -0.0009942054748535156, -0.0009336471557617188, -0.0008730888366699219, -0.000812530517578125, -0.0007519721984863281, -0.0006914138793945312, -0.0006308555603027344, -0.0005702972412109375, -0.0005097389221191406, -0.00044918060302734375, -0.0003886222839355469, -0.00032806396484375, -0.0002675056457519531, -0.00020694732666015625, -0.00014638900756835938, -8.58306884765625e-05, -2.5272369384765625e-05, 3.528594970703125e-05, 9.584426879882812e-05, 0.000156402587890625, 0.00021696090698242188, 0.00027751922607421875, 0.0003380775451660156, 0.0003986358642578125, 0.0004591941833496094, 0.0005197525024414062, 0.0005803108215332031, 0.000640869140625, 0.0007014274597167969, 0.0007619857788085938, 0.0008225440979003906, 0.0008831024169921875, 0.0009436607360839844, 0.0010042190551757812, 0.0010647773742675781, 0.001125335693359375, 0.0011858940124511719, 0.0012464523315429688, 0.0013070106506347656, 0.0013675689697265625, 0.0014281272888183594, 0.0014886856079101562, 0.0015492439270019531, 0.00160980224609375, 0.0016703605651855469, 0.0017309188842773438, 0.0017914772033691406, 0.0018520355224609375, 0.0019125938415527344, 0.0019731521606445312, 0.002033710479736328, 0.002094268798828125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 16.0, 33.0, 63.0, 165.0, 415.0, 177.0, 60.0, 32.0, 15.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3488658666610718, -1.317858099937439, -1.2868503332138062, -1.2558425664901733, -1.224834680557251, -1.1938269138336182, -1.1628191471099854, -1.1318113803863525, -1.1008036136627197, -1.069795846939087, -1.038788080215454, -1.0077803134918213, -0.9767724871635437, -0.9457647204399109, -0.9147568941116333, -0.8837491273880005, -0.8527413606643677, -0.8217335939407349, -0.790725827217102, -0.7597180008888245, -0.7287102341651917, -0.6977024674415588, -0.6666946411132812, -0.6356868743896484, -0.6046791076660156, -0.5736713409423828, -0.54266357421875, -0.5116557478904724, -0.4806479811668396, -0.4496402144432068, -0.4186324179172516, -0.3876246213912964, -0.3566168546676636, -0.32560908794403076, -0.29460129141807556, -0.26359349489212036, -0.23258572816848755, -0.20157794654369354, -0.17057016491889954, -0.13956238329410553, -0.10855460166931152, -0.07754682004451752, -0.04653903841972351, -0.015531256794929504, 0.015476524829864502, 0.04648430645465851, 0.07749208807945251, 0.10849986970424652, 0.13950765132904053, 0.17051543295383453, 0.20152321457862854, 0.23253099620342255, 0.26353877782821655, 0.29454654455184937, 0.32555434107780457, 0.35656213760375977, 0.3875699043273926, 0.4185776710510254, 0.4495854675769806, 0.4805932641029358, 0.5116010308265686, 0.5426087975502014, 0.573616623878479, 0.6046243906021118, 0.6356321573257446]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 10.0, 19.0, 18.0, 25.0, 47.0, 58.0, 65.0, 68.0, 71.0, 104.0, 80.0, 74.0, 72.0, 76.0, 49.0, 44.0, 34.0, 34.0, 19.0, 15.0, 9.0, 1.0, 7.0, 2.0, 3.0], "bins": [-0.6070731282234192, -0.5946942567825317, -0.5823153853416443, -0.5699365139007568, -0.5575577020645142, -0.5451788306236267, -0.5327999591827393, -0.5204210877418518, -0.5080422163009644, -0.4956633448600769, -0.48328450322151184, -0.4709056317806244, -0.45852676033973694, -0.4461479187011719, -0.4337690472602844, -0.421390175819397, -0.4090113639831543, -0.39663249254226685, -0.3842536509037018, -0.37187477946281433, -0.3594959080219269, -0.3471170663833618, -0.33473819494247437, -0.3223593235015869, -0.30998045206069946, -0.297601580619812, -0.28522273898124695, -0.2728438675403595, -0.26046499609947205, -0.24808615446090698, -0.23570728302001953, -0.22332842648029327, -0.21094955503940582, -0.19857069849967957, -0.18619182705879211, -0.17381297051906586, -0.1614341139793396, -0.14905524253845215, -0.1366763859987259, -0.12429752945899963, -0.11191866546869278, -0.09953980147838593, -0.08716094493865967, -0.07478208094835281, -0.06240322068333626, -0.0500243604183197, -0.03764549642801285, -0.02526663988828659, -0.012887775897979736, -0.0005089147016406059, 0.011869946494698524, 0.02424880862236023, 0.036627668887376785, 0.04900652915239334, 0.061385393142700195, 0.07376424968242645, 0.0861431136727333, 0.09852197766304016, 0.11090083420276642, 0.12327969819307327, 0.13565856218338013, 0.14803741872310638, 0.16041627526283264, 0.1727951467037201, 0.18517400324344635]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 9.0, 8.0, 11.0, 22.0, 20.0, 61.0, 84.0, 155.0, 289.0, 569.0, 1314.0, 99589.0, 4088442.0, 2148.0, 732.0, 345.0, 211.0, 93.0, 66.0, 45.0, 24.0, 10.0, 16.0, 7.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8935546875, -1.851593017578125, -1.80963134765625, -1.767669677734375, -1.7257080078125, -1.683746337890625, -1.64178466796875, -1.599822998046875, -1.557861328125, -1.515899658203125, -1.47393798828125, -1.431976318359375, -1.3900146484375, -1.348052978515625, -1.30609130859375, -1.264129638671875, -1.22216796875, -1.180206298828125, -1.13824462890625, -1.096282958984375, -1.0543212890625, -1.012359619140625, -0.97039794921875, -0.928436279296875, -0.886474609375, -0.844512939453125, -0.80255126953125, -0.760589599609375, -0.7186279296875, -0.676666259765625, -0.63470458984375, -0.592742919921875, -0.55078125, -0.508819580078125, -0.46685791015625, -0.424896240234375, -0.3829345703125, -0.340972900390625, -0.29901123046875, -0.257049560546875, -0.215087890625, -0.173126220703125, -0.13116455078125, -0.089202880859375, -0.0472412109375, -0.005279541015625, 0.03668212890625, 0.078643798828125, 0.12060546875, 0.162567138671875, 0.20452880859375, 0.246490478515625, 0.2884521484375, 0.330413818359375, 0.37237548828125, 0.414337158203125, 0.456298828125, 0.498260498046875, 0.54022216796875, 0.582183837890625, 0.6241455078125, 0.666107177734375, 0.70806884765625, 0.750030517578125, 0.7919921875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 11.0, 7.0, 8.0, 17.0, 19.0, 28.0, 36.0, 51.0, 59.0, 63.0, 58.0, 90.0, 86.0, 72.0, 67.0, 53.0, 70.0, 46.0, 40.0, 37.0, 26.0, 25.0, 12.0, 10.0, 3.0, 11.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.370849609375, -0.3625526428222656, -0.35425567626953125, -0.3459587097167969, -0.3376617431640625, -0.3293647766113281, -0.32106781005859375, -0.3127708435058594, -0.304473876953125, -0.2961769104003906, -0.28787994384765625, -0.2795829772949219, -0.2712860107421875, -0.2629890441894531, -0.25469207763671875, -0.24639511108398438, -0.23809814453125, -0.22980117797851562, -0.22150421142578125, -0.21320724487304688, -0.2049102783203125, -0.19661331176757812, -0.18831634521484375, -0.18001937866210938, -0.171722412109375, -0.16342544555664062, -0.15512847900390625, -0.14683151245117188, -0.1385345458984375, -0.13023757934570312, -0.12194061279296875, -0.11364364624023438, -0.1053466796875, -0.09704971313476562, -0.08875274658203125, -0.08045578002929688, -0.0721588134765625, -0.06386184692382812, -0.05556488037109375, -0.047267913818359375, -0.038970947265625, -0.030673980712890625, -0.02237701416015625, -0.014080047607421875, -0.0057830810546875, 0.002513885498046875, 0.01081085205078125, 0.019107818603515625, 0.02740478515625, 0.035701751708984375, 0.04399871826171875, 0.052295684814453125, 0.0605926513671875, 0.06888961791992188, 0.07718658447265625, 0.08548355102539062, 0.093780517578125, 0.10207748413085938, 0.11037445068359375, 0.11867141723632812, 0.1269683837890625, 0.13526535034179688, 0.14356231689453125, 0.15185928344726562, 0.16015625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 6.0, 5.0, 8.0, 11.0, 19.0, 34.0, 34.0, 62.0, 97.0, 196.0, 324.0, 568.0, 1190.0, 2766.0, 12917.0, 4003853.0, 162525.0, 5802.0, 1910.0, 863.0, 450.0, 228.0, 135.0, 88.0, 56.0, 42.0, 29.0, 27.0, 15.0, 7.0, 7.0, 2.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75830078125, -0.7382431030273438, -0.7181854248046875, -0.6981277465820312, -0.678070068359375, -0.6580123901367188, -0.6379547119140625, -0.6178970336914062, -0.59783935546875, -0.5777816772460938, -0.5577239990234375, -0.5376663208007812, -0.517608642578125, -0.49755096435546875, -0.4774932861328125, -0.45743560791015625, -0.4373779296875, -0.41732025146484375, -0.3972625732421875, -0.37720489501953125, -0.357147216796875, -0.33708953857421875, -0.3170318603515625, -0.29697418212890625, -0.27691650390625, -0.25685882568359375, -0.2368011474609375, -0.21674346923828125, -0.196685791015625, -0.17662811279296875, -0.1565704345703125, -0.13651275634765625, -0.116455078125, -0.09639739990234375, -0.0763397216796875, -0.05628204345703125, -0.036224365234375, -0.01616668701171875, 0.0038909912109375, 0.02394866943359375, 0.04400634765625, 0.06406402587890625, 0.0841217041015625, 0.10417938232421875, 0.124237060546875, 0.14429473876953125, 0.1643524169921875, 0.18441009521484375, 0.2044677734375, 0.22452545166015625, 0.2445831298828125, 0.26464080810546875, 0.284698486328125, 0.30475616455078125, 0.3248138427734375, 0.34487152099609375, 0.36492919921875, 0.38498687744140625, 0.4050445556640625, 0.42510223388671875, 0.445159912109375, 0.46521759033203125, 0.4852752685546875, 0.5053329467773438, 0.525390625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 2.0, 3.0, 5.0, 17.0, 53.0, 180.0, 2069.0, 1500.0, 170.0, 52.0, 14.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0908203125, -0.08718681335449219, -0.08355331420898438, -0.07991981506347656, -0.07628631591796875, -0.07265281677246094, -0.06901931762695312, -0.06538581848144531, -0.0617523193359375, -0.05811882019042969, -0.054485321044921875, -0.05085182189941406, -0.04721832275390625, -0.04358482360839844, -0.039951324462890625, -0.03631782531738281, -0.032684326171875, -0.029050827026367188, -0.025417327880859375, -0.021783828735351562, -0.01815032958984375, -0.014516830444335938, -0.010883331298828125, -0.0072498321533203125, -0.0036163330078125, 1.71661376953125e-05, 0.003650665283203125, 0.0072841644287109375, 0.01091766357421875, 0.014551162719726562, 0.018184661865234375, 0.021818161010742188, 0.02545166015625, 0.029085159301757812, 0.032718658447265625, 0.03635215759277344, 0.03998565673828125, 0.04361915588378906, 0.047252655029296875, 0.05088615417480469, 0.0545196533203125, 0.05815315246582031, 0.061786651611328125, 0.06542015075683594, 0.06905364990234375, 0.07268714904785156, 0.07632064819335938, 0.07995414733886719, 0.083587646484375, 0.08722114562988281, 0.09085464477539062, 0.09448814392089844, 0.09812164306640625, 0.10175514221191406, 0.10538864135742188, 0.10902214050292969, 0.1126556396484375, 0.11628913879394531, 0.11992263793945312, 0.12355613708496094, 0.12718963623046875, 0.13082313537597656, 0.13445663452148438, 0.1380901336669922, 0.1417236328125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 21.0, 29.0, 70.0, 124.0, 359.0, 251.0, 69.0, 32.0, 17.0, 19.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0357717275619507, -1.0136076211929321, -0.9914435744285583, -0.9692795276641846, -0.947115421295166, -0.9249513745307922, -0.9027873277664185, -0.8806232213973999, -0.8584591150283813, -0.8362950682640076, -0.814130961894989, -0.7919669151306152, -0.7698028087615967, -0.7476387619972229, -0.7254747152328491, -0.7033106088638306, -0.6811465620994568, -0.658982515335083, -0.6368184089660645, -0.6146543622016907, -0.5924902558326721, -0.5703262090682983, -0.5481621026992798, -0.525998055934906, -0.5038340091705322, -0.48166993260383606, -0.4595058560371399, -0.4373418092727661, -0.41517770290374756, -0.3930136561393738, -0.3708495795726776, -0.34868550300598145, -0.3265213668346405, -0.30435729026794434, -0.28219321370124817, -0.260029137134552, -0.23786507546901703, -0.21570099890232086, -0.1935369372367859, -0.17137286067008972, -0.14920878410339355, -0.1270447075366974, -0.10488063842058182, -0.08271656930446625, -0.06055249273777008, -0.038388416171073914, -0.01622435450553894, 0.0059397220611572266, 0.028103798627853394, 0.05026787146925926, 0.07243194431066513, 0.0945960134267807, 0.11676008999347687, 0.13892416656017303, 0.161088228225708, 0.18325230479240417, 0.20541638135910034, 0.2275804579257965, 0.24974453449249268, 0.27190858125686646, 0.294072687625885, 0.3162367343902588, 0.33840081095695496, 0.3605648875236511, 0.3827289640903473]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 9.0, 7.0, 15.0, 16.0, 23.0, 36.0, 47.0, 62.0, 73.0, 96.0, 79.0, 75.0, 82.0, 71.0, 67.0, 75.0, 58.0, 33.0, 22.0, 31.0, 14.0, 9.0, 7.0, 5.0, 2.0, 1.0], "bins": [-0.4561707377433777, -0.446965754032135, -0.43776077032089233, -0.42855575680732727, -0.4193507730960846, -0.4101457893848419, -0.40094080567359924, -0.39173582196235657, -0.3825308084487915, -0.37332582473754883, -0.36412084102630615, -0.3549158275127411, -0.3457108438014984, -0.33650586009025574, -0.32730087637901306, -0.3180958926677704, -0.3088909089565277, -0.29968592524528503, -0.29048094153404236, -0.2812759280204773, -0.2720709443092346, -0.26286596059799194, -0.25366097688674927, -0.2444559931755066, -0.23525099456310272, -0.22604601085186005, -0.21684101223945618, -0.2076360285282135, -0.19843104481697083, -0.18922604620456696, -0.18002106249332428, -0.1708160638809204, -0.16161110997200012, -0.15240612626075745, -0.14320112764835358, -0.1339961439371109, -0.12479115277528763, -0.11558616161346436, -0.10638117790222168, -0.09717618674039841, -0.08797119557857513, -0.07876620441675186, -0.06956121325492859, -0.06035622954368591, -0.05115123838186264, -0.04194624722003937, -0.03274125978350639, -0.02353627234697342, -0.014331281185150146, -0.005126291885972023, 0.0040786974132061005, 0.013283686712384224, 0.022488676011562347, 0.03169366717338562, 0.040898654609918594, 0.05010364204645157, 0.05930863320827484, 0.06851362437009811, 0.07771861553192139, 0.08692359924316406, 0.09612859040498734, 0.10533358156681061, 0.11453856527805328, 0.12374355643987656, 0.13294854760169983]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 9.0, 7.0, 3.0, 8.0, 25.0, 30.0, 34.0, 74.0, 161.0, 294.0, 655.0, 1681.0, 5076.0, 18239.0, 88974.0, 689015.0, 198882.0, 32748.0, 8266.0, 2619.0, 904.0, 421.0, 169.0, 106.0, 53.0, 33.0, 25.0, 15.0, 8.0, 9.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79833984375, -0.7684402465820312, -0.7385406494140625, -0.7086410522460938, -0.678741455078125, -0.6488418579101562, -0.6189422607421875, -0.5890426635742188, -0.55914306640625, -0.5292434692382812, -0.4993438720703125, -0.46944427490234375, -0.439544677734375, -0.40964508056640625, -0.3797454833984375, -0.34984588623046875, -0.3199462890625, -0.29004669189453125, -0.2601470947265625, -0.23024749755859375, -0.200347900390625, -0.17044830322265625, -0.1405487060546875, -0.11064910888671875, -0.08074951171875, -0.05084991455078125, -0.0209503173828125, 0.00894927978515625, 0.038848876953125, 0.06874847412109375, 0.0986480712890625, 0.12854766845703125, 0.158447265625, 0.18834686279296875, 0.2182464599609375, 0.24814605712890625, 0.278045654296875, 0.30794525146484375, 0.3378448486328125, 0.36774444580078125, 0.39764404296875, 0.42754364013671875, 0.4574432373046875, 0.48734283447265625, 0.517242431640625, 0.5471420288085938, 0.5770416259765625, 0.6069412231445312, 0.6368408203125, 0.6667404174804688, 0.6966400146484375, 0.7265396118164062, 0.756439208984375, 0.7863388061523438, 0.8162384033203125, 0.8461380004882812, 0.87603759765625, 0.9059371948242188, 0.9358367919921875, 0.9657363891601562, 0.995635986328125, 1.0255355834960938, 1.0554351806640625, 1.0853347778320312, 1.115234375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 5.0, 6.0, 23.0, 9.0, 20.0, 40.0, 45.0, 56.0, 69.0, 78.0, 77.0, 79.0, 79.0, 74.0, 57.0, 64.0, 48.0, 54.0, 21.0, 35.0, 20.0, 16.0, 9.0, 9.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2353515625, -0.23022842407226562, -0.22510528564453125, -0.21998214721679688, -0.2148590087890625, -0.20973587036132812, -0.20461273193359375, -0.19948959350585938, -0.194366455078125, -0.18924331665039062, -0.18412017822265625, -0.17899703979492188, -0.1738739013671875, -0.16875076293945312, -0.16362762451171875, -0.15850448608398438, -0.15338134765625, -0.14825820922851562, -0.14313507080078125, -0.13801193237304688, -0.1328887939453125, -0.12776565551757812, -0.12264251708984375, -0.11751937866210938, -0.112396240234375, -0.10727310180664062, -0.10214996337890625, -0.09702682495117188, -0.0919036865234375, -0.08678054809570312, -0.08165740966796875, -0.07653427124023438, -0.0714111328125, -0.06628799438476562, -0.06116485595703125, -0.056041717529296875, -0.0509185791015625, -0.045795440673828125, -0.04067230224609375, -0.035549163818359375, -0.030426025390625, -0.025302886962890625, -0.02017974853515625, -0.015056610107421875, -0.0099334716796875, -0.004810333251953125, 0.00031280517578125, 0.005435943603515625, 0.01055908203125, 0.015682220458984375, 0.02080535888671875, 0.025928497314453125, 0.0310516357421875, 0.036174774169921875, 0.04129791259765625, 0.046421051025390625, 0.051544189453125, 0.056667327880859375, 0.06179046630859375, 0.06691360473632812, 0.0720367431640625, 0.07715988159179688, 0.08228302001953125, 0.08740615844726562, 0.092529296875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 13.0, 9.0, 12.0, 15.0, 24.0, 29.0, 46.0, 66.0, 70.0, 93.0, 126.0, 150.0, 222.0, 345.0, 431.0, 617.0, 766.0, 1096.0, 1658.0, 2462.0, 3605.0, 5551.0, 9152.0, 15673.0, 30613.0, 75087.0, 621548.0, 174533.0, 48200.0, 22159.0, 12403.0, 7162.0, 4604.0, 3109.0, 1948.0, 1369.0, 953.0, 711.0, 510.0, 356.0, 276.0, 204.0, 155.0, 101.0, 68.0, 57.0, 47.0, 48.0, 39.0, 25.0, 17.0, 15.0, 5.0, 4.0, 1.0, 1.0, 4.0, 2.0], "bins": [-0.293212890625, -0.2842674255371094, -0.27532196044921875, -0.2663764953613281, -0.2574310302734375, -0.24848556518554688, -0.23954010009765625, -0.23059463500976562, -0.221649169921875, -0.21270370483398438, -0.20375823974609375, -0.19481277465820312, -0.1858673095703125, -0.17692184448242188, -0.16797637939453125, -0.15903091430664062, -0.15008544921875, -0.14113998413085938, -0.13219451904296875, -0.12324905395507812, -0.1143035888671875, -0.10535812377929688, -0.09641265869140625, -0.08746719360351562, -0.078521728515625, -0.06957626342773438, -0.06063079833984375, -0.051685333251953125, -0.0427398681640625, -0.033794403076171875, -0.02484893798828125, -0.015903472900390625, -0.0069580078125, 0.001987457275390625, 0.01093292236328125, 0.019878387451171875, 0.0288238525390625, 0.037769317626953125, 0.04671478271484375, 0.055660247802734375, 0.064605712890625, 0.07355117797851562, 0.08249664306640625, 0.09144210815429688, 0.1003875732421875, 0.10933303833007812, 0.11827850341796875, 0.12722396850585938, 0.13616943359375, 0.14511489868164062, 0.15406036376953125, 0.16300582885742188, 0.1719512939453125, 0.18089675903320312, 0.18984222412109375, 0.19878768920898438, 0.207733154296875, 0.21667861938476562, 0.22562408447265625, 0.23456954956054688, 0.2435150146484375, 0.2524604797363281, 0.26140594482421875, 0.2703514099121094, 0.279296875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 4.0, 3.0, 4.0, 8.0, 7.0, 8.0, 9.0, 15.0, 18.0, 16.0, 24.0, 16.0, 22.0, 16.0, 26.0, 34.0, 35.0, 31.0, 28.0, 41.0, 42.0, 37.0, 40.0, 43.0, 46.0, 32.0, 31.0, 34.0, 41.0, 27.0, 31.0, 29.0, 27.0, 27.0, 17.0, 16.0, 14.0, 15.0, 18.0, 6.0, 16.0, 10.0, 8.0, 3.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.0572509765625, -0.05553722381591797, -0.05382347106933594, -0.052109718322753906, -0.050395965576171875, -0.048682212829589844, -0.04696846008300781, -0.04525470733642578, -0.04354095458984375, -0.04182720184326172, -0.04011344909667969, -0.038399696350097656, -0.036685943603515625, -0.034972190856933594, -0.03325843811035156, -0.03154468536376953, -0.0298309326171875, -0.02811717987060547, -0.026403427124023438, -0.024689674377441406, -0.022975921630859375, -0.021262168884277344, -0.019548416137695312, -0.01783466339111328, -0.01612091064453125, -0.014407157897949219, -0.012693405151367188, -0.010979652404785156, -0.009265899658203125, -0.007552146911621094, -0.0058383941650390625, -0.004124641418457031, -0.002410888671875, -0.0006971359252929688, 0.0010166168212890625, 0.0027303695678710938, 0.004444122314453125, 0.006157875061035156, 0.007871627807617188, 0.009585380554199219, 0.01129913330078125, 0.013012886047363281, 0.014726638793945312, 0.016440391540527344, 0.018154144287109375, 0.019867897033691406, 0.021581649780273438, 0.02329540252685547, 0.0250091552734375, 0.02672290802001953, 0.028436660766601562, 0.030150413513183594, 0.031864166259765625, 0.033577919006347656, 0.03529167175292969, 0.03700542449951172, 0.03871917724609375, 0.04043292999267578, 0.04214668273925781, 0.043860435485839844, 0.045574188232421875, 0.047287940979003906, 0.04900169372558594, 0.05071544647216797, 0.05242919921875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 5.0, 3.0, 10.0, 8.0, 24.0, 24.0, 38.0, 37.0, 45.0, 59.0, 63.0, 74.0, 89.0, 122.0, 170.0, 255.0, 309.0, 399.0, 469.0, 615.0, 945.0, 1414.0, 2737.0, 8340.0, 886529.0, 131955.0, 6595.0, 2421.0, 1278.0, 845.0, 616.0, 467.0, 341.0, 270.0, 209.0, 168.0, 132.0, 100.0, 88.0, 64.0, 60.0, 40.0, 28.0, 30.0, 15.0, 26.0, 6.0, 8.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.12103271484375, -0.11746501922607422, -0.11389732360839844, -0.11032962799072266, -0.10676193237304688, -0.1031942367553711, -0.09962654113769531, -0.09605884552001953, -0.09249114990234375, -0.08892345428466797, -0.08535575866699219, -0.0817880630493164, -0.07822036743164062, -0.07465267181396484, -0.07108497619628906, -0.06751728057861328, -0.0639495849609375, -0.06038188934326172, -0.05681419372558594, -0.053246498107910156, -0.049678802490234375, -0.046111106872558594, -0.04254341125488281, -0.03897571563720703, -0.03540802001953125, -0.03184032440185547, -0.028272628784179688, -0.024704933166503906, -0.021137237548828125, -0.017569541931152344, -0.014001846313476562, -0.010434150695800781, -0.006866455078125, -0.0032987594604492188, 0.0002689361572265625, 0.0038366317749023438, 0.007404327392578125, 0.010972023010253906, 0.014539718627929688, 0.01810741424560547, 0.02167510986328125, 0.02524280548095703, 0.028810501098632812, 0.032378196716308594, 0.035945892333984375, 0.039513587951660156, 0.04308128356933594, 0.04664897918701172, 0.0502166748046875, 0.05378437042236328, 0.05735206604003906, 0.060919761657714844, 0.06448745727539062, 0.0680551528930664, 0.07162284851074219, 0.07519054412841797, 0.07875823974609375, 0.08232593536376953, 0.08589363098144531, 0.0894613265991211, 0.09302902221679688, 0.09659671783447266, 0.10016441345214844, 0.10373210906982422, 0.1072998046875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 5.0, 2.0, 7.0, 10.0, 17.0, 21.0, 56.0, 62.0, 85.0, 158.0, 181.0, 123.0, 80.0, 48.0, 35.0, 16.0, 14.0, 11.0, 4.0, 6.0, 3.0, 1.0, 6.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.045797348022461e-05, -2.9344111680984497e-05, -2.8230249881744385e-05, -2.7116388082504272e-05, -2.600252628326416e-05, -2.4888664484024048e-05, -2.3774802684783936e-05, -2.2660940885543823e-05, -2.154707908630371e-05, -2.04332172870636e-05, -1.9319355487823486e-05, -1.8205493688583374e-05, -1.7091631889343262e-05, -1.597777009010315e-05, -1.4863908290863037e-05, -1.3750046491622925e-05, -1.2636184692382812e-05, -1.15223228931427e-05, -1.0408461093902588e-05, -9.294599294662476e-06, -8.180737495422363e-06, -7.066875696182251e-06, -5.953013896942139e-06, -4.839152097702026e-06, -3.725290298461914e-06, -2.6114284992218018e-06, -1.4975666999816895e-06, -3.8370490074157715e-07, 7.301568984985352e-07, 1.8440186977386475e-06, 2.9578804969787598e-06, 4.071742296218872e-06, 5.185604095458984e-06, 6.299465894699097e-06, 7.413327693939209e-06, 8.527189493179321e-06, 9.641051292419434e-06, 1.0754913091659546e-05, 1.1868774890899658e-05, 1.298263669013977e-05, 1.4096498489379883e-05, 1.5210360288619995e-05, 1.6324222087860107e-05, 1.743808388710022e-05, 1.8551945686340332e-05, 1.9665807485580444e-05, 2.0779669284820557e-05, 2.189353108406067e-05, 2.300739288330078e-05, 2.4121254682540894e-05, 2.5235116481781006e-05, 2.6348978281021118e-05, 2.746284008026123e-05, 2.8576701879501343e-05, 2.9690563678741455e-05, 3.080442547798157e-05, 3.191828727722168e-05, 3.303214907646179e-05, 3.4146010875701904e-05, 3.5259872674942017e-05, 3.637373447418213e-05, 3.748759627342224e-05, 3.8601458072662354e-05, 3.9715319871902466e-05, 4.082918167114258e-05]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 12.0, 24.0, 40.0, 90.0, 178.0, 429.0, 943.0, 2391.0, 7205.0, 899725.0, 128198.0, 5831.0, 2010.0, 810.0, 351.0, 170.0, 65.0, 36.0, 19.0, 5.0, 10.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08935546875, -0.08646488189697266, -0.08357429504394531, -0.08068370819091797, -0.07779312133789062, -0.07490253448486328, -0.07201194763183594, -0.0691213607788086, -0.06623077392578125, -0.0633401870727539, -0.06044960021972656, -0.05755901336669922, -0.054668426513671875, -0.05177783966064453, -0.04888725280761719, -0.045996665954589844, -0.0431060791015625, -0.040215492248535156, -0.03732490539550781, -0.03443431854248047, -0.031543731689453125, -0.02865314483642578, -0.025762557983398438, -0.022871971130371094, -0.01998138427734375, -0.017090797424316406, -0.014200210571289062, -0.011309623718261719, -0.008419036865234375, -0.005528450012207031, -0.0026378631591796875, 0.00025272369384765625, 0.003143310546875, 0.006033897399902344, 0.008924484252929688, 0.011815071105957031, 0.014705657958984375, 0.01759624481201172, 0.020486831665039062, 0.023377418518066406, 0.02626800537109375, 0.029158592224121094, 0.03204917907714844, 0.03493976593017578, 0.037830352783203125, 0.04072093963623047, 0.04361152648925781, 0.046502113342285156, 0.0493927001953125, 0.052283287048339844, 0.05517387390136719, 0.05806446075439453, 0.060955047607421875, 0.06384563446044922, 0.06673622131347656, 0.0696268081665039, 0.07251739501953125, 0.0754079818725586, 0.07829856872558594, 0.08118915557861328, 0.08407974243164062, 0.08697032928466797, 0.08986091613769531, 0.09275150299072266, 0.09564208984375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 11.0, 22.0, 53.0, 257.0, 435.0, 131.0, 35.0, 17.0, 7.0, 6.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010894775390625, -0.010567545890808105, -0.010240316390991211, -0.009913086891174316, -0.009585857391357422, -0.009258627891540527, -0.008931398391723633, -0.008604168891906738, -0.008276939392089844, -0.00794970989227295, -0.007622480392456055, -0.00729525089263916, -0.006968021392822266, -0.006640791893005371, -0.0063135623931884766, -0.005986332893371582, -0.0056591033935546875, -0.005331873893737793, -0.0050046443939208984, -0.004677414894104004, -0.004350185394287109, -0.004022955894470215, -0.0036957263946533203, -0.0033684968948364258, -0.0030412673950195312, -0.0027140378952026367, -0.002386808395385742, -0.0020595788955688477, -0.0017323493957519531, -0.0014051198959350586, -0.001077890396118164, -0.0007506608963012695, -0.000423431396484375, -9.620189666748047e-05, 0.00023102760314941406, 0.0005582571029663086, 0.0008854866027832031, 0.0012127161026000977, 0.0015399456024169922, 0.0018671751022338867, 0.0021944046020507812, 0.0025216341018676758, 0.0028488636016845703, 0.003176093101501465, 0.0035033226013183594, 0.003830552101135254, 0.0041577816009521484, 0.004485011100769043, 0.0048122406005859375, 0.005139470100402832, 0.0054666996002197266, 0.005793929100036621, 0.006121158599853516, 0.00644838809967041, 0.006775617599487305, 0.007102847099304199, 0.007430076599121094, 0.007757306098937988, 0.008084535598754883, 0.008411765098571777, 0.008738994598388672, 0.009066224098205566, 0.009393453598022461, 0.009720683097839355, 0.01004791259765625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 13.0, 17.0, 36.0, 87.0, 170.0, 332.0, 163.0, 73.0, 50.0, 17.0, 17.0, 10.0, 12.0, 8.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5186271071434021, -0.5076634287834167, -0.4966997504234314, -0.48573607206344604, -0.4747723937034607, -0.46380871534347534, -0.45284503698349, -0.44188135862350464, -0.4309176802635193, -0.41995400190353394, -0.4089903235435486, -0.39802664518356323, -0.3870629668235779, -0.37609928846359253, -0.3651356101036072, -0.3541719317436218, -0.3432082235813141, -0.33224454522132874, -0.3212808668613434, -0.31031718850135803, -0.2993535101413727, -0.28838983178138733, -0.2774261236190796, -0.26646244525909424, -0.2554987668991089, -0.24453508853912354, -0.23357141017913818, -0.22260773181915283, -0.21164405345916748, -0.20068037509918213, -0.18971668183803558, -0.17875300347805023, -0.16778935492038727, -0.15682567656040192, -0.14586199820041656, -0.13489830493927002, -0.12393463402986526, -0.11297095566987991, -0.10200726985931396, -0.09104359149932861, -0.08007991313934326, -0.06911623477935791, -0.05815255269408226, -0.04718887060880661, -0.03622519224882126, -0.025261513888835907, -0.014297828078269958, -0.003334149718284607, 0.007629528641700745, 0.018593208864331245, 0.029556889086961746, 0.040520571172237396, 0.05148424953222275, 0.0624479278922081, 0.07341161370277405, 0.0843752920627594, 0.09533897042274475, 0.1063026487827301, 0.11726632714271545, 0.1282300055027008, 0.13919368386268616, 0.1501573622226715, 0.16112105548381805, 0.1720847338438034, 0.18304841220378876]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 9.0, 5.0, 18.0, 14.0, 26.0, 37.0, 49.0, 63.0, 73.0, 98.0, 81.0, 79.0, 86.0, 65.0, 76.0, 74.0, 57.0, 22.0, 29.0, 19.0, 14.0, 11.0, 4.0, 5.0, 1.0, 1.0], "bins": [-0.27401041984558105, -0.2684665322303772, -0.26292264461517334, -0.2573787569999695, -0.2518348693847656, -0.24629098176956177, -0.2407470941543579, -0.23520320653915405, -0.2296593189239502, -0.22411543130874634, -0.21857154369354248, -0.21302765607833862, -0.20748376846313477, -0.2019398808479309, -0.19639599323272705, -0.1908521056175232, -0.18530820310115814, -0.17976431548595428, -0.17422042787075043, -0.16867654025554657, -0.1631326526403427, -0.15758876502513885, -0.1520448625087738, -0.14650097489356995, -0.1409570872783661, -0.13541319966316223, -0.12986931204795837, -0.12432542443275452, -0.11878153681755066, -0.1132376492023468, -0.10769375413656235, -0.10214986652135849, -0.09660599380731583, -0.09106210619211197, -0.08551821857690811, -0.07997432351112366, -0.0744304358959198, -0.06888654828071594, -0.06334266066551208, -0.05779877305030823, -0.05225488543510437, -0.04671099781990051, -0.041167110204696655, -0.0356232188642025, -0.030079331248998642, -0.024535443633794785, -0.01899155229330063, -0.013447664678096771, -0.007903777062892914, -0.0023598885163664818, 0.0031840000301599503, 0.008727889508008957, 0.014271777123212814, 0.019815664738416672, 0.025359556078910828, 0.030903443694114685, 0.03644733130931854, 0.0419912189245224, 0.04753510653972626, 0.05307899788022041, 0.05862288549542427, 0.06416676938533783, 0.06971066445112228, 0.07525455206632614, 0.08079843968153]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 7.0, 11.0, 10.0, 16.0, 16.0, 22.0, 21.0, 25.0, 29.0, 34.0, 50.0, 39.0, 104.0, 550.0, 6144.0, 97180.0, 870664.0, 68241.0, 4534.0, 411.0, 112.0, 46.0, 34.0, 47.0, 28.0, 27.0, 21.0, 26.0, 17.0, 15.0, 12.0, 17.0, 9.0, 6.0, 3.0, 4.0, 7.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.884765625, -0.85980224609375, -0.8348388671875, -0.80987548828125, -0.784912109375, -0.75994873046875, -0.7349853515625, -0.71002197265625, -0.68505859375, -0.66009521484375, -0.6351318359375, -0.61016845703125, -0.585205078125, -0.56024169921875, -0.5352783203125, -0.51031494140625, -0.4853515625, -0.46038818359375, -0.4354248046875, -0.41046142578125, -0.385498046875, -0.36053466796875, -0.3355712890625, -0.31060791015625, -0.28564453125, -0.26068115234375, -0.2357177734375, -0.21075439453125, -0.185791015625, -0.16082763671875, -0.1358642578125, -0.11090087890625, -0.0859375, -0.06097412109375, -0.0360107421875, -0.01104736328125, 0.013916015625, 0.03887939453125, 0.0638427734375, 0.08880615234375, 0.11376953125, 0.13873291015625, 0.1636962890625, 0.18865966796875, 0.213623046875, 0.23858642578125, 0.2635498046875, 0.28851318359375, 0.3134765625, 0.33843994140625, 0.3634033203125, 0.38836669921875, 0.413330078125, 0.43829345703125, 0.4632568359375, 0.48822021484375, 0.51318359375, 0.53814697265625, 0.5631103515625, 0.58807373046875, 0.613037109375, 0.63800048828125, 0.6629638671875, 0.68792724609375, 0.712890625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 19.0, 37.0, 53.0, 97.0, 125.0, 162.0, 135.0, 144.0, 101.0, 64.0, 38.0, 27.0, 9.0, 1.0, 1.0], "bins": [-0.217529296875, -0.2135782241821289, -0.2096271514892578, -0.20567607879638672, -0.20172500610351562, -0.19777393341064453, -0.19382286071777344, -0.18987178802490234, -0.18592071533203125, -0.18196964263916016, -0.17801856994628906, -0.17406749725341797, -0.17011642456054688, -0.16616535186767578, -0.1622142791748047, -0.1582632064819336, -0.1543121337890625, -0.1503610610961914, -0.1464099884033203, -0.14245891571044922, -0.13850784301757812, -0.13455677032470703, -0.13060569763183594, -0.12665462493896484, -0.12270355224609375, -0.11875247955322266, -0.11480140686035156, -0.11085033416748047, -0.10689926147460938, -0.10294818878173828, -0.09899711608886719, -0.0950460433959961, -0.091094970703125, -0.0871438980102539, -0.08319282531738281, -0.07924175262451172, -0.07529067993164062, -0.07133960723876953, -0.06738853454589844, -0.06343746185302734, -0.05948638916015625, -0.055535316467285156, -0.05158424377441406, -0.04763317108154297, -0.043682098388671875, -0.03973102569580078, -0.03577995300292969, -0.031828880310058594, -0.0278778076171875, -0.023926734924316406, -0.019975662231445312, -0.01602458953857422, -0.012073516845703125, -0.008122444152832031, -0.0041713714599609375, -0.00022029876708984375, 0.00373077392578125, 0.007681846618652344, 0.011632919311523438, 0.015583992004394531, 0.019535064697265625, 0.02348613739013672, 0.027437210083007812, 0.031388282775878906, 0.03533935546875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 7.0, 13.0, 19.0, 26.0, 34.0, 56.0, 70.0, 96.0, 148.0, 242.0, 357.0, 527.0, 741.0, 1100.0, 1726.0, 2752.0, 4405.0, 7027.0, 12108.0, 20440.0, 36454.0, 66849.0, 140856.0, 320173.0, 220619.0, 95465.0, 48519.0, 27028.0, 15607.0, 9432.0, 5654.0, 3567.0, 2302.0, 1448.0, 878.0, 596.0, 381.0, 271.0, 175.0, 128.0, 75.0, 70.0, 43.0, 23.0, 14.0, 10.0, 8.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.11212158203125, -0.10869789123535156, -0.10527420043945312, -0.10185050964355469, -0.09842681884765625, -0.09500312805175781, -0.09157943725585938, -0.08815574645996094, -0.0847320556640625, -0.08130836486816406, -0.07788467407226562, -0.07446098327636719, -0.07103729248046875, -0.06761360168457031, -0.06418991088867188, -0.06076622009277344, -0.057342529296875, -0.05391883850097656, -0.050495147705078125, -0.04707145690917969, -0.04364776611328125, -0.04022407531738281, -0.036800384521484375, -0.03337669372558594, -0.0299530029296875, -0.026529312133789062, -0.023105621337890625, -0.019681930541992188, -0.01625823974609375, -0.012834548950195312, -0.009410858154296875, -0.0059871673583984375, -0.0025634765625, 0.0008602142333984375, 0.004283905029296875, 0.0077075958251953125, 0.01113128662109375, 0.014554977416992188, 0.017978668212890625, 0.021402359008789062, 0.0248260498046875, 0.028249740600585938, 0.031673431396484375, 0.03509712219238281, 0.03852081298828125, 0.04194450378417969, 0.045368194580078125, 0.04879188537597656, 0.052215576171875, 0.05563926696777344, 0.059062957763671875, 0.06248664855957031, 0.06591033935546875, 0.06933403015136719, 0.07275772094726562, 0.07618141174316406, 0.0796051025390625, 0.08302879333496094, 0.08645248413085938, 0.08987617492675781, 0.09329986572265625, 0.09672355651855469, 0.10014724731445312, 0.10357093811035156, 0.10699462890625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 7.0, 5.0, 6.0, 6.0, 7.0, 10.0, 12.0, 22.0, 15.0, 19.0, 28.0, 44.0, 30.0, 33.0, 46.0, 40.0, 44.0, 35.0, 32.0, 34.0, 47.0, 60.0, 57.0, 33.0, 43.0, 31.0, 31.0, 33.0, 26.0, 27.0, 22.0, 18.0, 23.0, 14.0, 13.0, 14.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.040191650390625, -0.03906679153442383, -0.037941932678222656, -0.036817073822021484, -0.03569221496582031, -0.03456735610961914, -0.03344249725341797, -0.0323176383972168, -0.031192779541015625, -0.030067920684814453, -0.02894306182861328, -0.02781820297241211, -0.026693344116210938, -0.025568485260009766, -0.024443626403808594, -0.023318767547607422, -0.02219390869140625, -0.021069049835205078, -0.019944190979003906, -0.018819332122802734, -0.017694473266601562, -0.01656961441040039, -0.015444755554199219, -0.014319896697998047, -0.013195037841796875, -0.012070178985595703, -0.010945320129394531, -0.00982046127319336, -0.008695602416992188, -0.007570743560791016, -0.006445884704589844, -0.005321025848388672, -0.0041961669921875, -0.003071308135986328, -0.0019464492797851562, -0.0008215904235839844, 0.0003032684326171875, 0.0014281272888183594, 0.0025529861450195312, 0.003677845001220703, 0.004802703857421875, 0.005927562713623047, 0.007052421569824219, 0.00817728042602539, 0.009302139282226562, 0.010426998138427734, 0.011551856994628906, 0.012676715850830078, 0.01380157470703125, 0.014926433563232422, 0.016051292419433594, 0.017176151275634766, 0.018301010131835938, 0.01942586898803711, 0.02055072784423828, 0.021675586700439453, 0.022800445556640625, 0.023925304412841797, 0.02505016326904297, 0.02617502212524414, 0.027299880981445312, 0.028424739837646484, 0.029549598693847656, 0.030674457550048828, 0.03179931640625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 9.0, 9.0, 17.0, 12.0, 32.0, 38.0, 56.0, 89.0, 141.0, 203.0, 401.0, 733.0, 1319.0, 2936.0, 7404.0, 23503.0, 137931.0, 772232.0, 74674.0, 16222.0, 5629.0, 2344.0, 1116.0, 603.0, 332.0, 208.0, 130.0, 80.0, 40.0, 29.0, 29.0, 14.0, 18.0, 4.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005558013916015625, -0.005338847637176514, -0.005119681358337402, -0.004900515079498291, -0.00468134880065918, -0.004462182521820068, -0.004243016242980957, -0.004023849964141846, -0.0038046836853027344, -0.003585517406463623, -0.0033663511276245117, -0.0031471848487854004, -0.002928018569946289, -0.0027088522911071777, -0.0024896860122680664, -0.002270519733428955, -0.0020513534545898438, -0.0018321871757507324, -0.001613020896911621, -0.0013938546180725098, -0.0011746883392333984, -0.0009555220603942871, -0.0007363557815551758, -0.0005171895027160645, -0.0002980232238769531, -7.88569450378418e-05, 0.00014030933380126953, 0.00035947561264038086, 0.0005786418914794922, 0.0007978081703186035, 0.0010169744491577148, 0.0012361407279968262, 0.0014553070068359375, 0.0016744732856750488, 0.0018936395645141602, 0.0021128058433532715, 0.002331972122192383, 0.002551138401031494, 0.0027703046798706055, 0.002989470958709717, 0.003208637237548828, 0.0034278035163879395, 0.0036469697952270508, 0.003866136074066162, 0.0040853023529052734, 0.004304468631744385, 0.004523634910583496, 0.004742801189422607, 0.004961967468261719, 0.00518113374710083, 0.005400300025939941, 0.005619466304779053, 0.005838632583618164, 0.006057798862457275, 0.006276965141296387, 0.006496131420135498, 0.006715297698974609, 0.006934463977813721, 0.007153630256652832, 0.007372796535491943, 0.007591962814331055, 0.007811129093170166, 0.008030295372009277, 0.008249461650848389, 0.0084686279296875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 7.0, 7.0, 6.0, 9.0, 4.0, 20.0, 35.0, 34.0, 36.0, 54.0, 65.0, 79.0, 114.0, 134.0, 100.0, 72.0, 69.0, 40.0, 34.0, 25.0, 16.0, 9.0, 10.0, 5.0, 7.0, 7.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4722347259521484e-05, -1.4219433069229126e-05, -1.3716518878936768e-05, -1.321360468864441e-05, -1.271069049835205e-05, -1.2207776308059692e-05, -1.1704862117767334e-05, -1.1201947927474976e-05, -1.0699033737182617e-05, -1.0196119546890259e-05, -9.6932053565979e-06, -9.190291166305542e-06, -8.687376976013184e-06, -8.184462785720825e-06, -7.681548595428467e-06, -7.178634405136108e-06, -6.67572021484375e-06, -6.172806024551392e-06, -5.669891834259033e-06, -5.166977643966675e-06, -4.664063453674316e-06, -4.161149263381958e-06, -3.6582350730895996e-06, -3.155320882797241e-06, -2.652406692504883e-06, -2.1494925022125244e-06, -1.646578311920166e-06, -1.1436641216278076e-06, -6.407499313354492e-07, -1.3783574104309082e-07, 3.650784492492676e-07, 8.67992639541626e-07, 1.3709068298339844e-06, 1.8738210201263428e-06, 2.376735210418701e-06, 2.8796494007110596e-06, 3.382563591003418e-06, 3.885477781295776e-06, 4.388391971588135e-06, 4.891306161880493e-06, 5.3942203521728516e-06, 5.89713454246521e-06, 6.400048732757568e-06, 6.902962923049927e-06, 7.405877113342285e-06, 7.908791303634644e-06, 8.411705493927002e-06, 8.91461968421936e-06, 9.417533874511719e-06, 9.920448064804077e-06, 1.0423362255096436e-05, 1.0926276445388794e-05, 1.1429190635681152e-05, 1.193210482597351e-05, 1.2435019016265869e-05, 1.2937933206558228e-05, 1.3440847396850586e-05, 1.3943761587142944e-05, 1.4446675777435303e-05, 1.4949589967727661e-05, 1.545250415802002e-05, 1.5955418348312378e-05, 1.6458332538604736e-05, 1.6961246728897095e-05, 1.7464160919189453e-05]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 9.0, 3.0, 12.0, 13.0, 19.0, 33.0, 25.0, 58.0, 71.0, 98.0, 155.0, 228.0, 344.0, 556.0, 794.0, 1330.0, 2163.0, 3628.0, 6360.0, 11519.0, 21338.0, 42046.0, 94374.0, 284217.0, 359759.0, 115349.0, 48964.0, 24468.0, 12831.0, 7082.0, 4055.0, 2462.0, 1478.0, 929.0, 593.0, 416.0, 230.0, 189.0, 106.0, 69.0, 55.0, 36.0, 30.0, 23.0, 11.0, 6.0, 9.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013589859008789062, -0.001315295696258545, -0.0012716054916381836, -0.0012279152870178223, -0.001184225082397461, -0.0011405348777770996, -0.0010968446731567383, -0.001053154468536377, -0.0010094642639160156, -0.0009657740592956543, -0.000922083854675293, -0.0008783936500549316, -0.0008347034454345703, -0.000791013240814209, -0.0007473230361938477, -0.0007036328315734863, -0.000659942626953125, -0.0006162524223327637, -0.0005725622177124023, -0.000528872013092041, -0.0004851818084716797, -0.00044149160385131836, -0.00039780139923095703, -0.0003541111946105957, -0.0003104209899902344, -0.00026673078536987305, -0.00022304058074951172, -0.0001793503761291504, -0.00013566017150878906, -9.196996688842773e-05, -4.8279762268066406e-05, -4.589557647705078e-06, 3.910064697265625e-05, 8.279085159301758e-05, 0.0001264810562133789, 0.00017017126083374023, 0.00021386146545410156, 0.0002575516700744629, 0.0003012418746948242, 0.00034493207931518555, 0.0003886222839355469, 0.0004323124885559082, 0.00047600269317626953, 0.0005196928977966309, 0.0005633831024169922, 0.0006070733070373535, 0.0006507635116577148, 0.0006944537162780762, 0.0007381439208984375, 0.0007818341255187988, 0.0008255243301391602, 0.0008692145347595215, 0.0009129047393798828, 0.0009565949440002441, 0.0010002851486206055, 0.0010439753532409668, 0.0010876655578613281, 0.0011313557624816895, 0.0011750459671020508, 0.0012187361717224121, 0.0012624263763427734, 0.0013061165809631348, 0.001349806785583496, 0.0013934969902038574, 0.0014371871948242188]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 4.0, 2.0, 3.0, 8.0, 11.0, 11.0, 19.0, 21.0, 35.0, 28.0, 25.0, 40.0, 41.0, 54.0, 73.0, 64.0, 71.0, 73.0, 62.0, 58.0, 51.0, 45.0, 29.0, 35.0, 31.0, 16.0, 21.0, 12.0, 11.0, 15.0, 10.0, 9.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00048613548278808594, -0.0004713200032711029, -0.0004565045237541199, -0.00044168904423713684, -0.0004268735647201538, -0.0004120580852031708, -0.00039724260568618774, -0.0003824271261692047, -0.0003676116466522217, -0.00035279616713523865, -0.0003379806876182556, -0.0003231652081012726, -0.00030834972858428955, -0.0002935342490673065, -0.0002787187695503235, -0.00026390329003334045, -0.0002490878105163574, -0.0002342723309993744, -0.00021945685148239136, -0.00020464137196540833, -0.0001898258924484253, -0.00017501041293144226, -0.00016019493341445923, -0.0001453794538974762, -0.00013056397438049316, -0.00011574849486351013, -0.0001009330153465271, -8.611753582954407e-05, -7.130205631256104e-05, -5.6486576795578e-05, -4.167109727859497e-05, -2.685561776161194e-05, -1.2040138244628906e-05, 2.775341272354126e-06, 1.7590820789337158e-05, 3.240630030632019e-05, 4.722177982330322e-05, 6.203725934028625e-05, 7.685273885726929e-05, 9.166821837425232e-05, 0.00010648369789123535, 0.00012129917740821838, 0.00013611465692520142, 0.00015093013644218445, 0.00016574561595916748, 0.0001805610954761505, 0.00019537657499313354, 0.00021019205451011658, 0.0002250075340270996, 0.00023982301354408264, 0.0002546384930610657, 0.0002694539725780487, 0.00028426945209503174, 0.00029908493161201477, 0.0003139004111289978, 0.00032871589064598083, 0.00034353137016296387, 0.0003583468496799469, 0.00037316232919692993, 0.00038797780871391296, 0.000402793288230896, 0.00041760876774787903, 0.00043242424726486206, 0.0004472397267818451, 0.0004620552062988281]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 12.0, 17.0, 24.0, 40.0, 89.0, 191.0, 309.0, 141.0, 61.0, 46.0, 22.0, 18.0, 12.0, 10.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2535037398338318, -0.2477933019399643, -0.2420828491449356, -0.23637241125106812, -0.23066197335720062, -0.22495152056217194, -0.21924108266830444, -0.21353062987327576, -0.20782019197940826, -0.20210975408554077, -0.19639930129051208, -0.1906888633966446, -0.1849784255027771, -0.1792679727077484, -0.17355753481388092, -0.16784709692001343, -0.16213664412498474, -0.15642620623111725, -0.15071575343608856, -0.14500531554222107, -0.13929487764835358, -0.1335844248533249, -0.1278739869594574, -0.12216354161500931, -0.11645311117172241, -0.11074266582727432, -0.10503222793340683, -0.09932178258895874, -0.09361133724451065, -0.08790089190006256, -0.08219045400619507, -0.07648000866174698, -0.07076955586671829, -0.0650591105222702, -0.05934866890311241, -0.05363822728395462, -0.04792778193950653, -0.04221734032034874, -0.03650689870119095, -0.03079645335674286, -0.025086011737585068, -0.019375568255782127, -0.013665125705301762, -0.007954683154821396, -0.0022442396730184555, 0.003466203808784485, 0.009176645427942276, 0.014887090772390366, 0.020597532391548157, 0.026307975873351097, 0.03201841935515404, 0.03772886097431183, 0.04343930631875992, 0.04914974793791771, 0.0548601895570755, 0.06057063490152359, 0.06628108024597168, 0.07199152559041977, 0.07770196348428726, 0.08341240882873535, 0.08912285417318344, 0.09483329951763153, 0.10054373741149902, 0.10625418275594711, 0.1119646206498146]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 7.0, 9.0, 15.0, 18.0, 28.0, 35.0, 48.0, 56.0, 70.0, 65.0, 81.0, 90.0, 91.0, 81.0, 78.0, 55.0, 48.0, 45.0, 39.0, 18.0, 15.0, 6.0, 10.0, 2.0, 3.0, 1.0], "bins": [-0.1661202311515808, -0.1627594381570816, -0.1593986451625824, -0.1560378521680832, -0.15267705917358398, -0.14931626617908478, -0.14595547318458557, -0.14259468019008636, -0.13923388719558716, -0.13587309420108795, -0.13251230120658875, -0.12915150821208954, -0.12579071521759033, -0.12242992222309113, -0.11906912922859192, -0.11570834368467331, -0.1123475581407547, -0.1089867651462555, -0.10562597215175629, -0.10226517915725708, -0.09890438616275787, -0.09554359316825867, -0.09218280017375946, -0.08882201462984085, -0.08546121418476105, -0.08210042119026184, -0.07873962819576263, -0.07537883520126343, -0.07201804220676422, -0.06865724921226501, -0.06529645621776581, -0.0619356706738472, -0.05857488140463829, -0.055214088410139084, -0.05185329541563988, -0.04849250614643097, -0.04513171315193176, -0.041770920157432556, -0.03841012716293335, -0.03504933416843414, -0.031688541173934937, -0.02832774817943573, -0.024966957047581673, -0.021606164053082466, -0.01824537292122841, -0.014884579926729202, -0.011523786932229996, -0.008162995800375938, -0.004802204668521881, -0.0014414123725146055, 0.00191937992349267, 0.005280172452330589, 0.008640964515507221, 0.012001756578683853, 0.01536254957318306, 0.018723340705037117, 0.022084133699536324, 0.02544492669403553, 0.028805717825889587, 0.032166510820388794, 0.035527303814888, 0.03888809680938721, 0.042248889803886414, 0.04560967907309532, 0.04897047206759453]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 11.0, 16.0, 26.0, 42.0, 46.0, 77.0, 112.0, 174.0, 300.0, 476.0, 1157.0, 3961463.0, 227915.0, 1174.0, 520.0, 269.0, 170.0, 115.0, 69.0, 59.0, 27.0, 25.0, 14.0, 4.0, 9.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.34228515625, -0.3346710205078125, -0.327056884765625, -0.3194427490234375, -0.31182861328125, -0.3042144775390625, -0.296600341796875, -0.2889862060546875, -0.2813720703125, -0.2737579345703125, -0.266143798828125, -0.2585296630859375, -0.25091552734375, -0.2433013916015625, -0.235687255859375, -0.2280731201171875, -0.220458984375, -0.2128448486328125, -0.205230712890625, -0.1976165771484375, -0.19000244140625, -0.1823883056640625, -0.174774169921875, -0.1671600341796875, -0.1595458984375, -0.1519317626953125, -0.144317626953125, -0.1367034912109375, -0.12908935546875, -0.1214752197265625, -0.113861083984375, -0.1062469482421875, -0.0986328125, -0.0910186767578125, -0.083404541015625, -0.0757904052734375, -0.06817626953125, -0.0605621337890625, -0.052947998046875, -0.0453338623046875, -0.0377197265625, -0.0301055908203125, -0.022491455078125, -0.0148773193359375, -0.00726318359375, 0.0003509521484375, 0.007965087890625, 0.0155792236328125, 0.023193359375, 0.0308074951171875, 0.038421630859375, 0.0460357666015625, 0.05364990234375, 0.0612640380859375, 0.068878173828125, 0.0764923095703125, 0.0841064453125, 0.0917205810546875, 0.099334716796875, 0.1069488525390625, 0.11456298828125, 0.1221771240234375, 0.129791259765625, 0.1374053955078125, 0.14501953125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 13.0, 6.0, 17.0, 23.0, 27.0, 38.0, 47.0, 71.0, 70.0, 68.0, 87.0, 78.0, 91.0, 71.0, 68.0, 60.0, 50.0, 32.0, 34.0, 20.0, 16.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.12548828125, -0.12283563613891602, -0.12018299102783203, -0.11753034591674805, -0.11487770080566406, -0.11222505569458008, -0.1095724105834961, -0.10691976547241211, -0.10426712036132812, -0.10161447525024414, -0.09896183013916016, -0.09630918502807617, -0.09365653991699219, -0.0910038948059082, -0.08835124969482422, -0.08569860458374023, -0.08304595947265625, -0.08039331436157227, -0.07774066925048828, -0.0750880241394043, -0.07243537902832031, -0.06978273391723633, -0.06713008880615234, -0.06447744369506836, -0.061824798583984375, -0.05917215347290039, -0.056519508361816406, -0.05386686325073242, -0.05121421813964844, -0.04856157302856445, -0.04590892791748047, -0.043256282806396484, -0.0406036376953125, -0.037950992584228516, -0.03529834747314453, -0.03264570236206055, -0.029993057250976562, -0.027340412139892578, -0.024687767028808594, -0.02203512191772461, -0.019382476806640625, -0.01672983169555664, -0.014077186584472656, -0.011424541473388672, -0.008771896362304688, -0.006119251251220703, -0.0034666061401367188, -0.0008139610290527344, 0.00183868408203125, 0.004491329193115234, 0.007143974304199219, 0.009796619415283203, 0.012449264526367188, 0.015101909637451172, 0.017754554748535156, 0.02040719985961914, 0.023059844970703125, 0.02571249008178711, 0.028365135192871094, 0.031017780303955078, 0.03367042541503906, 0.03632307052612305, 0.03897571563720703, 0.041628360748291016, 0.044281005859375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 12.0, 7.0, 17.0, 33.0, 37.0, 74.0, 115.0, 214.0, 517.0, 1009.0, 2659.0, 22154.0, 4144028.0, 18850.0, 2559.0, 991.0, 481.0, 226.0, 131.0, 67.0, 33.0, 17.0, 21.0, 16.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2047119140625, -0.19859695434570312, -0.19248199462890625, -0.18636703491210938, -0.1802520751953125, -0.17413711547851562, -0.16802215576171875, -0.16190719604492188, -0.155792236328125, -0.14967727661132812, -0.14356231689453125, -0.13744735717773438, -0.1313323974609375, -0.12521743774414062, -0.11910247802734375, -0.11298751831054688, -0.10687255859375, -0.10075759887695312, -0.09464263916015625, -0.08852767944335938, -0.0824127197265625, -0.07629776000976562, -0.07018280029296875, -0.06406784057617188, -0.057952880859375, -0.051837921142578125, -0.04572296142578125, -0.039608001708984375, -0.0334930419921875, -0.027378082275390625, -0.02126312255859375, -0.015148162841796875, -0.009033203125, -0.002918243408203125, 0.00319671630859375, 0.009311676025390625, 0.0154266357421875, 0.021541595458984375, 0.02765655517578125, 0.033771514892578125, 0.039886474609375, 0.046001434326171875, 0.05211639404296875, 0.058231353759765625, 0.0643463134765625, 0.07046127319335938, 0.07657623291015625, 0.08269119262695312, 0.08880615234375, 0.09492111206054688, 0.10103607177734375, 0.10715103149414062, 0.1132659912109375, 0.11938095092773438, 0.12549591064453125, 0.13161087036132812, 0.137725830078125, 0.14384078979492188, 0.14995574951171875, 0.15607070922851562, 0.1621856689453125, 0.16830062866210938, 0.17441558837890625, 0.18053054809570312, 0.1866455078125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 10.0, 34.0, 117.0, 2953.0, 756.0, 128.0, 43.0, 14.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0244140625, -0.02350759506225586, -0.02260112762451172, -0.021694660186767578, -0.020788192749023438, -0.019881725311279297, -0.018975257873535156, -0.018068790435791016, -0.017162322998046875, -0.016255855560302734, -0.015349388122558594, -0.014442920684814453, -0.013536453247070312, -0.012629985809326172, -0.011723518371582031, -0.01081705093383789, -0.00991058349609375, -0.00900411605834961, -0.008097648620605469, -0.007191181182861328, -0.0062847137451171875, -0.005378246307373047, -0.004471778869628906, -0.0035653114318847656, -0.002658843994140625, -0.0017523765563964844, -0.0008459091186523438, 6.0558319091796875e-05, 0.0009670257568359375, 0.0018734931945800781, 0.0027799606323242188, 0.0036864280700683594, 0.0045928955078125, 0.005499362945556641, 0.006405830383300781, 0.007312297821044922, 0.008218765258789062, 0.009125232696533203, 0.010031700134277344, 0.010938167572021484, 0.011844635009765625, 0.012751102447509766, 0.013657569885253906, 0.014564037322998047, 0.015470504760742188, 0.016376972198486328, 0.01728343963623047, 0.01818990707397461, 0.01909637451171875, 0.02000284194946289, 0.02090930938720703, 0.021815776824951172, 0.022722244262695312, 0.023628711700439453, 0.024535179138183594, 0.025441646575927734, 0.026348114013671875, 0.027254581451416016, 0.028161048889160156, 0.029067516326904297, 0.029973983764648438, 0.030880451202392578, 0.03178691864013672, 0.03269338607788086, 0.033599853515625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 5.0, 21.0, 16.0, 24.0, 37.0, 60.0, 116.0, 204.0, 212.0, 110.0, 63.0, 39.0, 28.0, 21.0, 13.0, 10.0, 9.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13338971138000488, -0.12979339063167572, -0.12619705498218536, -0.1226007267832756, -0.11900439858436584, -0.11540807783603668, -0.11181174963712692, -0.10821542143821716, -0.1046190932393074, -0.10102276504039764, -0.09742643684148788, -0.09383010864257812, -0.09023378789424896, -0.0866374522447586, -0.08304113149642944, -0.07944480329751968, -0.07584847509860992, -0.07225214689970016, -0.0686558187007904, -0.06505949050188065, -0.061463166028261185, -0.057866837829351425, -0.054270513355731964, -0.050674185156822205, -0.047077856957912445, -0.043481528759002686, -0.039885200560092926, -0.036288876086473465, -0.032692547887563705, -0.029096219688653946, -0.025499893352389336, -0.021903567016124725, -0.018307238817214966, -0.014710911549627781, -0.011114584282040596, -0.007518257014453411, -0.003921929746866226, -0.0003256015479564667, 0.0032707247883081436, 0.006867051124572754, 0.010463379323482513, 0.014059706591069698, 0.017656033858656883, 0.021252360194921494, 0.024848688393831253, 0.028445016592741013, 0.032041341066360474, 0.03563766926527023, 0.03923399746417999, 0.04283032566308975, 0.04642665386199951, 0.05002297833561897, 0.05361930653452873, 0.05721563473343849, 0.06081195920705795, 0.06440828740596771, 0.06800461560487747, 0.07160094380378723, 0.07519727200269699, 0.07879360020160675, 0.08238992094993591, 0.08598625659942627, 0.08958257734775543, 0.09317890554666519, 0.09677523374557495]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 10.0, 10.0, 17.0, 16.0, 25.0, 30.0, 36.0, 37.0, 48.0, 47.0, 48.0, 55.0, 63.0, 58.0, 63.0, 71.0, 55.0, 55.0, 43.0, 35.0, 41.0, 36.0, 19.0, 26.0, 18.0, 14.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.08962471783161163, -0.08761554956436157, -0.08560637384653091, -0.08359720557928085, -0.0815880298614502, -0.07957886159420013, -0.07756969332695007, -0.07556051760911942, -0.07355134934186935, -0.0715421810746193, -0.06953300535678864, -0.06752383708953857, -0.06551466882228851, -0.06350549310445786, -0.061496324837207794, -0.059487152844667435, -0.057477980852127075, -0.055468808859586716, -0.053459636867046356, -0.051450468599796295, -0.049441296607255936, -0.047432124614715576, -0.045422956347465515, -0.043413784354925156, -0.041404612362384796, -0.03939544036984444, -0.03738626837730408, -0.035377100110054016, -0.03336792811751366, -0.0313587561249733, -0.029349585995078087, -0.027340415865182877, -0.025331247597932816, -0.023322075605392456, -0.021312905475497246, -0.019303735345602036, -0.017294563353061676, -0.015285392291843891, -0.013276221230626106, -0.011267050169408321, -0.009257879108190536, -0.007248708046972752, -0.005239536985754967, -0.003230365924537182, -0.001221194863319397, 0.0007879761978983879, 0.002797147259116173, 0.004806318320333958, 0.0068154893815517426, 0.008824660442769527, 0.010833831503987312, 0.012843002565205097, 0.014852173626422882, 0.01686134561896324, 0.018870515748858452, 0.020879685878753662, 0.02288885787129402, 0.02489802986383438, 0.02690719999372959, 0.0289163701236248, 0.03092554211616516, 0.03293471410870552, 0.03494388610124588, 0.03695305436849594, 0.0389622263610363]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 4.0, 3.0, 7.0, 4.0, 7.0, 9.0, 14.0, 18.0, 18.0, 17.0, 50.0, 66.0, 168.0, 428.0, 924.0, 2295.0, 5797.0, 16182.0, 48893.0, 186495.0, 599467.0, 129817.0, 37284.0, 12573.0, 4742.0, 1762.0, 790.0, 359.0, 143.0, 58.0, 38.0, 22.0, 21.0, 13.0, 17.0, 8.0, 12.0, 7.0, 3.0, 2.0, 2.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.219482421875, -0.21309852600097656, -0.20671463012695312, -0.2003307342529297, -0.19394683837890625, -0.1875629425048828, -0.18117904663085938, -0.17479515075683594, -0.1684112548828125, -0.16202735900878906, -0.15564346313476562, -0.1492595672607422, -0.14287567138671875, -0.1364917755126953, -0.13010787963867188, -0.12372398376464844, -0.117340087890625, -0.11095619201660156, -0.10457229614257812, -0.09818840026855469, -0.09180450439453125, -0.08542060852050781, -0.07903671264648438, -0.07265281677246094, -0.0662689208984375, -0.05988502502441406, -0.053501129150390625, -0.04711723327636719, -0.04073333740234375, -0.03434944152832031, -0.027965545654296875, -0.021581649780273438, -0.01519775390625, -0.008813858032226562, -0.002429962158203125, 0.0039539337158203125, 0.01033782958984375, 0.016721725463867188, 0.023105621337890625, 0.029489517211914062, 0.0358734130859375, 0.04225730895996094, 0.048641204833984375, 0.05502510070800781, 0.06140899658203125, 0.06779289245605469, 0.07417678833007812, 0.08056068420410156, 0.086944580078125, 0.09332847595214844, 0.09971237182617188, 0.10609626770019531, 0.11248016357421875, 0.11886405944824219, 0.12524795532226562, 0.13163185119628906, 0.1380157470703125, 0.14439964294433594, 0.15078353881835938, 0.1571674346923828, 0.16355133056640625, 0.1699352264404297, 0.17631912231445312, 0.18270301818847656, 0.1890869140625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 10.0, 12.0, 15.0, 14.0, 29.0, 36.0, 35.0, 45.0, 66.0, 54.0, 65.0, 65.0, 72.0, 79.0, 80.0, 46.0, 67.0, 53.0, 27.0, 41.0, 21.0, 25.0, 20.0, 5.0, 8.0, 5.0, 7.0, 2.0, 2.0], "bins": [-0.08526611328125, -0.08347153663635254, -0.08167695999145508, -0.07988238334655762, -0.07808780670166016, -0.0762932300567627, -0.07449865341186523, -0.07270407676696777, -0.07090950012207031, -0.06911492347717285, -0.06732034683227539, -0.06552577018737793, -0.06373119354248047, -0.06193661689758301, -0.06014204025268555, -0.058347463607788086, -0.056552886962890625, -0.054758310317993164, -0.0529637336730957, -0.05116915702819824, -0.04937458038330078, -0.04758000373840332, -0.04578542709350586, -0.0439908504486084, -0.04219627380371094, -0.04040169715881348, -0.038607120513916016, -0.036812543869018555, -0.035017967224121094, -0.03322339057922363, -0.03142881393432617, -0.02963423728942871, -0.02783966064453125, -0.02604508399963379, -0.024250507354736328, -0.022455930709838867, -0.020661354064941406, -0.018866777420043945, -0.017072200775146484, -0.015277624130249023, -0.013483047485351562, -0.011688470840454102, -0.00989389419555664, -0.00809931755065918, -0.006304740905761719, -0.004510164260864258, -0.002715587615966797, -0.0009210109710693359, 0.000873565673828125, 0.002668142318725586, 0.004462718963623047, 0.006257295608520508, 0.008051872253417969, 0.00984644889831543, 0.01164102554321289, 0.013435602188110352, 0.015230178833007812, 0.017024755477905273, 0.018819332122802734, 0.020613908767700195, 0.022408485412597656, 0.024203062057495117, 0.025997638702392578, 0.02779221534729004, 0.0295867919921875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 7.0, 7.0, 6.0, 10.0, 14.0, 15.0, 18.0, 43.0, 51.0, 77.0, 71.0, 93.0, 144.0, 213.0, 266.0, 400.0, 565.0, 771.0, 1015.0, 1551.0, 2220.0, 3409.0, 5339.0, 8339.0, 14657.0, 27021.0, 63127.0, 536648.0, 265694.0, 55129.0, 24977.0, 13382.0, 7894.0, 5003.0, 3263.0, 2080.0, 1334.0, 1049.0, 739.0, 524.0, 369.0, 252.0, 203.0, 147.0, 108.0, 88.0, 62.0, 38.0, 40.0, 23.0, 21.0, 11.0, 14.0, 14.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.11065673828125, -0.10707950592041016, -0.10350227355957031, -0.09992504119873047, -0.09634780883789062, -0.09277057647705078, -0.08919334411621094, -0.0856161117553711, -0.08203887939453125, -0.0784616470336914, -0.07488441467285156, -0.07130718231201172, -0.06772994995117188, -0.06415271759033203, -0.06057548522949219, -0.056998252868652344, -0.0534210205078125, -0.049843788146972656, -0.04626655578613281, -0.04268932342529297, -0.039112091064453125, -0.03553485870361328, -0.03195762634277344, -0.028380393981933594, -0.02480316162109375, -0.021225929260253906, -0.017648696899414062, -0.014071464538574219, -0.010494232177734375, -0.006916999816894531, -0.0033397674560546875, 0.00023746490478515625, 0.003814697265625, 0.007391929626464844, 0.010969161987304688, 0.014546394348144531, 0.018123626708984375, 0.02170085906982422, 0.025278091430664062, 0.028855323791503906, 0.03243255615234375, 0.036009788513183594, 0.03958702087402344, 0.04316425323486328, 0.046741485595703125, 0.05031871795654297, 0.05389595031738281, 0.057473182678222656, 0.0610504150390625, 0.06462764739990234, 0.06820487976074219, 0.07178211212158203, 0.07535934448242188, 0.07893657684326172, 0.08251380920410156, 0.0860910415649414, 0.08966827392578125, 0.0932455062866211, 0.09682273864746094, 0.10039997100830078, 0.10397720336914062, 0.10755443572998047, 0.11113166809082031, 0.11470890045166016, 0.1182861328125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 6.0, 13.0, 6.0, 16.0, 18.0, 19.0, 22.0, 25.0, 24.0, 21.0, 27.0, 30.0, 32.0, 40.0, 33.0, 41.0, 42.0, 39.0, 47.0, 44.0, 45.0, 40.0, 28.0, 20.0, 31.0, 40.0, 25.0, 31.0, 24.0, 20.0, 22.0, 25.0, 17.0, 8.0, 6.0, 16.0, 10.0, 6.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.021484375, -0.020787477493286133, -0.020090579986572266, -0.0193936824798584, -0.01869678497314453, -0.017999887466430664, -0.017302989959716797, -0.01660609245300293, -0.015909194946289062, -0.015212297439575195, -0.014515399932861328, -0.013818502426147461, -0.013121604919433594, -0.012424707412719727, -0.01172780990600586, -0.011030912399291992, -0.010334014892578125, -0.009637117385864258, -0.00894021987915039, -0.008243322372436523, -0.007546424865722656, -0.006849527359008789, -0.006152629852294922, -0.005455732345581055, -0.0047588348388671875, -0.00406193733215332, -0.003365039825439453, -0.002668142318725586, -0.0019712448120117188, -0.0012743473052978516, -0.0005774497985839844, 0.00011944770812988281, 0.00081634521484375, 0.0015132427215576172, 0.0022101402282714844, 0.0029070377349853516, 0.0036039352416992188, 0.004300832748413086, 0.004997730255126953, 0.00569462776184082, 0.0063915252685546875, 0.007088422775268555, 0.007785320281982422, 0.008482217788696289, 0.009179115295410156, 0.009876012802124023, 0.01057291030883789, 0.011269807815551758, 0.011966705322265625, 0.012663602828979492, 0.01336050033569336, 0.014057397842407227, 0.014754295349121094, 0.015451192855834961, 0.016148090362548828, 0.016844987869262695, 0.017541885375976562, 0.01823878288269043, 0.018935680389404297, 0.019632577896118164, 0.02032947540283203, 0.0210263729095459, 0.021723270416259766, 0.022420167922973633, 0.0231170654296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 5.0, 5.0, 15.0, 16.0, 21.0, 34.0, 34.0, 54.0, 71.0, 108.0, 128.0, 200.0, 315.0, 505.0, 815.0, 1339.0, 2773.0, 8266.0, 979964.0, 42765.0, 5787.0, 2201.0, 1090.0, 659.0, 432.0, 279.0, 193.0, 132.0, 80.0, 70.0, 47.0, 42.0, 24.0, 21.0, 13.0, 10.0, 5.0, 11.0, 2.0, 5.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.037750244140625, -0.036635398864746094, -0.03552055358886719, -0.03440570831298828, -0.033290863037109375, -0.03217601776123047, -0.031061172485351562, -0.029946327209472656, -0.02883148193359375, -0.027716636657714844, -0.026601791381835938, -0.02548694610595703, -0.024372100830078125, -0.02325725555419922, -0.022142410278320312, -0.021027565002441406, -0.0199127197265625, -0.018797874450683594, -0.017683029174804688, -0.01656818389892578, -0.015453338623046875, -0.014338493347167969, -0.013223648071289062, -0.012108802795410156, -0.01099395751953125, -0.009879112243652344, -0.008764266967773438, -0.007649421691894531, -0.006534576416015625, -0.005419731140136719, -0.0043048858642578125, -0.0031900405883789062, -0.0020751953125, -0.0009603500366210938, 0.0001544952392578125, 0.0012693405151367188, 0.002384185791015625, 0.0034990310668945312, 0.0046138763427734375, 0.005728721618652344, 0.00684356689453125, 0.007958412170410156, 0.009073257446289062, 0.010188102722167969, 0.011302947998046875, 0.012417793273925781, 0.013532638549804688, 0.014647483825683594, 0.0157623291015625, 0.016877174377441406, 0.017992019653320312, 0.01910686492919922, 0.020221710205078125, 0.02133655548095703, 0.022451400756835938, 0.023566246032714844, 0.02468109130859375, 0.025795936584472656, 0.026910781860351562, 0.02802562713623047, 0.029140472412109375, 0.03025531768798828, 0.03137016296386719, 0.032485008239746094, 0.033599853515625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 13.0, 16.0, 33.0, 48.0, 53.0, 66.0, 68.0, 86.0, 109.0, 95.0, 63.0, 83.0, 53.0, 65.0, 47.0, 19.0, 21.0, 13.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6570091247558594e-05, -1.5951693058013916e-05, -1.5333294868469238e-05, -1.471489667892456e-05, -1.4096498489379883e-05, -1.3478100299835205e-05, -1.2859702110290527e-05, -1.224130392074585e-05, -1.1622905731201172e-05, -1.1004507541656494e-05, -1.0386109352111816e-05, -9.767711162567139e-06, -9.149312973022461e-06, -8.530914783477783e-06, -7.912516593933105e-06, -7.294118404388428e-06, -6.67572021484375e-06, -6.057322025299072e-06, -5.4389238357543945e-06, -4.820525646209717e-06, -4.202127456665039e-06, -3.5837292671203613e-06, -2.9653310775756836e-06, -2.346932888031006e-06, -1.7285346984863281e-06, -1.1101365089416504e-06, -4.917383193969727e-07, 1.2665987014770508e-07, 7.450580596923828e-07, 1.3634562492370605e-06, 1.9818544387817383e-06, 2.600252628326416e-06, 3.2186508178710938e-06, 3.8370490074157715e-06, 4.455447196960449e-06, 5.073845386505127e-06, 5.692243576049805e-06, 6.310641765594482e-06, 6.92903995513916e-06, 7.547438144683838e-06, 8.165836334228516e-06, 8.784234523773193e-06, 9.402632713317871e-06, 1.0021030902862549e-05, 1.0639429092407227e-05, 1.1257827281951904e-05, 1.1876225471496582e-05, 1.249462366104126e-05, 1.3113021850585938e-05, 1.3731420040130615e-05, 1.4349818229675293e-05, 1.496821641921997e-05, 1.558661460876465e-05, 1.6205012798309326e-05, 1.6823410987854004e-05, 1.744180917739868e-05, 1.806020736694336e-05, 1.8678605556488037e-05, 1.9297003746032715e-05, 1.9915401935577393e-05, 2.053380012512207e-05, 2.1152198314666748e-05, 2.1770596504211426e-05, 2.2388994693756104e-05, 2.300739288330078e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 3.0, 12.0, 17.0, 35.0, 69.0, 188.0, 554.0, 2088.0, 11324.0, 1024117.0, 7822.0, 1557.0, 482.0, 157.0, 79.0, 25.0, 9.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.049835205078125, -0.04787397384643555, -0.045912742614746094, -0.04395151138305664, -0.04199028015136719, -0.040029048919677734, -0.03806781768798828, -0.03610658645629883, -0.034145355224609375, -0.03218412399291992, -0.03022289276123047, -0.028261661529541016, -0.026300430297851562, -0.02433919906616211, -0.022377967834472656, -0.020416736602783203, -0.01845550537109375, -0.016494274139404297, -0.014533042907714844, -0.01257181167602539, -0.010610580444335938, -0.008649349212646484, -0.006688117980957031, -0.004726886749267578, -0.002765655517578125, -0.0008044242858886719, 0.0011568069458007812, 0.0031180381774902344, 0.0050792694091796875, 0.007040500640869141, 0.009001731872558594, 0.010962963104248047, 0.0129241943359375, 0.014885425567626953, 0.016846656799316406, 0.01880788803100586, 0.020769119262695312, 0.022730350494384766, 0.02469158172607422, 0.026652812957763672, 0.028614044189453125, 0.030575275421142578, 0.03253650665283203, 0.034497737884521484, 0.03645896911621094, 0.03842020034790039, 0.040381431579589844, 0.0423426628112793, 0.04430389404296875, 0.0462651252746582, 0.048226356506347656, 0.05018758773803711, 0.05214881896972656, 0.054110050201416016, 0.05607128143310547, 0.05803251266479492, 0.059993743896484375, 0.06195497512817383, 0.06391620635986328, 0.06587743759155273, 0.06783866882324219, 0.06979990005493164, 0.0717611312866211, 0.07372236251831055, 0.07568359375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 6.0, 3.0, 5.0, 24.0, 699.0, 214.0, 5.0, 12.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00522613525390625, -0.005087733268737793, -0.004949331283569336, -0.004810929298400879, -0.004672527313232422, -0.004534125328063965, -0.004395723342895508, -0.004257321357727051, -0.004118919372558594, -0.003980517387390137, -0.0038421154022216797, -0.0037037134170532227, -0.0035653114318847656, -0.0034269094467163086, -0.0032885074615478516, -0.0031501054763793945, -0.0030117034912109375, -0.0028733015060424805, -0.0027348995208740234, -0.0025964975357055664, -0.0024580955505371094, -0.0023196935653686523, -0.0021812915802001953, -0.0020428895950317383, -0.0019044876098632812, -0.0017660856246948242, -0.0016276836395263672, -0.0014892816543579102, -0.0013508796691894531, -0.001212477684020996, -0.001074075698852539, -0.000935673713684082, -0.000797271728515625, -0.000658869743347168, -0.0005204677581787109, -0.0003820657730102539, -0.00024366378784179688, -0.00010526180267333984, 3.314018249511719e-05, 0.00017154216766357422, 0.00030994415283203125, 0.0004483461380004883, 0.0005867481231689453, 0.0007251501083374023, 0.0008635520935058594, 0.0010019540786743164, 0.0011403560638427734, 0.0012787580490112305, 0.0014171600341796875, 0.0015555620193481445, 0.0016939640045166016, 0.0018323659896850586, 0.0019707679748535156, 0.0021091699600219727, 0.0022475719451904297, 0.0023859739303588867, 0.0025243759155273438, 0.0026627779006958008, 0.002801179885864258, 0.002939581871032715, 0.003077983856201172, 0.003216385841369629, 0.003354787826538086, 0.003493189811706543, 0.003631591796875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 6.0, 11.0, 18.0, 14.0, 39.0, 65.0, 80.0, 140.0, 162.0, 117.0, 88.0, 58.0, 37.0, 38.0, 29.0, 18.0, 19.0, 5.0, 13.0, 11.0, 11.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043036915361881256, -0.04110652208328247, -0.039176128804683685, -0.0372457355260849, -0.035315338522195816, -0.03338494524359703, -0.031454551964998245, -0.02952415868639946, -0.027593763545155525, -0.02566337026655674, -0.023732975125312805, -0.02180258184671402, -0.019872188568115234, -0.0179417934268713, -0.016011400148272514, -0.014081005938351154, -0.012150611728429794, -0.010220217518508434, -0.008289823308587074, -0.006359430029988289, -0.004429035820066929, -0.002498641610145569, -0.0005682483315467834, 0.0013621458783745766, 0.0032925400882959366, 0.005222934298217297, 0.007153328042477369, 0.009083721786737442, 0.011014115996658802, 0.012944510206580162, 0.014874903485178947, 0.016805298626422882, 0.018735691905021667, 0.020666085183620453, 0.022596480324864388, 0.024526873603463173, 0.026457268744707108, 0.028387662023305893, 0.03031805530190468, 0.032248448580503464, 0.03417884558439255, 0.03610923886299133, 0.03803963214159012, 0.039970025420188904, 0.04190042242407799, 0.04383081570267677, 0.04576120898127556, 0.047691602259874344, 0.04962199553847313, 0.051552388817071915, 0.0534827820956707, 0.055413179099559784, 0.05734357237815857, 0.059273965656757355, 0.06120435893535614, 0.06313475221395493, 0.06506514549255371, 0.0669955387711525, 0.06892593204975128, 0.07085632532835007, 0.07278671860694885, 0.07471711933612823, 0.07664750516414642, 0.0785779058933258, 0.08050829917192459]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 2.0, 11.0, 7.0, 14.0, 17.0, 21.0, 28.0, 33.0, 30.0, 43.0, 47.0, 53.0, 48.0, 49.0, 62.0, 58.0, 62.0, 68.0, 60.0, 44.0, 52.0, 26.0, 43.0, 32.0, 15.0, 24.0, 25.0, 8.0, 8.0, 6.0, 5.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.06612101197242737, -0.06462913751602173, -0.06313726305961609, -0.06164538860321045, -0.06015351787209511, -0.05866164341568947, -0.05716976895928383, -0.05567789450287819, -0.05418602004647255, -0.05269414559006691, -0.05120227113366127, -0.04971040040254593, -0.04821852594614029, -0.04672665148973465, -0.04523477703332901, -0.04374290257692337, -0.04225102812051773, -0.04075915366411209, -0.03926727920770645, -0.03777540475130081, -0.03628353402018547, -0.03479165956377983, -0.03329978510737419, -0.03180791065096855, -0.03031603991985321, -0.02882416546344757, -0.02733229286968708, -0.02584041841328144, -0.0243485439568758, -0.02285667136311531, -0.02136479690670967, -0.01987292245030403, -0.018381046131253242, -0.016889171674847603, -0.015397298149764538, -0.013905424624681473, -0.012413550168275833, -0.010921676643192768, -0.009429803118109703, -0.007937928661704063, -0.006446055136620998, -0.004954181145876646, -0.0034623073879629374, -0.0019704336300492287, -0.00047855963930487633, 0.001013314351439476, 0.002505187876522541, 0.003997062332928181, 0.005488935858011246, 0.006980809848755598, 0.00847268383949995, 0.009964557364583015, 0.011456431820988655, 0.01294830534607172, 0.014440178871154785, 0.015932053327560425, 0.017423927783966064, 0.018915802240371704, 0.020407674834132195, 0.021899549290537834, 0.023391423746943474, 0.024883296340703964, 0.026375170797109604, 0.027867045253515244, 0.029358917847275734]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 8.0, 6.0, 8.0, 14.0, 23.0, 27.0, 39.0, 93.0, 162.0, 341.0, 884.0, 2191.0, 5864.0, 17632.0, 61120.0, 303508.0, 516769.0, 99550.0, 26603.0, 8482.0, 3051.0, 1182.0, 482.0, 218.0, 100.0, 72.0, 37.0, 22.0, 16.0, 11.0, 10.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1004638671875, -0.09630775451660156, -0.09215164184570312, -0.08799552917480469, -0.08383941650390625, -0.07968330383300781, -0.07552719116210938, -0.07137107849121094, -0.0672149658203125, -0.06305885314941406, -0.058902740478515625, -0.05474662780761719, -0.05059051513671875, -0.04643440246582031, -0.042278289794921875, -0.03812217712402344, -0.033966064453125, -0.029809951782226562, -0.025653839111328125, -0.021497726440429688, -0.01734161376953125, -0.013185501098632812, -0.009029388427734375, -0.0048732757568359375, -0.0007171630859375, 0.0034389495849609375, 0.007595062255859375, 0.011751174926757812, 0.01590728759765625, 0.020063400268554688, 0.024219512939453125, 0.028375625610351562, 0.03253173828125, 0.03668785095214844, 0.040843963623046875, 0.04500007629394531, 0.04915618896484375, 0.05331230163574219, 0.057468414306640625, 0.06162452697753906, 0.0657806396484375, 0.06993675231933594, 0.07409286499023438, 0.07824897766113281, 0.08240509033203125, 0.08656120300292969, 0.09071731567382812, 0.09487342834472656, 0.099029541015625, 0.10318565368652344, 0.10734176635742188, 0.11149787902832031, 0.11565399169921875, 0.11981010437011719, 0.12396621704101562, 0.12812232971191406, 0.1322784423828125, 0.13643455505371094, 0.14059066772460938, 0.1447467803955078, 0.14890289306640625, 0.1530590057373047, 0.15721511840820312, 0.16137123107910156, 0.16552734375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 4.0, 9.0, 10.0, 20.0, 19.0, 23.0, 24.0, 25.0, 46.0, 41.0, 48.0, 78.0, 71.0, 67.0, 74.0, 69.0, 66.0, 55.0, 49.0, 42.0, 41.0, 32.0, 22.0, 23.0, 16.0, 10.0, 12.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.04205322265625, -0.04112076759338379, -0.04018831253051758, -0.03925585746765137, -0.038323402404785156, -0.037390947341918945, -0.036458492279052734, -0.03552603721618652, -0.03459358215332031, -0.0336611270904541, -0.03272867202758789, -0.03179621696472168, -0.03086376190185547, -0.029931306838989258, -0.028998851776123047, -0.028066396713256836, -0.027133941650390625, -0.026201486587524414, -0.025269031524658203, -0.024336576461791992, -0.02340412139892578, -0.02247166633605957, -0.02153921127319336, -0.02060675621032715, -0.019674301147460938, -0.018741846084594727, -0.017809391021728516, -0.016876935958862305, -0.015944480895996094, -0.015012025833129883, -0.014079570770263672, -0.013147115707397461, -0.01221466064453125, -0.011282205581665039, -0.010349750518798828, -0.009417295455932617, -0.008484840393066406, -0.007552385330200195, -0.006619930267333984, -0.0056874752044677734, -0.0047550201416015625, -0.0038225650787353516, -0.0028901100158691406, -0.0019576549530029297, -0.0010251998901367188, -9.274482727050781e-05, 0.0008397102355957031, 0.001772165298461914, 0.002704620361328125, 0.003637075424194336, 0.004569530487060547, 0.005501985549926758, 0.006434440612792969, 0.00736689567565918, 0.00829935073852539, 0.009231805801391602, 0.010164260864257812, 0.011096715927124023, 0.012029170989990234, 0.012961626052856445, 0.013894081115722656, 0.014826536178588867, 0.015758991241455078, 0.01669144630432129, 0.0176239013671875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 11.0, 10.0, 14.0, 12.0, 11.0, 36.0, 58.0, 80.0, 135.0, 176.0, 238.0, 424.0, 679.0, 1112.0, 1690.0, 2960.0, 4816.0, 8449.0, 14645.0, 25766.0, 46453.0, 89694.0, 213444.0, 335583.0, 147456.0, 68284.0, 36672.0, 20683.0, 11938.0, 6790.0, 3955.0, 2442.0, 1444.0, 880.0, 519.0, 361.0, 222.0, 121.0, 106.0, 60.0, 43.0, 30.0, 16.0, 10.0, 12.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0567626953125, -0.055108070373535156, -0.05345344543457031, -0.05179882049560547, -0.050144195556640625, -0.04848957061767578, -0.04683494567871094, -0.045180320739746094, -0.04352569580078125, -0.041871070861816406, -0.04021644592285156, -0.03856182098388672, -0.036907196044921875, -0.03525257110595703, -0.03359794616699219, -0.031943321228027344, -0.0302886962890625, -0.028634071350097656, -0.026979446411132812, -0.02532482147216797, -0.023670196533203125, -0.02201557159423828, -0.020360946655273438, -0.018706321716308594, -0.01705169677734375, -0.015397071838378906, -0.013742446899414062, -0.012087821960449219, -0.010433197021484375, -0.008778572082519531, -0.0071239471435546875, -0.005469322204589844, -0.003814697265625, -0.0021600723266601562, -0.0005054473876953125, 0.0011491775512695312, 0.002803802490234375, 0.004458427429199219, 0.0061130523681640625, 0.007767677307128906, 0.00942230224609375, 0.011076927185058594, 0.012731552124023438, 0.014386177062988281, 0.016040802001953125, 0.01769542694091797, 0.019350051879882812, 0.021004676818847656, 0.0226593017578125, 0.024313926696777344, 0.025968551635742188, 0.02762317657470703, 0.029277801513671875, 0.03093242645263672, 0.03258705139160156, 0.034241676330566406, 0.03589630126953125, 0.037550926208496094, 0.03920555114746094, 0.04086017608642578, 0.042514801025390625, 0.04416942596435547, 0.04582405090332031, 0.047478675842285156, 0.04913330078125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 13.0, 8.0, 16.0, 14.0, 14.0, 13.0, 11.0, 20.0, 28.0, 35.0, 36.0, 25.0, 27.0, 38.0, 35.0, 34.0, 39.0, 32.0, 55.0, 45.0, 44.0, 38.0, 50.0, 34.0, 34.0, 31.0, 21.0, 23.0, 27.0, 31.0, 17.0, 20.0, 17.0, 10.0, 14.0, 12.0, 7.0, 3.0, 4.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01415252685546875, -0.013658881187438965, -0.01316523551940918, -0.012671589851379395, -0.01217794418334961, -0.011684298515319824, -0.011190652847290039, -0.010697007179260254, -0.010203361511230469, -0.009709715843200684, -0.009216070175170898, -0.008722424507141113, -0.008228778839111328, -0.007735133171081543, -0.007241487503051758, -0.006747841835021973, -0.0062541961669921875, -0.005760550498962402, -0.005266904830932617, -0.004773259162902832, -0.004279613494873047, -0.0037859678268432617, -0.0032923221588134766, -0.0027986764907836914, -0.0023050308227539062, -0.001811385154724121, -0.001317739486694336, -0.0008240938186645508, -0.0003304481506347656, 0.00016319751739501953, 0.0006568431854248047, 0.0011504888534545898, 0.001644134521484375, 0.00213778018951416, 0.0026314258575439453, 0.0031250715255737305, 0.0036187171936035156, 0.004112362861633301, 0.004606008529663086, 0.005099654197692871, 0.005593299865722656, 0.006086945533752441, 0.0065805912017822266, 0.007074236869812012, 0.007567882537841797, 0.008061528205871582, 0.008555173873901367, 0.009048819541931152, 0.009542465209960938, 0.010036110877990723, 0.010529756546020508, 0.011023402214050293, 0.011517047882080078, 0.012010693550109863, 0.012504339218139648, 0.012997984886169434, 0.013491630554199219, 0.013985276222229004, 0.014478921890258789, 0.014972567558288574, 0.01546621322631836, 0.015959858894348145, 0.01645350456237793, 0.016947150230407715, 0.0174407958984375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 2.0, 17.0, 10.0, 35.0, 30.0, 47.0, 73.0, 116.0, 205.0, 351.0, 680.0, 1423.0, 3222.0, 9443.0, 38695.0, 514002.0, 429122.0, 36037.0, 9008.0, 3121.0, 1370.0, 646.0, 330.0, 202.0, 86.0, 85.0, 58.0, 18.0, 31.0, 20.0, 8.0, 10.0, 12.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002605438232421875, -0.002528756856918335, -0.002452075481414795, -0.002375394105911255, -0.002298712730407715, -0.002222031354904175, -0.0021453499794006348, -0.0020686686038970947, -0.0019919872283935547, -0.0019153058528900146, -0.0018386244773864746, -0.0017619431018829346, -0.0016852617263793945, -0.0016085803508758545, -0.0015318989753723145, -0.0014552175998687744, -0.0013785362243652344, -0.0013018548488616943, -0.0012251734733581543, -0.0011484920978546143, -0.0010718107223510742, -0.0009951293468475342, -0.0009184479713439941, -0.0008417665958404541, -0.0007650852203369141, -0.000688403844833374, -0.000611722469329834, -0.0005350410938262939, -0.0004583597183227539, -0.00038167834281921387, -0.00030499696731567383, -0.0002283155918121338, -0.00015163421630859375, -7.495284080505371e-05, 1.7285346984863281e-06, 7.840991020202637e-05, 0.0001550912857055664, 0.00023177266120910645, 0.0003084540367126465, 0.0003851354122161865, 0.00046181678771972656, 0.0005384981632232666, 0.0006151795387268066, 0.0006918609142303467, 0.0007685422897338867, 0.0008452236652374268, 0.0009219050407409668, 0.0009985864162445068, 0.0010752677917480469, 0.001151949167251587, 0.001228630542755127, 0.001305311918258667, 0.001381993293762207, 0.001458674669265747, 0.0015353560447692871, 0.0016120374202728271, 0.0016887187957763672, 0.0017654001712799072, 0.0018420815467834473, 0.0019187629222869873, 0.0019954442977905273, 0.0020721256732940674, 0.0021488070487976074, 0.0022254884243011475, 0.0023021697998046875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 9.0, 5.0, 14.0, 15.0, 21.0, 36.0, 59.0, 75.0, 111.0, 142.0, 120.0, 111.0, 64.0, 53.0, 33.0, 23.0, 14.0, 20.0, 7.0, 10.0, 7.0, 6.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.811981201171875e-05, -1.7568469047546387e-05, -1.7017126083374023e-05, -1.646578311920166e-05, -1.5914440155029297e-05, -1.5363097190856934e-05, -1.481175422668457e-05, -1.4260411262512207e-05, -1.3709068298339844e-05, -1.315772533416748e-05, -1.2606382369995117e-05, -1.2055039405822754e-05, -1.150369644165039e-05, -1.0952353477478027e-05, -1.0401010513305664e-05, -9.8496675491333e-06, -9.298324584960938e-06, -8.746981620788574e-06, -8.195638656616211e-06, -7.644295692443848e-06, -7.092952728271484e-06, -6.541609764099121e-06, -5.990266799926758e-06, -5.4389238357543945e-06, -4.887580871582031e-06, -4.336237907409668e-06, -3.7848949432373047e-06, -3.2335519790649414e-06, -2.682209014892578e-06, -2.130866050720215e-06, -1.5795230865478516e-06, -1.0281801223754883e-06, -4.76837158203125e-07, 7.450580596923828e-08, 6.258487701416016e-07, 1.1771917343139648e-06, 1.7285346984863281e-06, 2.2798776626586914e-06, 2.8312206268310547e-06, 3.382563591003418e-06, 3.933906555175781e-06, 4.4852495193481445e-06, 5.036592483520508e-06, 5.587935447692871e-06, 6.139278411865234e-06, 6.690621376037598e-06, 7.241964340209961e-06, 7.793307304382324e-06, 8.344650268554688e-06, 8.89599323272705e-06, 9.447336196899414e-06, 9.998679161071777e-06, 1.055002212524414e-05, 1.1101365089416504e-05, 1.1652708053588867e-05, 1.220405101776123e-05, 1.2755393981933594e-05, 1.3306736946105957e-05, 1.385807991027832e-05, 1.4409422874450684e-05, 1.4960765838623047e-05, 1.551210880279541e-05, 1.6063451766967773e-05, 1.6614794731140137e-05, 1.71661376953125e-05]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 18.0, 12.0, 18.0, 26.0, 62.0, 74.0, 160.0, 248.0, 403.0, 770.0, 1520.0, 2882.0, 6188.0, 14317.0, 36123.0, 116210.0, 455269.0, 293571.0, 74536.0, 26013.0, 10522.0, 4743.0, 2304.0, 1151.0, 605.0, 273.0, 209.0, 131.0, 66.0, 34.0, 27.0, 22.0, 13.0, 9.0, 7.0, 3.0, 4.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005636215209960938, -0.0005417987704277039, -0.000519976019859314, -0.0004981532692909241, -0.0004763305187225342, -0.0004545077681541443, -0.0004326850175857544, -0.0004108622670173645, -0.0003890395164489746, -0.0003672167658805847, -0.0003453940153121948, -0.00032357126474380493, -0.00030174851417541504, -0.00027992576360702515, -0.00025810301303863525, -0.00023628026247024536, -0.00021445751190185547, -0.00019263476133346558, -0.00017081201076507568, -0.0001489892601966858, -0.0001271665096282959, -0.000105343759059906, -8.352100849151611e-05, -6.169825792312622e-05, -3.987550735473633e-05, -1.8052756786346436e-05, 3.769993782043457e-06, 2.559274435043335e-05, 4.741549491882324e-05, 6.923824548721313e-05, 9.106099605560303e-05, 0.00011288374662399292, 0.0001347064971923828, 0.0001565292477607727, 0.0001783519983291626, 0.0002001747488975525, 0.00022199749946594238, 0.00024382025003433228, 0.00026564300060272217, 0.00028746575117111206, 0.00030928850173950195, 0.00033111125230789185, 0.00035293400287628174, 0.00037475675344467163, 0.0003965795040130615, 0.0004184022545814514, 0.0004402250051498413, 0.0004620477557182312, 0.0004838705062866211, 0.000505693256855011, 0.0005275160074234009, 0.0005493387579917908, 0.0005711615085601807, 0.0005929842591285706, 0.0006148070096969604, 0.0006366297602653503, 0.0006584525108337402, 0.0006802752614021301, 0.00070209801197052, 0.0007239207625389099, 0.0007457435131072998, 0.0007675662636756897, 0.0007893890142440796, 0.0008112117648124695, 0.0008330345153808594]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 7.0, 10.0, 9.0, 9.0, 21.0, 21.0, 30.0, 27.0, 40.0, 53.0, 54.0, 73.0, 59.0, 74.0, 68.0, 51.0, 58.0, 64.0, 45.0, 39.0, 39.0, 25.0, 25.0, 14.0, 23.0, 7.0, 13.0, 7.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00019848346710205078, -0.00019325129687786102, -0.00018801912665367126, -0.0001827869564294815, -0.00017755478620529175, -0.000172322615981102, -0.00016709044575691223, -0.00016185827553272247, -0.00015662610530853271, -0.00015139393508434296, -0.0001461617648601532, -0.00014092959463596344, -0.00013569742441177368, -0.00013046525418758392, -0.00012523308396339417, -0.0001200009137392044, -0.00011476874351501465, -0.00010953657329082489, -0.00010430440306663513, -9.907223284244537e-05, -9.384006261825562e-05, -8.860789239406586e-05, -8.33757221698761e-05, -7.814355194568634e-05, -7.291138172149658e-05, -6.767921149730682e-05, -6.244704127311707e-05, -5.721487104892731e-05, -5.198270082473755e-05, -4.675053060054779e-05, -4.151836037635803e-05, -3.6286190152168274e-05, -3.1054019927978516e-05, -2.5821849703788757e-05, -2.0589679479599e-05, -1.535750925540924e-05, -1.0125339031219482e-05, -4.893168807029724e-06, 3.390014171600342e-07, 5.5711716413497925e-06, 1.080334186553955e-05, 1.603551208972931e-05, 2.1267682313919067e-05, 2.6499852538108826e-05, 3.1732022762298584e-05, 3.696419298648834e-05, 4.21963632106781e-05, 4.742853343486786e-05, 5.266070365905762e-05, 5.7892873883247375e-05, 6.312504410743713e-05, 6.835721433162689e-05, 7.358938455581665e-05, 7.882155478000641e-05, 8.405372500419617e-05, 8.928589522838593e-05, 9.451806545257568e-05, 9.975023567676544e-05, 0.0001049824059009552, 0.00011021457612514496, 0.00011544674634933472, 0.00012067891657352448, 0.00012591108679771423, 0.000131143257021904, 0.00013637542724609375]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 10.0, 5.0, 13.0, 20.0, 35.0, 42.0, 74.0, 140.0, 229.0, 169.0, 105.0, 51.0, 32.0, 24.0, 20.0, 17.0, 7.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.09854555875062943, -0.09643755853176117, -0.09432956576347351, -0.09222156554460526, -0.0901135727763176, -0.08800557255744934, -0.08589757978916168, -0.08378957957029343, -0.08168157935142517, -0.07957357913255692, -0.07746558636426926, -0.075357586145401, -0.07324959337711334, -0.07114159315824509, -0.06903360038995743, -0.06692560017108917, -0.06481760740280151, -0.06270960718393326, -0.0606016144156456, -0.05849361792206764, -0.056385621428489685, -0.05427762120962143, -0.05216962471604347, -0.050061628222465515, -0.04795363172888756, -0.0458456352353096, -0.043737638741731644, -0.041629642248153687, -0.03952164202928543, -0.03741364926099777, -0.03530564904212952, -0.03319765254855156, -0.031089656054973602, -0.028981659561395645, -0.026873663067817688, -0.02476566471159458, -0.022657668218016624, -0.020549671724438667, -0.01844167336821556, -0.016333676874637604, -0.014225680381059647, -0.01211768388748169, -0.010009686462581158, -0.007901689037680626, -0.005793692544102669, -0.0036856960505247116, -0.0015776986256241798, 0.0005302987992763519, 0.002638295292854309, 0.0047462922520935535, 0.006854289211332798, 0.00896228663623333, 0.011070283129811287, 0.013178279623389244, 0.015286277048289776, 0.017394274473190308, 0.019502270966768265, 0.021610267460346222, 0.02371826395392418, 0.025826262310147285, 0.027934258803725243, 0.0300422552973032, 0.032150253653526306, 0.03425825014710426, 0.03636624664068222]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 4.0, 8.0, 10.0, 27.0, 14.0, 17.0, 23.0, 16.0, 32.0, 39.0, 36.0, 39.0, 33.0, 39.0, 49.0, 39.0, 51.0, 37.0, 57.0, 48.0, 46.0, 39.0, 47.0, 27.0, 47.0, 33.0, 27.0, 27.0, 23.0, 16.0, 5.0, 13.0, 9.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03575395420193672, -0.034807220101356506, -0.03386048600077629, -0.032913755625486374, -0.03196702152490616, -0.031020287424325943, -0.030073553323745728, -0.02912682108581066, -0.028180088847875595, -0.02723335474729538, -0.026286622509360313, -0.025339888408780098, -0.024393156170845032, -0.023446422070264816, -0.0224996879696846, -0.021552955731749535, -0.02060622163116932, -0.019659487530589104, -0.018712755292654037, -0.017766021192073822, -0.016819288954138756, -0.01587255485355854, -0.0149258216843009, -0.013979088515043259, -0.013032355345785618, -0.012085622176527977, -0.011138889007270336, -0.010192155838012695, -0.00924542173743248, -0.008298689499497414, -0.007351955398917198, -0.006405222229659557, -0.005458490923047066, -0.004511757753789425, -0.0035650243517011404, -0.002618290949612856, -0.001671557780355215, -0.0007248246110975742, 0.0002219090238213539, 0.0011686421930789948, 0.0021153753623366356, 0.0030621085315942764, 0.004008841700851917, 0.004955575335770845, 0.005902308505028486, 0.006849041674286127, 0.007795775309205055, 0.008742508478462696, 0.009689241647720337, 0.010635974816977978, 0.011582707986235619, 0.012529442086815834, 0.0134761743247509, 0.014422908425331116, 0.015369641594588757, 0.016316374763846397, 0.017263107001781464, 0.01820984110236168, 0.019156573340296745, 0.02010330744087696, 0.021050039678812027, 0.021996773779392242, 0.022943507879972458, 0.023890240117907524, 0.02483697421848774]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 1.0, 2.0, 5.0, 8.0, 12.0, 16.0, 19.0, 23.0, 50.0, 46.0, 65.0, 72.0, 89.0, 158.0, 292.0, 569.0, 1257.0, 5985.0, 51561.0, 3997253.0, 120522.0, 12368.0, 2049.0, 816.0, 370.0, 205.0, 122.0, 77.0, 73.0, 51.0, 40.0, 28.0, 24.0, 15.0, 13.0, 11.0, 7.0, 6.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030914306640625, -0.029906272888183594, -0.028898239135742188, -0.02789020538330078, -0.026882171630859375, -0.02587413787841797, -0.024866104125976562, -0.023858070373535156, -0.02285003662109375, -0.021842002868652344, -0.020833969116210938, -0.01982593536376953, -0.018817901611328125, -0.01780986785888672, -0.016801834106445312, -0.015793800354003906, -0.0147857666015625, -0.013777732849121094, -0.012769699096679688, -0.011761665344238281, -0.010753631591796875, -0.009745597839355469, -0.008737564086914062, -0.007729530334472656, -0.00672149658203125, -0.005713462829589844, -0.0047054290771484375, -0.0036973953247070312, -0.002689361572265625, -0.0016813278198242188, -0.0006732940673828125, 0.00033473968505859375, 0.0013427734375, 0.0023508071899414062, 0.0033588409423828125, 0.004366874694824219, 0.005374908447265625, 0.006382942199707031, 0.0073909759521484375, 0.008399009704589844, 0.00940704345703125, 0.010415077209472656, 0.011423110961914062, 0.012431144714355469, 0.013439178466796875, 0.014447212219238281, 0.015455245971679688, 0.016463279724121094, 0.0174713134765625, 0.018479347229003906, 0.019487380981445312, 0.02049541473388672, 0.021503448486328125, 0.02251148223876953, 0.023519515991210938, 0.024527549743652344, 0.02553558349609375, 0.026543617248535156, 0.027551651000976562, 0.02855968475341797, 0.029567718505859375, 0.03057575225830078, 0.03158378601074219, 0.032591819763183594, 0.033599853515625]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 8.0, 13.0, 17.0, 12.0, 12.0, 19.0, 15.0, 26.0, 18.0, 24.0, 34.0, 29.0, 33.0, 35.0, 39.0, 41.0, 45.0, 38.0, 45.0, 31.0, 39.0, 48.0, 56.0, 39.0, 32.0, 26.0, 32.0, 32.0, 34.0, 19.0, 22.0, 19.0, 15.0, 8.0, 10.0, 9.0, 5.0, 5.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0236663818359375, -0.022939205169677734, -0.02221202850341797, -0.021484851837158203, -0.020757675170898438, -0.020030498504638672, -0.019303321838378906, -0.01857614517211914, -0.017848968505859375, -0.01712179183959961, -0.016394615173339844, -0.015667438507080078, -0.014940261840820312, -0.014213085174560547, -0.013485908508300781, -0.012758731842041016, -0.01203155517578125, -0.011304378509521484, -0.010577201843261719, -0.009850025177001953, -0.009122848510742188, -0.008395671844482422, -0.007668495178222656, -0.006941318511962891, -0.006214141845703125, -0.005486965179443359, -0.004759788513183594, -0.004032611846923828, -0.0033054351806640625, -0.002578258514404297, -0.0018510818481445312, -0.0011239051818847656, -0.000396728515625, 0.0003304481506347656, 0.0010576248168945312, 0.0017848014831542969, 0.0025119781494140625, 0.003239154815673828, 0.003966331481933594, 0.004693508148193359, 0.005420684814453125, 0.006147861480712891, 0.006875038146972656, 0.007602214813232422, 0.008329391479492188, 0.009056568145751953, 0.009783744812011719, 0.010510921478271484, 0.01123809814453125, 0.011965274810791016, 0.012692451477050781, 0.013419628143310547, 0.014146804809570312, 0.014873981475830078, 0.015601158142089844, 0.01632833480834961, 0.017055511474609375, 0.01778268814086914, 0.018509864807128906, 0.019237041473388672, 0.019964218139648438, 0.020691394805908203, 0.02141857147216797, 0.022145748138427734, 0.0228729248046875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 7.0, 17.0, 27.0, 36.0, 63.0, 118.0, 188.0, 374.0, 655.0, 1393.0, 3915.0, 24990.0, 4108986.0, 45530.0, 4736.0, 1585.0, 750.0, 406.0, 217.0, 121.0, 77.0, 38.0, 23.0, 16.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.05389404296875, -0.051609039306640625, -0.04932403564453125, -0.047039031982421875, -0.0447540283203125, -0.042469024658203125, -0.04018402099609375, -0.037899017333984375, -0.035614013671875, -0.033329010009765625, -0.03104400634765625, -0.028759002685546875, -0.0264739990234375, -0.024188995361328125, -0.02190399169921875, -0.019618988037109375, -0.017333984375, -0.015048980712890625, -0.01276397705078125, -0.010478973388671875, -0.0081939697265625, -0.005908966064453125, -0.00362396240234375, -0.001338958740234375, 0.000946044921875, 0.003231048583984375, 0.00551605224609375, 0.007801055908203125, 0.0100860595703125, 0.012371063232421875, 0.01465606689453125, 0.016941070556640625, 0.01922607421875, 0.021511077880859375, 0.02379608154296875, 0.026081085205078125, 0.0283660888671875, 0.030651092529296875, 0.03293609619140625, 0.035221099853515625, 0.037506103515625, 0.039791107177734375, 0.04207611083984375, 0.044361114501953125, 0.0466461181640625, 0.048931121826171875, 0.05121612548828125, 0.053501129150390625, 0.0557861328125, 0.058071136474609375, 0.06035614013671875, 0.06264114379882812, 0.0649261474609375, 0.06721115112304688, 0.06949615478515625, 0.07178115844726562, 0.074066162109375, 0.07635116577148438, 0.07863616943359375, 0.08092117309570312, 0.0832061767578125, 0.08549118041992188, 0.08777618408203125, 0.09006118774414062, 0.09234619140625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 16.0, 33.0, 59.0, 200.0, 3174.0, 323.0, 118.0, 70.0, 23.0, 12.0, 8.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01146697998046875, -0.011184096336364746, -0.010901212692260742, -0.010618329048156738, -0.010335445404052734, -0.01005256175994873, -0.009769678115844727, -0.009486794471740723, -0.009203910827636719, -0.008921027183532715, -0.008638143539428711, -0.008355259895324707, -0.008072376251220703, -0.007789492607116699, -0.007506608963012695, -0.007223725318908691, -0.0069408416748046875, -0.006657958030700684, -0.00637507438659668, -0.006092190742492676, -0.005809307098388672, -0.005526423454284668, -0.005243539810180664, -0.00496065616607666, -0.004677772521972656, -0.004394888877868652, -0.0041120052337646484, -0.0038291215896606445, -0.0035462379455566406, -0.0032633543014526367, -0.002980470657348633, -0.002697587013244629, -0.002414703369140625, -0.002131819725036621, -0.0018489360809326172, -0.0015660524368286133, -0.0012831687927246094, -0.0010002851486206055, -0.0007174015045166016, -0.00043451786041259766, -0.00015163421630859375, 0.00013124942779541016, 0.00041413307189941406, 0.000697016716003418, 0.0009799003601074219, 0.0012627840042114258, 0.0015456676483154297, 0.0018285512924194336, 0.0021114349365234375, 0.0023943185806274414, 0.0026772022247314453, 0.0029600858688354492, 0.003242969512939453, 0.003525853157043457, 0.003808736801147461, 0.004091620445251465, 0.004374504089355469, 0.004657387733459473, 0.0049402713775634766, 0.0052231550216674805, 0.005506038665771484, 0.005788922309875488, 0.006071805953979492, 0.006354689598083496, 0.0066375732421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 6.0, 9.0, 5.0, 13.0, 17.0, 28.0, 29.0, 47.0, 49.0, 78.0, 120.0, 163.0, 135.0, 83.0, 57.0, 33.0, 36.0, 25.0, 13.0, 12.0, 13.0, 6.0, 4.0, 2.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04585394635796547, -0.04460207372903824, -0.04335019737482071, -0.04209832474589348, -0.04084645211696625, -0.03959457576274872, -0.03834270313382149, -0.03709083050489426, -0.03583895415067673, -0.034587081521749496, -0.03333520516753197, -0.032083332538604736, -0.030831458047032356, -0.029579583555459976, -0.028327710926532745, -0.027075836434960365, -0.025823961943387985, -0.024572087451815605, -0.023320212960243225, -0.022068340331315994, -0.020816465839743614, -0.019564591348171234, -0.018312718719244003, -0.017060844227671623, -0.015808969736099243, -0.014557095244526863, -0.013305221684277058, -0.012053348124027252, -0.010801473632454872, -0.009549599140882492, -0.008297725580632687, -0.007045852020382881, -0.005793977528810501, -0.004542103502899408, -0.0032902294769883156, -0.002038355451077223, -0.0007864814251661301, 0.0004653926007449627, 0.0017172666266560555, 0.002969140186905861, 0.004221014678478241, 0.005472888704389334, 0.0067247627303004265, 0.007976636290550232, 0.009228510782122612, 0.010480385273694992, 0.011732258833944798, 0.012984132394194603, 0.014236006885766983, 0.015487881377339363, 0.016739755868911743, 0.017991628497838974, 0.019243502989411354, 0.020495377480983734, 0.021747250109910965, 0.022999124601483345, 0.024250999093055725, 0.025502873584628105, 0.026754748076200485, 0.028006620705127716, 0.029258495196700096, 0.030510369688272476, 0.03176224231719971, 0.033014118671417236, 0.03426599130034447]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 14.0, 10.0, 16.0, 11.0, 14.0, 23.0, 30.0, 20.0, 33.0, 37.0, 37.0, 39.0, 42.0, 44.0, 44.0, 40.0, 44.0, 54.0, 55.0, 48.0, 53.0, 34.0, 42.0, 41.0, 36.0, 22.0, 26.0, 24.0, 17.0, 7.0, 11.0, 9.0, 5.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030462054535746574, -0.029620321467518806, -0.02877858653664589, -0.02793685346841812, -0.027095120400190353, -0.026253385469317436, -0.02541165240108967, -0.02456991747021675, -0.023728184401988983, -0.022886451333761215, -0.022044716402888298, -0.02120298333466053, -0.020361248403787613, -0.019519515335559845, -0.018677782267332077, -0.01783604919910431, -0.016994314268231392, -0.016152581200003624, -0.015310846269130707, -0.014469113200902939, -0.013627379201352596, -0.012785645201802254, -0.011943912133574486, -0.011102178134024143, -0.0102604441344738, -0.009418710134923458, -0.008576976135373116, -0.007735243067145348, -0.006893509067595005, -0.0060517750680446625, -0.005210041534155607, -0.004368308000266552, -0.0035265740007162094, -0.0026848402339965105, -0.0018431064672768116, -0.0010013727005571127, -0.0001596389338374138, 0.0006820950657129288, 0.001523828599601984, 0.0023655621334910393, 0.003207296133041382, 0.004049030132591724, 0.00489076366648078, 0.005732497200369835, 0.0065742311999201775, 0.00741596519947052, 0.008257698267698288, 0.00909943226724863, 0.009941166266798973, 0.010782900266349316, 0.011624634265899658, 0.012466367334127426, 0.013308101333677769, 0.014149835333228111, 0.01499156840145588, 0.015833303332328796, 0.016675036400556564, 0.017516769468784332, 0.01835850439965725, 0.019200237467885017, 0.020041972398757935, 0.020883705466985703, 0.02172543853521347, 0.02256717160344124, 0.023408906534314156]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 13.0, 14.0, 14.0, 21.0, 34.0, 35.0, 83.0, 132.0, 187.0, 269.0, 451.0, 690.0, 1218.0, 1952.0, 3451.0, 6404.0, 11717.0, 22329.0, 46120.0, 103530.0, 345071.0, 315461.0, 98221.0, 44025.0, 21527.0, 11167.0, 5940.0, 3460.0, 1890.0, 1156.0, 723.0, 468.0, 266.0, 162.0, 102.0, 78.0, 56.0, 44.0, 23.0, 18.0, 11.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.06341552734375, -0.061548709869384766, -0.05968189239501953, -0.0578150749206543, -0.05594825744628906, -0.05408143997192383, -0.052214622497558594, -0.05034780502319336, -0.048480987548828125, -0.04661417007446289, -0.044747352600097656, -0.04288053512573242, -0.04101371765136719, -0.03914690017700195, -0.03728008270263672, -0.035413265228271484, -0.03354644775390625, -0.031679630279541016, -0.02981281280517578, -0.027945995330810547, -0.026079177856445312, -0.024212360382080078, -0.022345542907714844, -0.02047872543334961, -0.018611907958984375, -0.01674509048461914, -0.014878273010253906, -0.013011455535888672, -0.011144638061523438, -0.009277820587158203, -0.007411003112792969, -0.005544185638427734, -0.0036773681640625, -0.0018105506896972656, 5.626678466796875e-05, 0.0019230842590332031, 0.0037899017333984375, 0.005656719207763672, 0.007523536682128906, 0.00939035415649414, 0.011257171630859375, 0.01312398910522461, 0.014990806579589844, 0.016857624053955078, 0.018724441528320312, 0.020591259002685547, 0.02245807647705078, 0.024324893951416016, 0.02619171142578125, 0.028058528900146484, 0.02992534637451172, 0.03179216384887695, 0.03365898132324219, 0.03552579879760742, 0.037392616271972656, 0.03925943374633789, 0.041126251220703125, 0.04299306869506836, 0.044859886169433594, 0.04672670364379883, 0.04859352111816406, 0.0504603385925293, 0.05232715606689453, 0.054193973541259766, 0.056060791015625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 6.0, 9.0, 5.0, 12.0, 16.0, 16.0, 18.0, 26.0, 22.0, 28.0, 38.0, 45.0, 38.0, 37.0, 53.0, 56.0, 33.0, 53.0, 40.0, 49.0, 51.0, 59.0, 34.0, 47.0, 38.0, 37.0, 25.0, 27.0, 19.0, 20.0, 9.0, 9.0, 9.0, 7.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0267791748046875, -0.02602100372314453, -0.025262832641601562, -0.024504661560058594, -0.023746490478515625, -0.022988319396972656, -0.022230148315429688, -0.02147197723388672, -0.02071380615234375, -0.01995563507080078, -0.019197463989257812, -0.018439292907714844, -0.017681121826171875, -0.016922950744628906, -0.016164779663085938, -0.015406608581542969, -0.0146484375, -0.013890266418457031, -0.013132095336914062, -0.012373924255371094, -0.011615753173828125, -0.010857582092285156, -0.010099411010742188, -0.009341239929199219, -0.00858306884765625, -0.007824897766113281, -0.0070667266845703125, -0.006308555603027344, -0.005550384521484375, -0.004792213439941406, -0.0040340423583984375, -0.0032758712768554688, -0.0025177001953125, -0.0017595291137695312, -0.0010013580322265625, -0.00024318695068359375, 0.000514984130859375, 0.0012731552124023438, 0.0020313262939453125, 0.0027894973754882812, 0.00354766845703125, 0.004305839538574219, 0.0050640106201171875, 0.005822181701660156, 0.006580352783203125, 0.007338523864746094, 0.008096694946289062, 0.008854866027832031, 0.009613037109375, 0.010371208190917969, 0.011129379272460938, 0.011887550354003906, 0.012645721435546875, 0.013403892517089844, 0.014162063598632812, 0.014920234680175781, 0.01567840576171875, 0.01643657684326172, 0.017194747924804688, 0.017952919006347656, 0.018711090087890625, 0.019469261169433594, 0.020227432250976562, 0.02098560333251953, 0.0217437744140625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 10.0, 4.0, 9.0, 13.0, 25.0, 26.0, 24.0, 33.0, 56.0, 80.0, 96.0, 100.0, 149.0, 186.0, 290.0, 431.0, 552.0, 737.0, 995.0, 1586.0, 2329.0, 3352.0, 5435.0, 8867.0, 15640.0, 30690.0, 78672.0, 598814.0, 193403.0, 50011.0, 22607.0, 12111.0, 7200.0, 4451.0, 2925.0, 1973.0, 1279.0, 914.0, 649.0, 507.0, 355.0, 236.0, 204.0, 127.0, 104.0, 60.0, 60.0, 49.0, 40.0, 33.0, 22.0, 12.0, 13.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0], "bins": [-0.06982421875, -0.06769466400146484, -0.06556510925292969, -0.06343555450439453, -0.061305999755859375, -0.05917644500732422, -0.05704689025878906, -0.054917335510253906, -0.05278778076171875, -0.050658226013183594, -0.04852867126464844, -0.04639911651611328, -0.044269561767578125, -0.04214000701904297, -0.04001045227050781, -0.037880897521972656, -0.0357513427734375, -0.033621788024902344, -0.03149223327636719, -0.02936267852783203, -0.027233123779296875, -0.02510356903076172, -0.022974014282226562, -0.020844459533691406, -0.01871490478515625, -0.016585350036621094, -0.014455795288085938, -0.012326240539550781, -0.010196685791015625, -0.008067131042480469, -0.0059375762939453125, -0.0038080215454101562, -0.001678466796875, 0.00045108795166015625, 0.0025806427001953125, 0.004710197448730469, 0.006839752197265625, 0.008969306945800781, 0.011098861694335938, 0.013228416442871094, 0.01535797119140625, 0.017487525939941406, 0.019617080688476562, 0.02174663543701172, 0.023876190185546875, 0.02600574493408203, 0.028135299682617188, 0.030264854431152344, 0.0323944091796875, 0.034523963928222656, 0.03665351867675781, 0.03878307342529297, 0.040912628173828125, 0.04304218292236328, 0.04517173767089844, 0.047301292419433594, 0.04943084716796875, 0.051560401916503906, 0.05368995666503906, 0.05581951141357422, 0.057949066162109375, 0.06007862091064453, 0.06220817565917969, 0.06433773040771484, 0.06646728515625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 12.0, 10.0, 16.0, 12.0, 13.0, 16.0, 24.0, 16.0, 20.0, 29.0, 39.0, 28.0, 29.0, 36.0, 31.0, 35.0, 41.0, 47.0, 36.0, 43.0, 39.0, 42.0, 45.0, 36.0, 30.0, 29.0, 34.0, 33.0, 20.0, 27.0, 18.0, 18.0, 16.0, 17.0, 12.0, 8.0, 9.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0180816650390625, -0.017486095428466797, -0.016890525817871094, -0.01629495620727539, -0.015699386596679688, -0.015103816986083984, -0.014508247375488281, -0.013912677764892578, -0.013317108154296875, -0.012721538543701172, -0.012125968933105469, -0.011530399322509766, -0.010934829711914062, -0.01033926010131836, -0.009743690490722656, -0.009148120880126953, -0.00855255126953125, -0.007956981658935547, -0.007361412048339844, -0.006765842437744141, -0.0061702728271484375, -0.005574703216552734, -0.004979133605957031, -0.004383563995361328, -0.003787994384765625, -0.003192424774169922, -0.0025968551635742188, -0.0020012855529785156, -0.0014057159423828125, -0.0008101463317871094, -0.00021457672119140625, 0.0003809928894042969, 0.0009765625, 0.0015721321105957031, 0.0021677017211914062, 0.0027632713317871094, 0.0033588409423828125, 0.003954410552978516, 0.004549980163574219, 0.005145549774169922, 0.005741119384765625, 0.006336688995361328, 0.006932258605957031, 0.007527828216552734, 0.008123397827148438, 0.00871896743774414, 0.009314537048339844, 0.009910106658935547, 0.01050567626953125, 0.011101245880126953, 0.011696815490722656, 0.01229238510131836, 0.012887954711914062, 0.013483524322509766, 0.014079093933105469, 0.014674663543701172, 0.015270233154296875, 0.015865802764892578, 0.01646137237548828, 0.017056941986083984, 0.017652511596679688, 0.01824808120727539, 0.018843650817871094, 0.019439220428466797, 0.0200347900390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 7.0, 11.0, 6.0, 13.0, 24.0, 21.0, 27.0, 50.0, 51.0, 87.0, 86.0, 138.0, 169.0, 275.0, 311.0, 470.0, 633.0, 884.0, 1456.0, 2364.0, 4363.0, 10341.0, 40292.0, 930209.0, 35396.0, 9779.0, 4211.0, 2254.0, 1382.0, 924.0, 614.0, 453.0, 334.0, 237.0, 169.0, 118.0, 89.0, 80.0, 59.0, 51.0, 32.0, 18.0, 22.0, 9.0, 10.0, 15.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1636962890625, -0.1583232879638672, -0.15295028686523438, -0.14757728576660156, -0.14220428466796875, -0.13683128356933594, -0.13145828247070312, -0.1260852813720703, -0.1207122802734375, -0.11533927917480469, -0.10996627807617188, -0.10459327697753906, -0.09922027587890625, -0.09384727478027344, -0.08847427368164062, -0.08310127258300781, -0.077728271484375, -0.07235527038574219, -0.06698226928710938, -0.06160926818847656, -0.05623626708984375, -0.05086326599121094, -0.045490264892578125, -0.04011726379394531, -0.0347442626953125, -0.029371261596679688, -0.023998260498046875, -0.018625259399414062, -0.01325225830078125, -0.007879257202148438, -0.002506256103515625, 0.0028667449951171875, 0.00823974609375, 0.013612747192382812, 0.018985748291015625, 0.024358749389648438, 0.02973175048828125, 0.03510475158691406, 0.040477752685546875, 0.04585075378417969, 0.0512237548828125, 0.05659675598144531, 0.061969757080078125, 0.06734275817871094, 0.07271575927734375, 0.07808876037597656, 0.08346176147460938, 0.08883476257324219, 0.094207763671875, 0.09958076477050781, 0.10495376586914062, 0.11032676696777344, 0.11569976806640625, 0.12107276916503906, 0.12644577026367188, 0.1318187713623047, 0.1371917724609375, 0.1425647735595703, 0.14793777465820312, 0.15331077575683594, 0.15868377685546875, 0.16405677795410156, 0.16942977905273438, 0.1748027801513672, 0.18017578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 5.0, 3.0, 7.0, 8.0, 13.0, 11.0, 6.0, 12.0, 18.0, 32.0, 71.0, 106.0, 220.0, 140.0, 108.0, 55.0, 46.0, 14.0, 11.0, 13.0, 6.0, 9.0, 6.0, 7.0, 5.0, 5.0, 5.0, 5.0, 5.0, 6.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-4.89354133605957e-05, -4.7489069402217865e-05, -4.604272544384003e-05, -4.459638148546219e-05, -4.315003752708435e-05, -4.170369356870651e-05, -4.0257349610328674e-05, -3.8811005651950836e-05, -3.7364661693573e-05, -3.591831773519516e-05, -3.447197377681732e-05, -3.3025629818439484e-05, -3.1579285860061646e-05, -3.0132941901683807e-05, -2.868659794330597e-05, -2.724025398492813e-05, -2.5793910026550293e-05, -2.4347566068172455e-05, -2.2901222109794617e-05, -2.145487815141678e-05, -2.000853419303894e-05, -1.8562190234661102e-05, -1.7115846276283264e-05, -1.5669502317905426e-05, -1.4223158359527588e-05, -1.277681440114975e-05, -1.1330470442771912e-05, -9.884126484394073e-06, -8.437782526016235e-06, -6.991438567638397e-06, -5.545094609260559e-06, -4.098750650882721e-06, -2.652406692504883e-06, -1.2060627341270447e-06, 2.4028122425079346e-07, 1.6866251826286316e-06, 3.1329691410064697e-06, 4.579313099384308e-06, 6.025657057762146e-06, 7.472001016139984e-06, 8.918344974517822e-06, 1.036468893289566e-05, 1.1811032891273499e-05, 1.3257376849651337e-05, 1.4703720808029175e-05, 1.6150064766407013e-05, 1.759640872478485e-05, 1.904275268316269e-05, 2.0489096641540527e-05, 2.1935440599918365e-05, 2.3381784558296204e-05, 2.4828128516674042e-05, 2.627447247505188e-05, 2.7720816433429718e-05, 2.9167160391807556e-05, 3.0613504350185394e-05, 3.205984830856323e-05, 3.350619226694107e-05, 3.495253622531891e-05, 3.639888018369675e-05, 3.7845224142074585e-05, 3.929156810045242e-05, 4.073791205883026e-05, 4.21842560172081e-05, 4.363059997558594e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 7.0, 8.0, 10.0, 10.0, 24.0, 47.0, 76.0, 135.0, 224.0, 574.0, 1190.0, 3092.0, 9025.0, 37594.0, 922527.0, 56179.0, 11369.0, 3695.0, 1475.0, 661.0, 295.0, 140.0, 86.0, 47.0, 23.0, 15.0, 12.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12481689453125, -0.1209878921508789, -0.11715888977050781, -0.11332988739013672, -0.10950088500976562, -0.10567188262939453, -0.10184288024902344, -0.09801387786865234, -0.09418487548828125, -0.09035587310791016, -0.08652687072753906, -0.08269786834716797, -0.07886886596679688, -0.07503986358642578, -0.07121086120605469, -0.0673818588256836, -0.0635528564453125, -0.059723854064941406, -0.05589485168457031, -0.05206584930419922, -0.048236846923828125, -0.04440784454345703, -0.04057884216308594, -0.036749839782714844, -0.03292083740234375, -0.029091835021972656, -0.025262832641601562, -0.02143383026123047, -0.017604827880859375, -0.013775825500488281, -0.009946823120117188, -0.006117820739746094, -0.002288818359375, 0.0015401840209960938, 0.0053691864013671875, 0.009198188781738281, 0.013027191162109375, 0.01685619354248047, 0.020685195922851562, 0.024514198303222656, 0.02834320068359375, 0.032172203063964844, 0.03600120544433594, 0.03983020782470703, 0.043659210205078125, 0.04748821258544922, 0.05131721496582031, 0.055146217346191406, 0.0589752197265625, 0.0628042221069336, 0.06663322448730469, 0.07046222686767578, 0.07429122924804688, 0.07812023162841797, 0.08194923400878906, 0.08577823638916016, 0.08960723876953125, 0.09343624114990234, 0.09726524353027344, 0.10109424591064453, 0.10492324829101562, 0.10875225067138672, 0.11258125305175781, 0.1164102554321289, 0.1202392578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 3.0, 8.0, 8.0, 15.0, 19.0, 9.0, 22.0, 45.0, 50.0, 574.0, 80.0, 44.0, 28.0, 15.0, 19.0, 5.0, 9.0, 4.0, 8.0, 9.0, 3.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0178375244140625, -0.01727294921875, -0.0167083740234375, -0.016143798828125, -0.0155792236328125, -0.0150146484375, -0.0144500732421875, -0.013885498046875, -0.0133209228515625, -0.01275634765625, -0.0121917724609375, -0.011627197265625, -0.0110626220703125, -0.010498046875, -0.0099334716796875, -0.009368896484375, -0.0088043212890625, -0.00823974609375, -0.0076751708984375, -0.007110595703125, -0.0065460205078125, -0.0059814453125, -0.0054168701171875, -0.004852294921875, -0.0042877197265625, -0.00372314453125, -0.0031585693359375, -0.002593994140625, -0.0020294189453125, -0.00146484375, -0.0009002685546875, -0.000335693359375, 0.0002288818359375, 0.00079345703125, 0.0013580322265625, 0.001922607421875, 0.0024871826171875, 0.0030517578125, 0.0036163330078125, 0.004180908203125, 0.0047454833984375, 0.00531005859375, 0.0058746337890625, 0.006439208984375, 0.0070037841796875, 0.007568359375, 0.0081329345703125, 0.008697509765625, 0.0092620849609375, 0.00982666015625, 0.0103912353515625, 0.010955810546875, 0.0115203857421875, 0.0120849609375, 0.0126495361328125, 0.013214111328125, 0.0137786865234375, 0.01434326171875, 0.0149078369140625, 0.015472412109375, 0.0160369873046875, 0.0166015625, 0.0171661376953125, 0.017730712890625, 0.0182952880859375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 11.0, 22.0, 25.0, 35.0, 59.0, 122.0, 197.0, 149.0, 85.0, 76.0, 45.0, 28.0, 30.0, 20.0, 23.0, 10.0, 13.0, 5.0, 8.0, 14.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022606682032346725, -0.021328220143914223, -0.02004975825548172, -0.018771298229694366, -0.017492836341261864, -0.01621437445282936, -0.014935912564396858, -0.01365745160728693, -0.012378989718854427, -0.011100527830421925, -0.009822066873311996, -0.008543604984879494, -0.007265143562108278, -0.005986682139337063, -0.00470822025090456, -0.003429759293794632, -0.002151297405362129, -0.0008728358661755919, 0.0004056256730109453, 0.0016840873286128044, 0.00296254875138402, 0.004241010174155235, 0.005519472062587738, 0.006797933019697666, 0.008076394908130169, 0.009354856796562672, 0.0106333177536726, 0.011911779642105103, 0.013190241530537605, 0.014468702487647533, 0.01574716344475746, 0.017025625333189964, 0.018304087221622467, 0.01958254911005497, 0.020861010998487473, 0.022139471024274826, 0.02341793291270733, 0.02469639480113983, 0.025974856689572334, 0.027253318578004837, 0.02853177860379219, 0.029810240492224693, 0.031088702380657196, 0.03236716240644455, 0.0336456261575222, 0.034924086183309555, 0.03620254993438721, 0.03748100996017456, 0.038759469985961914, 0.04003793001174927, 0.04131639376282692, 0.04259485378861427, 0.043873317539691925, 0.04515177756547928, 0.04643023759126663, 0.047708701342344284, 0.048987165093421936, 0.05026562511920929, 0.05154408887028694, 0.052822548896074295, 0.05410101264715195, 0.0553794726729393, 0.056657932698726654, 0.057936396449804306, 0.05921485647559166]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 5.0, 2.0, 5.0, 8.0, 9.0, 7.0, 13.0, 11.0, 19.0, 21.0, 34.0, 23.0, 27.0, 35.0, 38.0, 37.0, 38.0, 33.0, 47.0, 44.0, 33.0, 46.0, 39.0, 47.0, 53.0, 34.0, 39.0, 43.0, 29.0, 33.0, 28.0, 21.0, 22.0, 19.0, 16.0, 12.0, 9.0, 9.0, 8.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024003896862268448, -0.023317359387874603, -0.02263082005083561, -0.021944280713796616, -0.02125774323940277, -0.020571205765008926, -0.019884666427969933, -0.01919812709093094, -0.018511589616537094, -0.01782505214214325, -0.017138512805104256, -0.016451973468065262, -0.015765435993671417, -0.015078897587954998, -0.014392359182238579, -0.01370582077652216, -0.01301928237080574, -0.012332743965089321, -0.011646205559372902, -0.010959667153656483, -0.010273128747940063, -0.009586590342223644, -0.008900051936507225, -0.008213513530790806, -0.007526975125074387, -0.006840436719357967, -0.006153898313641548, -0.005467359907925129, -0.00478082150220871, -0.0040942830964922905, -0.0034077446907758713, -0.002721206285059452, -0.002034667879343033, -0.0013481294736266136, -0.0006615910679101944, 2.4947337806224823e-05, 0.000711485743522644, 0.0013980241492390633, 0.0020845625549554825, 0.0027711009606719017, 0.003457639366388321, 0.00414417777210474, 0.004830716177821159, 0.005517254583537579, 0.006203792989253998, 0.006890331394970417, 0.007576869800686836, 0.008263408206403255, 0.008949946612119675, 0.009636485017836094, 0.010323023423552513, 0.011009561829268932, 0.011696100234985352, 0.01238263864070177, 0.01306917704641819, 0.01375571545213461, 0.014442253857851028, 0.015128792263567448, 0.015815330669283867, 0.01650187000632286, 0.017188407480716705, 0.01787494495511055, 0.018561484292149544, 0.019248023629188538, 0.019934561103582382]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 13.0, 22.0, 23.0, 44.0, 47.0, 85.0, 124.0, 172.0, 273.0, 382.0, 624.0, 983.0, 1497.0, 2368.0, 3887.0, 6309.0, 10548.0, 18360.0, 32870.0, 62272.0, 138847.0, 322393.0, 239200.0, 97523.0, 47336.0, 25583.0, 14444.0, 8713.0, 5077.0, 3076.0, 1946.0, 1215.0, 747.0, 498.0, 340.0, 245.0, 144.0, 90.0, 71.0, 49.0, 36.0, 28.0, 10.0, 9.0, 12.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.037445068359375, -0.03626728057861328, -0.03508949279785156, -0.033911705017089844, -0.032733917236328125, -0.031556129455566406, -0.030378341674804688, -0.02920055389404297, -0.02802276611328125, -0.02684497833251953, -0.025667190551757812, -0.024489402770996094, -0.023311614990234375, -0.022133827209472656, -0.020956039428710938, -0.01977825164794922, -0.0186004638671875, -0.01742267608642578, -0.016244888305664062, -0.015067100524902344, -0.013889312744140625, -0.012711524963378906, -0.011533737182617188, -0.010355949401855469, -0.00917816162109375, -0.008000373840332031, -0.0068225860595703125, -0.005644798278808594, -0.004467010498046875, -0.0032892227172851562, -0.0021114349365234375, -0.0009336471557617188, 0.000244140625, 0.0014219284057617188, 0.0025997161865234375, 0.0037775039672851562, 0.004955291748046875, 0.006133079528808594, 0.0073108673095703125, 0.008488655090332031, 0.00966644287109375, 0.010844230651855469, 0.012022018432617188, 0.013199806213378906, 0.014377593994140625, 0.015555381774902344, 0.016733169555664062, 0.01791095733642578, 0.0190887451171875, 0.02026653289794922, 0.021444320678710938, 0.022622108459472656, 0.023799896240234375, 0.024977684020996094, 0.026155471801757812, 0.02733325958251953, 0.02851104736328125, 0.02968883514404297, 0.030866622924804688, 0.032044410705566406, 0.033222198486328125, 0.034399986267089844, 0.03557777404785156, 0.03675556182861328, 0.037933349609375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 11.0, 10.0, 12.0, 15.0, 17.0, 9.0, 28.0, 32.0, 31.0, 27.0, 37.0, 45.0, 42.0, 49.0, 42.0, 52.0, 44.0, 36.0, 51.0, 63.0, 51.0, 39.0, 29.0, 31.0, 34.0, 21.0, 28.0, 24.0, 20.0, 9.0, 13.0, 13.0, 5.0, 7.0, 3.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0135498046875, -0.013156890869140625, -0.01276397705078125, -0.012371063232421875, -0.0119781494140625, -0.011585235595703125, -0.01119232177734375, -0.010799407958984375, -0.010406494140625, -0.010013580322265625, -0.00962066650390625, -0.009227752685546875, -0.0088348388671875, -0.008441925048828125, -0.00804901123046875, -0.007656097412109375, -0.00726318359375, -0.006870269775390625, -0.00647735595703125, -0.006084442138671875, -0.0056915283203125, -0.005298614501953125, -0.00490570068359375, -0.004512786865234375, -0.004119873046875, -0.003726959228515625, -0.00333404541015625, -0.002941131591796875, -0.0025482177734375, -0.002155303955078125, -0.00176239013671875, -0.001369476318359375, -0.0009765625, -0.000583648681640625, -0.00019073486328125, 0.000202178955078125, 0.0005950927734375, 0.000988006591796875, 0.00138092041015625, 0.001773834228515625, 0.002166748046875, 0.002559661865234375, 0.00295257568359375, 0.003345489501953125, 0.0037384033203125, 0.004131317138671875, 0.00452423095703125, 0.004917144775390625, 0.00531005859375, 0.005702972412109375, 0.00609588623046875, 0.006488800048828125, 0.0068817138671875, 0.007274627685546875, 0.00766754150390625, 0.008060455322265625, 0.008453369140625, 0.008846282958984375, 0.00923919677734375, 0.009632110595703125, 0.0100250244140625, 0.010417938232421875, 0.01081085205078125, 0.011203765869140625, 0.0115966796875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 10.0, 10.0, 17.0, 18.0, 28.0, 37.0, 67.0, 83.0, 165.0, 270.0, 563.0, 1131.0, 2528.0, 6192.0, 17095.0, 52531.0, 197695.0, 545492.0, 156627.0, 43691.0, 14545.0, 5290.0, 2243.0, 1029.0, 513.0, 270.0, 140.0, 84.0, 50.0, 43.0, 26.0, 22.0, 6.0, 11.0, 7.0, 3.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.056671142578125, -0.05497550964355469, -0.053279876708984375, -0.05158424377441406, -0.04988861083984375, -0.04819297790527344, -0.046497344970703125, -0.04480171203613281, -0.0431060791015625, -0.04141044616699219, -0.039714813232421875, -0.03801918029785156, -0.03632354736328125, -0.03462791442871094, -0.032932281494140625, -0.031236648559570312, -0.029541015625, -0.027845382690429688, -0.026149749755859375, -0.024454116821289062, -0.02275848388671875, -0.021062850952148438, -0.019367218017578125, -0.017671585083007812, -0.0159759521484375, -0.014280319213867188, -0.012584686279296875, -0.010889053344726562, -0.00919342041015625, -0.0074977874755859375, -0.005802154541015625, -0.0041065216064453125, -0.002410888671875, -0.0007152557373046875, 0.000980377197265625, 0.0026760101318359375, 0.00437164306640625, 0.0060672760009765625, 0.007762908935546875, 0.009458541870117188, 0.0111541748046875, 0.012849807739257812, 0.014545440673828125, 0.016241073608398438, 0.01793670654296875, 0.019632339477539062, 0.021327972412109375, 0.023023605346679688, 0.02471923828125, 0.026414871215820312, 0.028110504150390625, 0.029806137084960938, 0.03150177001953125, 0.03319740295410156, 0.034893035888671875, 0.03658866882324219, 0.0382843017578125, 0.03997993469238281, 0.041675567626953125, 0.04337120056152344, 0.04506683349609375, 0.04676246643066406, 0.048458099365234375, 0.05015373229980469, 0.051849365234375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 3.0, 10.0, 6.0, 25.0, 16.0, 24.0, 21.0, 36.0, 42.0, 32.0, 39.0, 48.0, 38.0, 66.0, 45.0, 44.0, 43.0, 52.0, 47.0, 48.0, 44.0, 30.0, 42.0, 27.0, 24.0, 26.0, 22.0, 20.0, 16.0, 9.0, 17.0, 7.0, 3.0, 7.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01081085205078125, -0.0104827880859375, -0.01015472412109375, -0.00982666015625, -0.00949859619140625, -0.0091705322265625, -0.00884246826171875, -0.008514404296875, -0.00818634033203125, -0.0078582763671875, -0.00753021240234375, -0.0072021484375, -0.00687408447265625, -0.0065460205078125, -0.00621795654296875, -0.005889892578125, -0.00556182861328125, -0.0052337646484375, -0.00490570068359375, -0.00457763671875, -0.00424957275390625, -0.0039215087890625, -0.00359344482421875, -0.003265380859375, -0.00293731689453125, -0.0026092529296875, -0.00228118896484375, -0.001953125, -0.00162506103515625, -0.0012969970703125, -0.00096893310546875, -0.000640869140625, -0.00031280517578125, 1.52587890625e-05, 0.00034332275390625, 0.00067138671875, 0.00099945068359375, 0.0013275146484375, 0.00165557861328125, 0.001983642578125, 0.00231170654296875, 0.0026397705078125, 0.00296783447265625, 0.0032958984375, 0.00362396240234375, 0.0039520263671875, 0.00428009033203125, 0.004608154296875, 0.00493621826171875, 0.0052642822265625, 0.00559234619140625, 0.00592041015625, 0.00624847412109375, 0.0065765380859375, 0.00690460205078125, 0.007232666015625, 0.00756072998046875, 0.0078887939453125, 0.00821685791015625, 0.008544921875, 0.00887298583984375, 0.0092010498046875, 0.00952911376953125, 0.009857177734375, 0.01018524169921875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 5.0, 8.0, 3.0, 26.0, 26.0, 31.0, 36.0, 86.0, 122.0, 174.0, 273.0, 467.0, 846.0, 1714.0, 3957.0, 11176.0, 45959.0, 632876.0, 303002.0, 32356.0, 8702.0, 3272.0, 1487.0, 737.0, 429.0, 264.0, 160.0, 107.0, 78.0, 50.0, 30.0, 20.0, 17.0, 15.0, 5.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0009851455688476562, -0.0009532570838928223, -0.0009213685989379883, -0.0008894801139831543, -0.0008575916290283203, -0.0008257031440734863, -0.0007938146591186523, -0.0007619261741638184, -0.0007300376892089844, -0.0006981492042541504, -0.0006662607192993164, -0.0006343722343444824, -0.0006024837493896484, -0.0005705952644348145, -0.0005387067794799805, -0.0005068182945251465, -0.0004749298095703125, -0.0004430413246154785, -0.00041115283966064453, -0.00037926435470581055, -0.00034737586975097656, -0.0003154873847961426, -0.0002835988998413086, -0.0002517104148864746, -0.00021982192993164062, -0.00018793344497680664, -0.00015604496002197266, -0.00012415647506713867, -9.226799011230469e-05, -6.03795051574707e-05, -2.849102020263672e-05, 3.3974647521972656e-06, 3.528594970703125e-05, 6.717443466186523e-05, 9.906291961669922e-05, 0.0001309514045715332, 0.0001628398895263672, 0.00019472837448120117, 0.00022661685943603516, 0.00025850534439086914, 0.0002903938293457031, 0.0003222823143005371, 0.0003541707992553711, 0.0003860592842102051, 0.00041794776916503906, 0.00044983625411987305, 0.00048172473907470703, 0.000513613224029541, 0.000545501708984375, 0.000577390193939209, 0.000609278678894043, 0.000641167163848877, 0.0006730556488037109, 0.0007049441337585449, 0.0007368326187133789, 0.0007687211036682129, 0.0008006095886230469, 0.0008324980735778809, 0.0008643865585327148, 0.0008962750434875488, 0.0009281635284423828, 0.0009600520133972168, 0.0009919404983520508, 0.0010238289833068848, 0.0010557174682617188]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 4.0, 9.0, 10.0, 14.0, 21.0, 15.0, 21.0, 36.0, 49.0, 62.0, 78.0, 97.0, 145.0, 127.0, 80.0, 39.0, 40.0, 25.0, 23.0, 18.0, 12.0, 11.0, 9.0, 12.0, 8.0, 2.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.5795230865478516e-05, -1.53491273522377e-05, -1.4903023838996887e-05, -1.4456920325756073e-05, -1.4010816812515259e-05, -1.3564713299274445e-05, -1.311860978603363e-05, -1.2672506272792816e-05, -1.2226402759552002e-05, -1.1780299246311188e-05, -1.1334195733070374e-05, -1.088809221982956e-05, -1.0441988706588745e-05, -9.995885193347931e-06, -9.549781680107117e-06, -9.103678166866302e-06, -8.657574653625488e-06, -8.211471140384674e-06, -7.76536762714386e-06, -7.319264113903046e-06, -6.8731606006622314e-06, -6.427057087421417e-06, -5.980953574180603e-06, -5.534850060939789e-06, -5.088746547698975e-06, -4.64264303445816e-06, -4.196539521217346e-06, -3.750436007976532e-06, -3.3043324947357178e-06, -2.8582289814949036e-06, -2.4121254682540894e-06, -1.966021955013275e-06, -1.519918441772461e-06, -1.0738149285316467e-06, -6.277114152908325e-07, -1.816079020500183e-07, 2.644956111907959e-07, 7.105991244316101e-07, 1.1567026376724243e-06, 1.6028061509132385e-06, 2.0489096641540527e-06, 2.495013177394867e-06, 2.941116690635681e-06, 3.3872202038764954e-06, 3.8333237171173096e-06, 4.279427230358124e-06, 4.725530743598938e-06, 5.171634256839752e-06, 5.617737770080566e-06, 6.063841283321381e-06, 6.509944796562195e-06, 6.956048309803009e-06, 7.402151823043823e-06, 7.848255336284637e-06, 8.294358849525452e-06, 8.740462362766266e-06, 9.18656587600708e-06, 9.632669389247894e-06, 1.0078772902488708e-05, 1.0524876415729523e-05, 1.0970979928970337e-05, 1.1417083442211151e-05, 1.1863186955451965e-05, 1.230929046869278e-05, 1.2755393981933594e-05]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 7.0, 9.0, 17.0, 25.0, 46.0, 84.0, 172.0, 260.0, 640.0, 1555.0, 4379.0, 15029.0, 72452.0, 651687.0, 254185.0, 34664.0, 8619.0, 2676.0, 1100.0, 475.0, 211.0, 104.0, 56.0, 20.0, 21.0, 14.0, 16.0, 6.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0005612373352050781, -0.0005455538630485535, -0.0005298703908920288, -0.0005141869187355042, -0.0004985034465789795, -0.00048281997442245483, -0.0004671365022659302, -0.0004514530301094055, -0.00043576955795288086, -0.0004200860857963562, -0.00040440261363983154, -0.0003887191414833069, -0.0003730356693267822, -0.00035735219717025757, -0.0003416687250137329, -0.00032598525285720825, -0.0003103017807006836, -0.00029461830854415894, -0.0002789348363876343, -0.0002632513642311096, -0.00024756789207458496, -0.0002318844199180603, -0.00021620094776153564, -0.00020051747560501099, -0.00018483400344848633, -0.00016915053129196167, -0.000153467059135437, -0.00013778358697891235, -0.0001221001148223877, -0.00010641664266586304, -9.073317050933838e-05, -7.504969835281372e-05, -5.936622619628906e-05, -4.3682754039764404e-05, -2.7999281883239746e-05, -1.2315809726715088e-05, 3.3676624298095703e-06, 1.905113458633423e-05, 3.473460674285889e-05, 5.0418078899383545e-05, 6.61015510559082e-05, 8.178502321243286e-05, 9.746849536895752e-05, 0.00011315196752548218, 0.00012883543968200684, 0.0001445189118385315, 0.00016020238399505615, 0.0001758858561515808, 0.00019156932830810547, 0.00020725280046463013, 0.00022293627262115479, 0.00023861974477767944, 0.0002543032169342041, 0.00026998668909072876, 0.0002856701612472534, 0.0003013536334037781, 0.00031703710556030273, 0.0003327205777168274, 0.00034840404987335205, 0.0003640875220298767, 0.00037977099418640137, 0.000395454466342926, 0.0004111379384994507, 0.00042682141065597534, 0.0004425048828125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 7.0, 5.0, 14.0, 9.0, 8.0, 8.0, 30.0, 24.0, 39.0, 49.0, 58.0, 63.0, 79.0, 75.0, 79.0, 69.0, 85.0, 47.0, 56.0, 36.0, 38.0, 28.0, 19.0, 14.0, 11.0, 14.0, 7.0, 11.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.468461990356445e-05, -7.206015288829803e-05, -6.943568587303162e-05, -6.68112188577652e-05, -6.418675184249878e-05, -6.156228482723236e-05, -5.893781781196594e-05, -5.6313350796699524e-05, -5.3688883781433105e-05, -5.106441676616669e-05, -4.843994975090027e-05, -4.581548273563385e-05, -4.319101572036743e-05, -4.056654870510101e-05, -3.7942081689834595e-05, -3.5317614674568176e-05, -3.269314765930176e-05, -3.006868064403534e-05, -2.744421362876892e-05, -2.4819746613502502e-05, -2.2195279598236084e-05, -1.9570812582969666e-05, -1.6946345567703247e-05, -1.4321878552436829e-05, -1.169741153717041e-05, -9.072944521903992e-06, -6.448477506637573e-06, -3.824010491371155e-06, -1.1995434761047363e-06, 1.4249235391616821e-06, 4.049390554428101e-06, 6.673857569694519e-06, 9.298324584960938e-06, 1.1922791600227356e-05, 1.4547258615493774e-05, 1.7171725630760193e-05, 1.979619264602661e-05, 2.242065966129303e-05, 2.5045126676559448e-05, 2.7669593691825867e-05, 3.0294060707092285e-05, 3.2918527722358704e-05, 3.554299473762512e-05, 3.816746175289154e-05, 4.079192876815796e-05, 4.341639578342438e-05, 4.6040862798690796e-05, 4.8665329813957214e-05, 5.128979682922363e-05, 5.391426384449005e-05, 5.653873085975647e-05, 5.916319787502289e-05, 6.17876648902893e-05, 6.441213190555573e-05, 6.703659892082214e-05, 6.966106593608856e-05, 7.228553295135498e-05, 7.49099999666214e-05, 7.753446698188782e-05, 8.015893399715424e-05, 8.278340101242065e-05, 8.540786802768707e-05, 8.803233504295349e-05, 9.065680205821991e-05, 9.328126907348633e-05]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 5.0, 11.0, 14.0, 24.0, 32.0, 59.0, 128.0, 246.0, 229.0, 108.0, 58.0, 35.0, 22.0, 11.0, 11.0, 9.0, 3.0, 3.0, 1.0, 3.0], "bins": [-0.08181358128786087, -0.0802389532327652, -0.07866431772708893, -0.07708968967199326, -0.07551505416631699, -0.07394042611122131, -0.07236579805612564, -0.07079116255044937, -0.0692165344953537, -0.06764190644025803, -0.06606727093458176, -0.06449264287948608, -0.06291800737380981, -0.06134337931871414, -0.05976874753832817, -0.0581941157579422, -0.05661948770284653, -0.055044855922460556, -0.053470224142074585, -0.05189559608697891, -0.05032096430659294, -0.04874633252620697, -0.047171700745821, -0.04559706896543503, -0.04402243718504906, -0.042447805404663086, -0.040873173624277115, -0.03929854556918144, -0.03772391378879547, -0.0361492820084095, -0.03457465022802353, -0.033000022172927856, -0.031425394117832184, -0.029850762337446213, -0.02827613241970539, -0.02670150063931942, -0.025126870721578598, -0.023552238941192627, -0.021977607160806656, -0.020402977243065834, -0.018828343600034714, -0.017253711819648743, -0.01567908190190792, -0.01410445012152195, -0.012529820203781128, -0.010955188423395157, -0.00938055757433176, -0.007805926725268364, -0.006231296807527542, -0.004656665958464146, -0.0030820348765701056, -0.0015074037946760654, 6.722705438733101e-05, 0.0016418583691120148, 0.0032164892181754112, 0.004791120067238808, 0.006365750916302204, 0.0079403817653656, 0.009515012614428997, 0.011089643463492393, 0.012664275243878365, 0.014238906092941761, 0.015813536942005157, 0.01738816872239113, 0.01896279864013195]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 15.0, 6.0, 8.0, 12.0, 12.0, 13.0, 18.0, 26.0, 22.0, 17.0, 29.0, 30.0, 28.0, 42.0, 38.0, 40.0, 40.0, 33.0, 36.0, 43.0, 45.0, 35.0, 52.0, 53.0, 46.0, 37.0, 27.0, 33.0, 21.0, 24.0, 18.0, 16.0, 23.0, 14.0, 7.0, 12.0, 9.0, 10.0, 2.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.015803804621100426, -0.015293308533728123, -0.014782813377678394, -0.014272317290306091, -0.013761822134256363, -0.01325132604688406, -0.012740829959511757, -0.012230334803462029, -0.0117198396474123, -0.011209343560039997, -0.010698848403990269, -0.010188352316617966, -0.009677857160568237, -0.009167361073195934, -0.008656864985823631, -0.008146369829773903, -0.0076358737424016, -0.007125378120690584, -0.0066148824989795685, -0.0061043864116072655, -0.005593891255557537, -0.005083395168185234, -0.004572899546474218, -0.004062403924763203, -0.003551908303052187, -0.0030414126813411713, -0.0025309170596301556, -0.002020421205088496, -0.0015099255833774805, -0.0009994299616664648, -0.0004889341071248055, 2.156151458621025e-05, 0.000532057136297226, 0.0010425527580082417, 0.0015530484961345792, 0.0020635442342609167, 0.0025740398559719324, 0.003084535477682948, 0.0035950313322246075, 0.004105526953935623, 0.004616022575646639, 0.005126518197357655, 0.00563701381906867, 0.006147509440779686, 0.006658005528151989, 0.007168500684201717, 0.00767899677157402, 0.008189491927623749, 0.008699988014996052, 0.009210484102368355, 0.009720979258418083, 0.010231475345790386, 0.010741970501840115, 0.011252466589212418, 0.011762961745262146, 0.012273457832634449, 0.012783953920006752, 0.013294450007379055, 0.013804945163428783, 0.014315441250801086, 0.014825936406850815, 0.015336432494223118, 0.01584692858159542, 0.01635742373764515, 0.016867918893694878]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 8.0, 22.0, 23.0, 42.0, 56.0, 56.0, 74.0, 113.0, 134.0, 213.0, 315.0, 525.0, 926.0, 1668.0, 4869.0, 4156216.0, 24091.0, 2124.0, 1052.0, 594.0, 377.0, 230.0, 153.0, 84.0, 94.0, 56.0, 38.0, 42.0, 25.0, 19.0, 9.0, 10.0, 2.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.061859130859375, -0.0600733757019043, -0.058287620544433594, -0.05650186538696289, -0.05471611022949219, -0.052930355072021484, -0.05114459991455078, -0.04935884475708008, -0.047573089599609375, -0.04578733444213867, -0.04400157928466797, -0.042215824127197266, -0.04043006896972656, -0.03864431381225586, -0.036858558654785156, -0.03507280349731445, -0.03328704833984375, -0.03150129318237305, -0.029715538024902344, -0.02792978286743164, -0.026144027709960938, -0.024358272552490234, -0.02257251739501953, -0.020786762237548828, -0.019001007080078125, -0.017215251922607422, -0.015429496765136719, -0.013643741607666016, -0.011857986450195312, -0.01007223129272461, -0.008286476135253906, -0.006500720977783203, -0.0047149658203125, -0.002929210662841797, -0.0011434555053710938, 0.0006422996520996094, 0.0024280548095703125, 0.004213809967041016, 0.005999565124511719, 0.007785320281982422, 0.009571075439453125, 0.011356830596923828, 0.013142585754394531, 0.014928340911865234, 0.016714096069335938, 0.01849985122680664, 0.020285606384277344, 0.022071361541748047, 0.02385711669921875, 0.025642871856689453, 0.027428627014160156, 0.02921438217163086, 0.031000137329101562, 0.032785892486572266, 0.03457164764404297, 0.03635740280151367, 0.038143157958984375, 0.03992891311645508, 0.04171466827392578, 0.043500423431396484, 0.04528617858886719, 0.04707193374633789, 0.048857688903808594, 0.0506434440612793, 0.05242919921875]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 6.0, 15.0, 10.0, 18.0, 21.0, 33.0, 21.0, 28.0, 28.0, 36.0, 37.0, 43.0, 51.0, 43.0, 49.0, 62.0, 52.0, 46.0, 50.0, 44.0, 58.0, 43.0, 41.0, 25.0, 28.0, 20.0, 14.0, 21.0, 15.0, 12.0, 10.0, 7.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0158843994140625, -0.01542806625366211, -0.014971733093261719, -0.014515399932861328, -0.014059066772460938, -0.013602733612060547, -0.013146400451660156, -0.012690067291259766, -0.012233734130859375, -0.011777400970458984, -0.011321067810058594, -0.010864734649658203, -0.010408401489257812, -0.009952068328857422, -0.009495735168457031, -0.00903940200805664, -0.00858306884765625, -0.00812673568725586, -0.007670402526855469, -0.007214069366455078, -0.0067577362060546875, -0.006301403045654297, -0.005845069885253906, -0.005388736724853516, -0.004932403564453125, -0.004476070404052734, -0.004019737243652344, -0.003563404083251953, -0.0031070709228515625, -0.002650737762451172, -0.0021944046020507812, -0.0017380714416503906, -0.00128173828125, -0.0008254051208496094, -0.00036907196044921875, 8.726119995117188e-05, 0.0005435943603515625, 0.0009999275207519531, 0.0014562606811523438, 0.0019125938415527344, 0.002368927001953125, 0.0028252601623535156, 0.0032815933227539062, 0.003737926483154297, 0.0041942596435546875, 0.004650592803955078, 0.005106925964355469, 0.005563259124755859, 0.00601959228515625, 0.006475925445556641, 0.006932258605957031, 0.007388591766357422, 0.007844924926757812, 0.008301258087158203, 0.008757591247558594, 0.009213924407958984, 0.009670257568359375, 0.010126590728759766, 0.010582923889160156, 0.011039257049560547, 0.011495590209960938, 0.011951923370361328, 0.012408256530761719, 0.01286458969116211, 0.0133209228515625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 9.0, 9.0, 6.0, 22.0, 31.0, 62.0, 95.0, 150.0, 273.0, 547.0, 1378.0, 4868.0, 3960640.0, 220216.0, 3707.0, 1147.0, 496.0, 256.0, 148.0, 83.0, 56.0, 35.0, 23.0, 12.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.052642822265625, -0.050241947174072266, -0.04784107208251953, -0.0454401969909668, -0.04303932189941406, -0.04063844680786133, -0.038237571716308594, -0.03583669662475586, -0.033435821533203125, -0.03103494644165039, -0.028634071350097656, -0.026233196258544922, -0.023832321166992188, -0.021431446075439453, -0.01903057098388672, -0.016629695892333984, -0.01422882080078125, -0.011827945709228516, -0.009427070617675781, -0.007026195526123047, -0.0046253204345703125, -0.002224445343017578, 0.00017642974853515625, 0.0025773048400878906, 0.004978179931640625, 0.007379055023193359, 0.009779930114746094, 0.012180805206298828, 0.014581680297851562, 0.016982555389404297, 0.01938343048095703, 0.021784305572509766, 0.0241851806640625, 0.026586055755615234, 0.02898693084716797, 0.0313878059387207, 0.03378868103027344, 0.03618955612182617, 0.038590431213378906, 0.04099130630493164, 0.043392181396484375, 0.04579305648803711, 0.048193931579589844, 0.05059480667114258, 0.05299568176269531, 0.05539655685424805, 0.05779743194580078, 0.060198307037353516, 0.06259918212890625, 0.06500005722045898, 0.06740093231201172, 0.06980180740356445, 0.07220268249511719, 0.07460355758666992, 0.07700443267822266, 0.07940530776977539, 0.08180618286132812, 0.08420705795288086, 0.0866079330444336, 0.08900880813598633, 0.09140968322753906, 0.0938105583190918, 0.09621143341064453, 0.09861230850219727, 0.10101318359375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 13.0, 24.0, 43.0, 171.0, 3244.0, 410.0, 105.0, 34.0, 14.0, 9.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0124053955078125, -0.012134253978729248, -0.011863112449645996, -0.011591970920562744, -0.011320829391479492, -0.01104968786239624, -0.010778546333312988, -0.010507404804229736, -0.010236263275146484, -0.009965121746063232, -0.00969398021697998, -0.009422838687896729, -0.009151697158813477, -0.008880555629730225, -0.008609414100646973, -0.00833827257156372, -0.008067131042480469, -0.007795989513397217, -0.007524847984313965, -0.007253706455230713, -0.006982564926147461, -0.006711423397064209, -0.006440281867980957, -0.006169140338897705, -0.005897998809814453, -0.005626857280731201, -0.005355715751647949, -0.005084574222564697, -0.004813432693481445, -0.004542291164398193, -0.004271149635314941, -0.0040000081062316895, -0.0037288665771484375, -0.0034577250480651855, -0.0031865835189819336, -0.0029154419898986816, -0.0026443004608154297, -0.0023731589317321777, -0.0021020174026489258, -0.0018308758735656738, -0.0015597343444824219, -0.00128859281539917, -0.001017451286315918, -0.000746309757232666, -0.00047516822814941406, -0.0002040266990661621, 6.711483001708984e-05, 0.0003382563591003418, 0.0006093978881835938, 0.0008805394172668457, 0.0011516809463500977, 0.0014228224754333496, 0.0016939640045166016, 0.0019651055335998535, 0.0022362470626831055, 0.0025073885917663574, 0.0027785301208496094, 0.0030496716499328613, 0.0033208131790161133, 0.0035919547080993652, 0.003863096237182617, 0.004134237766265869, 0.004405379295349121, 0.004676520824432373, 0.004947662353515625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 4.0, 11.0, 13.0, 12.0, 5.0, 7.0, 12.0, 25.0, 36.0, 43.0, 41.0, 71.0, 98.0, 134.0, 116.0, 72.0, 64.0, 45.0, 22.0, 34.0, 25.0, 15.0, 13.0, 10.0, 9.0, 9.0, 5.0, 6.0, 5.0, 6.0, 2.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015324462205171585, -0.014842480421066284, -0.014360497705638409, -0.013878515921533108, -0.013396533206105232, -0.012914551421999931, -0.01243256963789463, -0.01195058785378933, -0.011468605138361454, -0.010986623354256153, -0.010504640638828278, -0.010022658854722977, -0.009540677070617676, -0.0090586943551898, -0.0085767125710845, -0.008094729855656624, -0.007612748071551323, -0.007130765821784735, -0.0066487835720181465, -0.006166801787912846, -0.005684819538146257, -0.005202837288379669, -0.004720855504274368, -0.00423887325450778, -0.003756891004741192, -0.0032749087549746037, -0.002792926738038659, -0.0023109447211027145, -0.0018289624713361263, -0.0013469802215695381, -0.0008649982046335936, -0.000383016187697649, 9.89651307463646e-05, 0.000580947264097631, 0.0010629293974488974, 0.0015449115308001637, 0.00202689366415143, 0.0025088759139180183, 0.002990857930853963, 0.0034728399477899075, 0.003954822197556496, 0.004436804447323084, 0.004918786697089672, 0.005400768481194973, 0.005882750730961561, 0.006364732980728149, 0.00684671476483345, 0.0073286970146000385, 0.007810679264366627, 0.008292661048471928, 0.008774643763899803, 0.009256625548005104, 0.009738607332110405, 0.01022059004753828, 0.010702571831643581, 0.011184554547071457, 0.011666536331176758, 0.012148518115282059, 0.012630500830709934, 0.013112482614815235, 0.01359446533024311, 0.014076447114348412, 0.014558428898453712, 0.015040410682559013, 0.015522393397986889]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 15.0, 6.0, 9.0, 6.0, 12.0, 19.0, 17.0, 24.0, 13.0, 25.0, 28.0, 38.0, 38.0, 25.0, 40.0, 38.0, 46.0, 42.0, 35.0, 49.0, 53.0, 45.0, 45.0, 40.0, 35.0, 37.0, 35.0, 26.0, 20.0, 27.0, 21.0, 15.0, 16.0, 13.0, 11.0, 10.0, 5.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012058166787028313, -0.011667068116366863, -0.011275969445705414, -0.010884870775043964, -0.010493772104382515, -0.010102673433721066, -0.009711574763059616, -0.009320475161075592, -0.008929377421736717, -0.008538278751075268, -0.008147180080413818, -0.007756081409752369, -0.0073649827390909195, -0.00697388406842947, -0.006582784932106733, -0.006191686261445284, -0.005800587125122547, -0.005409488454461098, -0.005018389783799648, -0.004627291113138199, -0.004236192442476749, -0.0038450935389846563, -0.0034539946354925632, -0.003062895964831114, -0.0026717972941696644, -0.002280698623508215, -0.0018895998364314437, -0.0014985010493546724, -0.001107402378693223, -0.0007163037080317736, -0.0003252048045396805, 6.589386612176895e-05, 0.0004569925367832184, 0.0008480912656523287, 0.001239189994521439, 0.0016302887815982103, 0.0020213874522596598, 0.002412486122921109, 0.0028035850264132023, 0.0031946836970746517, 0.003585782367736101, 0.003976881038397551, 0.004367979709059, 0.004759078845381737, 0.005150177516043186, 0.005541276186704636, 0.005932374857366085, 0.0063234735280275345, 0.006714572198688984, 0.007105670869350433, 0.007496769540011883, 0.007887868210673332, 0.008278966881334782, 0.008670065551996231, 0.009061165153980255, 0.00945226289331913, 0.009843362495303154, 0.010234461165964603, 0.010625559836626053, 0.011016658507287502, 0.011407757177948952, 0.011798855848610401, 0.01218995451927185, 0.012581054121255875, 0.01297215186059475]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 10.0, 12.0, 12.0, 38.0, 28.0, 50.0, 67.0, 92.0, 131.0, 201.0, 267.0, 381.0, 540.0, 760.0, 1147.0, 1743.0, 2677.0, 4355.0, 7574.0, 13391.0, 25996.0, 55379.0, 137410.0, 415115.0, 223961.0, 79748.0, 34979.0, 17620.0, 9692.0, 5470.0, 3236.0, 2067.0, 1331.0, 905.0, 629.0, 416.0, 336.0, 224.0, 172.0, 127.0, 84.0, 50.0, 45.0, 36.0, 16.0, 10.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.021087646484375, -0.020422697067260742, -0.019757747650146484, -0.019092798233032227, -0.01842784881591797, -0.01776289939880371, -0.017097949981689453, -0.016433000564575195, -0.015768051147460938, -0.01510310173034668, -0.014438152313232422, -0.013773202896118164, -0.013108253479003906, -0.012443304061889648, -0.01177835464477539, -0.011113405227661133, -0.010448455810546875, -0.009783506393432617, -0.00911855697631836, -0.008453607559204102, -0.007788658142089844, -0.007123708724975586, -0.006458759307861328, -0.00579380989074707, -0.0051288604736328125, -0.004463911056518555, -0.003798961639404297, -0.003134012222290039, -0.0024690628051757812, -0.0018041133880615234, -0.0011391639709472656, -0.0004742145538330078, 0.00019073486328125, 0.0008556842803955078, 0.0015206336975097656, 0.0021855831146240234, 0.0028505325317382812, 0.003515481948852539, 0.004180431365966797, 0.004845380783081055, 0.0055103302001953125, 0.00617527961730957, 0.006840229034423828, 0.007505178451538086, 0.008170127868652344, 0.008835077285766602, 0.00950002670288086, 0.010164976119995117, 0.010829925537109375, 0.011494874954223633, 0.01215982437133789, 0.012824773788452148, 0.013489723205566406, 0.014154672622680664, 0.014819622039794922, 0.01548457145690918, 0.016149520874023438, 0.016814470291137695, 0.017479419708251953, 0.01814436912536621, 0.01880931854248047, 0.019474267959594727, 0.020139217376708984, 0.020804166793823242, 0.0214691162109375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 7.0, 3.0, 4.0, 7.0, 8.0, 13.0, 13.0, 15.0, 17.0, 14.0, 21.0, 24.0, 31.0, 36.0, 32.0, 36.0, 48.0, 42.0, 46.0, 41.0, 40.0, 53.0, 49.0, 56.0, 57.0, 28.0, 33.0, 34.0, 40.0, 23.0, 16.0, 27.0, 21.0, 15.0, 11.0, 6.0, 10.0, 6.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01233673095703125, -0.011946320533752441, -0.011555910110473633, -0.011165499687194824, -0.010775089263916016, -0.010384678840637207, -0.009994268417358398, -0.00960385799407959, -0.009213447570800781, -0.008823037147521973, -0.008432626724243164, -0.008042216300964355, -0.007651805877685547, -0.007261395454406738, -0.00687098503112793, -0.006480574607849121, -0.0060901641845703125, -0.005699753761291504, -0.005309343338012695, -0.004918932914733887, -0.004528522491455078, -0.0041381120681762695, -0.003747701644897461, -0.0033572912216186523, -0.0029668807983398438, -0.002576470375061035, -0.0021860599517822266, -0.001795649528503418, -0.0014052391052246094, -0.0010148286819458008, -0.0006244182586669922, -0.0002340078353881836, 0.000156402587890625, 0.0005468130111694336, 0.0009372234344482422, 0.0013276338577270508, 0.0017180442810058594, 0.002108454704284668, 0.0024988651275634766, 0.002889275550842285, 0.0032796859741210938, 0.0036700963973999023, 0.004060506820678711, 0.0044509172439575195, 0.004841327667236328, 0.005231738090515137, 0.005622148513793945, 0.006012558937072754, 0.0064029693603515625, 0.006793379783630371, 0.00718379020690918, 0.007574200630187988, 0.007964611053466797, 0.008355021476745605, 0.008745431900024414, 0.009135842323303223, 0.009526252746582031, 0.00991666316986084, 0.010307073593139648, 0.010697484016418457, 0.011087894439697266, 0.011478304862976074, 0.011868715286254883, 0.012259125709533691, 0.0126495361328125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 5.0, 6.0, 9.0, 4.0, 10.0, 15.0, 27.0, 42.0, 40.0, 51.0, 82.0, 117.0, 194.0, 245.0, 385.0, 513.0, 853.0, 1442.0, 2167.0, 3709.0, 6549.0, 12302.0, 26570.0, 75345.0, 605284.0, 220576.0, 48783.0, 19927.0, 9847.0, 5285.0, 2887.0, 1889.0, 1104.0, 768.0, 457.0, 323.0, 215.0, 146.0, 101.0, 89.0, 58.0, 37.0, 17.0, 12.0, 20.0, 17.0, 11.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.03729248046875, -0.03618955612182617, -0.035086631774902344, -0.033983707427978516, -0.03288078308105469, -0.03177785873413086, -0.03067493438720703, -0.029572010040283203, -0.028469085693359375, -0.027366161346435547, -0.02626323699951172, -0.02516031265258789, -0.024057388305664062, -0.022954463958740234, -0.021851539611816406, -0.020748615264892578, -0.01964569091796875, -0.018542766571044922, -0.017439842224121094, -0.016336917877197266, -0.015233993530273438, -0.01413106918334961, -0.013028144836425781, -0.011925220489501953, -0.010822296142578125, -0.009719371795654297, -0.008616447448730469, -0.007513523101806641, -0.0064105987548828125, -0.005307674407958984, -0.004204750061035156, -0.003101825714111328, -0.0019989013671875, -0.0008959770202636719, 0.00020694732666015625, 0.0013098716735839844, 0.0024127960205078125, 0.0035157203674316406, 0.004618644714355469, 0.005721569061279297, 0.006824493408203125, 0.007927417755126953, 0.009030342102050781, 0.01013326644897461, 0.011236190795898438, 0.012339115142822266, 0.013442039489746094, 0.014544963836669922, 0.01564788818359375, 0.016750812530517578, 0.017853736877441406, 0.018956661224365234, 0.020059585571289062, 0.02116250991821289, 0.02226543426513672, 0.023368358612060547, 0.024471282958984375, 0.025574207305908203, 0.02667713165283203, 0.02778005599975586, 0.028882980346679688, 0.029985904693603516, 0.031088829040527344, 0.03219175338745117, 0.033294677734375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 8.0, 4.0, 7.0, 10.0, 5.0, 12.0, 9.0, 10.0, 16.0, 17.0, 24.0, 20.0, 23.0, 25.0, 19.0, 30.0, 27.0, 31.0, 33.0, 39.0, 24.0, 39.0, 29.0, 32.0, 31.0, 40.0, 34.0, 23.0, 30.0, 32.0, 29.0, 24.0, 50.0, 27.0, 17.0, 19.0, 30.0, 22.0, 13.0, 11.0, 14.0, 9.0, 8.0, 6.0, 10.0, 9.0, 9.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0], "bins": [-0.00887298583984375, -0.00860905647277832, -0.00834512710571289, -0.008081197738647461, -0.007817268371582031, -0.0075533390045166016, -0.007289409637451172, -0.007025480270385742, -0.0067615509033203125, -0.006497621536254883, -0.006233692169189453, -0.0059697628021240234, -0.005705833435058594, -0.005441904067993164, -0.005177974700927734, -0.004914045333862305, -0.004650115966796875, -0.004386186599731445, -0.004122257232666016, -0.003858327865600586, -0.0035943984985351562, -0.0033304691314697266, -0.003066539764404297, -0.002802610397338867, -0.0025386810302734375, -0.002274751663208008, -0.002010822296142578, -0.0017468929290771484, -0.0014829635620117188, -0.001219034194946289, -0.0009551048278808594, -0.0006911754608154297, -0.00042724609375, -0.0001633167266845703, 0.00010061264038085938, 0.00036454200744628906, 0.0006284713745117188, 0.0008924007415771484, 0.0011563301086425781, 0.0014202594757080078, 0.0016841888427734375, 0.0019481182098388672, 0.002212047576904297, 0.0024759769439697266, 0.0027399063110351562, 0.003003835678100586, 0.0032677650451660156, 0.0035316944122314453, 0.003795623779296875, 0.004059553146362305, 0.004323482513427734, 0.004587411880493164, 0.004851341247558594, 0.0051152706146240234, 0.005379199981689453, 0.005643129348754883, 0.0059070587158203125, 0.006170988082885742, 0.006434917449951172, 0.0066988468170166016, 0.006962776184082031, 0.007226705551147461, 0.007490634918212891, 0.00775456428527832, 0.00801849365234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 10.0, 6.0, 12.0, 12.0, 12.0, 21.0, 41.0, 59.0, 51.0, 91.0, 93.0, 150.0, 231.0, 316.0, 422.0, 630.0, 957.0, 1390.0, 2230.0, 3614.0, 6501.0, 13224.0, 34341.0, 242411.0, 667676.0, 41102.0, 14681.0, 7203.0, 3924.0, 2345.0, 1549.0, 1017.0, 654.0, 454.0, 344.0, 197.0, 153.0, 111.0, 91.0, 62.0, 51.0, 35.0, 27.0, 29.0, 15.0, 5.0, 2.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.034271240234375, -0.0332026481628418, -0.032134056091308594, -0.03106546401977539, -0.029996871948242188, -0.028928279876708984, -0.02785968780517578, -0.026791095733642578, -0.025722503662109375, -0.024653911590576172, -0.02358531951904297, -0.022516727447509766, -0.021448135375976562, -0.02037954330444336, -0.019310951232910156, -0.018242359161376953, -0.01717376708984375, -0.016105175018310547, -0.015036582946777344, -0.01396799087524414, -0.012899398803710938, -0.011830806732177734, -0.010762214660644531, -0.009693622589111328, -0.008625030517578125, -0.007556438446044922, -0.006487846374511719, -0.005419254302978516, -0.0043506622314453125, -0.0032820701599121094, -0.0022134780883789062, -0.0011448860168457031, -7.62939453125e-05, 0.0009922981262207031, 0.0020608901977539062, 0.0031294822692871094, 0.0041980743408203125, 0.005266666412353516, 0.006335258483886719, 0.007403850555419922, 0.008472442626953125, 0.009541034698486328, 0.010609626770019531, 0.011678218841552734, 0.012746810913085938, 0.01381540298461914, 0.014883995056152344, 0.015952587127685547, 0.01702117919921875, 0.018089771270751953, 0.019158363342285156, 0.02022695541381836, 0.021295547485351562, 0.022364139556884766, 0.02343273162841797, 0.024501323699951172, 0.025569915771484375, 0.026638507843017578, 0.02770709991455078, 0.028775691986083984, 0.029844284057617188, 0.03091287612915039, 0.031981468200683594, 0.0330500602722168, 0.03411865234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 6.0, 6.0, 4.0, 11.0, 12.0, 15.0, 13.0, 15.0, 19.0, 14.0, 26.0, 37.0, 33.0, 57.0, 115.0, 133.0, 114.0, 106.0, 59.0, 35.0, 26.0, 23.0, 17.0, 16.0, 13.0, 9.0, 18.0, 6.0, 6.0, 6.0, 8.0, 6.0, 4.0, 0.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.153915405273438e-05, -7.907021790742874e-05, -7.660128176212311e-05, -7.413234561681747e-05, -7.166340947151184e-05, -6.919447332620621e-05, -6.672553718090057e-05, -6.425660103559494e-05, -6.17876648902893e-05, -5.931872874498367e-05, -5.684979259967804e-05, -5.4380856454372406e-05, -5.191192030906677e-05, -4.944298416376114e-05, -4.6974048018455505e-05, -4.450511187314987e-05, -4.203617572784424e-05, -3.9567239582538605e-05, -3.709830343723297e-05, -3.462936729192734e-05, -3.2160431146621704e-05, -2.969149500131607e-05, -2.7222558856010437e-05, -2.4753622710704803e-05, -2.228468656539917e-05, -1.9815750420093536e-05, -1.7346814274787903e-05, -1.487787812948227e-05, -1.2408941984176636e-05, -9.940005838871002e-06, -7.471069693565369e-06, -5.002133548259735e-06, -2.5331974029541016e-06, -6.426125764846802e-08, 2.4046748876571655e-06, 4.873611032962799e-06, 7.342547178268433e-06, 9.811483323574066e-06, 1.22804194688797e-05, 1.4749355614185333e-05, 1.7218291759490967e-05, 1.96872279047966e-05, 2.2156164050102234e-05, 2.4625100195407867e-05, 2.70940363407135e-05, 2.9562972486019135e-05, 3.203190863132477e-05, 3.45008447766304e-05, 3.6969780921936035e-05, 3.943871706724167e-05, 4.19076532125473e-05, 4.4376589357852936e-05, 4.684552550315857e-05, 4.93144616484642e-05, 5.1783397793769836e-05, 5.425233393907547e-05, 5.6721270084381104e-05, 5.919020622968674e-05, 6.165914237499237e-05, 6.4128078520298e-05, 6.659701466560364e-05, 6.906595081090927e-05, 7.15348869562149e-05, 7.400382310152054e-05, 7.647275924682617e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 9.0, 9.0, 14.0, 17.0, 44.0, 58.0, 100.0, 152.0, 302.0, 580.0, 1231.0, 2970.0, 8476.0, 29070.0, 142571.0, 764464.0, 70817.0, 17986.0, 5632.0, 2123.0, 915.0, 436.0, 227.0, 114.0, 83.0, 49.0, 30.0, 16.0, 12.0, 10.0, 11.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04327392578125, -0.042012691497802734, -0.04075145721435547, -0.0394902229309082, -0.03822898864746094, -0.03696775436401367, -0.035706520080566406, -0.03444528579711914, -0.033184051513671875, -0.03192281723022461, -0.030661582946777344, -0.029400348663330078, -0.028139114379882812, -0.026877880096435547, -0.02561664581298828, -0.024355411529541016, -0.02309417724609375, -0.021832942962646484, -0.02057170867919922, -0.019310474395751953, -0.018049240112304688, -0.016788005828857422, -0.015526771545410156, -0.01426553726196289, -0.013004302978515625, -0.01174306869506836, -0.010481834411621094, -0.009220600128173828, -0.007959365844726562, -0.006698131561279297, -0.005436897277832031, -0.004175662994384766, -0.0029144287109375, -0.0016531944274902344, -0.00039196014404296875, 0.0008692741394042969, 0.0021305084228515625, 0.003391742706298828, 0.004652976989746094, 0.005914211273193359, 0.007175445556640625, 0.00843667984008789, 0.009697914123535156, 0.010959148406982422, 0.012220382690429688, 0.013481616973876953, 0.014742851257324219, 0.016004085540771484, 0.01726531982421875, 0.018526554107666016, 0.01978778839111328, 0.021049022674560547, 0.022310256958007812, 0.023571491241455078, 0.024832725524902344, 0.02609395980834961, 0.027355194091796875, 0.02861642837524414, 0.029877662658691406, 0.031138896942138672, 0.03240013122558594, 0.0336613655090332, 0.03492259979248047, 0.036183834075927734, 0.037445068359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 8.0, 5.0, 9.0, 5.0, 16.0, 24.0, 15.0, 18.0, 22.0, 29.0, 38.0, 37.0, 51.0, 68.0, 257.0, 76.0, 62.0, 45.0, 41.0, 26.0, 13.0, 22.0, 20.0, 21.0, 16.0, 13.0, 11.0, 7.0, 1.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005199432373046875, -0.005024075508117676, -0.0048487186431884766, -0.004673361778259277, -0.004498004913330078, -0.004322648048400879, -0.00414729118347168, -0.0039719343185424805, -0.0037965774536132812, -0.003621220588684082, -0.003445863723754883, -0.0032705068588256836, -0.0030951499938964844, -0.002919793128967285, -0.002744436264038086, -0.0025690793991088867, -0.0023937225341796875, -0.0022183656692504883, -0.002043008804321289, -0.0018676519393920898, -0.0016922950744628906, -0.0015169382095336914, -0.0013415813446044922, -0.001166224479675293, -0.0009908676147460938, -0.0008155107498168945, -0.0006401538848876953, -0.0004647970199584961, -0.0002894401550292969, -0.00011408329010009766, 6.127357482910156e-05, 0.00023663043975830078, 0.0004119873046875, 0.0005873441696166992, 0.0007627010345458984, 0.0009380578994750977, 0.0011134147644042969, 0.001288771629333496, 0.0014641284942626953, 0.0016394853591918945, 0.0018148422241210938, 0.001990199089050293, 0.002165555953979492, 0.0023409128189086914, 0.0025162696838378906, 0.00269162654876709, 0.002866983413696289, 0.0030423402786254883, 0.0032176971435546875, 0.0033930540084838867, 0.003568410873413086, 0.003743767738342285, 0.003919124603271484, 0.004094481468200684, 0.004269838333129883, 0.004445195198059082, 0.004620552062988281, 0.0047959089279174805, 0.00497126579284668, 0.005146622657775879, 0.005321979522705078, 0.005497336387634277, 0.0056726932525634766, 0.005848050117492676, 0.006023406982421875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 3.0, 5.0, 1.0, 7.0, 5.0, 12.0, 9.0, 11.0, 19.0, 30.0, 22.0, 34.0, 67.0, 93.0, 161.0, 110.0, 88.0, 45.0, 61.0, 34.0, 30.0, 25.0, 19.0, 15.0, 9.0, 17.0, 12.0, 5.0, 8.0, 5.0, 8.0, 7.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01314300112426281, -0.01264999620616436, -0.01215699128806591, -0.011663987301290035, -0.011170982383191586, -0.010677977465093136, -0.01018497347831726, -0.009691968560218811, -0.009198963642120361, -0.008705958724021912, -0.008212953805923462, -0.007719949819147587, -0.007226944901049137, -0.006733939982950687, -0.006240935530513525, -0.005747931078076363, -0.005254926159977913, -0.004761921241879463, -0.004268916789442301, -0.0037759121041744947, -0.0032829074189066887, -0.0027899027336388826, -0.0022968980483710766, -0.0018038933631032705, -0.0013108886778354645, -0.0008178839925676584, -0.00032487930729985237, 0.00016812537796795368, 0.0006611300632357597, 0.0011541347485035658, 0.0016471394337713718, 0.002140144119039178, 0.0026331469416618347, 0.0031261516269296408, 0.003619156312197447, 0.004112160764634609, 0.004605165682733059, 0.005098170600831509, 0.005591175053268671, 0.0060841795057058334, 0.006577184423804283, 0.007070189341902733, 0.007563193794339895, 0.008056198246777058, 0.008549203164875507, 0.009042208082973957, 0.009535212069749832, 0.010028216987848282, 0.010521221905946732, 0.011014226824045181, 0.011507231742143631, 0.012000235728919506, 0.012493240647017956, 0.012986245565116405, 0.01347924955189228, 0.01397225446999073, 0.01446525938808918, 0.01495826430618763, 0.01545126922428608, 0.01594427414238453, 0.01643727719783783, 0.01693028211593628, 0.01742328703403473, 0.01791629195213318, 0.01840929687023163]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 10.0, 12.0, 8.0, 9.0, 9.0, 18.0, 14.0, 13.0, 16.0, 18.0, 28.0, 27.0, 30.0, 28.0, 39.0, 39.0, 23.0, 24.0, 41.0, 47.0, 41.0, 52.0, 41.0, 44.0, 35.0, 37.0, 32.0, 37.0, 31.0, 32.0, 18.0, 31.0, 12.0, 21.0, 14.0, 13.0, 13.0, 11.0, 11.0, 2.0, 5.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.010240460745990276, -0.009896199218928814, -0.009551937691867352, -0.009207676164805889, -0.008863414637744427, -0.008519153110682964, -0.008174890652298927, -0.007830629125237465, -0.00748636806383729, -0.007142106536775827, -0.006797845009714365, -0.006453583016991615, -0.006109321489930153, -0.0057650599628686905, -0.005420798435807228, -0.005076536908745766, -0.004732275381684303, -0.004388013854622841, -0.0040437523275613785, -0.0036994905676692724, -0.00335522904060781, -0.0030109675135463476, -0.0026667057536542416, -0.002322444226592779, -0.0019781826995313168, -0.0016339211724698544, -0.0012896595289930701, -0.0009453978855162859, -0.0006011363584548235, -0.0002568748313933611, 8.738692849874496e-05, 0.00043164845556020737, 0.0007759090512990952, 0.0011201705783605576, 0.0014644322218373418, 0.001808693865314126, 0.0021529553923755884, 0.002497216919437051, 0.002841478679329157, 0.0031857402063906193, 0.0035300017334520817, 0.003874263260513544, 0.0042185247875750065, 0.004562786780297756, 0.004907048307359219, 0.005251309834420681, 0.005595571361482143, 0.005939832888543606, 0.006284094415605068, 0.006628355942666531, 0.006972617469727993, 0.007316878996789455, 0.007661140523850918, 0.00800540205091238, 0.008349664509296417, 0.00869392603635788, 0.009038187563419342, 0.009382449090480804, 0.009726710617542267, 0.01007097214460373, 0.010415233671665192, 0.010759495198726654, 0.011103756725788116, 0.011448018252849579, 0.011792279779911041]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 13.0, 17.0, 28.0, 29.0, 53.0, 79.0, 115.0, 146.0, 218.0, 350.0, 478.0, 734.0, 1119.0, 1698.0, 2706.0, 4472.0, 7344.0, 11949.0, 20817.0, 37265.0, 68258.0, 147128.0, 375126.0, 186915.0, 80039.0, 42227.0, 23565.0, 13908.0, 8024.0, 5020.0, 3029.0, 1919.0, 1245.0, 794.0, 545.0, 379.0, 260.0, 171.0, 102.0, 81.0, 55.0, 33.0, 25.0, 21.0, 17.0, 12.0, 6.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.019805908203125, -0.019113779067993164, -0.018421649932861328, -0.017729520797729492, -0.017037391662597656, -0.01634526252746582, -0.015653133392333984, -0.014961004257202148, -0.014268875122070312, -0.013576745986938477, -0.01288461685180664, -0.012192487716674805, -0.011500358581542969, -0.010808229446411133, -0.010116100311279297, -0.009423971176147461, -0.008731842041015625, -0.008039712905883789, -0.007347583770751953, -0.006655454635620117, -0.005963325500488281, -0.005271196365356445, -0.004579067230224609, -0.0038869380950927734, -0.0031948089599609375, -0.0025026798248291016, -0.0018105506896972656, -0.0011184215545654297, -0.00042629241943359375, 0.0002658367156982422, 0.0009579658508300781, 0.001650094985961914, 0.00234222412109375, 0.003034353256225586, 0.003726482391357422, 0.004418611526489258, 0.005110740661621094, 0.00580286979675293, 0.006494998931884766, 0.0071871280670166016, 0.007879257202148438, 0.008571386337280273, 0.00926351547241211, 0.009955644607543945, 0.010647773742675781, 0.011339902877807617, 0.012032032012939453, 0.012724161148071289, 0.013416290283203125, 0.014108419418334961, 0.014800548553466797, 0.015492677688598633, 0.01618480682373047, 0.016876935958862305, 0.01756906509399414, 0.018261194229125977, 0.018953323364257812, 0.01964545249938965, 0.020337581634521484, 0.02102971076965332, 0.021721839904785156, 0.022413969039916992, 0.023106098175048828, 0.023798227310180664, 0.0244903564453125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 6.0, 10.0, 13.0, 7.0, 8.0, 13.0, 10.0, 14.0, 23.0, 25.0, 25.0, 24.0, 35.0, 23.0, 32.0, 31.0, 33.0, 35.0, 38.0, 42.0, 46.0, 54.0, 55.0, 45.0, 27.0, 31.0, 32.0, 27.0, 34.0, 30.0, 29.0, 21.0, 14.0, 16.0, 15.0, 17.0, 16.0, 7.0, 6.0, 6.0, 5.0, 5.0, 4.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00522613525390625, -0.00503164529800415, -0.004837155342102051, -0.004642665386199951, -0.0044481754302978516, -0.004253685474395752, -0.004059195518493652, -0.0038647055625915527, -0.003670215606689453, -0.0034757256507873535, -0.003281235694885254, -0.0030867457389831543, -0.0028922557830810547, -0.002697765827178955, -0.0025032758712768555, -0.002308785915374756, -0.0021142959594726562, -0.0019198060035705566, -0.001725316047668457, -0.0015308260917663574, -0.0013363361358642578, -0.0011418461799621582, -0.0009473562240600586, -0.000752866268157959, -0.0005583763122558594, -0.00036388635635375977, -0.00016939640045166016, 2.5093555450439453e-05, 0.00021958351135253906, 0.00041407346725463867, 0.0006085634231567383, 0.0008030533790588379, 0.0009975433349609375, 0.0011920332908630371, 0.0013865232467651367, 0.0015810132026672363, 0.001775503158569336, 0.0019699931144714355, 0.002164483070373535, 0.0023589730262756348, 0.0025534629821777344, 0.002747952938079834, 0.0029424428939819336, 0.003136932849884033, 0.003331422805786133, 0.0035259127616882324, 0.003720402717590332, 0.003914892673492432, 0.004109382629394531, 0.004303872585296631, 0.0044983625411987305, 0.00469285249710083, 0.00488734245300293, 0.005081832408905029, 0.005276322364807129, 0.0054708123207092285, 0.005665302276611328, 0.005859792232513428, 0.006054282188415527, 0.006248772144317627, 0.0064432621002197266, 0.006637752056121826, 0.006832242012023926, 0.007026731967926025, 0.007221221923828125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 7.0, 13.0, 22.0, 22.0, 41.0, 65.0, 97.0, 139.0, 263.0, 488.0, 918.0, 1815.0, 3749.0, 8099.0, 18775.0, 45376.0, 126586.0, 486885.0, 235289.0, 70007.0, 27439.0, 11838.0, 5367.0, 2440.0, 1241.0, 686.0, 347.0, 213.0, 109.0, 76.0, 43.0, 35.0, 20.0, 16.0, 10.0, 6.0, 9.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02490234375, -0.02403545379638672, -0.023168563842773438, -0.022301673889160156, -0.021434783935546875, -0.020567893981933594, -0.019701004028320312, -0.01883411407470703, -0.01796722412109375, -0.01710033416748047, -0.016233444213867188, -0.015366554260253906, -0.014499664306640625, -0.013632774353027344, -0.012765884399414062, -0.011898994445800781, -0.0110321044921875, -0.010165214538574219, -0.009298324584960938, -0.008431434631347656, -0.007564544677734375, -0.006697654724121094, -0.0058307647705078125, -0.004963874816894531, -0.00409698486328125, -0.0032300949096679688, -0.0023632049560546875, -0.0014963150024414062, -0.000629425048828125, 0.00023746490478515625, 0.0011043548583984375, 0.0019712448120117188, 0.002838134765625, 0.0037050247192382812, 0.0045719146728515625, 0.005438804626464844, 0.006305694580078125, 0.007172584533691406, 0.008039474487304688, 0.008906364440917969, 0.00977325439453125, 0.010640144348144531, 0.011507034301757812, 0.012373924255371094, 0.013240814208984375, 0.014107704162597656, 0.014974594116210938, 0.01584148406982422, 0.0167083740234375, 0.01757526397705078, 0.018442153930664062, 0.019309043884277344, 0.020175933837890625, 0.021042823791503906, 0.021909713745117188, 0.02277660369873047, 0.02364349365234375, 0.02451038360595703, 0.025377273559570312, 0.026244163513183594, 0.027111053466796875, 0.027977943420410156, 0.028844833374023438, 0.02971172332763672, 0.03057861328125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 8.0, 5.0, 4.0, 9.0, 11.0, 19.0, 18.0, 26.0, 22.0, 26.0, 46.0, 45.0, 57.0, 47.0, 58.0, 46.0, 61.0, 64.0, 48.0, 53.0, 48.0, 34.0, 41.0, 36.0, 34.0, 27.0, 26.0, 24.0, 15.0, 10.0, 12.0, 8.0, 10.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0078582763671875, -0.007638752460479736, -0.007419228553771973, -0.007199704647064209, -0.006980180740356445, -0.006760656833648682, -0.006541132926940918, -0.006321609020233154, -0.006102085113525391, -0.005882561206817627, -0.005663037300109863, -0.0054435133934021, -0.005223989486694336, -0.005004465579986572, -0.004784941673278809, -0.004565417766571045, -0.004345893859863281, -0.004126369953155518, -0.003906846046447754, -0.0036873221397399902, -0.0034677982330322266, -0.003248274326324463, -0.0030287504196166992, -0.0028092265129089355, -0.002589702606201172, -0.002370178699493408, -0.0021506547927856445, -0.0019311308860778809, -0.0017116069793701172, -0.0014920830726623535, -0.0012725591659545898, -0.0010530352592468262, -0.0008335113525390625, -0.0006139874458312988, -0.00039446353912353516, -0.00017493963241577148, 4.458427429199219e-05, 0.00026410818099975586, 0.00048363208770751953, 0.0007031559944152832, 0.0009226799011230469, 0.0011422038078308105, 0.0013617277145385742, 0.0015812516212463379, 0.0018007755279541016, 0.0020202994346618652, 0.002239823341369629, 0.0024593472480773926, 0.0026788711547851562, 0.00289839506149292, 0.0031179189682006836, 0.0033374428749084473, 0.003556966781616211, 0.0037764906883239746, 0.003996014595031738, 0.004215538501739502, 0.004435062408447266, 0.004654586315155029, 0.004874110221862793, 0.005093634128570557, 0.00531315803527832, 0.005532681941986084, 0.005752205848693848, 0.005971729755401611, 0.006191253662109375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 3.0, 12.0, 9.0, 18.0, 27.0, 46.0, 55.0, 102.0, 171.0, 336.0, 602.0, 1325.0, 3495.0, 12104.0, 100077.0, 860423.0, 55796.0, 8868.0, 2748.0, 1135.0, 528.0, 281.0, 136.0, 86.0, 53.0, 43.0, 20.0, 16.0, 14.0, 4.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006036758422851562, -0.0005816370248794556, -0.0005595982074737549, -0.0005375593900680542, -0.0005155205726623535, -0.0004934817552566528, -0.00047144293785095215, -0.00044940412044525146, -0.0004273653030395508, -0.0004053264856338501, -0.0003832876682281494, -0.00036124885082244873, -0.00033921003341674805, -0.00031717121601104736, -0.0002951323986053467, -0.000273093581199646, -0.0002510547637939453, -0.00022901594638824463, -0.00020697712898254395, -0.00018493831157684326, -0.00016289949417114258, -0.0001408606767654419, -0.00011882185935974121, -9.678304195404053e-05, -7.474422454833984e-05, -5.270540714263916e-05, -3.0666589736938477e-05, -8.627772331237793e-06, 1.341104507446289e-05, 3.5449862480163574e-05, 5.748867988586426e-05, 7.952749729156494e-05, 0.00010156631469726562, 0.0001236051321029663, 0.000145643949508667, 0.00016768276691436768, 0.00018972158432006836, 0.00021176040172576904, 0.00023379921913146973, 0.0002558380365371704, 0.0002778768539428711, 0.0002999156713485718, 0.00032195448875427246, 0.00034399330615997314, 0.00036603212356567383, 0.0003880709409713745, 0.0004101097583770752, 0.0004321485757827759, 0.00045418739318847656, 0.00047622621059417725, 0.0004982650279998779, 0.0005203038454055786, 0.0005423426628112793, 0.00056438148021698, 0.0005864202976226807, 0.0006084591150283813, 0.000630497932434082, 0.0006525367498397827, 0.0006745755672454834, 0.0006966143846511841, 0.0007186532020568848, 0.0007406920194625854, 0.0007627308368682861, 0.0007847696542739868, 0.0008068084716796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 14.0, 18.0, 28.0, 26.0, 39.0, 71.0, 105.0, 175.0, 157.0, 108.0, 53.0, 53.0, 41.0, 26.0, 12.0, 12.0, 10.0, 3.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3113021850585938e-05, -1.2747012078762054e-05, -1.2381002306938171e-05, -1.2014992535114288e-05, -1.1648982763290405e-05, -1.1282972991466522e-05, -1.091696321964264e-05, -1.0550953447818756e-05, -1.0184943675994873e-05, -9.81893390417099e-06, -9.452924132347107e-06, -9.086914360523224e-06, -8.72090458869934e-06, -8.354894816875458e-06, -7.988885045051575e-06, -7.622875273227692e-06, -7.256865501403809e-06, -6.8908557295799255e-06, -6.5248459577560425e-06, -6.1588361859321594e-06, -5.792826414108276e-06, -5.426816642284393e-06, -5.06080687046051e-06, -4.694797098636627e-06, -4.328787326812744e-06, -3.962777554988861e-06, -3.596767783164978e-06, -3.230758011341095e-06, -2.864748239517212e-06, -2.498738467693329e-06, -2.132728695869446e-06, -1.7667189240455627e-06, -1.4007091522216797e-06, -1.0346993803977966e-06, -6.686896085739136e-07, -3.026798367500305e-07, 6.332993507385254e-08, 4.293397068977356e-07, 7.953494787216187e-07, 1.1613592505455017e-06, 1.5273690223693848e-06, 1.8933787941932678e-06, 2.259388566017151e-06, 2.625398337841034e-06, 2.991408109664917e-06, 3.3574178814888e-06, 3.723427653312683e-06, 4.089437425136566e-06, 4.455447196960449e-06, 4.821456968784332e-06, 5.187466740608215e-06, 5.553476512432098e-06, 5.9194862842559814e-06, 6.2854960560798645e-06, 6.6515058279037476e-06, 7.017515599727631e-06, 7.383525371551514e-06, 7.749535143375397e-06, 8.11554491519928e-06, 8.481554687023163e-06, 8.847564458847046e-06, 9.213574230670929e-06, 9.579584002494812e-06, 9.945593774318695e-06, 1.0311603546142578e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 18.0, 18.0, 25.0, 31.0, 55.0, 79.0, 112.0, 149.0, 245.0, 408.0, 704.0, 1206.0, 2047.0, 4259.0, 8332.0, 18160.0, 41546.0, 107317.0, 397969.0, 310242.0, 89318.0, 34933.0, 15924.0, 7202.0, 3623.0, 1928.0, 1038.0, 616.0, 347.0, 228.0, 145.0, 89.0, 68.0, 51.0, 26.0, 19.0, 21.0, 9.0, 7.0, 11.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.0001302957534790039, -0.0001263357698917389, -0.00012237578630447388, -0.00011841580271720886, -0.00011445581912994385, -0.00011049583554267883, -0.00010653585195541382, -0.0001025758683681488, -9.861588478088379e-05, -9.465590119361877e-05, -9.069591760635376e-05, -8.673593401908875e-05, -8.277595043182373e-05, -7.881596684455872e-05, -7.48559832572937e-05, -7.089599967002869e-05, -6.693601608276367e-05, -6.297603249549866e-05, -5.901604890823364e-05, -5.505606532096863e-05, -5.109608173370361e-05, -4.71360981464386e-05, -4.3176114559173584e-05, -3.921613097190857e-05, -3.5256147384643555e-05, -3.129616379737854e-05, -2.7336180210113525e-05, -2.337619662284851e-05, -1.9416213035583496e-05, -1.545622944831848e-05, -1.1496245861053467e-05, -7.536262273788452e-06, -3.5762786865234375e-06, 3.8370490074157715e-07, 4.343688488006592e-06, 8.303672075271606e-06, 1.2263655662536621e-05, 1.6223639249801636e-05, 2.018362283706665e-05, 2.4143606424331665e-05, 2.810359001159668e-05, 3.2063573598861694e-05, 3.602355718612671e-05, 3.9983540773391724e-05, 4.394352436065674e-05, 4.790350794792175e-05, 5.186349153518677e-05, 5.582347512245178e-05, 5.97834587097168e-05, 6.374344229698181e-05, 6.770342588424683e-05, 7.166340947151184e-05, 7.562339305877686e-05, 7.958337664604187e-05, 8.354336023330688e-05, 8.75033438205719e-05, 9.146332740783691e-05, 9.542331099510193e-05, 9.938329458236694e-05, 0.00010334327816963196, 0.00010730326175689697, 0.00011126324534416199, 0.000115223228931427, 0.00011918321251869202, 0.00012314319610595703]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 4.0, 7.0, 3.0, 10.0, 19.0, 13.0, 17.0, 27.0, 28.0, 43.0, 39.0, 42.0, 50.0, 59.0, 63.0, 67.0, 62.0, 76.0, 65.0, 43.0, 53.0, 51.0, 28.0, 31.0, 24.0, 23.0, 15.0, 11.0, 14.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.606081008911133e-05, -3.48677858710289e-05, -3.367476165294647e-05, -3.2481737434864044e-05, -3.1288713216781616e-05, -3.0095688998699188e-05, -2.890266478061676e-05, -2.7709640562534332e-05, -2.6516616344451904e-05, -2.5323592126369476e-05, -2.413056790828705e-05, -2.293754369020462e-05, -2.1744519472122192e-05, -2.0551495254039764e-05, -1.9358471035957336e-05, -1.816544681787491e-05, -1.697242259979248e-05, -1.5779398381710052e-05, -1.4586374163627625e-05, -1.3393349945545197e-05, -1.2200325727462769e-05, -1.100730150938034e-05, -9.814277291297913e-06, -8.621253073215485e-06, -7.428228855133057e-06, -6.235204637050629e-06, -5.042180418968201e-06, -3.849156200885773e-06, -2.6561319828033447e-06, -1.4631077647209167e-06, -2.7008354663848877e-07, 9.229406714439392e-07, 2.115964889526367e-06, 3.308989107608795e-06, 4.502013325691223e-06, 5.695037543773651e-06, 6.888061761856079e-06, 8.081085979938507e-06, 9.274110198020935e-06, 1.0467134416103363e-05, 1.1660158634185791e-05, 1.2853182852268219e-05, 1.4046207070350647e-05, 1.5239231288433075e-05, 1.6432255506515503e-05, 1.762527972459793e-05, 1.881830394268036e-05, 2.0011328160762787e-05, 2.1204352378845215e-05, 2.2397376596927643e-05, 2.359040081501007e-05, 2.47834250330925e-05, 2.5976449251174927e-05, 2.7169473469257355e-05, 2.8362497687339783e-05, 2.955552190542221e-05, 3.074854612350464e-05, 3.194157034158707e-05, 3.3134594559669495e-05, 3.432761877775192e-05, 3.552064299583435e-05, 3.671366721391678e-05, 3.7906691431999207e-05, 3.9099715650081635e-05, 4.029273986816406e-05]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 7.0, 7.0, 14.0, 28.0, 15.0, 18.0, 25.0, 47.0, 64.0, 121.0, 140.0, 148.0, 99.0, 66.0, 40.0, 38.0, 12.0, 21.0, 11.0, 13.0, 11.0, 9.0, 5.0, 10.0, 3.0, 3.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01410786621272564, -0.013716993853449821, -0.013326120562851429, -0.012935248203575611, -0.012544375844299793, -0.0121535025537014, -0.011762630194425583, -0.011371757835149765, -0.010980885475873947, -0.01059001311659813, -0.010199139825999737, -0.009808267466723919, -0.009417395107448101, -0.009026521816849709, -0.00863564945757389, -0.008244777098298073, -0.007853904739022255, -0.00746303191408515, -0.007072159554809332, -0.006681286729872227, -0.006290414370596409, -0.005899541545659304, -0.0055086687207221985, -0.005117796361446381, -0.004726923070847988, -0.004336050245910883, -0.003945177886635065, -0.00355430506169796, -0.003163432702422142, -0.002772559877485037, -0.0023816872853785753, -0.001990814693272114, -0.001599942333996296, -0.0012090697418898344, -0.000818197091575712, -0.00042732444126158953, -3.6451849155128e-05, 0.00035442085936665535, 0.0007452934514731169, 0.0011361660435795784, 0.00152703863568604, 0.0019179112277925014, 0.002308783819898963, 0.0026996564120054245, 0.0030905292369425297, 0.003481401829048991, 0.0038722744211554527, 0.004263146780431271, 0.004654019605368376, 0.005044892430305481, 0.005435764789581299, 0.005826637614518404, 0.006217509973794222, 0.006608382798731327, 0.006999255158007145, 0.00739012798294425, 0.007781000807881355, 0.008171873167157173, 0.008562746457755566, 0.008953618817031384, 0.009344491176307201, 0.009735364466905594, 0.010126236826181412, 0.01051710918545723, 0.010907981544733047]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 9.0, 7.0, 5.0, 6.0, 2.0, 10.0, 19.0, 16.0, 17.0, 27.0, 30.0, 22.0, 31.0, 22.0, 25.0, 26.0, 36.0, 35.0, 42.0, 32.0, 45.0, 45.0, 38.0, 45.0, 39.0, 42.0, 45.0, 33.0, 31.0, 26.0, 26.0, 31.0, 19.0, 15.0, 16.0, 20.0, 19.0, 9.0, 9.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.006566388998180628, -0.0063355593010783195, -0.006104730069637299, -0.005873900838196278, -0.005643071141093969, -0.005412241443991661, -0.00518141221255064, -0.004950582981109619, -0.004719753284007311, -0.004488923586905003, -0.004258094355463982, -0.004027265124022961, -0.0037964354269206524, -0.0035656059626489878, -0.003334776498377323, -0.0031039470341056585, -0.002873117569833994, -0.0026422881055623293, -0.0024114586412906647, -0.002180629177019, -0.0019497997127473354, -0.0017189702484756708, -0.0014881407842040062, -0.0012573113199323416, -0.001026481855660677, -0.0007956523913890123, -0.0005648229271173477, -0.0003339934628456831, -0.00010316399857401848, 0.00012766546569764614, 0.00035849492996931076, 0.0005893243942409754, 0.0008201533928513527, 0.0010509828571230173, 0.001281812321394682, 0.0015126417856663465, 0.0017434712499380112, 0.001974300714209676, 0.0022051301784813404, 0.002435959642753005, 0.0026667891070246696, 0.0028976185712963343, 0.003128448035567999, 0.0033592774998396635, 0.003590106964111328, 0.0038209364283829927, 0.004051765892654657, 0.004282595589756966, 0.004513424821197987, 0.004744254052639008, 0.004975083749741316, 0.005205913446843624, 0.005436742678284645, 0.005667571909725666, 0.005898401606827974, 0.006129231303930283, 0.0063600605353713036, 0.0065908897668123245, 0.006821719463914633, 0.007052549161016941, 0.007283378392457962, 0.007514207623898983, 0.007745037321001291, 0.0079758670181036, 0.00820669624954462]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 8.0, 10.0, 15.0, 21.0, 34.0, 38.0, 43.0, 71.0, 89.0, 116.0, 153.0, 179.0, 265.0, 344.0, 466.0, 659.0, 973.0, 1521.0, 2393.0, 5970.0, 106560.0, 4025451.0, 38131.0, 4093.0, 2149.0, 1316.0, 865.0, 589.0, 432.0, 323.0, 222.0, 170.0, 141.0, 120.0, 74.0, 72.0, 47.0, 45.0, 24.0, 13.0, 19.0, 13.0, 8.0, 10.0, 5.0, 5.0, 3.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01654052734375, -0.01597738265991211, -0.015414237976074219, -0.014851093292236328, -0.014287948608398438, -0.013724803924560547, -0.013161659240722656, -0.012598514556884766, -0.012035369873046875, -0.011472225189208984, -0.010909080505371094, -0.010345935821533203, -0.009782791137695312, -0.009219646453857422, -0.008656501770019531, -0.00809335708618164, -0.00753021240234375, -0.006967067718505859, -0.006403923034667969, -0.005840778350830078, -0.0052776336669921875, -0.004714488983154297, -0.004151344299316406, -0.0035881996154785156, -0.003025054931640625, -0.0024619102478027344, -0.0018987655639648438, -0.0013356208801269531, -0.0007724761962890625, -0.00020933151245117188, 0.00035381317138671875, 0.0009169578552246094, 0.0014801025390625, 0.0020432472229003906, 0.0026063919067382812, 0.003169536590576172, 0.0037326812744140625, 0.004295825958251953, 0.004858970642089844, 0.005422115325927734, 0.005985260009765625, 0.006548404693603516, 0.007111549377441406, 0.007674694061279297, 0.008237838745117188, 0.008800983428955078, 0.009364128112792969, 0.00992727279663086, 0.01049041748046875, 0.01105356216430664, 0.011616706848144531, 0.012179851531982422, 0.012742996215820312, 0.013306140899658203, 0.013869285583496094, 0.014432430267333984, 0.014995574951171875, 0.015558719635009766, 0.016121864318847656, 0.016685009002685547, 0.017248153686523438, 0.017811298370361328, 0.01837444305419922, 0.01893758773803711, 0.019500732421875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 10.0, 10.0, 17.0, 15.0, 22.0, 22.0, 21.0, 21.0, 43.0, 31.0, 24.0, 28.0, 30.0, 53.0, 37.0, 42.0, 47.0, 44.0, 48.0, 48.0, 41.0, 44.0, 35.0, 34.0, 29.0, 34.0, 21.0, 19.0, 25.0, 15.0, 20.0, 15.0, 13.0, 5.0, 8.0, 4.0, 6.0, 0.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.005748748779296875, -0.00555795431137085, -0.005367159843444824, -0.005176365375518799, -0.0049855709075927734, -0.004794776439666748, -0.004603981971740723, -0.004413187503814697, -0.004222393035888672, -0.0040315985679626465, -0.003840804100036621, -0.0036500096321105957, -0.0034592151641845703, -0.003268420696258545, -0.0030776262283325195, -0.002886831760406494, -0.0026960372924804688, -0.0025052428245544434, -0.002314448356628418, -0.0021236538887023926, -0.0019328594207763672, -0.0017420649528503418, -0.0015512704849243164, -0.001360476016998291, -0.0011696815490722656, -0.0009788870811462402, -0.0007880926132202148, -0.0005972981452941895, -0.00040650367736816406, -0.00021570920944213867, -2.491474151611328e-05, 0.0001658797264099121, 0.0003566741943359375, 0.0005474686622619629, 0.0007382631301879883, 0.0009290575981140137, 0.001119852066040039, 0.0013106465339660645, 0.0015014410018920898, 0.0016922354698181152, 0.0018830299377441406, 0.002073824405670166, 0.0022646188735961914, 0.002455413341522217, 0.002646207809448242, 0.0028370022773742676, 0.003027796745300293, 0.0032185912132263184, 0.0034093856811523438, 0.003600180149078369, 0.0037909746170043945, 0.00398176908493042, 0.004172563552856445, 0.004363358020782471, 0.004554152488708496, 0.0047449469566345215, 0.004935741424560547, 0.005126535892486572, 0.005317330360412598, 0.005508124828338623, 0.0056989192962646484, 0.005889713764190674, 0.006080508232116699, 0.006271302700042725, 0.00646209716796875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 7.0, 10.0, 18.0, 27.0, 41.0, 61.0, 88.0, 132.0, 186.0, 314.0, 498.0, 796.0, 1342.0, 2497.0, 5696.0, 20276.0, 3667167.0, 468725.0, 15954.0, 4880.0, 2293.0, 1223.0, 727.0, 475.0, 278.0, 177.0, 126.0, 80.0, 56.0, 36.0, 25.0, 21.0, 15.0, 10.0, 5.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0198974609375, -0.01918506622314453, -0.018472671508789062, -0.017760276794433594, -0.017047882080078125, -0.016335487365722656, -0.015623092651367188, -0.014910697937011719, -0.01419830322265625, -0.013485908508300781, -0.012773513793945312, -0.012061119079589844, -0.011348724365234375, -0.010636329650878906, -0.009923934936523438, -0.009211540222167969, -0.0084991455078125, -0.007786750793457031, -0.0070743560791015625, -0.006361961364746094, -0.005649566650390625, -0.004937171936035156, -0.0042247772216796875, -0.0035123825073242188, -0.00279998779296875, -0.0020875930786132812, -0.0013751983642578125, -0.0006628036499023438, 4.9591064453125e-05, 0.0007619857788085938, 0.0014743804931640625, 0.0021867752075195312, 0.002899169921875, 0.0036115646362304688, 0.0043239593505859375, 0.005036354064941406, 0.005748748779296875, 0.006461143493652344, 0.0071735382080078125, 0.007885932922363281, 0.00859832763671875, 0.009310722351074219, 0.010023117065429688, 0.010735511779785156, 0.011447906494140625, 0.012160301208496094, 0.012872695922851562, 0.013585090637207031, 0.0142974853515625, 0.015009880065917969, 0.015722274780273438, 0.016434669494628906, 0.017147064208984375, 0.017859458923339844, 0.018571853637695312, 0.01928424835205078, 0.01999664306640625, 0.02070903778076172, 0.021421432495117188, 0.022133827209472656, 0.022846221923828125, 0.023558616638183594, 0.024271011352539062, 0.02498340606689453, 0.02569580078125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 11.0, 4.0, 11.0, 24.0, 44.0, 96.0, 245.0, 2858.0, 520.0, 152.0, 47.0, 13.0, 9.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00438690185546875, -0.004264205694198608, -0.004141509532928467, -0.004018813371658325, -0.0038961172103881836, -0.003773421049118042, -0.0036507248878479004, -0.003528028726577759, -0.003405332565307617, -0.0032826364040374756, -0.003159940242767334, -0.0030372440814971924, -0.0029145479202270508, -0.002791851758956909, -0.0026691555976867676, -0.002546459436416626, -0.0024237632751464844, -0.0023010671138763428, -0.002178370952606201, -0.0020556747913360596, -0.001932978630065918, -0.0018102824687957764, -0.0016875863075256348, -0.0015648901462554932, -0.0014421939849853516, -0.00131949782371521, -0.0011968016624450684, -0.0010741055011749268, -0.0009514093399047852, -0.0008287131786346436, -0.000706017017364502, -0.0005833208560943604, -0.00046062469482421875, -0.00033792853355407715, -0.00021523237228393555, -9.253621101379395e-05, 3.0159950256347656e-05, 0.00015285611152648926, 0.00027555227279663086, 0.00039824843406677246, 0.0005209445953369141, 0.0006436407566070557, 0.0007663369178771973, 0.0008890330791473389, 0.0010117292404174805, 0.001134425401687622, 0.0012571215629577637, 0.0013798177242279053, 0.0015025138854980469, 0.0016252100467681885, 0.00174790620803833, 0.0018706023693084717, 0.0019932985305786133, 0.002115994691848755, 0.0022386908531188965, 0.002361387014389038, 0.0024840831756591797, 0.0026067793369293213, 0.002729475498199463, 0.0028521716594696045, 0.002974867820739746, 0.0030975639820098877, 0.0032202601432800293, 0.003342956304550171, 0.0034656524658203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 3.0, 1.0, 2.0, 9.0, 7.0, 10.0, 5.0, 12.0, 12.0, 23.0, 12.0, 23.0, 21.0, 29.0, 48.0, 65.0, 76.0, 88.0, 120.0, 104.0, 68.0, 48.0, 39.0, 23.0, 28.0, 13.0, 18.0, 9.0, 12.0, 13.0, 9.0, 7.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0], "bins": [-0.0066308979876339436, -0.006426646374166012, -0.00622239476069808, -0.006018143147230148, -0.005813891533762217, -0.005609639920294285, -0.005405387841165066, -0.005201136227697134, -0.004996884614229202, -0.0047926330007612705, -0.004588381387293339, -0.004384129773825407, -0.004179878160357475, -0.003975626081228256, -0.003771374700590968, -0.0035671228542923927, -0.0033628714736551046, -0.003158619860187173, -0.002954368246719241, -0.0027501164004206657, -0.002545864786952734, -0.0023416131734848022, -0.0021373615600168705, -0.001933109830133617, -0.0017288582166656852, -0.0015246066031977534, -0.0013203548733144999, -0.001116103259846568, -0.0009118515881709754, -0.0007075999164953828, -0.000503348303027451, -0.00029909657314419746, -9.484495967626572e-05, 0.00010940669744741172, 0.00031365835457108915, 0.0005179099971428514, 0.000722161668818444, 0.0009264133404940367, 0.0011306649539619684, 0.001334916683845222, 0.0015391682973131537, 0.0017434199107810855, 0.001947671640664339, 0.002151923254132271, 0.0023561748676002026, 0.0025604264810681343, 0.002764678094536066, 0.0029689299408346415, 0.003173181554302573, 0.003377433167770505, 0.0035816847812384367, 0.003785936627537012, 0.003990188241004944, 0.004194439854472876, 0.004398691467940807, 0.004602943081408739, 0.004807194694876671, 0.005011446308344603, 0.005215697921812534, 0.005419949535280466, 0.005624201148748398, 0.005828453227877617, 0.006032704375684261, 0.00623695645481348, 0.006441208068281412]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 10.0, 6.0, 6.0, 10.0, 16.0, 11.0, 17.0, 26.0, 24.0, 34.0, 24.0, 22.0, 39.0, 26.0, 30.0, 37.0, 35.0, 41.0, 41.0, 48.0, 57.0, 54.0, 32.0, 40.0, 31.0, 38.0, 34.0, 35.0, 20.0, 27.0, 18.0, 16.0, 19.0, 17.0, 10.0, 14.0, 8.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.005718897096812725, -0.005536563228815794, -0.00535422982648015, -0.005171895958483219, -0.004989562090486288, -0.004807228222489357, -0.004624894820153713, -0.004442560952156782, -0.004260227084159851, -0.00407789321616292, -0.0038955595809966326, -0.003713225945830345, -0.003530892077833414, -0.0033485584426671267, -0.0031662248075008392, -0.002983890939503908, -0.0028015575371682644, -0.002619223902001977, -0.002436890034005046, -0.0022545563988387585, -0.0020722225308418274, -0.00188988889567554, -0.0017075552605092525, -0.0015252215089276433, -0.001342887757346034, -0.0011605540057644248, -0.0009782202541828156, -0.0007958866190165281, -0.0006135528674349189, -0.00043121911585330963, -0.0002488854806870222, -6.655172910541296e-05, 0.00011578155681490898, 0.0002981152792926878, 0.00048044900177046657, 0.0006627826951444149, 0.0008451164467260242, 0.0010274501983076334, 0.0012097838334739208, 0.00139211758505553, 0.0015744513366371393, 0.0017567850882187486, 0.0019391188398003578, 0.0021214524749666452, 0.0023037861101329327, 0.0024861199781298637, 0.002668453613296151, 0.0028507872484624386, 0.0030331211164593697, 0.003215454751625657, 0.003397788619622588, 0.0035801222547888756, 0.0037624561227858067, 0.003944789990782738, 0.0041271233931183815, 0.004309457261115313, 0.004491791129112244, 0.004674124997109175, 0.0048564583994448185, 0.00503879226744175, 0.005221126135438681, 0.005403460003435612, 0.0055857934057712555, 0.005768127273768187, 0.00595046067610383]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 16.0, 18.0, 19.0, 28.0, 33.0, 38.0, 59.0, 88.0, 129.0, 191.0, 267.0, 386.0, 600.0, 981.0, 1614.0, 2723.0, 4945.0, 9246.0, 18827.0, 40517.0, 103704.0, 339738.0, 340174.0, 103333.0, 40838.0, 18529.0, 9243.0, 4974.0, 2801.0, 1617.0, 962.0, 636.0, 386.0, 251.0, 186.0, 117.0, 92.0, 66.0, 36.0, 32.0, 32.0, 26.0, 17.0, 12.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00934600830078125, -0.009053945541381836, -0.008761882781982422, -0.008469820022583008, -0.008177757263183594, -0.00788569450378418, -0.007593631744384766, -0.0073015689849853516, -0.0070095062255859375, -0.0067174434661865234, -0.006425380706787109, -0.006133317947387695, -0.005841255187988281, -0.005549192428588867, -0.005257129669189453, -0.004965066909790039, -0.004673004150390625, -0.004380941390991211, -0.004088878631591797, -0.003796815872192383, -0.0035047531127929688, -0.0032126903533935547, -0.0029206275939941406, -0.0026285648345947266, -0.0023365020751953125, -0.0020444393157958984, -0.0017523765563964844, -0.0014603137969970703, -0.0011682510375976562, -0.0008761882781982422, -0.0005841255187988281, -0.00029206275939941406, 0.0, 0.00029206275939941406, 0.0005841255187988281, 0.0008761882781982422, 0.0011682510375976562, 0.0014603137969970703, 0.0017523765563964844, 0.0020444393157958984, 0.0023365020751953125, 0.0026285648345947266, 0.0029206275939941406, 0.0032126903533935547, 0.0035047531127929688, 0.003796815872192383, 0.004088878631591797, 0.004380941390991211, 0.004673004150390625, 0.004965066909790039, 0.005257129669189453, 0.005549192428588867, 0.005841255187988281, 0.006133317947387695, 0.006425380706787109, 0.0067174434661865234, 0.0070095062255859375, 0.0073015689849853516, 0.007593631744384766, 0.00788569450378418, 0.008177757263183594, 0.008469820022583008, 0.008761882781982422, 0.009053945541381836, 0.00934600830078125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 6.0, 4.0, 5.0, 7.0, 10.0, 9.0, 15.0, 12.0, 20.0, 25.0, 21.0, 26.0, 27.0, 33.0, 36.0, 32.0, 30.0, 39.0, 33.0, 43.0, 39.0, 37.0, 56.0, 57.0, 40.0, 37.0, 27.0, 42.0, 35.0, 37.0, 22.0, 19.0, 22.0, 12.0, 13.0, 18.0, 14.0, 5.0, 4.0, 11.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00626373291015625, -0.00607454776763916, -0.00588536262512207, -0.0056961774826049805, -0.005506992340087891, -0.005317807197570801, -0.005128622055053711, -0.004939436912536621, -0.004750251770019531, -0.004561066627502441, -0.0043718814849853516, -0.004182696342468262, -0.003993511199951172, -0.003804326057434082, -0.003615140914916992, -0.0034259557723999023, -0.0032367706298828125, -0.0030475854873657227, -0.002858400344848633, -0.002669215202331543, -0.002480030059814453, -0.0022908449172973633, -0.0021016597747802734, -0.0019124746322631836, -0.0017232894897460938, -0.001534104347229004, -0.001344919204711914, -0.0011557340621948242, -0.0009665489196777344, -0.0007773637771606445, -0.0005881786346435547, -0.00039899349212646484, -0.000209808349609375, -2.0623207092285156e-05, 0.0001685619354248047, 0.00035774707794189453, 0.0005469322204589844, 0.0007361173629760742, 0.0009253025054931641, 0.001114487648010254, 0.0013036727905273438, 0.0014928579330444336, 0.0016820430755615234, 0.0018712282180786133, 0.002060413360595703, 0.002249598503112793, 0.002438783645629883, 0.0026279687881469727, 0.0028171539306640625, 0.0030063390731811523, 0.003195524215698242, 0.003384709358215332, 0.003573894500732422, 0.0037630796432495117, 0.0039522647857666016, 0.004141449928283691, 0.004330635070800781, 0.004519820213317871, 0.004709005355834961, 0.004898190498352051, 0.005087375640869141, 0.0052765607833862305, 0.00546574592590332, 0.00565493106842041, 0.0058441162109375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 4.0, 8.0, 13.0, 10.0, 23.0, 22.0, 27.0, 48.0, 93.0, 136.0, 262.0, 496.0, 1008.0, 1960.0, 4033.0, 9597.0, 28154.0, 139221.0, 738975.0, 88013.0, 21820.0, 7845.0, 3277.0, 1635.0, 805.0, 458.0, 223.0, 109.0, 82.0, 50.0, 32.0, 28.0, 15.0, 16.0, 5.0, 8.0, 9.0, 11.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016326904296875, -0.01580667495727539, -0.015286445617675781, -0.014766216278076172, -0.014245986938476562, -0.013725757598876953, -0.013205528259277344, -0.012685298919677734, -0.012165069580078125, -0.011644840240478516, -0.011124610900878906, -0.010604381561279297, -0.010084152221679688, -0.009563922882080078, -0.009043693542480469, -0.00852346420288086, -0.00800323486328125, -0.007483005523681641, -0.006962776184082031, -0.006442546844482422, -0.0059223175048828125, -0.005402088165283203, -0.004881858825683594, -0.004361629486083984, -0.003841400146484375, -0.0033211708068847656, -0.0028009414672851562, -0.002280712127685547, -0.0017604827880859375, -0.0012402534484863281, -0.0007200241088867188, -0.00019979476928710938, 0.0003204345703125, 0.0008406639099121094, 0.0013608932495117188, 0.0018811225891113281, 0.0024013519287109375, 0.002921581268310547, 0.0034418106079101562, 0.003962039947509766, 0.004482269287109375, 0.005002498626708984, 0.005522727966308594, 0.006042957305908203, 0.0065631866455078125, 0.007083415985107422, 0.007603645324707031, 0.00812387466430664, 0.00864410400390625, 0.00916433334350586, 0.009684562683105469, 0.010204792022705078, 0.010725021362304688, 0.011245250701904297, 0.011765480041503906, 0.012285709381103516, 0.012805938720703125, 0.013326168060302734, 0.013846397399902344, 0.014366626739501953, 0.014886856079101562, 0.015407085418701172, 0.01592731475830078, 0.01644754409790039, 0.0169677734375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 5.0, 7.0, 13.0, 9.0, 11.0, 11.0, 15.0, 14.0, 24.0, 18.0, 12.0, 34.0, 24.0, 29.0, 31.0, 38.0, 37.0, 32.0, 41.0, 39.0, 44.0, 34.0, 33.0, 40.0, 41.0, 33.0, 34.0, 38.0, 28.0, 26.0, 19.0, 35.0, 19.0, 23.0, 19.0, 12.0, 12.0, 12.0, 6.0, 17.0, 8.0, 4.0, 1.0, 7.0, 5.0, 2.0, 2.0, 3.0, 3.0], "bins": [-0.0044403076171875, -0.004319608211517334, -0.004198908805847168, -0.004078209400177002, -0.003957509994506836, -0.00383681058883667, -0.003716111183166504, -0.003595411777496338, -0.003474712371826172, -0.003354012966156006, -0.00323331356048584, -0.003112614154815674, -0.002991914749145508, -0.002871215343475342, -0.0027505159378051758, -0.0026298165321350098, -0.0025091171264648438, -0.0023884177207946777, -0.0022677183151245117, -0.0021470189094543457, -0.0020263195037841797, -0.0019056200981140137, -0.0017849206924438477, -0.0016642212867736816, -0.0015435218811035156, -0.0014228224754333496, -0.0013021230697631836, -0.0011814236640930176, -0.0010607242584228516, -0.0009400248527526855, -0.0008193254470825195, -0.0006986260414123535, -0.0005779266357421875, -0.0004572272300720215, -0.00033652782440185547, -0.00021582841873168945, -9.512901306152344e-05, 2.5570392608642578e-05, 0.0001462697982788086, 0.0002669692039489746, 0.0003876686096191406, 0.0005083680152893066, 0.0006290674209594727, 0.0007497668266296387, 0.0008704662322998047, 0.0009911656379699707, 0.0011118650436401367, 0.0012325644493103027, 0.0013532638549804688, 0.0014739632606506348, 0.0015946626663208008, 0.0017153620719909668, 0.0018360614776611328, 0.001956760883331299, 0.002077460289001465, 0.002198159694671631, 0.002318859100341797, 0.002439558506011963, 0.002560257911682129, 0.002680957317352295, 0.002801656723022461, 0.002922356128692627, 0.003043055534362793, 0.003163754940032959, 0.003284454345703125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 3.0, 6.0, 11.0, 15.0, 15.0, 20.0, 32.0, 43.0, 64.0, 81.0, 129.0, 148.0, 262.0, 365.0, 568.0, 998.0, 1781.0, 3341.0, 7615.0, 21175.0, 122746.0, 814728.0, 49637.0, 13184.0, 5349.0, 2566.0, 1349.0, 806.0, 488.0, 335.0, 184.0, 144.0, 95.0, 73.0, 50.0, 45.0, 32.0, 15.0, 16.0, 7.0, 8.0, 8.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00768280029296875, -0.007458746433258057, -0.007234692573547363, -0.00701063871383667, -0.0067865848541259766, -0.006562530994415283, -0.00633847713470459, -0.0061144232749938965, -0.005890369415283203, -0.00566631555557251, -0.005442261695861816, -0.005218207836151123, -0.00499415397644043, -0.004770100116729736, -0.004546046257019043, -0.00432199239730835, -0.004097938537597656, -0.003873884677886963, -0.0036498308181762695, -0.003425776958465576, -0.003201723098754883, -0.0029776692390441895, -0.002753615379333496, -0.0025295615196228027, -0.0023055076599121094, -0.002081453800201416, -0.0018573999404907227, -0.0016333460807800293, -0.001409292221069336, -0.0011852383613586426, -0.0009611845016479492, -0.0007371306419372559, -0.0005130767822265625, -0.00028902292251586914, -6.496906280517578e-05, 0.00015908479690551758, 0.00038313865661621094, 0.0006071925163269043, 0.0008312463760375977, 0.001055300235748291, 0.0012793540954589844, 0.0015034079551696777, 0.001727461814880371, 0.0019515156745910645, 0.002175569534301758, 0.002399623394012451, 0.0026236772537231445, 0.002847731113433838, 0.0030717849731445312, 0.0032958388328552246, 0.003519892692565918, 0.0037439465522766113, 0.003968000411987305, 0.004192054271697998, 0.004416108131408691, 0.004640161991119385, 0.004864215850830078, 0.0050882697105407715, 0.005312323570251465, 0.005536377429962158, 0.0057604312896728516, 0.005984485149383545, 0.006208539009094238, 0.006432592868804932, 0.006656646728515625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 9.0, 5.0, 7.0, 10.0, 8.0, 11.0, 12.0, 17.0, 33.0, 42.0, 38.0, 63.0, 88.0, 91.0, 144.0, 98.0, 72.0, 66.0, 28.0, 47.0, 33.0, 14.0, 12.0, 7.0, 10.0, 9.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.173154830932617e-05, -8.904840797185898e-05, -8.636526763439178e-05, -8.368212729692459e-05, -8.09989869594574e-05, -7.83158466219902e-05, -7.563270628452301e-05, -7.294956594705582e-05, -7.026642560958862e-05, -6.758328527212143e-05, -6.490014493465424e-05, -6.221700459718704e-05, -5.953386425971985e-05, -5.6850723922252655e-05, -5.416758358478546e-05, -5.148444324731827e-05, -4.8801302909851074e-05, -4.611816257238388e-05, -4.343502223491669e-05, -4.0751881897449493e-05, -3.80687415599823e-05, -3.5385601222515106e-05, -3.270246088504791e-05, -3.001932054758072e-05, -2.7336180210113525e-05, -2.4653039872646332e-05, -2.1969899535179138e-05, -1.9286759197711945e-05, -1.660361886024475e-05, -1.3920478522777557e-05, -1.1237338185310364e-05, -8.55419784784317e-06, -5.8710575103759766e-06, -3.187917172908783e-06, -5.047768354415894e-07, 2.1783635020256042e-06, 4.861503839492798e-06, 7.5446441769599915e-06, 1.0227784514427185e-05, 1.2910924851894379e-05, 1.5594065189361572e-05, 1.8277205526828766e-05, 2.096034586429596e-05, 2.3643486201763153e-05, 2.6326626539230347e-05, 2.900976687669754e-05, 3.1692907214164734e-05, 3.437604755163193e-05, 3.705918788909912e-05, 3.9742328226566315e-05, 4.242546856403351e-05, 4.51086089015007e-05, 4.7791749238967896e-05, 5.047488957643509e-05, 5.315802991390228e-05, 5.5841170251369476e-05, 5.852431058883667e-05, 6.120745092630386e-05, 6.389059126377106e-05, 6.657373160123825e-05, 6.925687193870544e-05, 7.194001227617264e-05, 7.462315261363983e-05, 7.730629295110703e-05, 7.998943328857422e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 10.0, 10.0, 8.0, 19.0, 32.0, 41.0, 58.0, 90.0, 157.0, 243.0, 350.0, 543.0, 1002.0, 1847.0, 3590.0, 8068.0, 21541.0, 79196.0, 712926.0, 163849.0, 33031.0, 11521.0, 4788.0, 2443.0, 1269.0, 715.0, 425.0, 273.0, 171.0, 94.0, 68.0, 46.0, 41.0, 22.0, 19.0, 8.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00582122802734375, -0.00561833381652832, -0.005415439605712891, -0.005212545394897461, -0.005009651184082031, -0.0048067569732666016, -0.004603862762451172, -0.004400968551635742, -0.0041980743408203125, -0.003995180130004883, -0.003792285919189453, -0.0035893917083740234, -0.0033864974975585938, -0.003183603286743164, -0.0029807090759277344, -0.0027778148651123047, -0.002574920654296875, -0.0023720264434814453, -0.0021691322326660156, -0.001966238021850586, -0.0017633438110351562, -0.0015604496002197266, -0.0013575553894042969, -0.0011546611785888672, -0.0009517669677734375, -0.0007488727569580078, -0.0005459785461425781, -0.00034308433532714844, -0.00014019012451171875, 6.270408630371094e-05, 0.0002655982971191406, 0.0004684925079345703, 0.00067138671875, 0.0008742809295654297, 0.0010771751403808594, 0.001280069351196289, 0.0014829635620117188, 0.0016858577728271484, 0.0018887519836425781, 0.002091646194458008, 0.0022945404052734375, 0.002497434616088867, 0.002700328826904297, 0.0029032230377197266, 0.0031061172485351562, 0.003309011459350586, 0.0035119056701660156, 0.0037147998809814453, 0.003917694091796875, 0.004120588302612305, 0.004323482513427734, 0.004526376724243164, 0.004729270935058594, 0.0049321651458740234, 0.005135059356689453, 0.005337953567504883, 0.0055408477783203125, 0.005743741989135742, 0.005946636199951172, 0.0061495304107666016, 0.006352424621582031, 0.006555318832397461, 0.006758213043212891, 0.00696110725402832, 0.00716400146484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 3.0, 6.0, 5.0, 5.0, 8.0, 15.0, 16.0, 15.0, 27.0, 45.0, 34.0, 71.0, 66.0, 130.0, 154.0, 94.0, 72.0, 44.0, 42.0, 25.0, 19.0, 17.0, 15.0, 20.0, 14.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0013246536254882812, -0.0012869387865066528, -0.0012492239475250244, -0.001211509108543396, -0.0011737942695617676, -0.0011360794305801392, -0.0010983645915985107, -0.0010606497526168823, -0.001022934913635254, -0.0009852200746536255, -0.0009475052356719971, -0.0009097903966903687, -0.0008720755577087402, -0.0008343607187271118, -0.0007966458797454834, -0.000758931040763855, -0.0007212162017822266, -0.0006835013628005981, -0.0006457865238189697, -0.0006080716848373413, -0.0005703568458557129, -0.0005326420068740845, -0.0004949271678924561, -0.00045721232891082764, -0.0004194974899291992, -0.0003817826509475708, -0.0003440678119659424, -0.00030635297298431396, -0.00026863813400268555, -0.00023092329502105713, -0.0001932084560394287, -0.0001554936170578003, -0.00011777877807617188, -8.006393909454346e-05, -4.234910011291504e-05, -4.634261131286621e-06, 3.30805778503418e-05, 7.079541683197021e-05, 0.00010851025581359863, 0.00014622509479522705, 0.00018393993377685547, 0.0002216547727584839, 0.0002593696117401123, 0.0002970844507217407, 0.00033479928970336914, 0.00037251412868499756, 0.000410228967666626, 0.0004479438066482544, 0.0004856586456298828, 0.0005233734846115112, 0.0005610883235931396, 0.0005988031625747681, 0.0006365180015563965, 0.0006742328405380249, 0.0007119476795196533, 0.0007496625185012817, 0.0007873773574829102, 0.0008250921964645386, 0.000862807035446167, 0.0009005218744277954, 0.0009382367134094238, 0.0009759515523910522, 0.0010136663913726807, 0.001051381230354309, 0.0010890960693359375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 5.0, 11.0, 4.0, 19.0, 12.0, 16.0, 25.0, 25.0, 36.0, 37.0, 36.0, 72.0, 102.0, 126.0, 121.0, 51.0, 45.0, 50.0, 26.0, 31.0, 14.0, 15.0, 17.0, 19.0, 12.0, 8.0, 11.0, 3.0, 8.0, 2.0, 5.0, 3.0, 1.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.006300482898950577, -0.006079658400267363, -0.005858833901584148, -0.005638009402900934, -0.00541718490421772, -0.005196360405534506, -0.004975535906851292, -0.0047547114081680775, -0.004533886909484863, -0.004313062410801649, -0.004092237912118435, -0.0038714134134352207, -0.0036505889147520065, -0.0034297644160687923, -0.003208939917385578, -0.002988115418702364, -0.002767290687188506, -0.002546466188505292, -0.0023256416898220778, -0.0021048171911388636, -0.0018839926924556494, -0.0016631680773571134, -0.0014423435786738992, -0.001221519079990685, -0.0010006945813074708, -0.0007798700826242566, -0.0005590455839410424, -0.0003382210270501673, -0.00011739652836695313, 0.00010342802852392197, 0.00032425252720713615, 0.0005450770258903503, 0.0007659015245735645, 0.0009867260232567787, 0.001207550521939993, 0.001428375020623207, 0.0016491995193064213, 0.0018700241344049573, 0.0020908485166728497, 0.002311673015356064, 0.002532497514039278, 0.0027533220127224922, 0.0029741465114057064, 0.0031949710100889206, 0.0034157955087721348, 0.003636620007455349, 0.003857444506138563, 0.004078269004821777, 0.004299093969166279, 0.004519918467849493, 0.004740742966532707, 0.004961567465215921, 0.005182391963899136, 0.00540321646258235, 0.005624040961265564, 0.005844865459948778, 0.006065689958631992, 0.0062865144573152065, 0.006507338955998421, 0.006728163454681635, 0.006948987953364849, 0.007169812452048063, 0.0073906369507312775, 0.007611461449414492, 0.007832285948097706]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 7.0, 11.0, 6.0, 12.0, 11.0, 20.0, 23.0, 29.0, 32.0, 27.0, 27.0, 23.0, 32.0, 31.0, 42.0, 34.0, 43.0, 45.0, 49.0, 52.0, 43.0, 35.0, 44.0, 38.0, 40.0, 29.0, 33.0, 24.0, 27.0, 19.0, 16.0, 19.0, 14.0, 12.0, 13.0, 9.0, 3.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005949061363935471, -0.0057600741274654865, -0.0055710868909955025, -0.005382099654525518, -0.005193112418055534, -0.005004124715924263, -0.004815137479454279, -0.004626150242984295, -0.004437163006514311, -0.004248175770044327, -0.004059188533574343, -0.003870201064273715, -0.003681213827803731, -0.003492226591333747, -0.003303239122033119, -0.003114251885563135, -0.002925264649093151, -0.002736277412623167, -0.002547290176153183, -0.0023583027068525553, -0.0021693154703825712, -0.001980328233912587, -0.0017913408810272813, -0.0016023535281419754, -0.0014133662916719913, -0.0012243790552020073, -0.0010353917023167014, -0.0008464044076390564, -0.0006574171129614115, -0.0004684298182837665, -0.00027944252360612154, -9.045517072081566e-05, 9.853160008788109e-05, 0.00028751889476552606, 0.000476506189443171, 0.000665493484120816, 0.000854480778798461, 0.001043468015268445, 0.001232455368153751, 0.0014214427210390568, 0.0016104299575090408, 0.0017994171939790249, 0.001988404430449009, 0.0021773918997496367, 0.0023663791362196207, 0.0025553663726896048, 0.0027443538419902325, 0.0029333410784602165, 0.0031223283149302006, 0.0033113155514001846, 0.0035003027878701687, 0.0036892902571707964, 0.0038782774936407804, 0.004067264962941408, 0.004256252199411392, 0.004445239435881376, 0.00463422667235136, 0.004823213908821344, 0.005012201145291328, 0.0052011883817613125, 0.0053901756182312965, 0.005579163320362568, 0.005768150556832552, 0.005957137793302536, 0.00614612502977252]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 9.0, 6.0, 10.0, 6.0, 5.0, 23.0, 24.0, 40.0, 90.0, 119.0, 224.0, 506.0, 1038.0, 2303.0, 5253.0, 12191.0, 29836.0, 79124.0, 285865.0, 450126.0, 112837.0, 40219.0, 16246.0, 6771.0, 3049.0, 1327.0, 614.0, 281.0, 144.0, 99.0, 49.0, 26.0, 16.0, 19.0, 11.0, 10.0, 8.0, 4.0, 7.0, 4.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0186920166015625, -0.01802825927734375, -0.017364501953125, -0.01670074462890625, -0.0160369873046875, -0.01537322998046875, -0.01470947265625, -0.01404571533203125, -0.0133819580078125, -0.01271820068359375, -0.012054443359375, -0.01139068603515625, -0.0107269287109375, -0.01006317138671875, -0.0093994140625, -0.00873565673828125, -0.0080718994140625, -0.00740814208984375, -0.006744384765625, -0.00608062744140625, -0.0054168701171875, -0.00475311279296875, -0.00408935546875, -0.00342559814453125, -0.0027618408203125, -0.00209808349609375, -0.001434326171875, -0.00077056884765625, -0.0001068115234375, 0.00055694580078125, 0.001220703125, 0.00188446044921875, 0.0025482177734375, 0.00321197509765625, 0.003875732421875, 0.00453948974609375, 0.0052032470703125, 0.00586700439453125, 0.00653076171875, 0.00719451904296875, 0.0078582763671875, 0.00852203369140625, 0.009185791015625, 0.00984954833984375, 0.0105133056640625, 0.01117706298828125, 0.0118408203125, 0.01250457763671875, 0.0131683349609375, 0.01383209228515625, 0.014495849609375, 0.01515960693359375, 0.0158233642578125, 0.01648712158203125, 0.01715087890625, 0.01781463623046875, 0.0184783935546875, 0.01914215087890625, 0.019805908203125, 0.02046966552734375, 0.0211334228515625, 0.02179718017578125, 0.0224609375, 0.02312469482421875, 0.0237884521484375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 4.0, 6.0, 11.0, 15.0, 17.0, 21.0, 27.0, 42.0, 45.0, 42.0, 45.0, 58.0, 52.0, 75.0, 69.0, 72.0, 59.0, 58.0, 55.0, 46.0, 46.0, 35.0, 21.0, 30.0, 20.0, 14.0, 6.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036792755126953125, -0.00350835919380188, -0.0033374428749084473, -0.0031665265560150146, -0.002995610237121582, -0.0028246939182281494, -0.002653777599334717, -0.002482861280441284, -0.0023119449615478516, -0.002141028642654419, -0.0019701123237609863, -0.0017991960048675537, -0.001628279685974121, -0.0014573633670806885, -0.0012864470481872559, -0.0011155307292938232, -0.0009446144104003906, -0.000773698091506958, -0.0006027817726135254, -0.0004318654537200928, -0.00026094913482666016, -9.003281593322754e-05, 8.088350296020508e-05, 0.0002517998218536377, 0.0004227161407470703, 0.0005936324596405029, 0.0007645487785339355, 0.0009354650974273682, 0.0011063814163208008, 0.0012772977352142334, 0.001448214054107666, 0.0016191303730010986, 0.0017900466918945312, 0.001960963010787964, 0.0021318793296813965, 0.002302795648574829, 0.0024737119674682617, 0.0026446282863616943, 0.002815544605255127, 0.0029864609241485596, 0.003157377243041992, 0.003328293561935425, 0.0034992098808288574, 0.00367012619972229, 0.0038410425186157227, 0.004011958837509155, 0.004182875156402588, 0.0043537914752960205, 0.004524707794189453, 0.004695624113082886, 0.004866540431976318, 0.005037456750869751, 0.005208373069763184, 0.005379289388656616, 0.005550205707550049, 0.0057211220264434814, 0.005892038345336914, 0.006062954664230347, 0.006233870983123779, 0.006404787302017212, 0.0065757036209106445, 0.006746619939804077, 0.00691753625869751, 0.007088452577590942, 0.007259368896484375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 12.0, 6.0, 6.0, 14.0, 25.0, 33.0, 39.0, 45.0, 86.0, 120.0, 185.0, 278.0, 460.0, 829.0, 1491.0, 2565.0, 4677.0, 8420.0, 15234.0, 28038.0, 56936.0, 132177.0, 366067.0, 248124.0, 91164.0, 42325.0, 22084.0, 11862.0, 6630.0, 3651.0, 2041.0, 1144.0, 698.0, 391.0, 234.0, 146.0, 104.0, 58.0, 40.0, 28.0, 24.0, 16.0, 14.0, 8.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.011322021484375, -0.01095438003540039, -0.010586738586425781, -0.010219097137451172, -0.009851455688476562, -0.009483814239501953, -0.009116172790527344, -0.008748531341552734, -0.008380889892578125, -0.008013248443603516, -0.007645606994628906, -0.007277965545654297, -0.0069103240966796875, -0.006542682647705078, -0.006175041198730469, -0.005807399749755859, -0.00543975830078125, -0.005072116851806641, -0.004704475402832031, -0.004336833953857422, -0.0039691925048828125, -0.003601551055908203, -0.0032339096069335938, -0.0028662681579589844, -0.002498626708984375, -0.0021309852600097656, -0.0017633438110351562, -0.0013957023620605469, -0.0010280609130859375, -0.0006604194641113281, -0.00029277801513671875, 7.486343383789062e-05, 0.0004425048828125, 0.0008101463317871094, 0.0011777877807617188, 0.0015454292297363281, 0.0019130706787109375, 0.002280712127685547, 0.0026483535766601562, 0.0030159950256347656, 0.003383636474609375, 0.0037512779235839844, 0.004118919372558594, 0.004486560821533203, 0.0048542022705078125, 0.005221843719482422, 0.005589485168457031, 0.005957126617431641, 0.00632476806640625, 0.006692409515380859, 0.007060050964355469, 0.007427692413330078, 0.0077953338623046875, 0.008162975311279297, 0.008530616760253906, 0.008898258209228516, 0.009265899658203125, 0.009633541107177734, 0.010001182556152344, 0.010368824005126953, 0.010736465454101562, 0.011104106903076172, 0.011471748352050781, 0.01183938980102539, 0.01220703125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 1.0, 6.0, 7.0, 7.0, 6.0, 13.0, 10.0, 15.0, 13.0, 19.0, 26.0, 28.0, 25.0, 23.0, 21.0, 30.0, 27.0, 57.0, 30.0, 36.0, 52.0, 32.0, 37.0, 40.0, 46.0, 29.0, 46.0, 38.0, 28.0, 42.0, 30.0, 24.0, 20.0, 23.0, 15.0, 13.0, 14.0, 16.0, 21.0, 10.0, 6.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.003070831298828125, -0.0029787421226501465, -0.002886652946472168, -0.0027945637702941895, -0.002702474594116211, -0.0026103854179382324, -0.002518296241760254, -0.0024262070655822754, -0.002334117889404297, -0.0022420287132263184, -0.00214993953704834, -0.0020578503608703613, -0.001965761184692383, -0.0018736720085144043, -0.0017815828323364258, -0.0016894936561584473, -0.0015974044799804688, -0.0015053153038024902, -0.0014132261276245117, -0.0013211369514465332, -0.0012290477752685547, -0.0011369585990905762, -0.0010448694229125977, -0.0009527802467346191, -0.0008606910705566406, -0.0007686018943786621, -0.0006765127182006836, -0.0005844235420227051, -0.0004923343658447266, -0.00040024518966674805, -0.00030815601348876953, -0.00021606683731079102, -0.0001239776611328125, -3.1888484954833984e-05, 6.020069122314453e-05, 0.00015228986740112305, 0.00024437904357910156, 0.0003364682197570801, 0.0004285573959350586, 0.0005206465721130371, 0.0006127357482910156, 0.0007048249244689941, 0.0007969141006469727, 0.0008890032768249512, 0.0009810924530029297, 0.0010731816291809082, 0.0011652708053588867, 0.0012573599815368652, 0.0013494491577148438, 0.0014415383338928223, 0.0015336275100708008, 0.0016257166862487793, 0.0017178058624267578, 0.0018098950386047363, 0.0019019842147827148, 0.0019940733909606934, 0.002086162567138672, 0.0021782517433166504, 0.002270340919494629, 0.0023624300956726074, 0.002454519271850586, 0.0025466084480285645, 0.002638697624206543, 0.0027307868003845215, 0.0028228759765625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 7.0, 19.0, 17.0, 18.0, 44.0, 62.0, 104.0, 149.0, 243.0, 399.0, 687.0, 1340.0, 2631.0, 5991.0, 16242.0, 61136.0, 594697.0, 300237.0, 42353.0, 12342.0, 4840.0, 2219.0, 1123.0, 642.0, 379.0, 224.0, 141.0, 84.0, 65.0, 29.0, 27.0, 19.0, 9.0, 12.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003802776336669922, -0.00036967918276786804, -0.0003590807318687439, -0.00034848228096961975, -0.0003378838300704956, -0.00032728537917137146, -0.0003166869282722473, -0.00030608847737312317, -0.000295490026473999, -0.0002848915755748749, -0.00027429312467575073, -0.0002636946737766266, -0.00025309622287750244, -0.0002424977719783783, -0.00023189932107925415, -0.00022130087018013, -0.00021070241928100586, -0.00020010396838188171, -0.00018950551748275757, -0.00017890706658363342, -0.00016830861568450928, -0.00015771016478538513, -0.00014711171388626099, -0.00013651326298713684, -0.0001259148120880127, -0.00011531636118888855, -0.0001047179102897644, -9.411945939064026e-05, -8.352100849151611e-05, -7.292255759239197e-05, -6.232410669326782e-05, -5.172565579414368e-05, -4.112720489501953e-05, -3.0528753995895386e-05, -1.993030309677124e-05, -9.331852197647095e-06, 1.2665987014770508e-06, 1.1865049600601196e-05, 2.2463500499725342e-05, 3.306195139884949e-05, 4.366040229797363e-05, 5.425885319709778e-05, 6.485730409622192e-05, 7.545575499534607e-05, 8.605420589447021e-05, 9.665265679359436e-05, 0.0001072511076927185, 0.00011784955859184265, 0.0001284480094909668, 0.00013904646039009094, 0.0001496449112892151, 0.00016024336218833923, 0.00017084181308746338, 0.00018144026398658752, 0.00019203871488571167, 0.00020263716578483582, 0.00021323561668395996, 0.0002238340675830841, 0.00023443251848220825, 0.0002450309693813324, 0.00025562942028045654, 0.0002662278711795807, 0.00027682632207870483, 0.000287424772977829, 0.0002980232238769531]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 6.0, 13.0, 8.0, 17.0, 15.0, 24.0, 52.0, 83.0, 150.0, 179.0, 165.0, 119.0, 45.0, 31.0, 16.0, 15.0, 9.0, 11.0, 10.0, 6.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0609626770019531e-05, -1.027621328830719e-05, -9.942799806594849e-06, -9.609386324882507e-06, -9.275972843170166e-06, -8.942559361457825e-06, -8.609145879745483e-06, -8.275732398033142e-06, -7.9423189163208e-06, -7.6089054346084595e-06, -7.275491952896118e-06, -6.942078471183777e-06, -6.6086649894714355e-06, -6.275251507759094e-06, -5.941838026046753e-06, -5.608424544334412e-06, -5.27501106262207e-06, -4.941597580909729e-06, -4.608184099197388e-06, -4.274770617485046e-06, -3.941357135772705e-06, -3.6079436540603638e-06, -3.2745301723480225e-06, -2.941116690635681e-06, -2.60770320892334e-06, -2.2742897272109985e-06, -1.9408762454986572e-06, -1.607462763786316e-06, -1.2740492820739746e-06, -9.406358003616333e-07, -6.07222318649292e-07, -2.738088369369507e-07, 5.960464477539063e-08, 3.9301812648773193e-07, 7.264316082000732e-07, 1.0598450899124146e-06, 1.3932585716247559e-06, 1.7266720533370972e-06, 2.0600855350494385e-06, 2.3934990167617798e-06, 2.726912498474121e-06, 3.0603259801864624e-06, 3.3937394618988037e-06, 3.727152943611145e-06, 4.060566425323486e-06, 4.393979907035828e-06, 4.727393388748169e-06, 5.06080687046051e-06, 5.3942203521728516e-06, 5.727633833885193e-06, 6.061047315597534e-06, 6.3944607973098755e-06, 6.727874279022217e-06, 7.061287760734558e-06, 7.394701242446899e-06, 7.72811472415924e-06, 8.061528205871582e-06, 8.394941687583923e-06, 8.728355169296265e-06, 9.061768651008606e-06, 9.395182132720947e-06, 9.728595614433289e-06, 1.006200909614563e-05, 1.0395422577857971e-05, 1.0728836059570312e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 7.0, 14.0, 14.0, 23.0, 37.0, 42.0, 89.0, 122.0, 210.0, 323.0, 564.0, 800.0, 1425.0, 2722.0, 4904.0, 9866.0, 20594.0, 44051.0, 115068.0, 395280.0, 292340.0, 88302.0, 36718.0, 17005.0, 8234.0, 4305.0, 2289.0, 1284.0, 743.0, 439.0, 281.0, 165.0, 97.0, 69.0, 30.0, 33.0, 13.0, 11.0, 12.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.89897346496582e-05, -8.590798825025558e-05, -8.282624185085297e-05, -7.974449545145035e-05, -7.666274905204773e-05, -7.358100265264511e-05, -7.049925625324249e-05, -6.741750985383987e-05, -6.433576345443726e-05, -6.125401705503464e-05, -5.817227065563202e-05, -5.50905242562294e-05, -5.200877785682678e-05, -4.8927031457424164e-05, -4.5845285058021545e-05, -4.276353865861893e-05, -3.968179225921631e-05, -3.660004585981369e-05, -3.351829946041107e-05, -3.0436553061008453e-05, -2.7354806661605835e-05, -2.4273060262203217e-05, -2.1191313862800598e-05, -1.810956746339798e-05, -1.5027821063995361e-05, -1.1946074664592743e-05, -8.864328265190125e-06, -5.782581865787506e-06, -2.7008354663848877e-06, 3.809109330177307e-07, 3.462657332420349e-06, 6.5444037318229675e-06, 9.626150131225586e-06, 1.2707896530628204e-05, 1.5789642930030823e-05, 1.887138932943344e-05, 2.195313572883606e-05, 2.5034882128238678e-05, 2.8116628527641296e-05, 3.1198374927043915e-05, 3.428012132644653e-05, 3.736186772584915e-05, 4.044361412525177e-05, 4.352536052465439e-05, 4.660710692405701e-05, 4.9688853323459625e-05, 5.2770599722862244e-05, 5.585234612226486e-05, 5.893409252166748e-05, 6.20158389210701e-05, 6.509758532047272e-05, 6.817933171987534e-05, 7.126107811927795e-05, 7.434282451868057e-05, 7.742457091808319e-05, 8.050631731748581e-05, 8.358806371688843e-05, 8.666981011629105e-05, 8.975155651569366e-05, 9.283330291509628e-05, 9.59150493144989e-05, 9.899679571390152e-05, 0.00010207854211330414, 0.00010516028851270676, 0.00010824203491210938]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 0.0, 3.0, 7.0, 11.0, 11.0, 18.0, 18.0, 16.0, 21.0, 32.0, 31.0, 40.0, 44.0, 49.0, 44.0, 45.0, 47.0, 53.0, 51.0, 61.0, 57.0, 49.0, 41.0, 48.0, 29.0, 31.0, 22.0, 25.0, 22.0, 21.0, 11.0, 14.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.765655517578125e-05, -2.6845373213291168e-05, -2.6034191250801086e-05, -2.5223009288311005e-05, -2.4411827325820923e-05, -2.360064536333084e-05, -2.278946340084076e-05, -2.1978281438350677e-05, -2.1167099475860596e-05, -2.0355917513370514e-05, -1.9544735550880432e-05, -1.873355358839035e-05, -1.792237162590027e-05, -1.7111189663410187e-05, -1.6300007700920105e-05, -1.5488825738430023e-05, -1.4677643775939941e-05, -1.386646181344986e-05, -1.3055279850959778e-05, -1.2244097888469696e-05, -1.1432915925979614e-05, -1.0621733963489532e-05, -9.81055200099945e-06, -8.999370038509369e-06, -8.188188076019287e-06, -7.377006113529205e-06, -6.5658241510391235e-06, -5.754642188549042e-06, -4.94346022605896e-06, -4.132278263568878e-06, -3.3210963010787964e-06, -2.5099143385887146e-06, -1.6987323760986328e-06, -8.87550413608551e-07, -7.636845111846924e-08, 7.348135113716125e-07, 1.5459954738616943e-06, 2.357177436351776e-06, 3.168359398841858e-06, 3.97954136133194e-06, 4.7907233238220215e-06, 5.601905286312103e-06, 6.413087248802185e-06, 7.224269211292267e-06, 8.035451173782349e-06, 8.84663313627243e-06, 9.657815098762512e-06, 1.0468997061252594e-05, 1.1280179023742676e-05, 1.2091360986232758e-05, 1.290254294872284e-05, 1.3713724911212921e-05, 1.4524906873703003e-05, 1.5336088836193085e-05, 1.6147270798683167e-05, 1.6958452761173248e-05, 1.776963472366333e-05, 1.8580816686153412e-05, 1.9391998648643494e-05, 2.0203180611133575e-05, 2.1014362573623657e-05, 2.182554453611374e-05, 2.263672649860382e-05, 2.3447908461093903e-05, 2.4259090423583984e-05]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 8.0, 4.0, 9.0, 8.0, 13.0, 13.0, 24.0, 34.0, 55.0, 86.0, 150.0, 198.0, 114.0, 78.0, 68.0, 43.0, 32.0, 16.0, 11.0, 14.0, 8.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00774313835427165, -0.007481791079044342, -0.007220443803817034, -0.0069590965285897255, -0.0066977497190237045, -0.006436402443796396, -0.006175055168569088, -0.00591370789334178, -0.0056523606181144714, -0.005391013342887163, -0.005129666067659855, -0.004868319258093834, -0.004606971982866526, -0.004345624707639217, -0.004084277432411909, -0.003822930157184601, -0.00356158334761858, -0.0033002360723912716, -0.003038889029994607, -0.0027775417547672987, -0.002516194712370634, -0.002254847437143326, -0.0019935001619160175, -0.001732153003104031, -0.0014708058442920446, -0.0012094586854800582, -0.0009481114684604108, -0.0006867642514407635, -0.00042541709262877703, -0.00016406993381679058, 9.727734141051769e-05, 0.00035862450022250414, 0.0006199721246957779, 0.0008813192835077643, 0.0011426664423197508, 0.001404013717547059, 0.0016653608763590455, 0.001926708035171032, 0.0021880553103983402, 0.0024494025856256485, 0.002710749628022313, 0.0029720969032496214, 0.003233443945646286, 0.0034947912208735943, 0.0037561384961009026, 0.0040174853056669235, 0.004278833046555519, 0.00454017985612154, 0.004801527131348848, 0.005062874406576157, 0.005324221681803465, 0.005585568957030773, 0.005846915766596794, 0.006108263041824102, 0.006369610317051411, 0.006630957592278719, 0.006892304867506027, 0.0071536521427333355, 0.007414999417960644, 0.007676346227526665, 0.00793769396841526, 0.008199040777981281, 0.008460387587547302, 0.008721735328435898, 0.008983082138001919]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 9.0, 7.0, 16.0, 14.0, 12.0, 26.0, 22.0, 33.0, 27.0, 39.0, 46.0, 44.0, 33.0, 47.0, 46.0, 55.0, 65.0, 54.0, 57.0, 51.0, 36.0, 45.0, 24.0, 33.0, 34.0, 24.0, 27.0, 22.0, 13.0, 9.0, 14.0, 6.0, 6.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004100169986486435, -0.003943602554500103, -0.0037870346568524837, -0.003630466992035508, -0.0034738993272185326, -0.0033173318952322006, -0.003160764230415225, -0.0030041965655982494, -0.002847628900781274, -0.0026910612359642982, -0.0025344935711473227, -0.002377925906330347, -0.002221358474344015, -0.002064790576696396, -0.001908223144710064, -0.0017516554798930883, -0.0015950878150761127, -0.0014385201502591372, -0.0012819524854421616, -0.0011253849370405078, -0.0009688172722235322, -0.0008122496074065566, -0.0006556820007972419, -0.0004991143941879272, -0.00034254672937095165, -0.00018597909365780652, -2.941145794466138e-05, 0.00012715617776848376, 0.0002837238134816289, 0.0004402914782986045, 0.0005968590849079192, 0.0007534266915172338, 0.0009099938906729221, 0.0010665615554898977, 0.0012231292203068733, 0.001379696768708527, 0.0015362644335255027, 0.0016928320983424783, 0.001849399646744132, 0.0020059673115611076, 0.0021625349763780832, 0.002319102641195059, 0.0024756703060120344, 0.00263223797082901, 0.002788805402815342, 0.002945373300462961, 0.003101940732449293, 0.0032585083972662687, 0.0034150760620832443, 0.00357164372690022, 0.0037282113917171955, 0.003884779056534171, 0.004041346721351147, 0.004197914153337479, 0.004354482050985098, 0.00451104948297143, 0.004667617380619049, 0.004824184812605381, 0.004980752710253, 0.005137320142239332, 0.0052938880398869514, 0.005450455471873283, 0.005607023369520903, 0.005763590801507235, 0.0059201582334935665]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 7.0, 11.0, 16.0, 20.0, 16.0, 25.0, 54.0, 74.0, 94.0, 126.0, 180.0, 346.0, 509.0, 857.0, 1644.0, 3172.0, 7365.0, 136878.0, 4019068.0, 14078.0, 4481.0, 2256.0, 1123.0, 685.0, 387.0, 268.0, 134.0, 133.0, 82.0, 47.0, 34.0, 17.0, 25.0, 21.0, 11.0, 11.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01446533203125, -0.01397085189819336, -0.013476371765136719, -0.012981891632080078, -0.012487411499023438, -0.011992931365966797, -0.011498451232910156, -0.011003971099853516, -0.010509490966796875, -0.010015010833740234, -0.009520530700683594, -0.009026050567626953, -0.008531570434570312, -0.008037090301513672, -0.007542610168457031, -0.007048130035400391, -0.00655364990234375, -0.006059169769287109, -0.005564689636230469, -0.005070209503173828, -0.0045757293701171875, -0.004081249237060547, -0.0035867691040039062, -0.0030922889709472656, -0.002597808837890625, -0.0021033287048339844, -0.0016088485717773438, -0.0011143684387207031, -0.0006198883056640625, -0.00012540817260742188, 0.00036907196044921875, 0.0008635520935058594, 0.0013580322265625, 0.0018525123596191406, 0.0023469924926757812, 0.002841472625732422, 0.0033359527587890625, 0.003830432891845703, 0.004324913024902344, 0.004819393157958984, 0.005313873291015625, 0.005808353424072266, 0.006302833557128906, 0.006797313690185547, 0.0072917938232421875, 0.007786273956298828, 0.008280754089355469, 0.00877523422241211, 0.00926971435546875, 0.00976419448852539, 0.010258674621582031, 0.010753154754638672, 0.011247634887695312, 0.011742115020751953, 0.012236595153808594, 0.012731075286865234, 0.013225555419921875, 0.013720035552978516, 0.014214515686035156, 0.014708995819091797, 0.015203475952148438, 0.015697956085205078, 0.01619243621826172, 0.01668691635131836, 0.017181396484375]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 6.0, 6.0, 9.0, 11.0, 18.0, 19.0, 20.0, 22.0, 25.0, 39.0, 35.0, 37.0, 30.0, 42.0, 48.0, 45.0, 54.0, 58.0, 55.0, 47.0, 48.0, 41.0, 42.0, 40.0, 30.0, 21.0, 31.0, 22.0, 17.0, 11.0, 15.0, 18.0, 5.0, 6.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002941131591796875, -0.002840965986251831, -0.002740800380706787, -0.002640634775161743, -0.0025404691696166992, -0.0024403035640716553, -0.0023401379585266113, -0.0022399723529815674, -0.0021398067474365234, -0.0020396411418914795, -0.0019394755363464355, -0.0018393099308013916, -0.0017391443252563477, -0.0016389787197113037, -0.0015388131141662598, -0.0014386475086212158, -0.0013384819030761719, -0.001238316297531128, -0.001138150691986084, -0.00103798508644104, -0.0009378194808959961, -0.0008376538753509521, -0.0007374882698059082, -0.0006373226642608643, -0.0005371570587158203, -0.00043699145317077637, -0.0003368258476257324, -0.00023666024208068848, -0.00013649463653564453, -3.6329030990600586e-05, 6.383657455444336e-05, 0.0001640021800994873, 0.00026416778564453125, 0.0003643333911895752, 0.00046449899673461914, 0.0005646646022796631, 0.000664830207824707, 0.000764995813369751, 0.0008651614189147949, 0.0009653270244598389, 0.0010654926300048828, 0.0011656582355499268, 0.0012658238410949707, 0.0013659894466400146, 0.0014661550521850586, 0.0015663206577301025, 0.0016664862632751465, 0.0017666518688201904, 0.0018668174743652344, 0.0019669830799102783, 0.0020671486854553223, 0.002167314291000366, 0.00226747989654541, 0.002367645502090454, 0.002467811107635498, 0.002567976713180542, 0.002668142318725586, 0.00276830792427063, 0.002868473529815674, 0.0029686391353607178, 0.0030688047409057617, 0.0031689703464508057, 0.0032691359519958496, 0.0033693015575408936, 0.0034694671630859375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 3.0, 3.0, 9.0, 13.0, 16.0, 20.0, 28.0, 34.0, 52.0, 92.0, 143.0, 303.0, 663.0, 1698.0, 5041.0, 22910.0, 4055665.0, 94294.0, 8670.0, 2673.0, 1005.0, 425.0, 215.0, 121.0, 66.0, 28.0, 34.0, 17.0, 18.0, 10.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169830322265625, -0.016322612762451172, -0.015662193298339844, -0.015001773834228516, -0.014341354370117188, -0.01368093490600586, -0.013020515441894531, -0.012360095977783203, -0.011699676513671875, -0.011039257049560547, -0.010378837585449219, -0.00971841812133789, -0.009057998657226562, -0.008397579193115234, -0.007737159729003906, -0.007076740264892578, -0.00641632080078125, -0.005755901336669922, -0.005095481872558594, -0.004435062408447266, -0.0037746429443359375, -0.0031142234802246094, -0.0024538040161132812, -0.0017933845520019531, -0.001132965087890625, -0.0004725456237792969, 0.00018787384033203125, 0.0008482933044433594, 0.0015087127685546875, 0.0021691322326660156, 0.0028295516967773438, 0.003489971160888672, 0.004150390625, 0.004810810089111328, 0.005471229553222656, 0.006131649017333984, 0.0067920684814453125, 0.007452487945556641, 0.008112907409667969, 0.008773326873779297, 0.009433746337890625, 0.010094165802001953, 0.010754585266113281, 0.01141500473022461, 0.012075424194335938, 0.012735843658447266, 0.013396263122558594, 0.014056682586669922, 0.01471710205078125, 0.015377521514892578, 0.016037940979003906, 0.016698360443115234, 0.017358779907226562, 0.01801919937133789, 0.01867961883544922, 0.019340038299560547, 0.020000457763671875, 0.020660877227783203, 0.02132129669189453, 0.02198171615600586, 0.022642135620117188, 0.023302555084228516, 0.023962974548339844, 0.024623394012451172, 0.0252838134765625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 9.0, 11.0, 8.0, 21.0, 92.0, 405.0, 2888.0, 438.0, 109.0, 25.0, 20.0, 9.0, 7.0, 4.0, 7.0, 2.0, 4.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00446319580078125, -0.004362955689430237, -0.004262715578079224, -0.0041624754667282104, -0.004062235355377197, -0.003961995244026184, -0.003861755132675171, -0.0037615150213241577, -0.0036612749099731445, -0.0035610347986221313, -0.003460794687271118, -0.003360554575920105, -0.003260314464569092, -0.0031600743532180786, -0.0030598342418670654, -0.0029595941305160522, -0.002859354019165039, -0.002759113907814026, -0.0026588737964630127, -0.0025586336851119995, -0.0024583935737609863, -0.002358153462409973, -0.00225791335105896, -0.0021576732397079468, -0.0020574331283569336, -0.0019571930170059204, -0.0018569529056549072, -0.001756712794303894, -0.0016564726829528809, -0.0015562325716018677, -0.0014559924602508545, -0.0013557523488998413, -0.0012555122375488281, -0.001155272126197815, -0.0010550320148468018, -0.0009547919034957886, -0.0008545517921447754, -0.0007543116807937622, -0.000654071569442749, -0.0005538314580917358, -0.00045359134674072266, -0.00035335123538970947, -0.0002531111240386963, -0.0001528710126876831, -5.263090133666992e-05, 4.760921001434326e-05, 0.00014784932136535645, 0.00024808943271636963, 0.0003483295440673828, 0.000448569655418396, 0.0005488097667694092, 0.0006490498781204224, 0.0007492899894714355, 0.0008495301008224487, 0.0009497702121734619, 0.001050010323524475, 0.0011502504348754883, 0.0012504905462265015, 0.0013507306575775146, 0.0014509707689285278, 0.001551210880279541, 0.0016514509916305542, 0.0017516911029815674, 0.0018519312143325806, 0.0019521713256835938]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 1.0, 5.0, 6.0, 7.0, 7.0, 25.0, 27.0, 21.0, 37.0, 50.0, 59.0, 127.0, 166.0, 157.0, 90.0, 53.0, 38.0, 27.0, 26.0, 14.0, 16.0, 8.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004850286990404129, -0.004687699489295483, -0.004525111988186836, -0.004362524952739477, -0.004199937451630831, -0.004037349950522184, -0.003874762449413538, -0.0037121749483048916, -0.003549587680026889, -0.0033870001789182425, -0.0032244129106402397, -0.0030618254095315933, -0.002899237908422947, -0.002736650640144944, -0.002574063139036298, -0.002411475870758295, -0.0022488883696496487, -0.0020863008685410023, -0.0019237136002629995, -0.0017611260991543531, -0.0015985387144610286, -0.001435951329767704, -0.0012733638286590576, -0.001110776443965733, -0.0009481890592724085, -0.0007856016745790839, -0.0006230142316780984, -0.0004604268178809434, -0.0002978394040837884, -0.00013525201939046383, 2.733542351052165e-05, 0.00018992286641150713, 0.0003525097854435444, 0.000515097170136869, 0.0006776846130378544, 0.0008402720559388399, 0.0010028594406321645, 0.001165446825325489, 0.0013280343264341354, 0.00149062171112746, 0.0016532090958207846, 0.0018157964805141091, 0.0019783838652074337, 0.00214097136631608, 0.0023035588674247265, 0.0024661461357027292, 0.0026287336368113756, 0.0027913209050893784, 0.0029539084061980247, 0.003116495907306671, 0.003279083175584674, 0.0034416706766933203, 0.003604257944971323, 0.0037668454460799694, 0.003929432947188616, 0.004092020448297262, 0.004254607483744621, 0.004417194984853268, 0.004579782485961914, 0.004742369521409273, 0.0049049570225179195, 0.005067544523626566, 0.005230132024735212, 0.005392719525843859, 0.005555307026952505]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 6.0, 9.0, 12.0, 5.0, 7.0, 17.0, 18.0, 17.0, 12.0, 27.0, 28.0, 30.0, 21.0, 33.0, 36.0, 29.0, 24.0, 35.0, 36.0, 35.0, 41.0, 37.0, 36.0, 40.0, 30.0, 38.0, 29.0, 25.0, 28.0, 24.0, 26.0, 18.0, 15.0, 29.0, 15.0, 20.0, 14.0, 15.0, 15.0, 8.0, 15.0, 6.0, 8.0, 5.0, 7.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.0025053133722394705, -0.0024283272214233875, -0.0023513410706073046, -0.0022743549197912216, -0.0021973687689751387, -0.0021203826181590557, -0.0020433964673429728, -0.00196641031652689, -0.0018894241657108068, -0.001812438014894724, -0.001735451864078641, -0.001658465713262558, -0.001581479562446475, -0.001504493411630392, -0.0014275072608143091, -0.0013505211099982262, -0.0012735349591821432, -0.0011965488083660603, -0.0011195626575499773, -0.0010425765067338943, -0.0009655903559178114, -0.0008886042051017284, -0.0008116180542856455, -0.0007346319034695625, -0.0006576457526534796, -0.0005806596018373966, -0.0005036734510213137, -0.0004266873002052307, -0.00034970114938914776, -0.0002727149985730648, -0.00019572884775698185, -0.0001187426969408989, -4.1756778955459595e-05, 3.522937186062336e-05, 0.00011221552267670631, 0.00018920167349278927, 0.0002661878243088722, 0.0003431739751249552, 0.00042016012594103813, 0.0004971462767571211, 0.000574132427573204, 0.000651118578389287, 0.00072810472920537, 0.0008050908800214529, 0.0008820770308375359, 0.0009590631816536188, 0.0010360493324697018, 0.0011130354832857847, 0.0011900216341018677, 0.0012670077849179506, 0.0013439939357340336, 0.0014209800865501165, 0.0014979662373661995, 0.0015749523881822824, 0.0016519385389983654, 0.0017289246898144484, 0.0018059108406305313, 0.0018828969914466143, 0.0019598831422626972, 0.00203686929307878, 0.002113855443894863, 0.002190841594710946, 0.002267827745527029, 0.002344813896343112, 0.002421800047159195]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 6.0, 9.0, 19.0, 37.0, 33.0, 52.0, 67.0, 126.0, 216.0, 378.0, 705.0, 1113.0, 2196.0, 3972.0, 7737.0, 15944.0, 34512.0, 83602.0, 239844.0, 412678.0, 143408.0, 54483.0, 23644.0, 11337.0, 5607.0, 3087.0, 1558.0, 938.0, 482.0, 305.0, 143.0, 96.0, 73.0, 50.0, 28.0, 19.0, 18.0, 11.0, 3.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0035381317138671875, -0.0034249722957611084, -0.0033118128776550293, -0.00319865345954895, -0.003085494041442871, -0.002972334623336792, -0.002859175205230713, -0.002746015787124634, -0.0026328563690185547, -0.0025196969509124756, -0.0024065375328063965, -0.0022933781147003174, -0.0021802186965942383, -0.002067059278488159, -0.00195389986038208, -0.001840740442276001, -0.0017275810241699219, -0.0016144216060638428, -0.0015012621879577637, -0.0013881027698516846, -0.0012749433517456055, -0.0011617839336395264, -0.0010486245155334473, -0.0009354650974273682, -0.0008223056793212891, -0.00070914626121521, -0.0005959868431091309, -0.00048282742500305176, -0.00036966800689697266, -0.00025650858879089355, -0.00014334917068481445, -3.018975257873535e-05, 8.296966552734375e-05, 0.00019612908363342285, 0.00030928850173950195, 0.00042244791984558105, 0.0005356073379516602, 0.0006487667560577393, 0.0007619261741638184, 0.0008750855922698975, 0.0009882450103759766, 0.0011014044284820557, 0.0012145638465881348, 0.0013277232646942139, 0.001440882682800293, 0.001554042100906372, 0.0016672015190124512, 0.0017803609371185303, 0.0018935203552246094, 0.0020066797733306885, 0.0021198391914367676, 0.0022329986095428467, 0.0023461580276489258, 0.002459317445755005, 0.002572476863861084, 0.002685636281967163, 0.002798795700073242, 0.0029119551181793213, 0.0030251145362854004, 0.0031382739543914795, 0.0032514333724975586, 0.0033645927906036377, 0.003477752208709717, 0.003590911626815796, 0.003704071044921875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 6.0, 6.0, 8.0, 12.0, 9.0, 11.0, 21.0, 9.0, 24.0, 21.0, 29.0, 21.0, 33.0, 39.0, 30.0, 33.0, 36.0, 37.0, 31.0, 37.0, 42.0, 50.0, 25.0, 39.0, 33.0, 36.0, 42.0, 28.0, 28.0, 33.0, 19.0, 23.0, 17.0, 19.0, 15.0, 14.0, 14.0, 12.0, 11.0, 15.0, 7.0, 7.0, 5.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 4.0], "bins": [-0.0029582977294921875, -0.0028717517852783203, -0.002785205841064453, -0.002698659896850586, -0.0026121139526367188, -0.0025255680084228516, -0.0024390220642089844, -0.002352476119995117, -0.00226593017578125, -0.002179384231567383, -0.0020928382873535156, -0.0020062923431396484, -0.0019197463989257812, -0.001833200454711914, -0.0017466545104980469, -0.0016601085662841797, -0.0015735626220703125, -0.0014870166778564453, -0.0014004707336425781, -0.001313924789428711, -0.0012273788452148438, -0.0011408329010009766, -0.0010542869567871094, -0.0009677410125732422, -0.000881195068359375, -0.0007946491241455078, -0.0007081031799316406, -0.0006215572357177734, -0.0005350112915039062, -0.00044846534729003906, -0.0003619194030761719, -0.0002753734588623047, -0.0001888275146484375, -0.00010228157043457031, -1.5735626220703125e-05, 7.081031799316406e-05, 0.00015735626220703125, 0.00024390220642089844, 0.0003304481506347656, 0.0004169940948486328, 0.0005035400390625, 0.0005900859832763672, 0.0006766319274902344, 0.0007631778717041016, 0.0008497238159179688, 0.0009362697601318359, 0.0010228157043457031, 0.0011093616485595703, 0.0011959075927734375, 0.0012824535369873047, 0.0013689994812011719, 0.001455545425415039, 0.0015420913696289062, 0.0016286373138427734, 0.0017151832580566406, 0.0018017292022705078, 0.001888275146484375, 0.001974821090698242, 0.0020613670349121094, 0.0021479129791259766, 0.0022344589233398438, 0.002321004867553711, 0.002407550811767578, 0.0024940967559814453, 0.0025806427001953125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 11.0, 8.0, 10.0, 26.0, 25.0, 30.0, 36.0, 60.0, 67.0, 122.0, 143.0, 213.0, 304.0, 446.0, 597.0, 945.0, 1442.0, 2318.0, 3746.0, 6151.0, 10644.0, 19925.0, 42113.0, 111036.0, 455593.0, 250892.0, 73127.0, 30664.0, 15414.0, 8649.0, 4934.0, 3050.0, 1940.0, 1243.0, 812.0, 562.0, 346.0, 271.0, 186.0, 132.0, 97.0, 55.0, 46.0, 33.0, 13.0, 26.0, 25.0, 10.0, 7.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0028514862060546875, -0.002758920192718506, -0.0026663541793823242, -0.0025737881660461426, -0.002481222152709961, -0.0023886561393737793, -0.0022960901260375977, -0.002203524112701416, -0.0021109580993652344, -0.0020183920860290527, -0.001925826072692871, -0.0018332600593566895, -0.0017406940460205078, -0.0016481280326843262, -0.0015555620193481445, -0.0014629960060119629, -0.0013704299926757812, -0.0012778639793395996, -0.001185297966003418, -0.0010927319526672363, -0.0010001659393310547, -0.000907599925994873, -0.0008150339126586914, -0.0007224678993225098, -0.0006299018859863281, -0.0005373358726501465, -0.00044476985931396484, -0.0003522038459777832, -0.00025963783264160156, -0.00016707181930541992, -7.450580596923828e-05, 1.806020736694336e-05, 0.000110626220703125, 0.00020319223403930664, 0.0002957582473754883, 0.0003883242607116699, 0.00048089027404785156, 0.0005734562873840332, 0.0006660223007202148, 0.0007585883140563965, 0.0008511543273925781, 0.0009437203407287598, 0.0010362863540649414, 0.001128852367401123, 0.0012214183807373047, 0.0013139843940734863, 0.001406550407409668, 0.0014991164207458496, 0.0015916824340820312, 0.0016842484474182129, 0.0017768144607543945, 0.0018693804740905762, 0.001961946487426758, 0.0020545125007629395, 0.002147078514099121, 0.0022396445274353027, 0.0023322105407714844, 0.002424776554107666, 0.0025173425674438477, 0.0026099085807800293, 0.002702474594116211, 0.0027950406074523926, 0.0028876066207885742, 0.002980172634124756, 0.0030727386474609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 7.0, 2.0, 7.0, 6.0, 8.0, 11.0, 15.0, 13.0, 15.0, 23.0, 22.0, 27.0, 36.0, 33.0, 40.0, 26.0, 44.0, 39.0, 32.0, 43.0, 44.0, 43.0, 22.0, 46.0, 32.0, 32.0, 38.0, 32.0, 27.0, 30.0, 26.0, 29.0, 27.0, 23.0, 22.0, 7.0, 12.0, 14.0, 11.0, 12.0, 5.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018148422241210938, -0.0017572790384292603, -0.0016997158527374268, -0.0016421526670455933, -0.0015845894813537598, -0.0015270262956619263, -0.0014694631099700928, -0.0014118999242782593, -0.0013543367385864258, -0.0012967735528945923, -0.0012392103672027588, -0.0011816471815109253, -0.0011240839958190918, -0.0010665208101272583, -0.0010089576244354248, -0.0009513944387435913, -0.0008938312530517578, -0.0008362680673599243, -0.0007787048816680908, -0.0007211416959762573, -0.0006635785102844238, -0.0006060153245925903, -0.0005484521389007568, -0.0004908889532089233, -0.00043332576751708984, -0.00037576258182525635, -0.00031819939613342285, -0.00026063621044158936, -0.00020307302474975586, -0.00014550983905792236, -8.794665336608887e-05, -3.038346767425537e-05, 2.7179718017578125e-05, 8.474290370941162e-05, 0.00014230608940124512, 0.0001998692750930786, 0.0002574324607849121, 0.0003149956464767456, 0.0003725588321685791, 0.0004301220178604126, 0.0004876852035522461, 0.0005452483892440796, 0.0006028115749359131, 0.0006603747606277466, 0.0007179379463195801, 0.0007755011320114136, 0.0008330643177032471, 0.0008906275033950806, 0.0009481906890869141, 0.0010057538747787476, 0.001063317060470581, 0.0011208802461624146, 0.001178443431854248, 0.0012360066175460815, 0.001293569803237915, 0.0013511329889297485, 0.001408696174621582, 0.0014662593603134155, 0.001523822546005249, 0.0015813857316970825, 0.001638948917388916, 0.0016965121030807495, 0.001754075288772583, 0.0018116384744644165, 0.00186920166015625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 1.0, 7.0, 12.0, 13.0, 20.0, 21.0, 28.0, 53.0, 63.0, 97.0, 108.0, 174.0, 241.0, 362.0, 546.0, 895.0, 1352.0, 2250.0, 3956.0, 7846.0, 17647.0, 56201.0, 684821.0, 208987.0, 35323.0, 12882.0, 6108.0, 3289.0, 1835.0, 1143.0, 697.0, 477.0, 341.0, 195.0, 170.0, 97.0, 85.0, 42.0, 45.0, 30.0, 26.0, 14.0, 12.0, 13.0, 7.0, 4.0, 7.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008993148803710938, -0.0008719190955162048, -0.0008445233106613159, -0.000817127525806427, -0.0007897317409515381, -0.0007623359560966492, -0.0007349401712417603, -0.0007075443863868713, -0.0006801486015319824, -0.0006527528166770935, -0.0006253570318222046, -0.0005979612469673157, -0.0005705654621124268, -0.0005431696772575378, -0.0005157738924026489, -0.00048837810754776, -0.0004609823226928711, -0.0004335865378379822, -0.00040619075298309326, -0.00037879496812820435, -0.00035139918327331543, -0.0003240033984184265, -0.0002966076135635376, -0.0002692118287086487, -0.00024181604385375977, -0.00021442025899887085, -0.00018702447414398193, -0.00015962868928909302, -0.0001322329044342041, -0.00010483711957931519, -7.744133472442627e-05, -5.0045549869537354e-05, -2.2649765014648438e-05, 4.7460198402404785e-06, 3.2141804695129395e-05, 5.953758955001831e-05, 8.693337440490723e-05, 0.00011432915925979614, 0.00014172494411468506, 0.00016912072896957397, 0.0001965165138244629, 0.0002239122986793518, 0.0002513080835342407, 0.00027870386838912964, 0.00030609965324401855, 0.00033349543809890747, 0.0003608912229537964, 0.0003882870078086853, 0.0004156827926635742, 0.00044307857751846313, 0.00047047436237335205, 0.000497870147228241, 0.0005252659320831299, 0.0005526617169380188, 0.0005800575017929077, 0.0006074532866477966, 0.0006348490715026855, 0.0006622448563575745, 0.0006896406412124634, 0.0007170364260673523, 0.0007444322109222412, 0.0007718279957771301, 0.000799223780632019, 0.000826619565486908, 0.0008540153503417969]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 4.0, 7.0, 10.0, 10.0, 19.0, 14.0, 28.0, 41.0, 57.0, 81.0, 108.0, 83.0, 105.0, 91.0, 82.0, 74.0, 43.0, 46.0, 19.0, 15.0, 17.0, 16.0, 6.0, 7.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5093555450439453e-05, -2.4334527552127838e-05, -2.3575499653816223e-05, -2.2816471755504608e-05, -2.2057443857192993e-05, -2.1298415958881378e-05, -2.0539388060569763e-05, -1.9780360162258148e-05, -1.9021332263946533e-05, -1.8262304365634918e-05, -1.7503276467323303e-05, -1.6744248569011688e-05, -1.5985220670700073e-05, -1.5226192772388458e-05, -1.4467164874076843e-05, -1.3708136975765228e-05, -1.2949109077453613e-05, -1.2190081179141998e-05, -1.1431053280830383e-05, -1.0672025382518768e-05, -9.912997484207153e-06, -9.153969585895538e-06, -8.394941687583923e-06, -7.635913789272308e-06, -6.876885890960693e-06, -6.117857992649078e-06, -5.358830094337463e-06, -4.599802196025848e-06, -3.840774297714233e-06, -3.0817463994026184e-06, -2.3227185010910034e-06, -1.5636906027793884e-06, -8.046627044677734e-07, -4.563480615615845e-08, 7.133930921554565e-07, 1.4724209904670715e-06, 2.2314488887786865e-06, 2.9904767870903015e-06, 3.7495046854019165e-06, 4.5085325837135315e-06, 5.2675604820251465e-06, 6.0265883803367615e-06, 6.7856162786483765e-06, 7.5446441769599915e-06, 8.303672075271606e-06, 9.062699973583221e-06, 9.821727871894836e-06, 1.0580755770206451e-05, 1.1339783668518066e-05, 1.2098811566829681e-05, 1.2857839465141296e-05, 1.3616867363452911e-05, 1.4375895261764526e-05, 1.5134923160076141e-05, 1.5893951058387756e-05, 1.665297895669937e-05, 1.7412006855010986e-05, 1.81710347533226e-05, 1.8930062651634216e-05, 1.968909054994583e-05, 2.0448118448257446e-05, 2.120714634656906e-05, 2.1966174244880676e-05, 2.272520214319229e-05, 2.3484230041503906e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 4.0, 5.0, 10.0, 7.0, 16.0, 23.0, 39.0, 74.0, 99.0, 195.0, 297.0, 518.0, 864.0, 1639.0, 3420.0, 7787.0, 20075.0, 63958.0, 557884.0, 310171.0, 51480.0, 16825.0, 6688.0, 3006.0, 1533.0, 795.0, 446.0, 246.0, 166.0, 94.0, 60.0, 39.0, 23.0, 17.0, 10.0, 9.0, 9.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0009703636169433594, -0.0009389743208885193, -0.0009075850248336792, -0.0008761957287788391, -0.000844806432723999, -0.0008134171366691589, -0.0007820278406143188, -0.0007506385445594788, -0.0007192492485046387, -0.0006878599524497986, -0.0006564706563949585, -0.0006250813603401184, -0.0005936920642852783, -0.0005623027682304382, -0.0005309134721755981, -0.0004995241761207581, -0.00046813488006591797, -0.0004367455840110779, -0.0004053562879562378, -0.0003739669919013977, -0.0003425776958465576, -0.00031118839979171753, -0.00027979910373687744, -0.00024840980768203735, -0.00021702051162719727, -0.00018563121557235718, -0.0001542419195175171, -0.000122852623462677, -9.146332740783691e-05, -6.0074031352996826e-05, -2.8684735298156738e-05, 2.7045607566833496e-06, 3.409385681152344e-05, 6.548315286636353e-05, 9.687244892120361e-05, 0.0001282617449760437, 0.0001596510410308838, 0.00019104033708572388, 0.00022242963314056396, 0.00025381892919540405, 0.00028520822525024414, 0.00031659752130508423, 0.0003479868173599243, 0.0003793761134147644, 0.0004107654094696045, 0.0004421547055244446, 0.00047354400157928467, 0.0005049332976341248, 0.0005363225936889648, 0.0005677118897438049, 0.000599101185798645, 0.0006304904818534851, 0.0006618797779083252, 0.0006932690739631653, 0.0007246583700180054, 0.0007560476660728455, 0.0007874369621276855, 0.0008188262581825256, 0.0008502155542373657, 0.0008816048502922058, 0.0009129941463470459, 0.000944383442401886, 0.0009757727384567261, 0.0010071620345115662, 0.0010385513305664062]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 3.0, 12.0, 3.0, 4.0, 12.0, 13.0, 19.0, 24.0, 30.0, 27.0, 42.0, 43.0, 54.0, 70.0, 98.0, 140.0, 84.0, 64.0, 51.0, 45.0, 32.0, 17.0, 21.0, 16.0, 17.0, 11.0, 16.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018477439880371094, -0.00017921626567840576, -0.00017365813255310059, -0.0001680999994277954, -0.00016254186630249023, -0.00015698373317718506, -0.00015142560005187988, -0.0001458674669265747, -0.00014030933380126953, -0.00013475120067596436, -0.00012919306755065918, -0.000123634934425354, -0.00011807680130004883, -0.00011251866817474365, -0.00010696053504943848, -0.0001014024019241333, -9.584426879882812e-05, -9.028613567352295e-05, -8.472800254821777e-05, -7.91698694229126e-05, -7.361173629760742e-05, -6.805360317230225e-05, -6.249547004699707e-05, -5.6937336921691895e-05, -5.137920379638672e-05, -4.582107067108154e-05, -4.026293754577637e-05, -3.470480442047119e-05, -2.9146671295166016e-05, -2.358853816986084e-05, -1.8030405044555664e-05, -1.2472271919250488e-05, -6.9141387939453125e-06, -1.3560056686401367e-06, 4.202127456665039e-06, 9.760260581970215e-06, 1.531839370727539e-05, 2.0876526832580566e-05, 2.6434659957885742e-05, 3.199279308319092e-05, 3.7550926208496094e-05, 4.310905933380127e-05, 4.8667192459106445e-05, 5.422532558441162e-05, 5.97834587097168e-05, 6.534159183502197e-05, 7.089972496032715e-05, 7.645785808563232e-05, 8.20159912109375e-05, 8.757412433624268e-05, 9.313225746154785e-05, 9.869039058685303e-05, 0.0001042485237121582, 0.00010980665683746338, 0.00011536478996276855, 0.00012092292308807373, 0.0001264810562133789, 0.00013203918933868408, 0.00013759732246398926, 0.00014315545558929443, 0.0001487135887145996, 0.00015427172183990479, 0.00015982985496520996, 0.00016538798809051514, 0.0001709461212158203]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 11.0, 14.0, 8.0, 14.0, 30.0, 29.0, 42.0, 45.0, 87.0, 157.0, 183.0, 121.0, 73.0, 46.0, 29.0, 35.0, 16.0, 10.0, 11.0, 9.0, 5.0, 8.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004358283709734678, -0.004179053939878941, -0.00399982463568449, -0.003820595098659396, -0.003641365561634302, -0.003462136024609208, -0.003282906487584114, -0.00310367695055902, -0.002924447413533926, -0.002745217876508832, -0.002565988339483738, -0.002386758802458644, -0.00220752926543355, -0.002028299728408456, -0.0018490701913833618, -0.0016698406543582678, -0.0014906111173331738, -0.0013113815803080797, -0.0011321520432829857, -0.0009529225062578917, -0.0007736929692327976, -0.0005944634322077036, -0.00041523389518260956, -0.00023600435815751553, -5.6774821132421494e-05, 0.00012245471589267254, 0.00030168425291776657, 0.0004809137899428606, 0.0006601433269679546, 0.0008393728639930487, 0.0010186024010181427, 0.0011978319380432367, 0.001377061940729618, 0.001556291477754712, 0.0017355210147798061, 0.0019147505518049002, 0.002093980088829994, 0.0022732096258550882, 0.0024524391628801823, 0.0026316686999052763, 0.0028108982369303703, 0.0029901277739554644, 0.0031693573109805584, 0.0033485868480056524, 0.0035278163850307465, 0.0037070459220558405, 0.0038862754590809345, 0.004065505228936672, 0.004244734533131123, 0.004423963837325573, 0.004603193607181311, 0.004782423377037048, 0.004961652681231499, 0.005140881985425949, 0.005320111755281687, 0.0054993415251374245, 0.005678570829331875, 0.005857800133526325, 0.006037029903382063, 0.006216259673237801, 0.006395488977432251, 0.006574718281626701, 0.006753948051482439, 0.006933177821338177, 0.007112407125532627]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 9.0, 5.0, 14.0, 5.0, 8.0, 17.0, 17.0, 20.0, 13.0, 30.0, 25.0, 27.0, 25.0, 32.0, 31.0, 34.0, 30.0, 30.0, 35.0, 45.0, 39.0, 38.0, 28.0, 41.0, 39.0, 37.0, 22.0, 23.0, 32.0, 26.0, 19.0, 21.0, 16.0, 27.0, 14.0, 17.0, 19.0, 14.0, 12.0, 11.0, 12.0, 8.0, 5.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.002559978049248457, -0.0024806433357298374, -0.002401308622211218, -0.0023219739086925983, -0.002242639195173979, -0.0021633044816553593, -0.0020839697681367397, -0.00200463505461812, -0.0019253003410995007, -0.0018459656275808811, -0.0017666309140622616, -0.001687296200543642, -0.0016079614870250225, -0.001528626773506403, -0.0014492920599877834, -0.001369957346469164, -0.0012906226329505444, -0.0012112879194319248, -0.0011319532059133053, -0.0010526184923946857, -0.0009732837788760662, -0.0008939490653574467, -0.0008146143518388271, -0.0007352796383202076, -0.0006559449248015881, -0.0005766102112829685, -0.000497275497764349, -0.00041794078424572945, -0.0003386060707271099, -0.00025927135720849037, -0.00017993664368987083, -0.0001006019301712513, -2.1267449483275414e-05, 5.8067264035344124e-05, 0.00013740197755396366, 0.0002167366910725832, 0.00029607140459120274, 0.0003754061181098223, 0.0004547408316284418, 0.0005340755451470613, 0.0006134102586656809, 0.0006927449721843004, 0.00077207968570292, 0.0008514143992215395, 0.000930749112740159, 0.0010100838262587786, 0.0010894185397773981, 0.0011687532532960176, 0.0012480879668146372, 0.0013274226803332567, 0.0014067573938518763, 0.0014860921073704958, 0.0015654268208891153, 0.0016447615344077349, 0.0017240962479263544, 0.001803430961444974, 0.0018827656749635935, 0.001962100388482213, 0.0020414351020008326, 0.002120769815519452, 0.0022001045290380716, 0.002279439242556691, 0.0023587739560753107, 0.0024381086695939302, 0.0025174433831125498]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 11.0, 9.0, 18.0, 27.0, 23.0, 46.0, 63.0, 98.0, 154.0, 235.0, 335.0, 557.0, 843.0, 1328.0, 2135.0, 3417.0, 5445.0, 8934.0, 15256.0, 26972.0, 50265.0, 101463.0, 235666.0, 309067.0, 138823.0, 65653.0, 34003.0, 18952.0, 11001.0, 6677.0, 4057.0, 2548.0, 1572.0, 995.0, 652.0, 425.0, 270.0, 180.0, 118.0, 84.0, 60.0, 44.0, 23.0, 21.0, 9.0, 9.0, 7.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.005908966064453125, -0.005713284015655518, -0.00551760196685791, -0.005321919918060303, -0.005126237869262695, -0.004930555820465088, -0.0047348737716674805, -0.004539191722869873, -0.004343509674072266, -0.004147827625274658, -0.003952145576477051, -0.0037564635276794434, -0.003560781478881836, -0.0033650994300842285, -0.003169417381286621, -0.0029737353324890137, -0.0027780532836914062, -0.002582371234893799, -0.0023866891860961914, -0.002191007137298584, -0.0019953250885009766, -0.0017996430397033691, -0.0016039609909057617, -0.0014082789421081543, -0.0012125968933105469, -0.0010169148445129395, -0.000821232795715332, -0.0006255507469177246, -0.0004298686981201172, -0.00023418664932250977, -3.8504600524902344e-05, 0.00015717744827270508, 0.0003528594970703125, 0.0005485415458679199, 0.0007442235946655273, 0.0009399056434631348, 0.0011355876922607422, 0.0013312697410583496, 0.001526951789855957, 0.0017226338386535645, 0.0019183158874511719, 0.0021139979362487793, 0.0023096799850463867, 0.002505362033843994, 0.0027010440826416016, 0.002896726131439209, 0.0030924081802368164, 0.003288090229034424, 0.0034837722778320312, 0.0036794543266296387, 0.003875136375427246, 0.0040708184242248535, 0.004266500473022461, 0.004462182521820068, 0.004657864570617676, 0.004853546619415283, 0.005049228668212891, 0.005244910717010498, 0.0054405927658081055, 0.005636274814605713, 0.00583195686340332, 0.006027638912200928, 0.006223320960998535, 0.006419003009796143, 0.00661468505859375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 9.0, 5.0, 8.0, 10.0, 8.0, 21.0, 24.0, 22.0, 23.0, 33.0, 36.0, 45.0, 46.0, 51.0, 38.0, 50.0, 46.0, 42.0, 44.0, 62.0, 44.0, 43.0, 41.0, 41.0, 31.0, 26.0, 18.0, 18.0, 26.0, 19.0, 14.0, 13.0, 8.0, 8.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019311904907226562, -0.0018659979104995728, -0.0018008053302764893, -0.0017356127500534058, -0.0016704201698303223, -0.0016052275896072388, -0.0015400350093841553, -0.0014748424291610718, -0.0014096498489379883, -0.0013444572687149048, -0.0012792646884918213, -0.0012140721082687378, -0.0011488795280456543, -0.0010836869478225708, -0.0010184943675994873, -0.0009533017873764038, -0.0008881092071533203, -0.0008229166269302368, -0.0007577240467071533, -0.0006925314664840698, -0.0006273388862609863, -0.0005621463060379028, -0.0004969537258148193, -0.00043176114559173584, -0.00036656856536865234, -0.00030137598514556885, -0.00023618340492248535, -0.00017099082469940186, -0.00010579824447631836, -4.060566425323486e-05, 2.4586915969848633e-05, 8.977949619293213e-05, 0.00015497207641601562, 0.00022016465663909912, 0.0002853572368621826, 0.0003505498170852661, 0.0004157423973083496, 0.0004809349775314331, 0.0005461275577545166, 0.0006113201379776001, 0.0006765127182006836, 0.0007417052984237671, 0.0008068978786468506, 0.0008720904588699341, 0.0009372830390930176, 0.001002475619316101, 0.0010676681995391846, 0.001132860779762268, 0.0011980533599853516, 0.001263245940208435, 0.0013284385204315186, 0.001393631100654602, 0.0014588236808776855, 0.001524016261100769, 0.0015892088413238525, 0.001654401421546936, 0.0017195940017700195, 0.001784786581993103, 0.0018499791622161865, 0.00191517174243927, 0.0019803643226623535, 0.002045556902885437, 0.0021107494831085205, 0.002175942063331604, 0.0022411346435546875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 9.0, 8.0, 13.0, 13.0, 33.0, 40.0, 60.0, 82.0, 119.0, 205.0, 304.0, 481.0, 797.0, 1323.0, 2336.0, 4074.0, 7430.0, 13399.0, 25508.0, 48218.0, 100995.0, 269758.0, 333484.0, 119888.0, 55936.0, 28917.0, 15622.0, 8291.0, 4677.0, 2563.0, 1504.0, 887.0, 570.0, 378.0, 219.0, 120.0, 94.0, 62.0, 44.0, 26.0, 21.0, 16.0, 12.0, 7.0, 7.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00580596923828125, -0.005625128746032715, -0.00544428825378418, -0.0052634477615356445, -0.005082607269287109, -0.004901766777038574, -0.004720926284790039, -0.004540085792541504, -0.004359245300292969, -0.004178404808044434, -0.0039975643157958984, -0.0038167238235473633, -0.003635883331298828, -0.003455042839050293, -0.003274202346801758, -0.0030933618545532227, -0.0029125213623046875, -0.0027316808700561523, -0.002550840377807617, -0.002369999885559082, -0.002189159393310547, -0.0020083189010620117, -0.0018274784088134766, -0.0016466379165649414, -0.0014657974243164062, -0.001284956932067871, -0.001104116439819336, -0.0009232759475708008, -0.0007424354553222656, -0.0005615949630737305, -0.0003807544708251953, -0.00019991397857666016, -1.9073486328125e-05, 0.00016176700592041016, 0.0003426074981689453, 0.0005234479904174805, 0.0007042884826660156, 0.0008851289749145508, 0.001065969467163086, 0.001246809959411621, 0.0014276504516601562, 0.0016084909439086914, 0.0017893314361572266, 0.0019701719284057617, 0.002151012420654297, 0.002331852912902832, 0.002512693405151367, 0.0026935338973999023, 0.0028743743896484375, 0.0030552148818969727, 0.003236055374145508, 0.003416895866394043, 0.003597736358642578, 0.0037785768508911133, 0.0039594173431396484, 0.004140257835388184, 0.004321098327636719, 0.004501938819885254, 0.004682779312133789, 0.004863619804382324, 0.005044460296630859, 0.0052253007888793945, 0.00540614128112793, 0.005586981773376465, 0.005767822265625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 3.0, 7.0, 8.0, 12.0, 14.0, 13.0, 21.0, 24.0, 26.0, 30.0, 27.0, 36.0, 31.0, 37.0, 33.0, 44.0, 43.0, 43.0, 49.0, 42.0, 43.0, 47.0, 40.0, 41.0, 39.0, 44.0, 24.0, 29.0, 17.0, 30.0, 15.0, 19.0, 14.0, 11.0, 14.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0016222000122070312, -0.0015712827444076538, -0.0015203654766082764, -0.001469448208808899, -0.0014185309410095215, -0.001367613673210144, -0.0013166964054107666, -0.0012657791376113892, -0.0012148618698120117, -0.0011639446020126343, -0.0011130273342132568, -0.0010621100664138794, -0.001011192798614502, -0.0009602755308151245, -0.0009093582630157471, -0.0008584409952163696, -0.0008075237274169922, -0.0007566064596176147, -0.0007056891918182373, -0.0006547719240188599, -0.0006038546562194824, -0.000552937388420105, -0.0005020201206207275, -0.0004511028528213501, -0.00040018558502197266, -0.0003492683172225952, -0.0002983510494232178, -0.00024743378162384033, -0.0001965165138244629, -0.00014559924602508545, -9.468197822570801e-05, -4.3764710426330566e-05, 7.152557373046875e-06, 5.8069825172424316e-05, 0.00010898709297180176, 0.0001599043607711792, 0.00021082162857055664, 0.0002617388963699341, 0.0003126561641693115, 0.00036357343196868896, 0.0004144906997680664, 0.00046540796756744385, 0.0005163252353668213, 0.0005672425031661987, 0.0006181597709655762, 0.0006690770387649536, 0.0007199943065643311, 0.0007709115743637085, 0.0008218288421630859, 0.0008727461099624634, 0.0009236633777618408, 0.0009745806455612183, 0.0010254979133605957, 0.0010764151811599731, 0.0011273324489593506, 0.001178249716758728, 0.0012291669845581055, 0.001280084252357483, 0.0013310015201568604, 0.0013819187879562378, 0.0014328360557556152, 0.0014837533235549927, 0.0015346705913543701, 0.0015855878591537476, 0.001636505126953125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 11.0, 4.0, 9.0, 15.0, 28.0, 26.0, 45.0, 57.0, 93.0, 170.0, 262.0, 446.0, 738.0, 1509.0, 3050.0, 6965.0, 19358.0, 73138.0, 686165.0, 201450.0, 34722.0, 11210.0, 4517.0, 2078.0, 1033.0, 544.0, 326.0, 192.0, 150.0, 70.0, 53.0, 36.0, 25.0, 14.0, 7.0, 13.0, 3.0, 7.0, 0.0, 1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00017344951629638672, -0.00016815215349197388, -0.00016285479068756104, -0.0001575574278831482, -0.00015226006507873535, -0.0001469627022743225, -0.00014166533946990967, -0.00013636797666549683, -0.00013107061386108398, -0.00012577325105667114, -0.0001204758882522583, -0.00011517852544784546, -0.00010988116264343262, -0.00010458379983901978, -9.928643703460693e-05, -9.398907423019409e-05, -8.869171142578125e-05, -8.339434862136841e-05, -7.809698581695557e-05, -7.279962301254272e-05, -6.750226020812988e-05, -6.220489740371704e-05, -5.69075345993042e-05, -5.161017179489136e-05, -4.6312808990478516e-05, -4.1015446186065674e-05, -3.571808338165283e-05, -3.042072057723999e-05, -2.512335777282715e-05, -1.9825994968414307e-05, -1.4528632164001465e-05, -9.231269359588623e-06, -3.933906555175781e-06, 1.3634562492370605e-06, 6.660819053649902e-06, 1.1958181858062744e-05, 1.7255544662475586e-05, 2.2552907466888428e-05, 2.785027027130127e-05, 3.314763307571411e-05, 3.844499588012695e-05, 4.3742358684539795e-05, 4.903972148895264e-05, 5.433708429336548e-05, 5.963444709777832e-05, 6.493180990219116e-05, 7.0229172706604e-05, 7.552653551101685e-05, 8.082389831542969e-05, 8.612126111984253e-05, 9.141862392425537e-05, 9.671598672866821e-05, 0.00010201334953308105, 0.0001073107123374939, 0.00011260807514190674, 0.00011790543794631958, 0.00012320280075073242, 0.00012850016355514526, 0.0001337975263595581, 0.00013909488916397095, 0.0001443922519683838, 0.00014968961477279663, 0.00015498697757720947, 0.00016028434038162231, 0.00016558170318603516]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 9.0, 13.0, 6.0, 15.0, 10.0, 23.0, 20.0, 45.0, 54.0, 119.0, 172.0, 161.0, 121.0, 61.0, 48.0, 32.0, 22.0, 10.0, 11.0, 6.0, 9.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.059906005859375e-06, -8.794479072093964e-06, -8.529052138328552e-06, -8.263625204563141e-06, -7.99819827079773e-06, -7.732771337032318e-06, -7.467344403266907e-06, -7.201917469501495e-06, -6.936490535736084e-06, -6.671063601970673e-06, -6.405636668205261e-06, -6.14020973443985e-06, -5.8747828006744385e-06, -5.609355866909027e-06, -5.343928933143616e-06, -5.078501999378204e-06, -4.813075065612793e-06, -4.547648131847382e-06, -4.28222119808197e-06, -4.016794264316559e-06, -3.7513673305511475e-06, -3.485940396785736e-06, -3.2205134630203247e-06, -2.9550865292549133e-06, -2.689659595489502e-06, -2.4242326617240906e-06, -2.158805727958679e-06, -1.8933787941932678e-06, -1.6279518604278564e-06, -1.362524926662445e-06, -1.0970979928970337e-06, -8.316710591316223e-07, -5.662441253662109e-07, -3.0081719160079956e-07, -3.5390257835388184e-08, 2.300366759300232e-07, 4.954636096954346e-07, 7.60890543460846e-07, 1.0263174772262573e-06, 1.2917444109916687e-06, 1.55717134475708e-06, 1.8225982785224915e-06, 2.088025212287903e-06, 2.353452146053314e-06, 2.6188790798187256e-06, 2.884306013584137e-06, 3.1497329473495483e-06, 3.4151598811149597e-06, 3.680586814880371e-06, 3.9460137486457825e-06, 4.211440682411194e-06, 4.476867616176605e-06, 4.742294549942017e-06, 5.007721483707428e-06, 5.273148417472839e-06, 5.538575351238251e-06, 5.804002285003662e-06, 6.0694292187690735e-06, 6.334856152534485e-06, 6.600283086299896e-06, 6.865710020065308e-06, 7.131136953830719e-06, 7.39656388759613e-06, 7.661990821361542e-06, 7.927417755126953e-06]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 5.0, 12.0, 17.0, 14.0, 15.0, 22.0, 37.0, 81.0, 93.0, 135.0, 193.0, 290.0, 502.0, 682.0, 1159.0, 1907.0, 3185.0, 5835.0, 10286.0, 19658.0, 42572.0, 100057.0, 325510.0, 349332.0, 100435.0, 41616.0, 20587.0, 10283.0, 5817.0, 3083.0, 1888.0, 1166.0, 680.0, 444.0, 349.0, 190.0, 124.0, 87.0, 58.0, 47.0, 31.0, 17.0, 15.0, 14.0, 9.0, 6.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.988908767700195e-05, -4.837755113840103e-05, -4.686601459980011e-05, -4.535447806119919e-05, -4.3842941522598267e-05, -4.2331404983997345e-05, -4.081986844539642e-05, -3.93083319067955e-05, -3.779679536819458e-05, -3.628525882959366e-05, -3.477372229099274e-05, -3.3262185752391815e-05, -3.1750649213790894e-05, -3.0239112675189972e-05, -2.872757613658905e-05, -2.721603959798813e-05, -2.5704503059387207e-05, -2.4192966520786285e-05, -2.2681429982185364e-05, -2.1169893443584442e-05, -1.965835690498352e-05, -1.81468203663826e-05, -1.6635283827781677e-05, -1.5123747289180756e-05, -1.3612210750579834e-05, -1.2100674211978912e-05, -1.058913767337799e-05, -9.077601134777069e-06, -7.5660645961761475e-06, -6.054528057575226e-06, -4.542991518974304e-06, -3.0314549803733826e-06, -1.519918441772461e-06, -8.381903171539307e-09, 1.5031546354293823e-06, 3.014691174030304e-06, 4.526227712631226e-06, 6.037764251232147e-06, 7.549300789833069e-06, 9.06083732843399e-06, 1.0572373867034912e-05, 1.2083910405635834e-05, 1.3595446944236755e-05, 1.5106983482837677e-05, 1.66185200214386e-05, 1.813005656003952e-05, 1.9641593098640442e-05, 2.1153129637241364e-05, 2.2664666175842285e-05, 2.4176202714443207e-05, 2.568773925304413e-05, 2.719927579164505e-05, 2.871081233024597e-05, 3.0222348868846893e-05, 3.1733885407447815e-05, 3.3245421946048737e-05, 3.475695848464966e-05, 3.626849502325058e-05, 3.77800315618515e-05, 3.929156810045242e-05, 4.0803104639053345e-05, 4.2314641177654266e-05, 4.382617771625519e-05, 4.533771425485611e-05, 4.684925079345703e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 14.0, 12.0, 17.0, 25.0, 20.0, 21.0, 25.0, 44.0, 43.0, 59.0, 57.0, 64.0, 71.0, 53.0, 53.0, 57.0, 57.0, 44.0, 32.0, 33.0, 41.0, 15.0, 20.0, 18.0, 18.0, 15.0, 10.0, 8.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.329183578491211e-05, -1.2860633432865143e-05, -1.2429431080818176e-05, -1.199822872877121e-05, -1.1567026376724243e-05, -1.1135824024677277e-05, -1.070462167263031e-05, -1.0273419320583344e-05, -9.842216968536377e-06, -9.41101461648941e-06, -8.979812264442444e-06, -8.548609912395477e-06, -8.11740756034851e-06, -7.686205208301544e-06, -7.255002856254578e-06, -6.823800504207611e-06, -6.3925981521606445e-06, -5.961395800113678e-06, -5.5301934480667114e-06, -5.098991096019745e-06, -4.667788743972778e-06, -4.236586391925812e-06, -3.8053840398788452e-06, -3.3741816878318787e-06, -2.942979335784912e-06, -2.5117769837379456e-06, -2.080574631690979e-06, -1.6493722796440125e-06, -1.218169927597046e-06, -7.869675755500793e-07, -3.557652235031128e-07, 7.543712854385376e-08, 5.066394805908203e-07, 9.378418326377869e-07, 1.3690441846847534e-06, 1.80024653673172e-06, 2.2314488887786865e-06, 2.662651240825653e-06, 3.0938535928726196e-06, 3.525055944919586e-06, 3.956258296966553e-06, 4.387460649013519e-06, 4.818663001060486e-06, 5.249865353107452e-06, 5.681067705154419e-06, 6.1122700572013855e-06, 6.543472409248352e-06, 6.974674761295319e-06, 7.405877113342285e-06, 7.837079465389252e-06, 8.268281817436218e-06, 8.699484169483185e-06, 9.130686521530151e-06, 9.561888873577118e-06, 9.993091225624084e-06, 1.0424293577671051e-05, 1.0855495929718018e-05, 1.1286698281764984e-05, 1.171790063381195e-05, 1.2149102985858917e-05, 1.2580305337905884e-05, 1.301150768995285e-05, 1.3442710041999817e-05, 1.3873912394046783e-05, 1.430511474609375e-05]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 7.0, 2.0, 5.0, 11.0, 8.0, 9.0, 9.0, 9.0, 18.0, 29.0, 24.0, 36.0, 45.0, 64.0, 90.0, 128.0, 116.0, 86.0, 74.0, 48.0, 36.0, 35.0, 11.0, 12.0, 13.0, 18.0, 7.0, 9.0, 9.0, 2.0, 3.0, 10.0, 5.0, 4.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003235005075111985, -0.003137350780889392, -0.003039696253836155, -0.0029420419596135616, -0.0028443874325603247, -0.0027467331383377314, -0.0026490786112844944, -0.002551424317061901, -0.002453770022839308, -0.0023561157286167145, -0.0022584612015634775, -0.002160806907340884, -0.0020631523802876472, -0.001965498086065054, -0.0018678436754271388, -0.0017701892647892237, -0.0016725347377359867, -0.0015748803270980716, -0.0014772259164601564, -0.0013795716222375631, -0.0012819170951843262, -0.0011842628009617329, -0.0010866083903238177, -0.0009889539796859026, -0.0008912995690479875, -0.0007936451584100723, -0.0006959907477721572, -0.000598336395341903, -0.0005006819847039878, -0.0004030275740660727, -0.0003053732216358185, -0.00020771881099790335, -0.00011006440035998821, -1.2410004273988307e-05, 8.52443918120116e-05, 0.00018289877334609628, 0.0002805531839840114, 0.00037820759462192655, 0.00047586194705218077, 0.0005735163576900959, 0.000671170768328011, 0.0007688251789659262, 0.0008664795896038413, 0.0009641339420340955, 0.0010617882944643497, 0.0011594428215175867, 0.00125709711574018, 0.0013547515263780951, 0.0014524059370160103, 0.0015500603476539254, 0.0016477147582918406, 0.0017453690525144339, 0.0018430235795676708, 0.0019406778737902641, 0.0020383321680128574, 0.0021359866950660944, 0.0022336412221193314, 0.0023312955163419247, 0.0024289500433951616, 0.002526604337617755, 0.002624258864670992, 0.002721913158893585, 0.0028195674531161785, 0.0029172219801694155, 0.0030148762743920088]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 2.0, 8.0, 10.0, 13.0, 7.0, 11.0, 19.0, 17.0, 16.0, 24.0, 30.0, 26.0, 26.0, 28.0, 36.0, 38.0, 50.0, 34.0, 37.0, 36.0, 43.0, 35.0, 38.0, 40.0, 38.0, 39.0, 35.0, 27.0, 27.0, 32.0, 20.0, 27.0, 21.0, 23.0, 18.0, 4.0, 10.0, 13.0, 9.0, 8.0, 9.0, 3.0, 10.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.0023254542611539364, -0.0022560730576515198, -0.0021866916213184595, -0.0021173101849853992, -0.0020479289814829826, -0.001978547777980566, -0.0019091663416475058, -0.0018397850217297673, -0.0017704037018120289, -0.0017010223818942904, -0.001631641061976552, -0.0015622597420588136, -0.0014928784221410751, -0.0014234971022233367, -0.0013541157823055983, -0.0012847344623878598, -0.0012153531424701214, -0.001145971822552383, -0.0010765905026346445, -0.001007209182716906, -0.0009378278627991676, -0.0008684465428814292, -0.0007990652229636908, -0.0007296839030459523, -0.0006603025831282139, -0.0005909212632104754, -0.000521539943292737, -0.00045215862337499857, -0.00038277730345726013, -0.0003133959835395217, -0.00024401466362178326, -0.00017463334370404482, -0.00010525225661695004, -3.58709366992116e-05, 3.351038321852684e-05, 0.00010289170313626528, 0.00017227302305400372, 0.00024165434297174215, 0.0003110356628894806, 0.00038041698280721903, 0.00044979830272495747, 0.0005191796226426959, 0.0005885609425604343, 0.0006579422624781728, 0.0007273235823959112, 0.0007967049023136497, 0.0008660862222313881, 0.0009354675421491265, 0.001004848862066865, 0.0010742301819846034, 0.0011436115019023418, 0.0012129928218200803, 0.0012823741417378187, 0.0013517554616555572, 0.0014211367815732956, 0.001490518101491034, 0.0015598994214087725, 0.001629280741326511, 0.0016986620612442493, 0.0017680433811619878, 0.0018374247010797262, 0.0019068060209974647, 0.001976187340915203, 0.0020455685444176197, 0.00211494998075068]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 12.0, 5.0, 18.0, 15.0, 36.0, 23.0, 46.0, 66.0, 81.0, 115.0, 188.0, 234.0, 381.0, 578.0, 957.0, 1713.0, 3419.0, 9457.0, 167626.0, 3984510.0, 14682.0, 4734.0, 2100.0, 1132.0, 707.0, 450.0, 290.0, 198.0, 129.0, 112.0, 72.0, 48.0, 37.0, 29.0, 19.0, 17.0, 11.0, 12.0, 6.0, 11.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0129547119140625, -0.01256406307220459, -0.01217341423034668, -0.01178276538848877, -0.01139211654663086, -0.01100146770477295, -0.010610818862915039, -0.010220170021057129, -0.009829521179199219, -0.009438872337341309, -0.009048223495483398, -0.008657574653625488, -0.008266925811767578, -0.007876276969909668, -0.007485628128051758, -0.007094979286193848, -0.0067043304443359375, -0.006313681602478027, -0.005923032760620117, -0.005532383918762207, -0.005141735076904297, -0.004751086235046387, -0.0043604373931884766, -0.003969788551330566, -0.0035791397094726562, -0.003188490867614746, -0.002797842025756836, -0.0024071931838989258, -0.0020165443420410156, -0.0016258955001831055, -0.0012352466583251953, -0.0008445978164672852, -0.000453948974609375, -6.330013275146484e-05, 0.0003273487091064453, 0.0007179975509643555, 0.0011086463928222656, 0.0014992952346801758, 0.001889944076538086, 0.002280592918395996, 0.0026712417602539062, 0.0030618906021118164, 0.0034525394439697266, 0.0038431882858276367, 0.004233837127685547, 0.004624485969543457, 0.005015134811401367, 0.005405783653259277, 0.0057964324951171875, 0.006187081336975098, 0.006577730178833008, 0.006968379020690918, 0.007359027862548828, 0.007749676704406738, 0.008140325546264648, 0.008530974388122559, 0.008921623229980469, 0.009312272071838379, 0.009702920913696289, 0.0100935697555542, 0.01048421859741211, 0.01087486743927002, 0.01126551628112793, 0.01165616512298584, 0.01204681396484375]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 3.0, 7.0, 8.0, 16.0, 7.0, 13.0, 19.0, 30.0, 25.0, 32.0, 27.0, 34.0, 33.0, 47.0, 48.0, 49.0, 31.0, 37.0, 50.0, 46.0, 50.0, 50.0, 44.0, 41.0, 34.0, 29.0, 29.0, 24.0, 30.0, 29.0, 10.0, 10.0, 14.0, 8.0, 8.0, 6.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016279220581054688, -0.0015789121389389038, -0.0015299022197723389, -0.001480892300605774, -0.001431882381439209, -0.001382872462272644, -0.001333862543106079, -0.0012848526239395142, -0.0012358427047729492, -0.0011868327856063843, -0.0011378228664398193, -0.0010888129472732544, -0.0010398030281066895, -0.0009907931089401245, -0.0009417831897735596, -0.0008927732706069946, -0.0008437633514404297, -0.0007947534322738647, -0.0007457435131072998, -0.0006967335939407349, -0.0006477236747741699, -0.000598713755607605, -0.00054970383644104, -0.0005006939172744751, -0.00045168399810791016, -0.0004026740789413452, -0.0003536641597747803, -0.00030465424060821533, -0.0002556443214416504, -0.00020663440227508545, -0.0001576244831085205, -0.00010861456394195557, -5.9604644775390625e-05, -1.0594725608825684e-05, 3.841519355773926e-05, 8.74251127243042e-05, 0.00013643503189086914, 0.00018544495105743408, 0.00023445487022399902, 0.00028346478939056396, 0.0003324747085571289, 0.00038148462772369385, 0.0004304945468902588, 0.00047950446605682373, 0.0005285143852233887, 0.0005775243043899536, 0.0006265342235565186, 0.0006755441427230835, 0.0007245540618896484, 0.0007735639810562134, 0.0008225739002227783, 0.0008715838193893433, 0.0009205937385559082, 0.0009696036577224731, 0.001018613576889038, 0.001067623496055603, 0.001116633415222168, 0.001165643334388733, 0.0012146532535552979, 0.0012636631727218628, 0.0013126730918884277, 0.0013616830110549927, 0.0014106929302215576, 0.0014597028493881226, 0.0015087127685546875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 5.0, 3.0, 5.0, 11.0, 15.0, 24.0, 56.0, 76.0, 129.0, 251.0, 482.0, 1084.0, 2632.0, 7009.0, 27294.0, 3883671.0, 246235.0, 16577.0, 5042.0, 1952.0, 843.0, 436.0, 188.0, 109.0, 73.0, 31.0, 18.0, 16.0, 11.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01113128662109375, -0.010811805725097656, -0.010492324829101562, -0.010172843933105469, -0.009853363037109375, -0.009533882141113281, -0.009214401245117188, -0.008894920349121094, -0.008575439453125, -0.008255958557128906, -0.007936477661132812, -0.007616996765136719, -0.007297515869140625, -0.006978034973144531, -0.0066585540771484375, -0.006339073181152344, -0.00601959228515625, -0.005700111389160156, -0.0053806304931640625, -0.005061149597167969, -0.004741668701171875, -0.004422187805175781, -0.0041027069091796875, -0.0037832260131835938, -0.0034637451171875, -0.0031442642211914062, -0.0028247833251953125, -0.0025053024291992188, -0.002185821533203125, -0.0018663406372070312, -0.0015468597412109375, -0.0012273788452148438, -0.00090789794921875, -0.0005884170532226562, -0.0002689361572265625, 5.054473876953125e-05, 0.000370025634765625, 0.0006895065307617188, 0.0010089874267578125, 0.0013284683227539062, 0.00164794921875, 0.0019674301147460938, 0.0022869110107421875, 0.0026063919067382812, 0.002925872802734375, 0.0032453536987304688, 0.0035648345947265625, 0.0038843154907226562, 0.00420379638671875, 0.004523277282714844, 0.0048427581787109375, 0.005162239074707031, 0.005481719970703125, 0.005801200866699219, 0.0061206817626953125, 0.006440162658691406, 0.0067596435546875, 0.007079124450683594, 0.0073986053466796875, 0.007718086242675781, 0.008037567138671875, 0.008357048034667969, 0.008676528930664062, 0.008996009826660156, 0.00931549072265625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 8.0, 2.0, 7.0, 6.0, 9.0, 12.0, 17.0, 34.0, 119.0, 381.0, 2638.0, 514.0, 149.0, 61.0, 33.0, 16.0, 10.0, 8.0, 9.0, 3.0, 3.0, 10.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001190185546875, -0.0011470615863800049, -0.0011039376258850098, -0.0010608136653900146, -0.0010176897048950195, -0.0009745657444000244, -0.0009314417839050293, -0.0008883178234100342, -0.0008451938629150391, -0.0008020699024200439, -0.0007589459419250488, -0.0007158219814300537, -0.0006726980209350586, -0.0006295740604400635, -0.0005864500999450684, -0.0005433261394500732, -0.0005002021789550781, -0.000457078218460083, -0.0004139542579650879, -0.0003708302974700928, -0.00032770633697509766, -0.00028458237648010254, -0.00024145841598510742, -0.0001983344554901123, -0.0001552104949951172, -0.00011208653450012207, -6.896257400512695e-05, -2.5838613510131836e-05, 1.728534698486328e-05, 6.04093074798584e-05, 0.00010353326797485352, 0.00014665722846984863, 0.00018978118896484375, 0.00023290514945983887, 0.000276029109954834, 0.0003191530704498291, 0.0003622770309448242, 0.00040540099143981934, 0.00044852495193481445, 0.0004916489124298096, 0.0005347728729248047, 0.0005778968334197998, 0.0006210207939147949, 0.00066414475440979, 0.0007072687149047852, 0.0007503926753997803, 0.0007935166358947754, 0.0008366405963897705, 0.0008797645568847656, 0.0009228885173797607, 0.0009660124778747559, 0.001009136438369751, 0.001052260398864746, 0.0010953843593597412, 0.0011385083198547363, 0.0011816322803497314, 0.0012247562408447266, 0.0012678802013397217, 0.0013110041618347168, 0.001354128122329712, 0.001397252082824707, 0.0014403760433197021, 0.0014835000038146973, 0.0015266239643096924, 0.0015697479248046875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 13.0, 12.0, 13.0, 17.0, 21.0, 25.0, 44.0, 60.0, 95.0, 148.0, 158.0, 108.0, 88.0, 43.0, 28.0, 29.0, 27.0, 14.0, 12.0, 11.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003198405960574746, -0.003112602047622204, -0.0030267981346696615, -0.0029409942217171192, -0.002855190308764577, -0.0027693863958120346, -0.0026835824828594923, -0.00259777856990695, -0.0025119746569544077, -0.0024261707440018654, -0.002340366831049323, -0.0022545629180967808, -0.0021687590051442385, -0.002082955092191696, -0.001997151179239154, -0.0019113472662866116, -0.0018255432369187474, -0.0017397393239662051, -0.0016539354110136628, -0.0015681314980611205, -0.0014823275851085782, -0.001396523672156036, -0.0013107196427881718, -0.0012249157298356295, -0.0011391118168830872, -0.0010533079039305449, -0.0009675039909780025, -0.0008817000780254602, -0.0007958961650729179, -0.0007100922521203756, -0.0006242882809601724, -0.0005384843680076301, -0.0004526805132627487, -0.0003668766003102064, -0.0002810726873576641, -0.00019526874530129135, -0.00010946483234874904, -2.3660919396206737e-05, 6.214302266016603e-05, 0.00014794693561270833, 0.00023375084856525064, 0.00031955476151779294, 0.00040535867447033525, 0.0004911626456305385, 0.0005769665585830808, 0.0006627704715356231, 0.0007485743844881654, 0.0008343782974407077, 0.00092018221039325, 0.0010059861233457923, 0.0010917900362983346, 0.001177593949250877, 0.0012633978622034192, 0.0013492017751559615, 0.0014350058045238256, 0.001520809717476368, 0.0016066136304289103, 0.0016924175433814526, 0.0017782214563339949, 0.0018640253692865372, 0.0019498292822390795, 0.0020356331951916218, 0.002121437108144164, 0.0022072410210967064, 0.0022930449340492487]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 8.0, 7.0, 14.0, 5.0, 13.0, 24.0, 16.0, 17.0, 21.0, 28.0, 43.0, 27.0, 29.0, 46.0, 43.0, 51.0, 49.0, 30.0, 51.0, 41.0, 44.0, 37.0, 44.0, 29.0, 31.0, 38.0, 31.0, 21.0, 25.0, 21.0, 18.0, 14.0, 26.0, 11.0, 8.0, 7.0, 4.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001528700813651085, -0.0014785992680117488, -0.0014284978387877345, -0.0013783962931483984, -0.0013282947475090623, -0.0012781932018697262, -0.001228091772645712, -0.0011779902270063758, -0.0011278886813670397, -0.0010777871357277036, -0.0010276857065036893, -0.0009775841608643532, -0.0009274826152250171, -0.0008773811277933419, -0.0008272796403616667, -0.0007771780947223306, -0.0007270766654983163, -0.0006769751780666411, -0.000626873632427305, -0.0005767721449956298, -0.0005266705993562937, -0.0004765691119246185, -0.0004264676244929433, -0.00037636610795743763, -0.000326264591421932, -0.00027616307488642633, -0.0002260615729028359, -0.00017596007091924548, -0.00012585855438373983, -7.575703784823418e-05, -2.565555041655898e-05, 2.444596611894667e-05, 7.454759906977415e-05, 0.0001246491156052798, 0.00017475061758887023, 0.00022485211957246065, 0.0002749536361079663, 0.00032505515264347196, 0.00037515664007514715, 0.0004252581566106528, 0.00047535967314615846, 0.0005254611605778337, 0.0005755627062171698, 0.000625664193648845, 0.0006757656810805202, 0.0007258672267198563, 0.0007759687141515315, 0.0008260702015832067, 0.0008761717472225428, 0.000926273234654218, 0.0009763747802935541, 0.0010264762677252293, 0.0010765778133645654, 0.0011266793590039015, 0.0011767807882279158, 0.0012268823338672519, 0.001276983879506588, 0.001327085425145924, 0.0013771868543699384, 0.0014272884000092745, 0.0014773899456486106, 0.0015274914912879467, 0.001577592920511961, 0.001627694466151297, 0.0016777958953753114]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 8.0, 10.0, 16.0, 19.0, 28.0, 64.0, 58.0, 98.0, 130.0, 205.0, 267.0, 412.0, 637.0, 856.0, 1223.0, 1920.0, 2749.0, 4092.0, 6173.0, 9416.0, 14496.0, 22615.0, 36677.0, 63726.0, 121414.0, 255534.0, 237130.0, 111874.0, 59593.0, 34924.0, 21433.0, 13624.0, 8906.0, 6114.0, 3878.0, 2578.0, 1718.0, 1284.0, 839.0, 530.0, 429.0, 276.0, 166.0, 118.0, 89.0, 74.0, 41.0, 30.0, 28.0, 16.0, 7.0, 13.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0010442733764648438, -0.001011580228805542, -0.0009788870811462402, -0.0009461939334869385, -0.0009135007858276367, -0.000880807638168335, -0.0008481144905090332, -0.0008154213428497314, -0.0007827281951904297, -0.0007500350475311279, -0.0007173418998718262, -0.0006846487522125244, -0.0006519556045532227, -0.0006192624568939209, -0.0005865693092346191, -0.0005538761615753174, -0.0005211830139160156, -0.0004884898662567139, -0.0004557967185974121, -0.00042310357093811035, -0.0003904104232788086, -0.00035771727561950684, -0.0003250241279602051, -0.0002923309803009033, -0.00025963783264160156, -0.0002269446849822998, -0.00019425153732299805, -0.0001615583896636963, -0.00012886524200439453, -9.617209434509277e-05, -6.347894668579102e-05, -3.078579902648926e-05, 1.9073486328125e-06, 3.460049629211426e-05, 6.729364395141602e-05, 9.998679161071777e-05, 0.00013267993927001953, 0.0001653730869293213, 0.00019806623458862305, 0.0002307593822479248, 0.00026345252990722656, 0.0002961456775665283, 0.0003288388252258301, 0.00036153197288513184, 0.0003942251205444336, 0.00042691826820373535, 0.0004596114158630371, 0.0004923045635223389, 0.0005249977111816406, 0.0005576908588409424, 0.0005903840065002441, 0.0006230771541595459, 0.0006557703018188477, 0.0006884634494781494, 0.0007211565971374512, 0.0007538497447967529, 0.0007865428924560547, 0.0008192360401153564, 0.0008519291877746582, 0.00088462233543396, 0.0009173154830932617, 0.0009500086307525635, 0.0009827017784118652, 0.001015394926071167, 0.0010480880737304688]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 9.0, 10.0, 5.0, 11.0, 8.0, 17.0, 23.0, 13.0, 16.0, 21.0, 34.0, 31.0, 36.0, 32.0, 49.0, 39.0, 49.0, 44.0, 40.0, 47.0, 32.0, 43.0, 44.0, 38.0, 40.0, 29.0, 27.0, 32.0, 16.0, 24.0, 24.0, 13.0, 9.0, 20.0, 19.0, 14.0, 6.0, 6.0, 5.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0017223358154296875, -0.0016705989837646484, -0.0016188621520996094, -0.0015671253204345703, -0.0015153884887695312, -0.0014636516571044922, -0.0014119148254394531, -0.001360177993774414, -0.001308441162109375, -0.001256704330444336, -0.0012049674987792969, -0.0011532306671142578, -0.0011014938354492188, -0.0010497570037841797, -0.0009980201721191406, -0.0009462833404541016, -0.0008945465087890625, -0.0008428096771240234, -0.0007910728454589844, -0.0007393360137939453, -0.0006875991821289062, -0.0006358623504638672, -0.0005841255187988281, -0.0005323886871337891, -0.00048065185546875, -0.00042891502380371094, -0.0003771781921386719, -0.0003254413604736328, -0.00027370452880859375, -0.0002219676971435547, -0.00017023086547851562, -0.00011849403381347656, -6.67572021484375e-05, -1.5020370483398438e-05, 3.6716461181640625e-05, 8.845329284667969e-05, 0.00014019012451171875, 0.0001919269561767578, 0.00024366378784179688, 0.00029540061950683594, 0.000347137451171875, 0.00039887428283691406, 0.0004506111145019531, 0.0005023479461669922, 0.0005540847778320312, 0.0006058216094970703, 0.0006575584411621094, 0.0007092952728271484, 0.0007610321044921875, 0.0008127689361572266, 0.0008645057678222656, 0.0009162425994873047, 0.0009679794311523438, 0.0010197162628173828, 0.0010714530944824219, 0.001123189926147461, 0.0011749267578125, 0.001226663589477539, 0.0012784004211425781, 0.0013301372528076172, 0.0013818740844726562, 0.0014336109161376953, 0.0014853477478027344, 0.0015370845794677734, 0.0015888214111328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 11.0, 13.0, 8.0, 21.0, 36.0, 42.0, 58.0, 103.0, 113.0, 176.0, 232.0, 387.0, 556.0, 838.0, 1241.0, 1968.0, 2983.0, 4731.0, 7962.0, 13801.0, 26596.0, 57590.0, 158108.0, 486684.0, 163050.0, 58689.0, 26969.0, 14123.0, 8035.0, 4810.0, 3011.0, 1915.0, 1204.0, 785.0, 536.0, 396.0, 245.0, 168.0, 114.0, 77.0, 59.0, 40.0, 28.0, 10.0, 8.0, 15.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0014514923095703125, -0.001406848430633545, -0.0013622045516967773, -0.0013175606727600098, -0.0012729167938232422, -0.0012282729148864746, -0.001183629035949707, -0.0011389851570129395, -0.0010943412780761719, -0.0010496973991394043, -0.0010050535202026367, -0.0009604096412658691, -0.0009157657623291016, -0.000871121883392334, -0.0008264780044555664, -0.0007818341255187988, -0.0007371902465820312, -0.0006925463676452637, -0.0006479024887084961, -0.0006032586097717285, -0.0005586147308349609, -0.0005139708518981934, -0.0004693269729614258, -0.0004246830940246582, -0.0003800392150878906, -0.00033539533615112305, -0.00029075145721435547, -0.0002461075782775879, -0.0002014636993408203, -0.00015681982040405273, -0.00011217594146728516, -6.753206253051758e-05, -2.288818359375e-05, 2.1755695343017578e-05, 6.639957427978516e-05, 0.00011104345321655273, 0.0001556873321533203, 0.0002003312110900879, 0.00024497509002685547, 0.00028961896896362305, 0.0003342628479003906, 0.0003789067268371582, 0.0004235506057739258, 0.00046819448471069336, 0.0005128383636474609, 0.0005574822425842285, 0.0006021261215209961, 0.0006467700004577637, 0.0006914138793945312, 0.0007360577583312988, 0.0007807016372680664, 0.000825345516204834, 0.0008699893951416016, 0.0009146332740783691, 0.0009592771530151367, 0.0010039210319519043, 0.0010485649108886719, 0.0010932087898254395, 0.001137852668762207, 0.0011824965476989746, 0.0012271404266357422, 0.0012717843055725098, 0.0013164281845092773, 0.001361072063446045, 0.0014057159423828125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 13.0, 12.0, 10.0, 8.0, 12.0, 18.0, 19.0, 17.0, 23.0, 29.0, 31.0, 32.0, 33.0, 31.0, 29.0, 37.0, 34.0, 51.0, 40.0, 28.0, 42.0, 38.0, 30.0, 32.0, 30.0, 36.0, 31.0, 27.0, 32.0, 23.0, 26.0, 18.0, 20.0, 21.0, 6.0, 12.0, 6.0, 12.0, 6.0, 5.0, 9.0, 5.0, 6.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0009098052978515625, -0.0008797943592071533, -0.0008497834205627441, -0.000819772481918335, -0.0007897615432739258, -0.0007597506046295166, -0.0007297396659851074, -0.0006997287273406982, -0.0006697177886962891, -0.0006397068500518799, -0.0006096959114074707, -0.0005796849727630615, -0.0005496740341186523, -0.0005196630954742432, -0.000489652156829834, -0.0004596412181854248, -0.0004296302795410156, -0.00039961934089660645, -0.00036960840225219727, -0.0003395974636077881, -0.0003095865249633789, -0.0002795755863189697, -0.00024956464767456055, -0.00021955370903015137, -0.0001895427703857422, -0.000159531831741333, -0.00012952089309692383, -9.950995445251465e-05, -6.949901580810547e-05, -3.948807716369629e-05, -9.47713851928711e-06, 2.053380012512207e-05, 5.054473876953125e-05, 8.055567741394043e-05, 0.00011056661605834961, 0.0001405775547027588, 0.00017058849334716797, 0.00020059943199157715, 0.00023061037063598633, 0.0002606213092803955, 0.0002906322479248047, 0.00032064318656921387, 0.00035065412521362305, 0.0003806650638580322, 0.0004106760025024414, 0.0004406869411468506, 0.00047069787979125977, 0.0005007088184356689, 0.0005307197570800781, 0.0005607306957244873, 0.0005907416343688965, 0.0006207525730133057, 0.0006507635116577148, 0.000680774450302124, 0.0007107853889465332, 0.0007407963275909424, 0.0007708072662353516, 0.0008008182048797607, 0.0008308291435241699, 0.0008608400821685791, 0.0008908510208129883, 0.0009208619594573975, 0.0009508728981018066, 0.0009808838367462158, 0.001010894775390625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 13.0, 13.0, 17.0, 44.0, 65.0, 69.0, 68.0, 115.0, 161.0, 205.0, 325.0, 448.0, 629.0, 892.0, 1303.0, 1947.0, 3011.0, 4854.0, 8489.0, 16758.0, 41807.0, 199901.0, 646215.0, 69283.0, 23730.0, 10872.0, 6092.0, 3751.0, 2422.0, 1474.0, 1040.0, 737.0, 510.0, 357.0, 217.0, 171.0, 153.0, 107.0, 67.0, 52.0, 47.0, 30.0, 28.0, 20.0, 15.0, 9.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0002605915069580078, -0.00025250017642974854, -0.00024440884590148926, -0.00023631751537322998, -0.0002282261848449707, -0.00022013485431671143, -0.00021204352378845215, -0.00020395219326019287, -0.0001958608627319336, -0.00018776953220367432, -0.00017967820167541504, -0.00017158687114715576, -0.00016349554061889648, -0.0001554042100906372, -0.00014731287956237793, -0.00013922154903411865, -0.00013113021850585938, -0.0001230388879776001, -0.00011494755744934082, -0.00010685622692108154, -9.876489639282227e-05, -9.067356586456299e-05, -8.258223533630371e-05, -7.449090480804443e-05, -6.639957427978516e-05, -5.830824375152588e-05, -5.02169132232666e-05, -4.2125582695007324e-05, -3.403425216674805e-05, -2.594292163848877e-05, -1.7851591110229492e-05, -9.760260581970215e-06, -1.6689300537109375e-06, 6.42240047454834e-06, 1.4513731002807617e-05, 2.2605061531066895e-05, 3.069639205932617e-05, 3.878772258758545e-05, 4.6879053115844727e-05, 5.4970383644104004e-05, 6.306171417236328e-05, 7.115304470062256e-05, 7.924437522888184e-05, 8.733570575714111e-05, 9.542703628540039e-05, 0.00010351836681365967, 0.00011160969734191895, 0.00011970102787017822, 0.0001277923583984375, 0.00013588368892669678, 0.00014397501945495605, 0.00015206634998321533, 0.0001601576805114746, 0.0001682490110397339, 0.00017634034156799316, 0.00018443167209625244, 0.00019252300262451172, 0.000200614333152771, 0.00020870566368103027, 0.00021679699420928955, 0.00022488832473754883, 0.0002329796552658081, 0.00024107098579406738, 0.00024916231632232666, 0.00025725364685058594]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0, 6.0, 2.0, 7.0, 8.0, 1.0, 8.0, 12.0, 7.0, 10.0, 12.0, 12.0, 20.0, 28.0, 20.0, 25.0, 36.0, 42.0, 45.0, 52.0, 52.0, 47.0, 65.0, 61.0, 50.0, 47.0, 63.0, 35.0, 31.0, 32.0, 30.0, 23.0, 15.0, 12.0, 10.0, 14.0, 16.0, 3.0, 6.0, 12.0, 3.0, 10.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.298324584960938e-06, -9.01147723197937e-06, -8.724629878997803e-06, -8.437782526016235e-06, -8.150935173034668e-06, -7.8640878200531e-06, -7.577240467071533e-06, -7.290393114089966e-06, -7.0035457611083984e-06, -6.716698408126831e-06, -6.429851055145264e-06, -6.143003702163696e-06, -5.856156349182129e-06, -5.5693089962005615e-06, -5.282461643218994e-06, -4.995614290237427e-06, -4.708766937255859e-06, -4.421919584274292e-06, -4.135072231292725e-06, -3.848224878311157e-06, -3.56137752532959e-06, -3.2745301723480225e-06, -2.987682819366455e-06, -2.7008354663848877e-06, -2.4139881134033203e-06, -2.127140760421753e-06, -1.8402934074401855e-06, -1.5534460544586182e-06, -1.2665987014770508e-06, -9.797513484954834e-07, -6.92903995513916e-07, -4.0605664253234863e-07, -1.1920928955078125e-07, 1.6763806343078613e-07, 4.544854164123535e-07, 7.413327693939209e-07, 1.0281801223754883e-06, 1.3150274753570557e-06, 1.601874828338623e-06, 1.8887221813201904e-06, 2.175569534301758e-06, 2.462416887283325e-06, 2.7492642402648926e-06, 3.03611159324646e-06, 3.3229589462280273e-06, 3.6098062992095947e-06, 3.896653652191162e-06, 4.1835010051727295e-06, 4.470348358154297e-06, 4.757195711135864e-06, 5.044043064117432e-06, 5.330890417098999e-06, 5.617737770080566e-06, 5.904585123062134e-06, 6.191432476043701e-06, 6.4782798290252686e-06, 6.765127182006836e-06, 7.051974534988403e-06, 7.338821887969971e-06, 7.625669240951538e-06, 7.912516593933105e-06, 8.199363946914673e-06, 8.48621129989624e-06, 8.773058652877808e-06, 9.059906005859375e-06]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 4.0, 8.0, 9.0, 24.0, 30.0, 48.0, 84.0, 160.0, 332.0, 670.0, 1491.0, 3567.0, 10399.0, 41456.0, 511619.0, 423867.0, 38673.0, 9838.0, 3522.0, 1455.0, 643.0, 270.0, 153.0, 86.0, 47.0, 33.0, 15.0, 12.0, 10.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004696846008300781, -0.00045452266931533813, -0.00043936073780059814, -0.00042419880628585815, -0.00040903687477111816, -0.0003938749432563782, -0.0003787130117416382, -0.0003635510802268982, -0.0003483891487121582, -0.0003332272171974182, -0.0003180652856826782, -0.00030290335416793823, -0.00028774142265319824, -0.00027257949113845825, -0.00025741755962371826, -0.00024225562810897827, -0.00022709369659423828, -0.0002119317650794983, -0.0001967698335647583, -0.0001816079020500183, -0.00016644597053527832, -0.00015128403902053833, -0.00013612210750579834, -0.00012096017599105835, -0.00010579824447631836, -9.063631296157837e-05, -7.547438144683838e-05, -6.031244993209839e-05, -4.51505184173584e-05, -2.9988586902618408e-05, -1.4826655387878418e-05, 3.3527612686157227e-07, 1.5497207641601562e-05, 3.065913915634155e-05, 4.582107067108154e-05, 6.098300218582153e-05, 7.614493370056152e-05, 9.130686521530151e-05, 0.0001064687967300415, 0.0001216307282447815, 0.00013679265975952148, 0.00015195459127426147, 0.00016711652278900146, 0.00018227845430374146, 0.00019744038581848145, 0.00021260231733322144, 0.00022776424884796143, 0.00024292618036270142, 0.0002580881118774414, 0.0002732500433921814, 0.0002884119749069214, 0.0003035739064216614, 0.00031873583793640137, 0.00033389776945114136, 0.00034905970096588135, 0.00036422163248062134, 0.00037938356399536133, 0.0003945454955101013, 0.0004097074270248413, 0.0004248693585395813, 0.0004400312900543213, 0.0004551932215690613, 0.00047035515308380127, 0.00048551708459854126, 0.0005006790161132812]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 5.0, 3.0, 6.0, 7.0, 5.0, 4.0, 8.0, 7.0, 13.0, 22.0, 22.0, 38.0, 37.0, 66.0, 72.0, 83.0, 131.0, 104.0, 86.0, 68.0, 51.0, 36.0, 26.0, 25.0, 20.0, 10.0, 10.0, 9.0, 3.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.812810897827148e-05, -6.605498492717743e-05, -6.398186087608337e-05, -6.190873682498932e-05, -5.9835612773895264e-05, -5.776248872280121e-05, -5.568936467170715e-05, -5.36162406206131e-05, -5.154311656951904e-05, -4.946999251842499e-05, -4.739686846733093e-05, -4.532374441623688e-05, -4.325062036514282e-05, -4.117749631404877e-05, -3.910437226295471e-05, -3.703124821186066e-05, -3.49581241607666e-05, -3.2885000109672546e-05, -3.081187605857849e-05, -2.8738752007484436e-05, -2.666562795639038e-05, -2.4592503905296326e-05, -2.251937985420227e-05, -2.0446255803108215e-05, -1.837313175201416e-05, -1.6300007700920105e-05, -1.422688364982605e-05, -1.2153759598731995e-05, -1.008063554763794e-05, -8.007511496543884e-06, -5.934387445449829e-06, -3.861263394355774e-06, -1.7881393432617188e-06, 2.849847078323364e-07, 2.3581087589263916e-06, 4.431232810020447e-06, 6.504356861114502e-06, 8.577480912208557e-06, 1.0650604963302612e-05, 1.2723729014396667e-05, 1.4796853065490723e-05, 1.6869977116584778e-05, 1.8943101167678833e-05, 2.1016225218772888e-05, 2.3089349269866943e-05, 2.5162473320961e-05, 2.7235597372055054e-05, 2.930872142314911e-05, 3.1381845474243164e-05, 3.345496952533722e-05, 3.5528093576431274e-05, 3.760121762752533e-05, 3.9674341678619385e-05, 4.174746572971344e-05, 4.3820589780807495e-05, 4.589371383190155e-05, 4.7966837882995605e-05, 5.003996193408966e-05, 5.2113085985183716e-05, 5.418621003627777e-05, 5.6259334087371826e-05, 5.833245813846588e-05, 6.0405582189559937e-05, 6.247870624065399e-05, 6.455183029174805e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 11.0, 7.0, 7.0, 15.0, 19.0, 18.0, 19.0, 34.0, 50.0, 63.0, 96.0, 136.0, 149.0, 90.0, 65.0, 55.0, 28.0, 29.0, 20.0, 17.0, 17.0, 6.0, 12.0, 6.0, 9.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0026861666701734066, -0.0026075050700455904, -0.002528843702748418, -0.0024501821026206017, -0.002371520735323429, -0.002292859135195613, -0.0022141975350677967, -0.002135536167770624, -0.002056874567642808, -0.0019782129675149918, -0.0018995516002178192, -0.001820890000090003, -0.0017422285163775086, -0.0016635670326650143, -0.001584905432537198, -0.0015062439488247037, -0.0014275824651122093, -0.001348920981399715, -0.0012702594976872206, -0.0011915978975594044, -0.00111293641384691, -0.0010342749301344156, -0.0009556133882142603, -0.000876951846294105, -0.0007982903625816107, -0.0007196288788691163, -0.000640967336948961, -0.0005623057950288057, -0.00048364431131631136, -0.00040498279849998653, -0.0003263212856836617, -0.0002476597437635064, -0.00016899826005101204, -9.033674723468721e-05, -1.1675234418362379e-05, 6.698627839796245e-05, 0.00014564779121428728, 0.0002243093040306121, 0.00030297081684693694, 0.00038163235876709223, 0.0004602938424795866, 0.000538955326192081, 0.0006176168681122363, 0.0006962784100323915, 0.0007749398937448859, 0.0008536013774573803, 0.0009322629193775356, 0.0010109244612976909, 0.0010895859450101852, 0.0011682474287226796, 0.001246908912435174, 0.0013255705125629902, 0.0014042319962754846, 0.001482893479987979, 0.0015615550801157951, 0.0016402165638282895, 0.0017188780475407839, 0.0017975395312532783, 0.0018762010149657726, 0.001954862615093589, 0.002033524215221405, 0.0021121855825185776, 0.0021908471826463938, 0.00226950878277421, 0.0023481701500713825]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 8.0, 12.0, 10.0, 15.0, 21.0, 15.0, 20.0, 25.0, 23.0, 42.0, 27.0, 36.0, 43.0, 45.0, 48.0, 45.0, 33.0, 49.0, 40.0, 48.0, 40.0, 35.0, 32.0, 29.0, 39.0, 29.0, 20.0, 26.0, 23.0, 19.0, 14.0, 21.0, 12.0, 10.0, 5.0, 5.0, 7.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001546455081552267, -0.0014955091755837202, -0.0014445632696151733, -0.0013936174800619483, -0.0013426715740934014, -0.0012917256681248546, -0.0012407797621563077, -0.0011898339726030827, -0.0011388880666345358, -0.001087942160665989, -0.001036996254697442, -0.000986050465144217, -0.0009351045591756701, -0.0008841586532071233, -0.0008332127472385764, -0.0007822668994776905, -0.0007313209935091436, -0.0006803750875405967, -0.0006294292397797108, -0.0005784833338111639, -0.000527537486050278, -0.0004765915800817311, -0.00042564570321701467, -0.00037469982635229826, -0.00032375394948758185, -0.00027280807262286544, -0.00022186219575814903, -0.0001709163043415174, -0.00011997042747680098, -6.902453606016934e-05, -1.807865919545293e-05, 3.286721766926348e-05, 8.381309453397989e-05, 0.0001347589713986963, 0.00018570484826341271, 0.00023665073968004435, 0.00028759660199284554, 0.0003385425079613924, 0.0003894883848261088, 0.0004404342616908252, 0.0004913801094517112, 0.000542326015420258, 0.000593271863181144, 0.0006442177691496909, 0.0006951636169105768, 0.0007461095228791237, 0.0007970554288476706, 0.0008480012766085565, 0.0008989471825771034, 0.0009498930885456502, 0.0010008389363065362, 0.001051784842275083, 0.00110273074824363, 0.001153676537796855, 0.0012046224437654018, 0.0012555683497339487, 0.0013065142557024956, 0.0013574601616710424, 0.0014084060676395893, 0.0014593518571928144, 0.0015102977631613612, 0.001561243669129908, 0.001612189575098455, 0.00166313536465168, 0.0017140812706202269]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 9.0, 18.0, 23.0, 33.0, 45.0, 64.0, 89.0, 160.0, 192.0, 286.0, 428.0, 619.0, 946.0, 1438.0, 2203.0, 3479.0, 5416.0, 8901.0, 14293.0, 24740.0, 44027.0, 86683.0, 204685.0, 339686.0, 151477.0, 68595.0, 36352.0, 20464.0, 12142.0, 7455.0, 4823.0, 2998.0, 1931.0, 1242.0, 818.0, 551.0, 393.0, 244.0, 197.0, 126.0, 82.0, 67.0, 36.0, 29.0, 23.0, 16.0, 6.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.00399017333984375, -0.003873974084854126, -0.003757774829864502, -0.003641575574874878, -0.003525376319885254, -0.00340917706489563, -0.003292977809906006, -0.003176778554916382, -0.003060579299926758, -0.002944380044937134, -0.0028281807899475098, -0.0027119815349578857, -0.0025957822799682617, -0.0024795830249786377, -0.0023633837699890137, -0.0022471845149993896, -0.0021309852600097656, -0.0020147860050201416, -0.0018985867500305176, -0.0017823874950408936, -0.0016661882400512695, -0.0015499889850616455, -0.0014337897300720215, -0.0013175904750823975, -0.0012013912200927734, -0.0010851919651031494, -0.0009689927101135254, -0.0008527934551239014, -0.0007365942001342773, -0.0006203949451446533, -0.0005041956901550293, -0.0003879964351654053, -0.00027179718017578125, -0.00015559792518615723, -3.93986701965332e-05, 7.680058479309082e-05, 0.00019299983978271484, 0.00030919909477233887, 0.0004253983497619629, 0.0005415976047515869, 0.0006577968597412109, 0.000773996114730835, 0.000890195369720459, 0.001006394624710083, 0.001122593879699707, 0.001238793134689331, 0.001354992389678955, 0.001471191644668579, 0.0015873908996582031, 0.0017035901546478271, 0.0018197894096374512, 0.0019359886646270752, 0.0020521879196166992, 0.0021683871746063232, 0.0022845864295959473, 0.0024007856845855713, 0.0025169849395751953, 0.0026331841945648193, 0.0027493834495544434, 0.0028655827045440674, 0.0029817819595336914, 0.0030979812145233154, 0.0032141804695129395, 0.0033303797245025635, 0.0034465789794921875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 4.0, 7.0, 5.0, 8.0, 18.0, 19.0, 15.0, 13.0, 26.0, 29.0, 31.0, 43.0, 32.0, 54.0, 50.0, 49.0, 47.0, 45.0, 52.0, 53.0, 48.0, 38.0, 47.0, 42.0, 31.0, 25.0, 34.0, 23.0, 25.0, 28.0, 9.0, 11.0, 8.0, 9.0, 4.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0011758804321289062, -0.0011420994997024536, -0.001108318567276001, -0.0010745376348495483, -0.0010407567024230957, -0.001006975769996643, -0.0009731948375701904, -0.0009394139051437378, -0.0009056329727172852, -0.0008718520402908325, -0.0008380711078643799, -0.0008042901754379272, -0.0007705092430114746, -0.000736728310585022, -0.0007029473781585693, -0.0006691664457321167, -0.0006353855133056641, -0.0006016045808792114, -0.0005678236484527588, -0.0005340427160263062, -0.0005002617835998535, -0.0004664808511734009, -0.00043269991874694824, -0.0003989189863204956, -0.00036513805389404297, -0.00033135712146759033, -0.0002975761890411377, -0.00026379525661468506, -0.00023001432418823242, -0.00019623339176177979, -0.00016245245933532715, -0.0001286715269088745, -9.489059448242188e-05, -6.110966205596924e-05, -2.73287296295166e-05, 6.452202796936035e-06, 4.023313522338867e-05, 7.401406764984131e-05, 0.00010779500007629395, 0.00014157593250274658, 0.00017535686492919922, 0.00020913779735565186, 0.0002429187297821045, 0.00027669966220855713, 0.00031048059463500977, 0.0003442615270614624, 0.00037804245948791504, 0.0004118233919143677, 0.0004456043243408203, 0.00047938525676727295, 0.0005131661891937256, 0.0005469471216201782, 0.0005807280540466309, 0.0006145089864730835, 0.0006482899188995361, 0.0006820708513259888, 0.0007158517837524414, 0.000749632716178894, 0.0007834136486053467, 0.0008171945810317993, 0.000850975513458252, 0.0008847564458847046, 0.0009185373783111572, 0.0009523183107376099, 0.0009860992431640625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 6.0, 16.0, 18.0, 38.0, 40.0, 71.0, 135.0, 251.0, 399.0, 744.0, 1487.0, 3044.0, 6068.0, 13538.0, 31585.0, 78137.0, 241151.0, 444733.0, 136808.0, 50637.0, 21204.0, 9423.0, 4273.0, 2157.0, 1104.0, 613.0, 343.0, 178.0, 109.0, 79.0, 36.0, 29.0, 21.0, 22.0, 15.0, 11.0, 5.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034275054931640625, -0.0033018290996551514, -0.0031761527061462402, -0.003050476312637329, -0.002924799919128418, -0.002799123525619507, -0.0026734471321105957, -0.0025477707386016846, -0.0024220943450927734, -0.0022964179515838623, -0.002170741558074951, -0.00204506516456604, -0.001919388771057129, -0.0017937123775482178, -0.0016680359840393066, -0.0015423595905303955, -0.0014166831970214844, -0.0012910068035125732, -0.0011653304100036621, -0.001039654016494751, -0.0009139776229858398, -0.0007883012294769287, -0.0006626248359680176, -0.0005369484424591064, -0.0004112720489501953, -0.0002855956554412842, -0.00015991926193237305, -3.4242868423461914e-05, 9.143352508544922e-05, 0.00021710991859436035, 0.0003427863121032715, 0.0004684627056121826, 0.0005941390991210938, 0.0007198154926300049, 0.000845491886138916, 0.0009711682796478271, 0.0010968446731567383, 0.0012225210666656494, 0.0013481974601745605, 0.0014738738536834717, 0.0015995502471923828, 0.001725226640701294, 0.001850903034210205, 0.001976579427719116, 0.0021022558212280273, 0.0022279322147369385, 0.0023536086082458496, 0.0024792850017547607, 0.002604961395263672, 0.002730637788772583, 0.002856314182281494, 0.0029819905757904053, 0.0031076669692993164, 0.0032333433628082275, 0.0033590197563171387, 0.00348469614982605, 0.003610372543334961, 0.003736048936843872, 0.003861725330352783, 0.003987401723861694, 0.0041130781173706055, 0.004238754510879517, 0.004364430904388428, 0.004490107297897339, 0.00461578369140625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 7.0, 4.0, 14.0, 13.0, 12.0, 11.0, 15.0, 14.0, 26.0, 32.0, 27.0, 29.0, 33.0, 39.0, 35.0, 32.0, 29.0, 49.0, 41.0, 54.0, 40.0, 39.0, 49.0, 45.0, 37.0, 32.0, 38.0, 26.0, 31.0, 38.0, 28.0, 17.0, 13.0, 11.0, 6.0, 7.0, 11.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0009322166442871094, -0.0009067356586456299, -0.0008812546730041504, -0.0008557736873626709, -0.0008302927017211914, -0.0008048117160797119, -0.0007793307304382324, -0.0007538497447967529, -0.0007283687591552734, -0.0007028877735137939, -0.0006774067878723145, -0.000651925802230835, -0.0006264448165893555, -0.000600963830947876, -0.0005754828453063965, -0.000550001859664917, -0.0005245208740234375, -0.000499039888381958, -0.0004735589027404785, -0.000448077917098999, -0.00042259693145751953, -0.00039711594581604004, -0.00037163496017456055, -0.00034615397453308105, -0.00032067298889160156, -0.00029519200325012207, -0.0002697110176086426, -0.0002442300319671631, -0.0002187490463256836, -0.0001932680606842041, -0.0001677870750427246, -0.00014230608940124512, -0.00011682510375976562, -9.134411811828613e-05, -6.586313247680664e-05, -4.038214683532715e-05, -1.4901161193847656e-05, 1.0579824447631836e-05, 3.606081008911133e-05, 6.154179573059082e-05, 8.702278137207031e-05, 0.0001125037670135498, 0.0001379847526550293, 0.0001634657382965088, 0.00018894672393798828, 0.00021442770957946777, 0.00023990869522094727, 0.00026538968086242676, 0.00029087066650390625, 0.00031635165214538574, 0.00034183263778686523, 0.0003673136234283447, 0.0003927946090698242, 0.0004182755947113037, 0.0004437565803527832, 0.0004692375659942627, 0.0004947185516357422, 0.0005201995372772217, 0.0005456805229187012, 0.0005711615085601807, 0.0005966424942016602, 0.0006221234798431396, 0.0006476044654846191, 0.0006730854511260986, 0.0006985664367675781]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 9.0, 20.0, 15.0, 28.0, 48.0, 64.0, 106.0, 185.0, 347.0, 709.0, 1610.0, 4588.0, 17698.0, 125937.0, 807363.0, 71096.0, 12332.0, 3669.0, 1352.0, 601.0, 320.0, 150.0, 104.0, 58.0, 38.0, 24.0, 21.0, 16.0, 7.0, 7.0, 5.0, 1.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011992454528808594, -0.00011584348976612091, -0.00011176243424415588, -0.00010768137872219086, -0.00010360032320022583, -9.95192676782608e-05, -9.543821215629578e-05, -9.135715663433075e-05, -8.727610111236572e-05, -8.31950455904007e-05, -7.911399006843567e-05, -7.503293454647064e-05, -7.095187902450562e-05, -6.687082350254059e-05, -6.278976798057556e-05, -5.8708712458610535e-05, -5.462765693664551e-05, -5.054660141468048e-05, -4.6465545892715454e-05, -4.238449037075043e-05, -3.83034348487854e-05, -3.4222379326820374e-05, -3.0141323804855347e-05, -2.606026828289032e-05, -2.1979212760925293e-05, -1.7898157238960266e-05, -1.381710171699524e-05, -9.736046195030212e-06, -5.6549906730651855e-06, -1.5739351511001587e-06, 2.507120370864868e-06, 6.588175892829895e-06, 1.0669231414794922e-05, 1.4750286936759949e-05, 1.8831342458724976e-05, 2.2912397980690002e-05, 2.699345350265503e-05, 3.1074509024620056e-05, 3.515556454658508e-05, 3.923662006855011e-05, 4.331767559051514e-05, 4.7398731112480164e-05, 5.147978663444519e-05, 5.556084215641022e-05, 5.9641897678375244e-05, 6.372295320034027e-05, 6.78040087223053e-05, 7.188506424427032e-05, 7.596611976623535e-05, 8.004717528820038e-05, 8.41282308101654e-05, 8.820928633213043e-05, 9.229034185409546e-05, 9.637139737606049e-05, 0.00010045245289802551, 0.00010453350841999054, 0.00010861456394195557, 0.0001126956194639206, 0.00011677667498588562, 0.00012085773050785065, 0.00012493878602981567, 0.0001290198415517807, 0.00013310089707374573, 0.00013718195259571075, 0.00014126300811767578]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 3.0, 2.0, 7.0, 5.0, 6.0, 10.0, 20.0, 20.0, 46.0, 87.0, 94.0, 171.0, 165.0, 112.0, 88.0, 63.0, 23.0, 24.0, 21.0, 8.0, 12.0, 6.0, 1.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.000301361083984e-06, -8.781440556049347e-06, -8.56257975101471e-06, -8.343718945980072e-06, -8.124858140945435e-06, -7.905997335910797e-06, -7.68713653087616e-06, -7.468275725841522e-06, -7.249414920806885e-06, -7.030554115772247e-06, -6.81169331073761e-06, -6.592832505702972e-06, -6.373971700668335e-06, -6.1551108956336975e-06, -5.93625009059906e-06, -5.717389285564423e-06, -5.498528480529785e-06, -5.279667675495148e-06, -5.06080687046051e-06, -4.841946065425873e-06, -4.623085260391235e-06, -4.404224455356598e-06, -4.1853636503219604e-06, -3.966502845287323e-06, -3.7476420402526855e-06, -3.528781235218048e-06, -3.3099204301834106e-06, -3.091059625148773e-06, -2.8721988201141357e-06, -2.6533380150794983e-06, -2.434477210044861e-06, -2.2156164050102234e-06, -1.996755599975586e-06, -1.7778947949409485e-06, -1.559033989906311e-06, -1.3401731848716736e-06, -1.1213123798370361e-06, -9.024515748023987e-07, -6.835907697677612e-07, -4.647299647331238e-07, -2.4586915969848633e-07, -2.7008354663848877e-08, 1.9185245037078857e-07, 4.10713255405426e-07, 6.295740604400635e-07, 8.484348654747009e-07, 1.0672956705093384e-06, 1.2861564755439758e-06, 1.5050172805786133e-06, 1.7238780856132507e-06, 1.942738890647888e-06, 2.1615996956825256e-06, 2.380460500717163e-06, 2.5993213057518005e-06, 2.818182110786438e-06, 3.0370429158210754e-06, 3.255903720855713e-06, 3.4747645258903503e-06, 3.693625330924988e-06, 3.912486135959625e-06, 4.131346940994263e-06, 4.3502077460289e-06, 4.569068551063538e-06, 4.787929356098175e-06, 5.0067901611328125e-06]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 8.0, 15.0, 31.0, 20.0, 38.0, 69.0, 119.0, 184.0, 319.0, 522.0, 891.0, 1646.0, 3168.0, 6539.0, 15331.0, 40697.0, 134011.0, 508384.0, 234822.0, 62044.0, 21227.0, 9235.0, 4296.0, 2165.0, 1138.0, 647.0, 384.0, 201.0, 137.0, 85.0, 54.0, 30.0, 27.0, 23.0, 8.0, 8.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5822391510009766e-05, -3.4574419260025024e-05, -3.332644701004028e-05, -3.207847476005554e-05, -3.08305025100708e-05, -2.958253026008606e-05, -2.833455801010132e-05, -2.7086585760116577e-05, -2.5838613510131836e-05, -2.4590641260147095e-05, -2.3342669010162354e-05, -2.2094696760177612e-05, -2.084672451019287e-05, -1.959875226020813e-05, -1.835078001022339e-05, -1.7102807760238647e-05, -1.5854835510253906e-05, -1.4606863260269165e-05, -1.3358891010284424e-05, -1.2110918760299683e-05, -1.0862946510314941e-05, -9.6149742603302e-06, -8.367002010345459e-06, -7.119029760360718e-06, -5.8710575103759766e-06, -4.623085260391235e-06, -3.375113010406494e-06, -2.127140760421753e-06, -8.791685104370117e-07, 3.688037395477295e-07, 1.6167759895324707e-06, 2.864748239517212e-06, 4.112720489501953e-06, 5.360692739486694e-06, 6.6086649894714355e-06, 7.856637239456177e-06, 9.104609489440918e-06, 1.035258173942566e-05, 1.16005539894104e-05, 1.2848526239395142e-05, 1.4096498489379883e-05, 1.5344470739364624e-05, 1.6592442989349365e-05, 1.7840415239334106e-05, 1.9088387489318848e-05, 2.033635973930359e-05, 2.158433198928833e-05, 2.283230423927307e-05, 2.4080276489257812e-05, 2.5328248739242554e-05, 2.6576220989227295e-05, 2.7824193239212036e-05, 2.9072165489196777e-05, 3.032013773918152e-05, 3.156810998916626e-05, 3.2816082239151e-05, 3.406405448913574e-05, 3.5312026739120483e-05, 3.6559998989105225e-05, 3.7807971239089966e-05, 3.905594348907471e-05, 4.030391573905945e-05, 4.155188798904419e-05, 4.279986023902893e-05, 4.404783248901367e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 7.0, 4.0, 7.0, 5.0, 15.0, 23.0, 22.0, 29.0, 44.0, 42.0, 41.0, 69.0, 75.0, 43.0, 71.0, 47.0, 66.0, 39.0, 67.0, 48.0, 51.0, 29.0, 30.0, 29.0, 22.0, 14.0, 15.0, 15.0, 4.0, 5.0, 2.0, 5.0, 0.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.894371032714844e-06, -9.612180292606354e-06, -9.329989552497864e-06, -9.047798812389374e-06, -8.765608072280884e-06, -8.483417332172394e-06, -8.201226592063904e-06, -7.919035851955414e-06, -7.636845111846924e-06, -7.354654371738434e-06, -7.072463631629944e-06, -6.790272891521454e-06, -6.508082151412964e-06, -6.225891411304474e-06, -5.943700671195984e-06, -5.661509931087494e-06, -5.379319190979004e-06, -5.097128450870514e-06, -4.814937710762024e-06, -4.532746970653534e-06, -4.250556230545044e-06, -3.968365490436554e-06, -3.686174750328064e-06, -3.403984010219574e-06, -3.121793270111084e-06, -2.839602530002594e-06, -2.557411789894104e-06, -2.275221049785614e-06, -1.993030309677124e-06, -1.710839569568634e-06, -1.428648829460144e-06, -1.146458089351654e-06, -8.642673492431641e-07, -5.820766091346741e-07, -2.998858690261841e-07, -1.7695128917694092e-08, 2.644956111907959e-07, 5.466863512992859e-07, 8.288770914077759e-07, 1.1110678315162659e-06, 1.3932585716247559e-06, 1.6754493117332458e-06, 1.957640051841736e-06, 2.239830791950226e-06, 2.522021532058716e-06, 2.804212272167206e-06, 3.086403012275696e-06, 3.368593752384186e-06, 3.6507844924926758e-06, 3.932975232601166e-06, 4.215165972709656e-06, 4.497356712818146e-06, 4.779547452926636e-06, 5.061738193035126e-06, 5.343928933143616e-06, 5.626119673252106e-06, 5.908310413360596e-06, 6.190501153469086e-06, 6.472691893577576e-06, 6.754882633686066e-06, 7.037073373794556e-06, 7.319264113903046e-06, 7.601454854011536e-06, 7.883645594120026e-06, 8.165836334228516e-06]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 9.0, 16.0, 23.0, 36.0, 63.0, 110.0, 274.0, 213.0, 109.0, 55.0, 31.0, 15.0, 10.0, 7.0, 11.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0040811714716255665, -0.0039835465140640736, -0.0038859210908412933, -0.0037882961332798004, -0.003690670942887664, -0.0035930457524955273, -0.0034954205621033907, -0.003397795371711254, -0.0033001701813191175, -0.003202544990926981, -0.0031049198005348444, -0.003007294610142708, -0.002909669652581215, -0.0028120444621890783, -0.0027144192717969418, -0.002616794081404805, -0.0025191688910126686, -0.002421543700620532, -0.0023239185102283955, -0.0022262935526669025, -0.002128668362274766, -0.0020310431718826294, -0.0019334179814904928, -0.0018357927910983562, -0.0017381678335368633, -0.0016405426431447268, -0.001542917569167912, -0.0014452923787757754, -0.0013476671883836389, -0.0012500421144068241, -0.0011524169240146875, -0.001054791733622551, -0.0009571665432304144, -0.0008595414110459387, -0.0007619162206538022, -0.0006642910884693265, -0.0005666658980771899, -0.00046904076589271426, -0.0003714156337082386, -0.00027379044331610203, -0.00017616531113162637, -7.854015711927786e-05, 1.9084996893070638e-05, 0.00011671014362946153, 0.00021433530491776764, 0.00031196046620607376, 0.0004095855983905494, 0.000507210788782686, 0.0006048359209671617, 0.0007024610531516373, 0.0008000862435437739, 0.0008977113757282495, 0.0009953365661203861, 0.0010929617565125227, 0.0011905868304893374, 0.001288212020881474, 0.0013858370948582888, 0.0014834622852504253, 0.00158108735922724, 0.0016787125496193767, 0.0017763377400115132, 0.001873962813988328, 0.0019715880043804646, 0.002069213194772601, 0.0021668383851647377]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 3.0, 15.0, 11.0, 16.0, 13.0, 27.0, 25.0, 24.0, 33.0, 31.0, 28.0, 34.0, 37.0, 38.0, 52.0, 49.0, 55.0, 60.0, 39.0, 48.0, 38.0, 34.0, 43.0, 30.0, 26.0, 33.0, 25.0, 21.0, 22.0, 16.0, 9.0, 15.0, 4.0, 13.0, 5.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.0012106747599318624, -0.0011751882266253233, -0.001139701809734106, -0.001104215276427567, -0.001068728743121028, -0.0010332422098144889, -0.0009977556765079498, -0.0009622692596167326, -0.0009267827263101935, -0.0008912961930036545, -0.0008558097179047763, -0.0008203232428058982, -0.0007848367094993591, -0.0007493501761928201, -0.0007138637010939419, -0.0006783772259950638, -0.0006428906926885247, -0.0006074041593819857, -0.0005719176842831075, -0.0005364312091842294, -0.0005009446758776903, -0.0004654581716749817, -0.0004299716674722731, -0.0003944851632695645, -0.0003589986590668559, -0.0003235121548641473, -0.0002880256506614387, -0.0002525391464587301, -0.0002170526422560215, -0.0001815661380533129, -0.0001460796338506043, -0.0001105931296478957, -7.510674186050892e-05, -3.962023765780032e-05, -4.133733455091715e-06, 3.135277074761689e-05, 6.683927495032549e-05, 0.00010232577915303409, 0.0001378122833557427, 0.0001732987875584513, 0.0002087852917611599, 0.0002442717959638685, 0.0002797583001665771, 0.0003152448043692857, 0.0003507313085719943, 0.0003862178127747029, 0.0004217043169774115, 0.0004571908211801201, 0.0004926773253828287, 0.0005281638586893678, 0.0005636503337882459, 0.0005991368088871241, 0.0006346233421936631, 0.0006701098755002022, 0.0007055963505990803, 0.0007410828256979585, 0.0007765693590044975, 0.0008120558923110366, 0.0008475423674099147, 0.0008830288425087929, 0.0009185153758153319, 0.000954001909121871, 0.0009894883260130882, 0.0010249748593196273, 0.0010604613926261663]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 5.0, 11.0, 14.0, 16.0, 9.0, 27.0, 30.0, 43.0, 60.0, 95.0, 147.0, 261.0, 510.0, 1109.0, 3013.0, 9059.0, 39696.0, 4095448.0, 31436.0, 8035.0, 2751.0, 1170.0, 518.0, 287.0, 166.0, 87.0, 86.0, 38.0, 40.0, 28.0, 14.0, 12.0, 10.0, 14.0, 6.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00701141357421875, -0.006795287132263184, -0.006579160690307617, -0.006363034248352051, -0.006146907806396484, -0.005930781364440918, -0.0057146549224853516, -0.005498528480529785, -0.005282402038574219, -0.005066275596618652, -0.004850149154663086, -0.0046340227127075195, -0.004417896270751953, -0.004201769828796387, -0.00398564338684082, -0.003769516944885254, -0.0035533905029296875, -0.003337264060974121, -0.0031211376190185547, -0.0029050111770629883, -0.002688884735107422, -0.0024727582931518555, -0.002256631851196289, -0.0020405054092407227, -0.0018243789672851562, -0.0016082525253295898, -0.0013921260833740234, -0.001175999641418457, -0.0009598731994628906, -0.0007437467575073242, -0.0005276203155517578, -0.0003114938735961914, -9.5367431640625e-05, 0.0001207590103149414, 0.0003368854522705078, 0.0005530118942260742, 0.0007691383361816406, 0.000985264778137207, 0.0012013912200927734, 0.0014175176620483398, 0.0016336441040039062, 0.0018497705459594727, 0.002065896987915039, 0.0022820234298706055, 0.002498149871826172, 0.0027142763137817383, 0.0029304027557373047, 0.003146529197692871, 0.0033626556396484375, 0.003578782081604004, 0.0037949085235595703, 0.004011034965515137, 0.004227161407470703, 0.0044432878494262695, 0.004659414291381836, 0.004875540733337402, 0.005091667175292969, 0.005307793617248535, 0.0055239200592041016, 0.005740046501159668, 0.005956172943115234, 0.006172299385070801, 0.006388425827026367, 0.006604552268981934, 0.0068206787109375]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 10.0, 10.0, 16.0, 12.0, 17.0, 14.0, 34.0, 20.0, 41.0, 31.0, 35.0, 37.0, 38.0, 46.0, 59.0, 52.0, 46.0, 47.0, 54.0, 38.0, 36.0, 35.0, 35.0, 33.0, 34.0, 38.0, 24.0, 16.0, 20.0, 4.0, 8.0, 13.0, 8.0, 9.0, 4.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0006513595581054688, -0.0006312578916549683, -0.0006111562252044678, -0.0005910545587539673, -0.0005709528923034668, -0.0005508512258529663, -0.0005307495594024658, -0.0005106478929519653, -0.0004905462265014648, -0.00047044456005096436, -0.00045034289360046387, -0.0004302412271499634, -0.0004101395606994629, -0.0003900378942489624, -0.0003699362277984619, -0.0003498345613479614, -0.00032973289489746094, -0.00030963122844696045, -0.00028952956199645996, -0.00026942789554595947, -0.000249326229095459, -0.0002292245626449585, -0.000209122896194458, -0.00018902122974395752, -0.00016891956329345703, -0.00014881789684295654, -0.00012871623039245605, -0.00010861456394195557, -8.851289749145508e-05, -6.841123104095459e-05, -4.83095645904541e-05, -2.8207898139953613e-05, -8.106231689453125e-06, 1.1995434761047363e-05, 3.209710121154785e-05, 5.219876766204834e-05, 7.230043411254883e-05, 9.240210056304932e-05, 0.0001125037670135498, 0.0001326054334640503, 0.00015270709991455078, 0.00017280876636505127, 0.00019291043281555176, 0.00021301209926605225, 0.00023311376571655273, 0.0002532154321670532, 0.0002733170986175537, 0.0002934187650680542, 0.0003135204315185547, 0.0003336220979690552, 0.00035372376441955566, 0.00037382543087005615, 0.00039392709732055664, 0.00041402876377105713, 0.0004341304302215576, 0.0004542320966720581, 0.0004743337631225586, 0.0004944354295730591, 0.0005145370960235596, 0.0005346387624740601, 0.0005547404289245605, 0.000574842095375061, 0.0005949437618255615, 0.000615045428276062, 0.0006351470947265625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 6.0, 1.0, 18.0, 14.0, 20.0, 26.0, 52.0, 43.0, 85.0, 105.0, 170.0, 265.0, 453.0, 697.0, 1283.0, 2244.0, 4440.0, 10138.0, 28297.0, 158301.0, 3838845.0, 107024.0, 23202.0, 8991.0, 4211.0, 2162.0, 1234.0, 713.0, 435.0, 269.0, 188.0, 106.0, 73.0, 41.0, 38.0, 25.0, 22.0, 7.0, 7.0, 6.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0034694671630859375, -0.0033742189407348633, -0.003278970718383789, -0.003183722496032715, -0.0030884742736816406, -0.0029932260513305664, -0.002897977828979492, -0.002802729606628418, -0.0027074813842773438, -0.0026122331619262695, -0.0025169849395751953, -0.002421736717224121, -0.002326488494873047, -0.0022312402725219727, -0.0021359920501708984, -0.0020407438278198242, -0.00194549560546875, -0.0018502473831176758, -0.0017549991607666016, -0.0016597509384155273, -0.0015645027160644531, -0.001469254493713379, -0.0013740062713623047, -0.0012787580490112305, -0.0011835098266601562, -0.001088261604309082, -0.0009930133819580078, -0.0008977651596069336, -0.0008025169372558594, -0.0007072687149047852, -0.0006120204925537109, -0.0005167722702026367, -0.0004215240478515625, -0.0003262758255004883, -0.00023102760314941406, -0.00013577938079833984, -4.0531158447265625e-05, 5.4717063903808594e-05, 0.0001499652862548828, 0.00024521350860595703, 0.00034046173095703125, 0.00043570995330810547, 0.0005309581756591797, 0.0006262063980102539, 0.0007214546203613281, 0.0008167028427124023, 0.0009119510650634766, 0.0010071992874145508, 0.001102447509765625, 0.0011976957321166992, 0.0012929439544677734, 0.0013881921768188477, 0.0014834403991699219, 0.001578688621520996, 0.0016739368438720703, 0.0017691850662231445, 0.0018644332885742188, 0.001959681510925293, 0.002054929733276367, 0.0021501779556274414, 0.0022454261779785156, 0.00234067440032959, 0.002435922622680664, 0.0025311708450317383, 0.0026264190673828125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 9.0, 11.0, 9.0, 9.0, 9.0, 19.0, 20.0, 25.0, 30.0, 44.0, 77.0, 237.0, 627.0, 2089.0, 482.0, 171.0, 61.0, 30.0, 24.0, 15.0, 14.0, 11.0, 7.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.00045561790466308594, -0.00043900683522224426, -0.0004223957657814026, -0.0004057846963405609, -0.00038917362689971924, -0.00037256255745887756, -0.0003559514880180359, -0.0003393404185771942, -0.00032272934913635254, -0.00030611827969551086, -0.0002895072102546692, -0.0002728961408138275, -0.00025628507137298584, -0.00023967400193214417, -0.0002230629324913025, -0.00020645186305046082, -0.00018984079360961914, -0.00017322972416877747, -0.0001566186547279358, -0.00014000758528709412, -0.00012339651584625244, -0.00010678544640541077, -9.017437696456909e-05, -7.356330752372742e-05, -5.695223808288574e-05, -4.034116864204407e-05, -2.3730099201202393e-05, -7.119029760360718e-06, 9.492039680480957e-06, 2.6103109121322632e-05, 4.271417856216431e-05, 5.932524800300598e-05, 7.593631744384766e-05, 9.254738688468933e-05, 0.000109158456325531, 0.00012576952576637268, 0.00014238059520721436, 0.00015899166464805603, 0.0001756027340888977, 0.00019221380352973938, 0.00020882487297058105, 0.00022543594241142273, 0.0002420470118522644, 0.0002586580812931061, 0.00027526915073394775, 0.00029188022017478943, 0.0003084912896156311, 0.0003251023590564728, 0.00034171342849731445, 0.00035832449793815613, 0.0003749355673789978, 0.0003915466368198395, 0.00040815770626068115, 0.00042476877570152283, 0.0004413798451423645, 0.0004579909145832062, 0.00047460198402404785, 0.0004912130534648895, 0.0005078241229057312, 0.0005244351923465729, 0.0005410462617874146, 0.0005576573312282562, 0.0005742684006690979, 0.0005908794701099396, 0.0006074905395507812]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 7.0, 7.0, 11.0, 12.0, 20.0, 33.0, 59.0, 101.0, 209.0, 243.0, 121.0, 81.0, 37.0, 23.0, 15.0, 8.0, 10.0, 0.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0026527184527367353, -0.002591090276837349, -0.002529462333768606, -0.0024678341578692198, -0.002406206214800477, -0.0023445780389010906, -0.002282950095832348, -0.0022213219199329615, -0.0021596939768642187, -0.0020980658009648323, -0.0020364378578960896, -0.001974809681996703, -0.0019131817389279604, -0.0018515536794438958, -0.0017899256199598312, -0.0017282974440604448, -0.0016666693845763803, -0.0016050413250923157, -0.001543413265608251, -0.0014817852061241865, -0.001420157146640122, -0.0013585290871560574, -0.001296900911256671, -0.0012352729681879282, -0.0011736447922885418, -0.0011120167328044772, -0.0010503886733204126, -0.000988760613836348, -0.0009271325543522835, -0.0008655044948682189, -0.0008038763771764934, -0.0007422483176924288, -0.000680620432831347, -0.0006189923733472824, -0.0005573643138632178, -0.0004957362543791533, -0.0004341081657912582, -0.00037248010630719364, -0.0003108520177192986, -0.000249223958235234, -0.00018759589875116944, -0.00012596783926710486, -6.433976523112506e-05, -2.7116911951452494e-06, 5.891636828891933e-05, 0.00012054442777298391, 0.00018217251636087894, 0.00024380057584494352, 0.0003054286353290081, 0.0003670566948130727, 0.00042868475429713726, 0.0004903128137812018, 0.0005519408732652664, 0.000613568932749331, 0.0006751970504410565, 0.0007368251099251211, 0.0007984531694091856, 0.0008600812288932502, 0.0009217092883773148, 0.0009833374060690403, 0.0010449654655531049, 0.0011065935250371695, 0.001168221584521234, 0.0012298496440052986, 0.0012914777034893632]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 4.0, 5.0, 6.0, 11.0, 6.0, 9.0, 12.0, 9.0, 13.0, 16.0, 22.0, 21.0, 27.0, 30.0, 22.0, 20.0, 28.0, 26.0, 37.0, 42.0, 43.0, 49.0, 41.0, 32.0, 36.0, 36.0, 27.0, 36.0, 44.0, 30.0, 28.0, 33.0, 28.0, 25.0, 25.0, 13.0, 11.0, 13.0, 12.0, 11.0, 9.0, 10.0, 5.0, 9.0, 5.0, 4.0, 1.0, 4.0, 6.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00056170963216573, -0.0005429800949059427, -0.0005242504994384944, -0.0005055209621787071, -0.0004867914249189198, -0.000468061858555302, -0.00044933229219168425, -0.0004306027549318969, -0.00041187318856827915, -0.00039314362220466137, -0.00037441408494487405, -0.00035568451858125627, -0.0003369549522176385, -0.00031822541495785117, -0.0002994958485942334, -0.0002807662822306156, -0.0002620367449708283, -0.00024330719315912575, -0.0002245776413474232, -0.00020584807498380542, -0.00018711852317210287, -0.00016838897136040032, -0.00014965940499678254, -0.00013092985318508, -0.00011220030137337744, -9.347074956167489e-05, -7.474119047401473e-05, -5.601163502433337e-05, -3.7282079574652016e-05, -1.8552527762949467e-05, 1.7703132471069694e-07, 1.890659041237086e-05, 3.763614222407341e-05, 5.6365697673754767e-05, 7.509525312343612e-05, 9.382481221109629e-05, 0.00011255436402279884, 0.00013128391583450139, 0.00015001348219811916, 0.0001687430340098217, 0.00018747258582152426, 0.0002062021376332268, 0.00022493168944492936, 0.00024366125580854714, 0.0002623908221721649, 0.00028112035943195224, 0.00029984992579557, 0.0003185794921591878, 0.0003373090294189751, 0.0003560385957825929, 0.0003747681330423802, 0.000393497699405998, 0.0004122272366657853, 0.0004309568030294031, 0.00044968636939302087, 0.0004684159066528082, 0.00048714547301642597, 0.0005058750393800437, 0.0005246045766398311, 0.0005433341138996184, 0.0005620637093670666, 0.0005807932466268539, 0.0005995227838866413, 0.0006182523793540895, 0.0006369819166138768]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 7.0, 6.0, 15.0, 20.0, 27.0, 34.0, 67.0, 65.0, 95.0, 147.0, 240.0, 304.0, 440.0, 546.0, 797.0, 1193.0, 1707.0, 2581.0, 4054.0, 6347.0, 10360.0, 18139.0, 32544.0, 64404.0, 141080.0, 324477.0, 231874.0, 97408.0, 47184.0, 25055.0, 13879.0, 8244.0, 5099.0, 3240.0, 2091.0, 1426.0, 975.0, 637.0, 489.0, 364.0, 246.0, 180.0, 149.0, 94.0, 64.0, 59.0, 31.0, 27.0, 13.0, 17.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0006461143493652344, -0.000625118613243103, -0.0006041228771209717, -0.0005831271409988403, -0.000562131404876709, -0.0005411356687545776, -0.0005201399326324463, -0.0004991441965103149, -0.0004781484603881836, -0.00045715272426605225, -0.0004361569881439209, -0.00041516125202178955, -0.0003941655158996582, -0.00037316977977752686, -0.0003521740436553955, -0.00033117830753326416, -0.0003101825714111328, -0.00028918683528900146, -0.0002681910991668701, -0.00024719536304473877, -0.00022619962692260742, -0.00020520389080047607, -0.00018420815467834473, -0.00016321241855621338, -0.00014221668243408203, -0.00012122094631195068, -0.00010022521018981934, -7.922947406768799e-05, -5.823373794555664e-05, -3.723800182342529e-05, -1.6242265701293945e-05, 4.753470420837402e-06, 2.574920654296875e-05, 4.67449426651001e-05, 6.774067878723145e-05, 8.873641490936279e-05, 0.00010973215103149414, 0.0001307278871536255, 0.00015172362327575684, 0.00017271935939788818, 0.00019371509552001953, 0.00021471083164215088, 0.00023570656776428223, 0.0002567023038864136, 0.0002776980400085449, 0.00029869377613067627, 0.0003196895122528076, 0.00034068524837493896, 0.0003616809844970703, 0.00038267672061920166, 0.000403672456741333, 0.00042466819286346436, 0.0004456639289855957, 0.00046665966510772705, 0.0004876554012298584, 0.0005086511373519897, 0.0005296468734741211, 0.0005506426095962524, 0.0005716383457183838, 0.0005926340818405151, 0.0006136298179626465, 0.0006346255540847778, 0.0006556212902069092, 0.0006766170263290405, 0.0006976127624511719]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 6.0, 6.0, 6.0, 5.0, 8.0, 4.0, 10.0, 13.0, 10.0, 15.0, 10.0, 20.0, 27.0, 18.0, 20.0, 26.0, 24.0, 25.0, 22.0, 29.0, 40.0, 45.0, 45.0, 40.0, 47.0, 42.0, 33.0, 42.0, 25.0, 38.0, 28.0, 34.0, 29.0, 29.0, 24.0, 25.0, 19.0, 11.0, 18.0, 16.0, 9.0, 9.0, 10.0, 7.0, 10.0, 4.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0006098747253417969, -0.0005899369716644287, -0.0005699992179870605, -0.0005500614643096924, -0.0005301237106323242, -0.0005101859569549561, -0.0004902482032775879, -0.0004703104496002197, -0.00045037269592285156, -0.0004304349422454834, -0.00041049718856811523, -0.00039055943489074707, -0.0003706216812133789, -0.00035068392753601074, -0.0003307461738586426, -0.0003108084201812744, -0.00029087066650390625, -0.0002709329128265381, -0.0002509951591491699, -0.00023105740547180176, -0.0002111196517944336, -0.00019118189811706543, -0.00017124414443969727, -0.0001513063907623291, -0.00013136863708496094, -0.00011143088340759277, -9.149312973022461e-05, -7.155537605285645e-05, -5.161762237548828e-05, -3.167986869812012e-05, -1.1742115020751953e-05, 8.195638656616211e-06, 2.8133392333984375e-05, 4.807114601135254e-05, 6.80088996887207e-05, 8.794665336608887e-05, 0.00010788440704345703, 0.0001278221607208252, 0.00014775991439819336, 0.00016769766807556152, 0.0001876354217529297, 0.00020757317543029785, 0.00022751092910766602, 0.0002474486827850342, 0.00026738643646240234, 0.0002873241901397705, 0.00030726194381713867, 0.00032719969749450684, 0.000347137451171875, 0.00036707520484924316, 0.00038701295852661133, 0.0004069507122039795, 0.00042688846588134766, 0.0004468262195587158, 0.000466763973236084, 0.00048670172691345215, 0.0005066394805908203, 0.0005265772342681885, 0.0005465149879455566, 0.0005664527416229248, 0.000586390495300293, 0.0006063282489776611, 0.0006262660026550293, 0.0006462037563323975, 0.0006661415100097656]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 9.0, 14.0, 17.0, 26.0, 36.0, 31.0, 59.0, 88.0, 105.0, 136.0, 176.0, 259.0, 355.0, 562.0, 803.0, 1275.0, 2028.0, 3213.0, 5750.0, 10791.0, 22720.0, 58152.0, 229045.0, 535808.0, 106770.0, 35104.0, 15541.0, 7887.0, 4334.0, 2560.0, 1582.0, 1054.0, 712.0, 436.0, 327.0, 230.0, 145.0, 114.0, 78.0, 56.0, 50.0, 37.0, 24.0, 17.0, 6.0, 9.0, 5.0, 3.0, 8.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009136199951171875, -0.0008843839168548584, -0.0008551478385925293, -0.0008259117603302002, -0.0007966756820678711, -0.000767439603805542, -0.0007382035255432129, -0.0007089674472808838, -0.0006797313690185547, -0.0006504952907562256, -0.0006212592124938965, -0.0005920231342315674, -0.0005627870559692383, -0.0005335509777069092, -0.0005043148994445801, -0.000475078821182251, -0.0004458427429199219, -0.0004166066646575928, -0.00038737058639526367, -0.00035813450813293457, -0.00032889842987060547, -0.00029966235160827637, -0.00027042627334594727, -0.00024119019508361816, -0.00021195411682128906, -0.00018271803855895996, -0.00015348196029663086, -0.00012424588203430176, -9.500980377197266e-05, -6.577372550964355e-05, -3.653764724731445e-05, -7.3015689849853516e-06, 2.193450927734375e-05, 5.117058753967285e-05, 8.040666580200195e-05, 0.00010964274406433105, 0.00013887882232666016, 0.00016811490058898926, 0.00019735097885131836, 0.00022658705711364746, 0.00025582313537597656, 0.00028505921363830566, 0.00031429529190063477, 0.00034353137016296387, 0.00037276744842529297, 0.00040200352668762207, 0.00043123960494995117, 0.0004604756832122803, 0.0004897117614746094, 0.0005189478397369385, 0.0005481839179992676, 0.0005774199962615967, 0.0006066560745239258, 0.0006358921527862549, 0.000665128231048584, 0.0006943643093109131, 0.0007236003875732422, 0.0007528364658355713, 0.0007820725440979004, 0.0008113086223602295, 0.0008405447006225586, 0.0008697807788848877, 0.0008990168571472168, 0.0009282529354095459, 0.000957489013671875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 7.0, 7.0, 10.0, 6.0, 5.0, 14.0, 18.0, 20.0, 20.0, 26.0, 29.0, 31.0, 33.0, 46.0, 40.0, 51.0, 48.0, 42.0, 42.0, 34.0, 42.0, 42.0, 46.0, 43.0, 28.0, 32.0, 30.0, 33.0, 22.0, 29.0, 20.0, 12.0, 19.0, 7.0, 11.0, 15.0, 7.0, 5.0, 4.0, 4.0, 4.0, 6.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0005068778991699219, -0.0004922784864902496, -0.0004776790738105774, -0.00046307966113090515, -0.0004484802484512329, -0.00043388083577156067, -0.00041928142309188843, -0.0004046820104122162, -0.00039008259773254395, -0.0003754831850528717, -0.00036088377237319946, -0.0003462843596935272, -0.000331684947013855, -0.00031708553433418274, -0.0003024861216545105, -0.00028788670897483826, -0.000273287296295166, -0.0002586878836154938, -0.00024408847093582153, -0.0002294890582561493, -0.00021488964557647705, -0.0002002902328968048, -0.00018569082021713257, -0.00017109140753746033, -0.00015649199485778809, -0.00014189258217811584, -0.0001272931694984436, -0.00011269375681877136, -9.809434413909912e-05, -8.349493145942688e-05, -6.889551877975464e-05, -5.42961061000824e-05, -3.9696693420410156e-05, -2.5097280740737915e-05, -1.0497868061065674e-05, 4.101544618606567e-06, 1.870095729827881e-05, 3.330036997795105e-05, 4.789978265762329e-05, 6.249919533729553e-05, 7.709860801696777e-05, 9.169802069664001e-05, 0.00010629743337631226, 0.0001208968460559845, 0.00013549625873565674, 0.00015009567141532898, 0.00016469508409500122, 0.00017929449677467346, 0.0001938939094543457, 0.00020849332213401794, 0.00022309273481369019, 0.00023769214749336243, 0.00025229156017303467, 0.0002668909728527069, 0.00028149038553237915, 0.0002960897982120514, 0.00031068921089172363, 0.0003252886235713959, 0.0003398880362510681, 0.00035448744893074036, 0.0003690868616104126, 0.00038368627429008484, 0.0003982856869697571, 0.0004128850996494293, 0.00042748451232910156]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 6.0, 6.0, 10.0, 15.0, 17.0, 25.0, 24.0, 49.0, 73.0, 94.0, 156.0, 236.0, 358.0, 621.0, 1162.0, 2118.0, 4656.0, 12175.0, 43991.0, 648614.0, 283018.0, 32947.0, 9856.0, 3931.0, 1785.0, 974.0, 591.0, 332.0, 207.0, 124.0, 113.0, 66.0, 54.0, 39.0, 23.0, 23.0, 13.0, 13.0, 14.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017821788787841797, -0.0001722574234008789, -0.00016629695892333984, -0.00016033649444580078, -0.00015437602996826172, -0.00014841556549072266, -0.0001424551010131836, -0.00013649463653564453, -0.00013053417205810547, -0.0001245737075805664, -0.00011861324310302734, -0.00011265277862548828, -0.00010669231414794922, -0.00010073184967041016, -9.47713851928711e-05, -8.881092071533203e-05, -8.285045623779297e-05, -7.68899917602539e-05, -7.092952728271484e-05, -6.496906280517578e-05, -5.900859832763672e-05, -5.3048133850097656e-05, -4.7087669372558594e-05, -4.112720489501953e-05, -3.516674041748047e-05, -2.9206275939941406e-05, -2.3245811462402344e-05, -1.728534698486328e-05, -1.1324882507324219e-05, -5.364418029785156e-06, 5.960464477539062e-07, 6.556510925292969e-06, 1.2516975402832031e-05, 1.8477439880371094e-05, 2.4437904357910156e-05, 3.039836883544922e-05, 3.635883331298828e-05, 4.2319297790527344e-05, 4.8279762268066406e-05, 5.424022674560547e-05, 6.020069122314453e-05, 6.61611557006836e-05, 7.212162017822266e-05, 7.808208465576172e-05, 8.404254913330078e-05, 9.000301361083984e-05, 9.59634780883789e-05, 0.00010192394256591797, 0.00010788440704345703, 0.0001138448715209961, 0.00011980533599853516, 0.00012576580047607422, 0.00013172626495361328, 0.00013768672943115234, 0.0001436471939086914, 0.00014960765838623047, 0.00015556812286376953, 0.0001615285873413086, 0.00016748905181884766, 0.00017344951629638672, 0.00017940998077392578, 0.00018537044525146484, 0.0001913309097290039, 0.00019729137420654297, 0.00020325183868408203]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 7.0, 4.0, 9.0, 18.0, 18.0, 26.0, 32.0, 41.0, 62.0, 67.0, 82.0, 74.0, 107.0, 91.0, 72.0, 75.0, 58.0, 43.0, 20.0, 17.0, 20.0, 15.0, 8.0, 6.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1086463928222656e-05, -1.0708346962928772e-05, -1.0330229997634888e-05, -9.952113032341003e-06, -9.573996067047119e-06, -9.195879101753235e-06, -8.81776213645935e-06, -8.439645171165466e-06, -8.061528205871582e-06, -7.683411240577698e-06, -7.3052942752838135e-06, -6.927177309989929e-06, -6.549060344696045e-06, -6.170943379402161e-06, -5.792826414108276e-06, -5.414709448814392e-06, -5.036592483520508e-06, -4.6584755182266235e-06, -4.280358552932739e-06, -3.902241587638855e-06, -3.5241246223449707e-06, -3.1460076570510864e-06, -2.767890691757202e-06, -2.389773726463318e-06, -2.0116567611694336e-06, -1.6335397958755493e-06, -1.255422830581665e-06, -8.773058652877808e-07, -4.991888999938965e-07, -1.210719347000122e-07, 2.5704503059387207e-07, 6.351619958877563e-07, 1.0132789611816406e-06, 1.391395926475525e-06, 1.7695128917694092e-06, 2.1476298570632935e-06, 2.5257468223571777e-06, 2.903863787651062e-06, 3.2819807529449463e-06, 3.6600977182388306e-06, 4.038214683532715e-06, 4.416331648826599e-06, 4.794448614120483e-06, 5.172565579414368e-06, 5.550682544708252e-06, 5.928799510002136e-06, 6.3069164752960205e-06, 6.685033440589905e-06, 7.063150405883789e-06, 7.441267371177673e-06, 7.819384336471558e-06, 8.197501301765442e-06, 8.575618267059326e-06, 8.95373523235321e-06, 9.331852197647095e-06, 9.709969162940979e-06, 1.0088086128234863e-05, 1.0466203093528748e-05, 1.0844320058822632e-05, 1.1222437024116516e-05, 1.16005539894104e-05, 1.1978670954704285e-05, 1.2356787919998169e-05, 1.2734904885292053e-05, 1.3113021850585938e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 5.0, 5.0, 8.0, 16.0, 18.0, 25.0, 40.0, 60.0, 80.0, 161.0, 259.0, 394.0, 730.0, 1354.0, 2467.0, 5492.0, 14612.0, 52493.0, 408101.0, 479715.0, 55625.0, 15054.0, 5909.0, 2640.0, 1363.0, 735.0, 448.0, 246.0, 171.0, 108.0, 71.0, 55.0, 23.0, 23.0, 11.0, 11.0, 6.0, 5.0, 6.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001558065414428711, -0.0001502465456724167, -0.00014468654990196228, -0.00013912655413150787, -0.00013356655836105347, -0.00012800656259059906, -0.00012244656682014465, -0.00011688657104969025, -0.00011132657527923584, -0.00010576657950878143, -0.00010020658373832703, -9.464658796787262e-05, -8.908659219741821e-05, -8.35265964269638e-05, -7.79666006565094e-05, -7.240660488605499e-05, -6.684660911560059e-05, -6.128661334514618e-05, -5.572661757469177e-05, -5.0166621804237366e-05, -4.460662603378296e-05, -3.904663026332855e-05, -3.3486634492874146e-05, -2.792663872241974e-05, -2.2366642951965332e-05, -1.6806647181510925e-05, -1.1246651411056519e-05, -5.686655640602112e-06, -1.2665987014770508e-07, 5.433335900306702e-06, 1.0993331670761108e-05, 1.6553327441215515e-05, 2.2113323211669922e-05, 2.767331898212433e-05, 3.3233314752578735e-05, 3.879331052303314e-05, 4.435330629348755e-05, 4.9913302063941956e-05, 5.547329783439636e-05, 6.103329360485077e-05, 6.659328937530518e-05, 7.215328514575958e-05, 7.771328091621399e-05, 8.32732766866684e-05, 8.88332724571228e-05, 9.439326822757721e-05, 9.995326399803162e-05, 0.00010551325976848602, 0.00011107325553894043, 0.00011663325130939484, 0.00012219324707984924, 0.00012775324285030365, 0.00013331323862075806, 0.00013887323439121246, 0.00014443323016166687, 0.00014999322593212128, 0.00015555322170257568, 0.0001611132174730301, 0.0001666732132434845, 0.0001722332090139389, 0.0001777932047843933, 0.00018335320055484772, 0.00018891319632530212, 0.00019447319209575653, 0.00020003318786621094]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 3.0, 12.0, 5.0, 11.0, 17.0, 25.0, 33.0, 49.0, 47.0, 89.0, 83.0, 127.0, 122.0, 83.0, 71.0, 60.0, 44.0, 37.0, 21.0, 10.0, 7.0, 10.0, 7.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7670135498046875e-05, -3.6621466279029846e-05, -3.557279706001282e-05, -3.452412784099579e-05, -3.347545862197876e-05, -3.242678940296173e-05, -3.13781201839447e-05, -3.0329450964927673e-05, -2.9280781745910645e-05, -2.8232112526893616e-05, -2.7183443307876587e-05, -2.6134774088859558e-05, -2.508610486984253e-05, -2.40374356508255e-05, -2.298876643180847e-05, -2.1940097212791443e-05, -2.0891427993774414e-05, -1.9842758774757385e-05, -1.8794089555740356e-05, -1.7745420336723328e-05, -1.66967511177063e-05, -1.564808189868927e-05, -1.4599412679672241e-05, -1.3550743460655212e-05, -1.2502074241638184e-05, -1.1453405022621155e-05, -1.0404735803604126e-05, -9.356066584587097e-06, -8.307397365570068e-06, -7.2587281465530396e-06, -6.210058927536011e-06, -5.161389708518982e-06, -4.112720489501953e-06, -3.0640512704849243e-06, -2.0153820514678955e-06, -9.667128324508667e-07, 8.195638656616211e-08, 1.130625605583191e-06, 2.1792948246002197e-06, 3.2279640436172485e-06, 4.276633262634277e-06, 5.325302481651306e-06, 6.373971700668335e-06, 7.422640919685364e-06, 8.471310138702393e-06, 9.519979357719421e-06, 1.056864857673645e-05, 1.1617317795753479e-05, 1.2665987014770508e-05, 1.3714656233787537e-05, 1.4763325452804565e-05, 1.5811994671821594e-05, 1.6860663890838623e-05, 1.7909333109855652e-05, 1.895800232887268e-05, 2.000667154788971e-05, 2.1055340766906738e-05, 2.2104009985923767e-05, 2.3152679204940796e-05, 2.4201348423957825e-05, 2.5250017642974854e-05, 2.6298686861991882e-05, 2.734735608100891e-05, 2.839602530002594e-05, 2.944469451904297e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 7.0, 7.0, 8.0, 13.0, 24.0, 26.0, 59.0, 106.0, 204.0, 228.0, 130.0, 74.0, 38.0, 27.0, 16.0, 11.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002422218443825841, -0.002363307634368539, -0.002304396592080593, -0.002245485782623291, -0.0021865747403353453, -0.002127663930878043, -0.0020687528885900974, -0.0020098420791327953, -0.0019509312696754932, -0.0018920203438028693, -0.0018331094179302454, -0.0017741986084729433, -0.0017152876826003194, -0.0016563767567276955, -0.0015974658308550715, -0.0015385549049824476, -0.0014796439791098237, -0.0014207330532371998, -0.0013618221273645759, -0.001302911201491952, -0.0012440003920346498, -0.001185089466162026, -0.001126178540289402, -0.001067267614416778, -0.0010083566885441542, -0.0009494457626715302, -0.0008905348950065672, -0.0008316239691339433, -0.0007727131014689803, -0.0007138021755963564, -0.0006548912497237325, -0.0005959803238511086, -0.0005370695143938065, -0.000478158617625013, -0.00041924772085621953, -0.0003603367949835956, -0.00030142589821480215, -0.00024251500144600868, -0.00018360407557338476, -0.0001246931788045913, -6.578228203579783e-05, -6.8713779910467565e-06, 5.203952605370432e-05, 0.00011095043737441301, 0.00016986133414320648, 0.00022877223091199994, 0.00028768315678462386, 0.0003465940535534173, 0.0004055049503222108, 0.00046441584709100425, 0.0005233267438597977, 0.0005822376697324216, 0.0006411485373973846, 0.0007000594632700086, 0.0007589703891426325, 0.0008178813150152564, 0.0008767921826802194, 0.0009357031085528433, 0.0009946139762178063, 0.0010535249020904303, 0.0011124358279630542, 0.001171346753835678, 0.0012302575632929802, 0.0012891684891656041, 0.001348079415038228]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 3.0, 6.0, 12.0, 5.0, 11.0, 10.0, 11.0, 11.0, 17.0, 19.0, 25.0, 27.0, 24.0, 29.0, 19.0, 28.0, 25.0, 33.0, 43.0, 50.0, 39.0, 44.0, 35.0, 43.0, 32.0, 28.0, 39.0, 37.0, 34.0, 29.0, 33.0, 27.0, 23.0, 25.0, 15.0, 13.0, 9.0, 10.0, 11.0, 12.0, 9.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005788164562545717, -0.0005596099072135985, -0.0005404032999649644, -0.0005211967509239912, -0.000501990201883018, -0.00048278365284204483, -0.0004635770746972412, -0.00044437049655243754, -0.00042516394751146436, -0.00040595739847049117, -0.00038675082032568753, -0.0003675442421808839, -0.0003483376931399107, -0.0003291311440989375, -0.00030992456595413387, -0.0002907179878093302, -0.00027151143876835704, -0.00025230488972738385, -0.0002330983115825802, -0.0002138917479896918, -0.00019468518439680338, -0.00017547862080391496, -0.00015627205721102655, -0.00013706549361813813, -0.00011785893002524972, -9.86523664323613e-05, -7.944580283947289e-05, -6.0239239246584475e-05, -4.103267565369606e-05, -2.1826112060807645e-05, -2.6195484679192305e-06, 1.6587015124969184e-05, 3.5793520510196686e-05, 5.50000841030851e-05, 7.420664769597352e-05, 9.341321128886193e-05, 0.00011261977488175035, 0.00013182633847463876, 0.00015103290206752717, 0.0001702394656604156, 0.000189446029253304, 0.00020865259284619242, 0.00022785915643908083, 0.0002470657345838845, 0.00026627228362485766, 0.00028547883266583085, 0.0003046854108106345, 0.00032389198895543814, 0.0003430985379964113, 0.0003623050870373845, 0.00038151166518218815, 0.0004007182433269918, 0.000419924792367965, 0.00043913134140893817, 0.0004583379195537418, 0.00047754449769854546, 0.0004967510467395186, 0.0005159575957804918, 0.000535164144821465, 0.0005543707520700991, 0.0005735773011110723, 0.0005927838501520455, 0.0006119904574006796, 0.0006311970064416528, 0.000650403555482626]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 6.0, 5.0, 5.0, 5.0, 12.0, 11.0, 23.0, 28.0, 45.0, 57.0, 82.0, 152.0, 175.0, 306.0, 442.0, 643.0, 969.0, 1413.0, 2180.0, 3330.0, 5039.0, 7973.0, 12516.0, 20494.0, 34481.0, 63204.0, 129734.0, 279611.0, 243165.0, 107701.0, 54083.0, 30790.0, 18023.0, 11273.0, 7187.0, 4435.0, 2986.0, 1962.0, 1345.0, 893.0, 575.0, 408.0, 257.0, 178.0, 122.0, 73.0, 51.0, 48.0, 24.0, 15.0, 9.0, 9.0, 3.0, 7.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012674331665039062, -0.001223549246788025, -0.0011796653270721436, -0.0011357814073562622, -0.0010918974876403809, -0.0010480135679244995, -0.0010041296482086182, -0.0009602457284927368, -0.0009163618087768555, -0.0008724778890609741, -0.0008285939693450928, -0.0007847100496292114, -0.0007408261299133301, -0.0006969422101974487, -0.0006530582904815674, -0.000609174370765686, -0.0005652904510498047, -0.0005214065313339233, -0.000477522611618042, -0.00043363869190216064, -0.0003897547721862793, -0.00034587085247039795, -0.0003019869327545166, -0.00025810301303863525, -0.0002142190933227539, -0.00017033517360687256, -0.0001264512538909912, -8.256733417510986e-05, -3.8683414459228516e-05, 5.200505256652832e-06, 4.908442497253418e-05, 9.296834468841553e-05, 0.00013685226440429688, 0.00018073618412017822, 0.00022462010383605957, 0.0002685040235519409, 0.00031238794326782227, 0.0003562718629837036, 0.00040015578269958496, 0.0004440397024154663, 0.00048792362213134766, 0.000531807541847229, 0.0005756914615631104, 0.0006195753812789917, 0.000663459300994873, 0.0007073432207107544, 0.0007512271404266357, 0.0007951110601425171, 0.0008389949798583984, 0.0008828788995742798, 0.0009267628192901611, 0.0009706467390060425, 0.0010145306587219238, 0.0010584145784378052, 0.0011022984981536865, 0.0011461824178695679, 0.0011900663375854492, 0.0012339502573013306, 0.001277834177017212, 0.0013217180967330933, 0.0013656020164489746, 0.001409485936164856, 0.0014533698558807373, 0.0014972537755966187, 0.0015411376953125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 14.0, 7.0, 15.0, 17.0, 11.0, 15.0, 22.0, 26.0, 25.0, 25.0, 40.0, 30.0, 38.0, 47.0, 51.0, 46.0, 41.0, 45.0, 34.0, 46.0, 36.0, 31.0, 42.0, 36.0, 33.0, 29.0, 23.0, 26.0, 17.0, 21.0, 13.0, 15.0, 10.0, 7.0, 3.0, 6.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.000362396240234375, -0.00035003572702407837, -0.00033767521381378174, -0.0003253147006034851, -0.0003129541873931885, -0.00030059367418289185, -0.0002882331609725952, -0.0002758726477622986, -0.00026351213455200195, -0.0002511516213417053, -0.0002387911081314087, -0.00022643059492111206, -0.00021407008171081543, -0.0002017095685005188, -0.00018934905529022217, -0.00017698854207992554, -0.0001646280288696289, -0.00015226751565933228, -0.00013990700244903564, -0.00012754648923873901, -0.00011518597602844238, -0.00010282546281814575, -9.046494960784912e-05, -7.810443639755249e-05, -6.574392318725586e-05, -5.338340997695923e-05, -4.10228967666626e-05, -2.8662383556365967e-05, -1.6301870346069336e-05, -3.941357135772705e-06, 8.419156074523926e-06, 2.0779669284820557e-05, 3.314018249511719e-05, 4.550069570541382e-05, 5.786120891571045e-05, 7.022172212600708e-05, 8.258223533630371e-05, 9.494274854660034e-05, 0.00010730326175689697, 0.0001196637749671936, 0.00013202428817749023, 0.00014438480138778687, 0.0001567453145980835, 0.00016910582780838013, 0.00018146634101867676, 0.0001938268542289734, 0.00020618736743927002, 0.00021854788064956665, 0.00023090839385986328, 0.0002432689070701599, 0.00025562942028045654, 0.0002679899334907532, 0.0002803504467010498, 0.00029271095991134644, 0.00030507147312164307, 0.0003174319863319397, 0.00032979249954223633, 0.00034215301275253296, 0.0003545135259628296, 0.0003668740391731262, 0.00037923455238342285, 0.0003915950655937195, 0.0004039555788040161, 0.00041631609201431274, 0.0004286766052246094]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 9.0, 2.0, 3.0, 7.0, 15.0, 16.0, 10.0, 15.0, 15.0, 38.0, 42.0, 73.0, 77.0, 125.0, 201.0, 357.0, 646.0, 1185.0, 2731.0, 5921.0, 14601.0, 39917.0, 135582.0, 511069.0, 238929.0, 60580.0, 20915.0, 8303.0, 3577.0, 1607.0, 824.0, 448.0, 234.0, 149.0, 73.0, 68.0, 48.0, 34.0, 24.0, 22.0, 20.0, 8.0, 20.0, 8.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00258636474609375, -0.0025117993354797363, -0.0024372339248657227, -0.002362668514251709, -0.0022881031036376953, -0.0022135376930236816, -0.002138972282409668, -0.0020644068717956543, -0.0019898414611816406, -0.001915276050567627, -0.0018407106399536133, -0.0017661452293395996, -0.001691579818725586, -0.0016170144081115723, -0.0015424489974975586, -0.001467883586883545, -0.0013933181762695312, -0.0013187527656555176, -0.001244187355041504, -0.0011696219444274902, -0.0010950565338134766, -0.0010204911231994629, -0.0009459257125854492, -0.0008713603019714355, -0.0007967948913574219, -0.0007222294807434082, -0.0006476640701293945, -0.0005730986595153809, -0.0004985332489013672, -0.0004239678382873535, -0.00034940242767333984, -0.00027483701705932617, -0.0002002716064453125, -0.00012570619583129883, -5.1140785217285156e-05, 2.3424625396728516e-05, 9.799003601074219e-05, 0.00017255544662475586, 0.00024712085723876953, 0.0003216862678527832, 0.0003962516784667969, 0.00047081708908081055, 0.0005453824996948242, 0.0006199479103088379, 0.0006945133209228516, 0.0007690787315368652, 0.0008436441421508789, 0.0009182095527648926, 0.0009927749633789062, 0.00106734037399292, 0.0011419057846069336, 0.0012164711952209473, 0.001291036605834961, 0.0013656020164489746, 0.0014401674270629883, 0.001514732837677002, 0.0015892982482910156, 0.0016638636589050293, 0.001738429069519043, 0.0018129944801330566, 0.0018875598907470703, 0.001962125301361084, 0.0020366907119750977, 0.0021112561225891113, 0.002185821533203125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 9.0, 6.0, 8.0, 8.0, 12.0, 8.0, 9.0, 12.0, 19.0, 26.0, 27.0, 28.0, 30.0, 52.0, 38.0, 48.0, 36.0, 57.0, 45.0, 50.0, 36.0, 48.0, 42.0, 34.0, 35.0, 31.0, 27.0, 25.0, 35.0, 28.0, 22.0, 26.0, 14.0, 14.0, 11.0, 7.0, 6.0, 6.0, 3.0, 2.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00035834312438964844, -0.00034617260098457336, -0.0003340020775794983, -0.0003218315541744232, -0.00030966103076934814, -0.00029749050736427307, -0.000285319983959198, -0.0002731494605541229, -0.00026097893714904785, -0.0002488084137439728, -0.0002366378903388977, -0.00022446736693382263, -0.00021229684352874756, -0.00020012632012367249, -0.0001879557967185974, -0.00017578527331352234, -0.00016361474990844727, -0.0001514442265033722, -0.00013927370309829712, -0.00012710317969322205, -0.00011493265628814697, -0.0001027621328830719, -9.059160947799683e-05, -7.842108607292175e-05, -6.625056266784668e-05, -5.4080039262771606e-05, -4.190951585769653e-05, -2.973899245262146e-05, -1.7568469047546387e-05, -5.3979456424713135e-06, 6.77257776260376e-06, 1.8943101167678833e-05, 3.1113624572753906e-05, 4.328414797782898e-05, 5.545467138290405e-05, 6.762519478797913e-05, 7.97957181930542e-05, 9.196624159812927e-05, 0.00010413676500320435, 0.00011630728840827942, 0.0001284778118133545, 0.00014064833521842957, 0.00015281885862350464, 0.0001649893820285797, 0.00017715990543365479, 0.00018933042883872986, 0.00020150095224380493, 0.00021367147564888, 0.00022584199905395508, 0.00023801252245903015, 0.0002501830458641052, 0.0002623535692691803, 0.00027452409267425537, 0.00028669461607933044, 0.0002988651394844055, 0.0003110356628894806, 0.00032320618629455566, 0.00033537670969963074, 0.0003475472331047058, 0.0003597177565097809, 0.00037188827991485596, 0.00038405880331993103, 0.0003962293267250061, 0.0004083998501300812, 0.00042057037353515625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 9.0, 12.0, 12.0, 15.0, 27.0, 46.0, 89.0, 172.0, 286.0, 508.0, 1085.0, 2849.0, 9648.0, 49034.0, 734784.0, 217188.0, 23679.0, 5490.0, 1883.0, 831.0, 401.0, 187.0, 110.0, 68.0, 34.0, 35.0, 25.0, 20.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3511390686035156e-05, -4.188716411590576e-05, -4.026293754577637e-05, -3.863871097564697e-05, -3.701448440551758e-05, -3.5390257835388184e-05, -3.376603126525879e-05, -3.2141804695129395e-05, -3.0517578125e-05, -2.8893351554870605e-05, -2.726912498474121e-05, -2.5644898414611816e-05, -2.4020671844482422e-05, -2.2396445274353027e-05, -2.0772218704223633e-05, -1.9147992134094238e-05, -1.7523765563964844e-05, -1.589953899383545e-05, -1.4275312423706055e-05, -1.265108585357666e-05, -1.1026859283447266e-05, -9.402632713317871e-06, -7.778406143188477e-06, -6.154179573059082e-06, -4.5299530029296875e-06, -2.905726432800293e-06, -1.2814998626708984e-06, 3.427267074584961e-07, 1.9669532775878906e-06, 3.591179847717285e-06, 5.21540641784668e-06, 6.839632987976074e-06, 8.463859558105469e-06, 1.0088086128234863e-05, 1.1712312698364258e-05, 1.3336539268493652e-05, 1.4960765838623047e-05, 1.658499240875244e-05, 1.8209218978881836e-05, 1.983344554901123e-05, 2.1457672119140625e-05, 2.308189868927002e-05, 2.4706125259399414e-05, 2.633035182952881e-05, 2.7954578399658203e-05, 2.9578804969787598e-05, 3.120303153991699e-05, 3.282725811004639e-05, 3.445148468017578e-05, 3.6075711250305176e-05, 3.769993782043457e-05, 3.9324164390563965e-05, 4.094839096069336e-05, 4.2572617530822754e-05, 4.419684410095215e-05, 4.582107067108154e-05, 4.744529724121094e-05, 4.906952381134033e-05, 5.0693750381469727e-05, 5.231797695159912e-05, 5.3942203521728516e-05, 5.556643009185791e-05, 5.7190656661987305e-05, 5.88148832321167e-05, 6.0439109802246094e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 5.0, 8.0, 13.0, 15.0, 12.0, 31.0, 31.0, 77.0, 111.0, 250.0, 154.0, 102.0, 76.0, 26.0, 38.0, 13.0, 19.0, 3.0, 4.0, 5.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.589557647705078e-06, -4.441477358341217e-06, -4.293397068977356e-06, -4.145316779613495e-06, -3.997236490249634e-06, -3.849156200885773e-06, -3.7010759115219116e-06, -3.5529956221580505e-06, -3.4049153327941895e-06, -3.2568350434303284e-06, -3.1087547540664673e-06, -2.960674464702606e-06, -2.812594175338745e-06, -2.664513885974884e-06, -2.516433596611023e-06, -2.368353307247162e-06, -2.2202730178833008e-06, -2.0721927285194397e-06, -1.9241124391555786e-06, -1.7760321497917175e-06, -1.6279518604278564e-06, -1.4798715710639954e-06, -1.3317912817001343e-06, -1.1837109923362732e-06, -1.0356307029724121e-06, -8.87550413608551e-07, -7.394701242446899e-07, -5.913898348808289e-07, -4.4330954551696777e-07, -2.952292561531067e-07, -1.471489667892456e-07, 9.313225746154785e-10, 1.4901161193847656e-07, 2.9709190130233765e-07, 4.4517219066619873e-07, 5.932524800300598e-07, 7.413327693939209e-07, 8.89413058757782e-07, 1.037493348121643e-06, 1.1855736374855042e-06, 1.3336539268493652e-06, 1.4817342162132263e-06, 1.6298145055770874e-06, 1.7778947949409485e-06, 1.9259750843048096e-06, 2.0740553736686707e-06, 2.2221356630325317e-06, 2.370215952396393e-06, 2.518296241760254e-06, 2.666376531124115e-06, 2.814456820487976e-06, 2.962537109851837e-06, 3.1106173992156982e-06, 3.2586976885795593e-06, 3.4067779779434204e-06, 3.5548582673072815e-06, 3.7029385566711426e-06, 3.851018846035004e-06, 3.999099135398865e-06, 4.147179424762726e-06, 4.295259714126587e-06, 4.443340003490448e-06, 4.591420292854309e-06, 4.73950058221817e-06, 4.887580871582031e-06]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 5.0, 11.0, 14.0, 22.0, 24.0, 27.0, 48.0, 64.0, 110.0, 198.0, 413.0, 826.0, 1816.0, 4033.0, 11502.0, 39832.0, 241357.0, 614146.0, 98740.0, 22681.0, 7253.0, 2738.0, 1335.0, 595.0, 280.0, 182.0, 100.0, 67.0, 36.0, 25.0, 17.0, 14.0, 15.0, 7.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.218650817871094e-05, -3.1366944313049316e-05, -3.0547380447387695e-05, -2.9727816581726074e-05, -2.8908252716064453e-05, -2.8088688850402832e-05, -2.726912498474121e-05, -2.644956111907959e-05, -2.562999725341797e-05, -2.4810433387756348e-05, -2.3990869522094727e-05, -2.3171305656433105e-05, -2.2351741790771484e-05, -2.1532177925109863e-05, -2.0712614059448242e-05, -1.989305019378662e-05, -1.9073486328125e-05, -1.825392246246338e-05, -1.7434358596801758e-05, -1.6614794731140137e-05, -1.5795230865478516e-05, -1.4975666999816895e-05, -1.4156103134155273e-05, -1.3336539268493652e-05, -1.2516975402832031e-05, -1.169741153717041e-05, -1.0877847671508789e-05, -1.0058283805847168e-05, -9.238719940185547e-06, -8.419156074523926e-06, -7.599592208862305e-06, -6.780028343200684e-06, -5.9604644775390625e-06, -5.140900611877441e-06, -4.32133674621582e-06, -3.5017728805541992e-06, -2.682209014892578e-06, -1.862645149230957e-06, -1.043081283569336e-06, -2.2351741790771484e-07, 5.960464477539062e-07, 1.4156103134155273e-06, 2.2351741790771484e-06, 3.0547380447387695e-06, 3.874301910400391e-06, 4.693865776062012e-06, 5.513429641723633e-06, 6.332993507385254e-06, 7.152557373046875e-06, 7.972121238708496e-06, 8.791685104370117e-06, 9.611248970031738e-06, 1.043081283569336e-05, 1.125037670135498e-05, 1.2069940567016602e-05, 1.2889504432678223e-05, 1.3709068298339844e-05, 1.4528632164001465e-05, 1.5348196029663086e-05, 1.6167759895324707e-05, 1.6987323760986328e-05, 1.780688762664795e-05, 1.862645149230957e-05, 1.944601535797119e-05, 2.0265579223632812e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 12.0, 6.0, 16.0, 9.0, 18.0, 25.0, 22.0, 49.0, 42.0, 70.0, 59.0, 56.0, 89.0, 60.0, 112.0, 49.0, 70.0, 45.0, 31.0, 36.0, 29.0, 21.0, 8.0, 14.0, 6.0, 6.0, 11.0, 7.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.933906555175781e-06, -3.789551556110382e-06, -3.645196557044983e-06, -3.5008415579795837e-06, -3.3564865589141846e-06, -3.2121315598487854e-06, -3.0677765607833862e-06, -2.923421561717987e-06, -2.779066562652588e-06, -2.6347115635871887e-06, -2.4903565645217896e-06, -2.3460015654563904e-06, -2.201646566390991e-06, -2.057291567325592e-06, -1.912936568260193e-06, -1.7685815691947937e-06, -1.6242265701293945e-06, -1.4798715710639954e-06, -1.3355165719985962e-06, -1.191161572933197e-06, -1.0468065738677979e-06, -9.024515748023987e-07, -7.580965757369995e-07, -6.137415766716003e-07, -4.6938657760620117e-07, -3.25031578540802e-07, -1.8067657947540283e-07, -3.632158041000366e-08, 1.0803341865539551e-07, 2.523884177207947e-07, 3.9674341678619385e-07, 5.41098415851593e-07, 6.854534149169922e-07, 8.298084139823914e-07, 9.741634130477905e-07, 1.1185184121131897e-06, 1.2628734111785889e-06, 1.407228410243988e-06, 1.5515834093093872e-06, 1.6959384083747864e-06, 1.8402934074401855e-06, 1.9846484065055847e-06, 2.129003405570984e-06, 2.273358404636383e-06, 2.4177134037017822e-06, 2.5620684027671814e-06, 2.7064234018325806e-06, 2.8507784008979797e-06, 2.995133399963379e-06, 3.139488399028778e-06, 3.2838433980941772e-06, 3.4281983971595764e-06, 3.5725533962249756e-06, 3.7169083952903748e-06, 3.861263394355774e-06, 4.005618393421173e-06, 4.149973392486572e-06, 4.2943283915519714e-06, 4.438683390617371e-06, 4.58303838968277e-06, 4.727393388748169e-06, 4.871748387813568e-06, 5.016103386878967e-06, 5.1604583859443665e-06, 5.304813385009766e-06]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 13.0, 14.0, 21.0, 33.0, 60.0, 108.0, 220.0, 238.0, 120.0, 67.0, 39.0, 26.0, 16.0, 9.0, 11.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0015372860943898559, -0.001489462680183351, -0.0014416391495615244, -0.0013938157353550196, -0.001345992204733193, -0.001298168790526688, -0.0012503452599048615, -0.0012025218456983566, -0.0011546984314918518, -0.001106875017285347, -0.0010590514866635203, -0.0010112280724570155, -0.0009634045418351889, -0.000915581127628684, -0.0008677576552145183, -0.0008199341828003526, -0.0007721106521785259, -0.0007242871797643602, -0.0006764637073501945, -0.0006286402931436896, -0.000580816762521863, -0.0005329933483153582, -0.0004851698759011924, -0.0004373464034870267, -0.00038952293107286096, -0.0003416994586586952, -0.0002938759862445295, -0.0002460525429341942, -0.00019822907052002847, -0.00015040559810586274, -0.00010258215479552746, -5.475868238136172e-05, -6.935209967195988e-06, 4.088825517101213e-05, 8.871172030922025e-05, 0.00013653517817147076, 0.0001843586505856365, 0.00023218212299980223, 0.0002800055663101375, 0.00032782903872430325, 0.000375652511138469, 0.0004234759835526347, 0.00047129945596680045, 0.0005191229283809662, 0.000566946342587471, 0.0006147698732092977, 0.0006625932874158025, 0.0007104167598299682, 0.000758240232244134, 0.0008060637046582997, 0.0008538871770724654, 0.0009017105912789702, 0.0009495341219007969, 0.0009973575361073017, 0.0010451809503138065, 0.0010930044809356332, 0.0011408280115574598, 0.0011886514257639647, 0.0012364749563857913, 0.0012842983705922961, 0.0013321219012141228, 0.0013799453154206276, 0.0014277687296271324, 0.001475592260248959, 0.0015234156744554639]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 8.0, 6.0, 8.0, 13.0, 6.0, 12.0, 13.0, 15.0, 27.0, 21.0, 30.0, 27.0, 30.0, 40.0, 36.0, 39.0, 36.0, 34.0, 39.0, 45.0, 26.0, 45.0, 33.0, 45.0, 34.0, 49.0, 30.0, 39.0, 26.0, 23.0, 25.0, 17.0, 14.0, 8.0, 16.0, 18.0, 9.0, 13.0, 5.0, 9.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00048091515782289207, -0.0004660561098717153, -0.00045119706192053854, -0.0004363380139693618, -0.000421478966018185, -0.00040661991806700826, -0.00039176089921966195, -0.00037690182216465473, -0.0003620428033173084, -0.00034718375536613166, -0.0003323247074149549, -0.00031746565946377814, -0.0003026066115126014, -0.0002877475635614246, -0.00027288851561024785, -0.00025802949676290154, -0.00024317041970789433, -0.00022831137175671756, -0.0002134523238055408, -0.00019859327585436404, -0.00018373422790318727, -0.0001688751799520105, -0.00015401614655274898, -0.00013915709860157222, -0.00012429805065039545, -0.00010943900269921869, -9.457995474804193e-05, -7.972091407282278e-05, -6.486186612164602e-05, -5.0002818170469254e-05, -3.5143777495250106e-05, -2.0284729544073343e-05, -5.425652489066124e-06, 9.433393643121235e-06, 2.4292439775308594e-05, 3.915148408850655e-05, 5.401053203968331e-05, 6.886957999086007e-05, 8.372862066607922e-05, 9.858766861725599e-05, 0.00011344671656843275, 0.0001283057645196095, 0.00014316481247078627, 0.0001580238458700478, 0.00017288289382122457, 0.00018774194177240133, 0.0002026009897235781, 0.00021746003767475486, 0.00023231908562593162, 0.0002471781335771084, 0.00026203718152828515, 0.0002768962294794619, 0.00029175527743063867, 0.00030661432538181543, 0.00032147334422916174, 0.00033633242128416896, 0.00035119144013151526, 0.000366050488082692, 0.0003809095360338688, 0.00039576858398504555, 0.0004106276319362223, 0.0004254866798873991, 0.00044034572783857584, 0.00045520474668592215, 0.00047006382374092937]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 8.0, 11.0, 18.0, 14.0, 26.0, 37.0, 46.0, 61.0, 80.0, 114.0, 133.0, 179.0, 242.0, 357.0, 487.0, 766.0, 1179.0, 1849.0, 3429.0, 7165.0, 189481.0, 3935173.0, 39953.0, 5461.0, 2865.0, 1620.0, 1011.0, 684.0, 475.0, 347.0, 224.0, 182.0, 145.0, 98.0, 80.0, 73.0, 48.0, 28.0, 32.0, 21.0, 25.0, 9.0, 10.0, 11.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0014162063598632812, -0.0013679414987564087, -0.0013196766376495361, -0.0012714117765426636, -0.001223146915435791, -0.0011748820543289185, -0.001126617193222046, -0.0010783523321151733, -0.0010300874710083008, -0.0009818226099014282, -0.0009335577487945557, -0.0008852928876876831, -0.0008370280265808105, -0.000788763165473938, -0.0007404983043670654, -0.0006922334432601929, -0.0006439685821533203, -0.0005957037210464478, -0.0005474388599395752, -0.0004991739988327026, -0.0004509091377258301, -0.0004026442766189575, -0.00035437941551208496, -0.0003061145544052124, -0.00025784969329833984, -0.00020958483219146729, -0.00016131997108459473, -0.00011305510997772217, -6.479024887084961e-05, -1.652538776397705e-05, 3.173947334289551e-05, 8.000433444976807e-05, 0.00012826919555664062, 0.00017653405666351318, 0.00022479891777038574, 0.0002730637788772583, 0.00032132863998413086, 0.0003695935010910034, 0.000417858362197876, 0.00046612322330474854, 0.0005143880844116211, 0.0005626529455184937, 0.0006109178066253662, 0.0006591826677322388, 0.0007074475288391113, 0.0007557123899459839, 0.0008039772510528564, 0.000852242112159729, 0.0009005069732666016, 0.0009487718343734741, 0.0009970366954803467, 0.0010453015565872192, 0.0010935664176940918, 0.0011418312788009644, 0.001190096139907837, 0.0012383610010147095, 0.001286625862121582, 0.0013348907232284546, 0.0013831555843353271, 0.0014314204454421997, 0.0014796853065490723, 0.0015279501676559448, 0.0015762150287628174, 0.00162447988986969, 0.0016727447509765625]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 5.0, 6.0, 10.0, 15.0, 3.0, 12.0, 10.0, 11.0, 19.0, 8.0, 25.0, 30.0, 22.0, 21.0, 33.0, 45.0, 29.0, 34.0, 35.0, 28.0, 43.0, 30.0, 32.0, 37.0, 40.0, 29.0, 39.0, 33.0, 34.0, 31.0, 26.0, 28.0, 21.0, 21.0, 19.0, 22.0, 16.0, 11.0, 13.0, 7.0, 11.0, 14.0, 8.0, 7.0, 8.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.0003497600555419922, -0.00033831968903541565, -0.0003268793225288391, -0.0003154389560222626, -0.00030399858951568604, -0.0002925582230091095, -0.00028111785650253296, -0.0002696774899959564, -0.0002582371234893799, -0.00024679675698280334, -0.0002353563904762268, -0.00022391602396965027, -0.00021247565746307373, -0.0002010352909564972, -0.00018959492444992065, -0.00017815455794334412, -0.00016671419143676758, -0.00015527382493019104, -0.0001438334584236145, -0.00013239309191703796, -0.00012095272541046143, -0.00010951235890388489, -9.807199239730835e-05, -8.663162589073181e-05, -7.519125938415527e-05, -6.375089287757874e-05, -5.23105263710022e-05, -4.087015986442566e-05, -2.942979335784912e-05, -1.7989426851272583e-05, -6.549060344696045e-06, 4.891306161880493e-06, 1.633167266845703e-05, 2.777203917503357e-05, 3.921240568161011e-05, 5.0652772188186646e-05, 6.209313869476318e-05, 7.353350520133972e-05, 8.497387170791626e-05, 9.64142382144928e-05, 0.00010785460472106934, 0.00011929497122764587, 0.0001307353377342224, 0.00014217570424079895, 0.0001536160707473755, 0.00016505643725395203, 0.00017649680376052856, 0.0001879371702671051, 0.00019937753677368164, 0.00021081790328025818, 0.00022225826978683472, 0.00023369863629341125, 0.0002451390027999878, 0.00025657936930656433, 0.00026801973581314087, 0.0002794601023197174, 0.00029090046882629395, 0.0003023408353328705, 0.000313781201839447, 0.00032522156834602356, 0.0003366619348526001, 0.00034810230135917664, 0.0003595426678657532, 0.0003709830343723297, 0.00038242340087890625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 6.0, 4.0, 11.0, 14.0, 37.0, 43.0, 103.0, 215.0, 502.0, 1284.0, 4273.0, 21307.0, 4053813.0, 100274.0, 8761.0, 2227.0, 767.0, 338.0, 132.0, 58.0, 36.0, 18.0, 11.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031585693359375, -0.003044724464416504, -0.002930879592895508, -0.0028170347213745117, -0.0027031898498535156, -0.0025893449783325195, -0.0024755001068115234, -0.0023616552352905273, -0.0022478103637695312, -0.002133965492248535, -0.002020120620727539, -0.001906275749206543, -0.0017924308776855469, -0.0016785860061645508, -0.0015647411346435547, -0.0014508962631225586, -0.0013370513916015625, -0.0012232065200805664, -0.0011093616485595703, -0.0009955167770385742, -0.0008816719055175781, -0.000767827033996582, -0.0006539821624755859, -0.0005401372909545898, -0.00042629241943359375, -0.00031244754791259766, -0.00019860267639160156, -8.475780487060547e-05, 2.9087066650390625e-05, 0.00014293193817138672, 0.0002567768096923828, 0.0003706216812133789, 0.000484466552734375, 0.0005983114242553711, 0.0007121562957763672, 0.0008260011672973633, 0.0009398460388183594, 0.0010536909103393555, 0.0011675357818603516, 0.0012813806533813477, 0.0013952255249023438, 0.0015090703964233398, 0.001622915267944336, 0.001736760139465332, 0.0018506050109863281, 0.0019644498825073242, 0.0020782947540283203, 0.0021921396255493164, 0.0023059844970703125, 0.0024198293685913086, 0.0025336742401123047, 0.0026475191116333008, 0.002761363983154297, 0.002875208854675293, 0.002989053726196289, 0.003102898597717285, 0.0032167434692382812, 0.0033305883407592773, 0.0034444332122802734, 0.0035582780838012695, 0.0036721229553222656, 0.0037859678268432617, 0.003899812698364258, 0.004013657569885254, 0.00412750244140625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 2.0, 5.0, 4.0, 8.0, 16.0, 39.0, 114.0, 309.0, 2083.0, 1058.0, 227.0, 73.0, 36.0, 13.0, 12.0, 12.0, 13.0, 5.0, 7.0, 8.0, 4.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003693103790283203, -0.00035809725522994995, -0.0003468841314315796, -0.00033567100763320923, -0.00032445788383483887, -0.0003132447600364685, -0.00030203163623809814, -0.0002908185124397278, -0.0002796053886413574, -0.00026839226484298706, -0.0002571791410446167, -0.00024596601724624634, -0.00023475289344787598, -0.00022353976964950562, -0.00021232664585113525, -0.0002011135220527649, -0.00018990039825439453, -0.00017868727445602417, -0.0001674741506576538, -0.00015626102685928345, -0.00014504790306091309, -0.00013383477926254272, -0.00012262165546417236, -0.000111408531665802, -0.00010019540786743164, -8.898228406906128e-05, -7.776916027069092e-05, -6.655603647232056e-05, -5.5342912673950195e-05, -4.4129788875579834e-05, -3.291666507720947e-05, -2.170354127883911e-05, -1.049041748046875e-05, 7.227063179016113e-07, 1.1935830116271973e-05, 2.3148953914642334e-05, 3.4362077713012695e-05, 4.557520151138306e-05, 5.678832530975342e-05, 6.800144910812378e-05, 7.921457290649414e-05, 9.04276967048645e-05, 0.00010164082050323486, 0.00011285394430160522, 0.00012406706809997559, 0.00013528019189834595, 0.0001464933156967163, 0.00015770643949508667, 0.00016891956329345703, 0.0001801326870918274, 0.00019134581089019775, 0.00020255893468856812, 0.00021377205848693848, 0.00022498518228530884, 0.0002361983060836792, 0.00024741142988204956, 0.0002586245536804199, 0.0002698376774787903, 0.00028105080127716064, 0.000292263925075531, 0.00030347704887390137, 0.00031469017267227173, 0.0003259032964706421, 0.00033711642026901245, 0.0003483295440673828]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 17.0, 19.0, 40.0, 82.0, 134.0, 292.0, 183.0, 86.0, 68.0, 25.0, 20.0, 8.0, 7.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014710359973832965, -0.0014286439400166273, -0.0013862518826499581, -0.001343859825283289, -0.0013014677679166198, -0.0012590757105499506, -0.0012166835367679596, -0.0011742915958166122, -0.0011318994220346212, -0.001089507364667952, -0.0010471153073012829, -0.0010047232499346137, -0.0009623311925679445, -0.0009199391352012753, -0.0008775470196269453, -0.0008351549622602761, -0.0007927629631012678, -0.0007503709057345986, -0.0007079788483679295, -0.0006655867910012603, -0.0006231947336345911, -0.0005808026762679219, -0.0005384105606935918, -0.0004960185033269227, -0.0004536264459602535, -0.0004112343885935843, -0.0003688423312269151, -0.0003264502447564155, -0.0002840581873897463, -0.00024166613002307713, -0.0001992740435525775, -0.00015688198618590832, -0.00011449004523456097, -7.209798059193417e-05, -2.9705915949307382e-05, 1.2686155969277024e-05, 5.50782133359462e-05, 9.747027070261538e-05, 0.00013986235717311502, 0.0001822544145397842, 0.00022464647190645337, 0.00026703852927312255, 0.0003094305866397917, 0.00035182267311029136, 0.00039421473047696054, 0.0004366067878436297, 0.00047899887431412935, 0.0005213909316807985, 0.0005637829890474677, 0.0006061750464141369, 0.0006485671037808061, 0.0006909591611474752, 0.0007333512185141444, 0.0007757432758808136, 0.0008181353914551437, 0.0008605274488218129, 0.000902919506188482, 0.0009453115635551512, 0.0009877036791294813, 0.0010300957364961505, 0.0010724877938628197, 0.0011148798512294888, 0.001157271908596158, 0.0011996639659628272, 0.0012420560233294964]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 7.0, 1.0, 4.0, 5.0, 5.0, 8.0, 11.0, 13.0, 8.0, 16.0, 23.0, 15.0, 24.0, 25.0, 28.0, 31.0, 30.0, 42.0, 31.0, 29.0, 31.0, 38.0, 50.0, 45.0, 37.0, 40.0, 39.0, 48.0, 48.0, 21.0, 28.0, 21.0, 24.0, 29.0, 21.0, 15.0, 24.0, 20.0, 16.0, 16.0, 11.0, 5.0, 5.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00038281764136627316, -0.00037043250631541014, -0.0003580473712645471, -0.0003456622362136841, -0.00033327710116282105, -0.000320891966111958, -0.000308506831061095, -0.00029612169601023197, -0.00028373656095936894, -0.0002713514259085059, -0.0002589662908576429, -0.00024658115580677986, -0.00023419602075591683, -0.0002218108857050538, -0.00020942575065419078, -0.00019704061560332775, -0.00018465549510437995, -0.00017227036005351692, -0.0001598852250026539, -0.00014750008995179087, -0.00013511495490092784, -0.00012272983440198004, -0.0001103446920751594, -9.795955702429637e-05, -8.557442197343335e-05, -7.318928692257032e-05, -6.080415187170729e-05, -4.841902045882307e-05, -3.603388540796004e-05, -2.3648753995075822e-05, -1.1263618944212794e-05, 1.1215161066502333e-06, 1.350665115751326e-05, 2.589178620837629e-05, 3.8276921259239316e-05, 5.0662052672123536e-05, 6.304719136096537e-05, 7.543231913587078e-05, 8.781745418673381e-05, 0.00010020258923759684, 0.00011258772428845987, 0.00012497285206336528, 0.0001373579871142283, 0.00014974312216509134, 0.00016212825721595436, 0.0001745133922668174, 0.00018689852731768042, 0.00019928366236854345, 0.00021166879741940647, 0.0002240539324702695, 0.00023643906752113253, 0.00024882418802008033, 0.00026120932307094336, 0.0002735944581218064, 0.0002859795931726694, 0.00029836472822353244, 0.00031074986327439547, 0.0003231349983252585, 0.0003355201333761215, 0.00034790526842698455, 0.0003602904034778476, 0.0003726755385287106, 0.00038506067357957363, 0.00039744580863043666, 0.0004098309436812997]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 5.0, 12.0, 16.0, 16.0, 30.0, 45.0, 56.0, 85.0, 100.0, 151.0, 230.0, 347.0, 490.0, 782.0, 1161.0, 2107.0, 3574.0, 6655.0, 12466.0, 25613.0, 55219.0, 127714.0, 304656.0, 284542.0, 119802.0, 51831.0, 24135.0, 11776.0, 6279.0, 3310.0, 1949.0, 1136.0, 673.0, 481.0, 351.0, 206.0, 155.0, 127.0, 79.0, 60.0, 33.0, 28.0, 25.0, 16.0, 8.0, 6.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.00040268898010253906, -0.000390470027923584, -0.0003782510757446289, -0.00036603212356567383, -0.00035381317138671875, -0.00034159421920776367, -0.0003293752670288086, -0.0003171563148498535, -0.00030493736267089844, -0.00029271841049194336, -0.0002804994583129883, -0.0002682805061340332, -0.0002560615539550781, -0.00024384260177612305, -0.00023162364959716797, -0.0002194046974182129, -0.0002071857452392578, -0.00019496679306030273, -0.00018274784088134766, -0.00017052888870239258, -0.0001583099365234375, -0.00014609098434448242, -0.00013387203216552734, -0.00012165307998657227, -0.00010943412780761719, -9.721517562866211e-05, -8.499622344970703e-05, -7.277727127075195e-05, -6.0558319091796875e-05, -4.83393669128418e-05, -3.612041473388672e-05, -2.390146255493164e-05, -1.1682510375976562e-05, 5.364418029785156e-07, 1.2755393981933594e-05, 2.4974346160888672e-05, 3.719329833984375e-05, 4.941225051879883e-05, 6.16312026977539e-05, 7.385015487670898e-05, 8.606910705566406e-05, 9.828805923461914e-05, 0.00011050701141357422, 0.0001227259635925293, 0.00013494491577148438, 0.00014716386795043945, 0.00015938282012939453, 0.0001716017723083496, 0.0001838207244873047, 0.00019603967666625977, 0.00020825862884521484, 0.00022047758102416992, 0.000232696533203125, 0.0002449154853820801, 0.00025713443756103516, 0.00026935338973999023, 0.0002815723419189453, 0.0002937912940979004, 0.00030601024627685547, 0.00031822919845581055, 0.0003304481506347656, 0.0003426671028137207, 0.0003548860549926758, 0.00036710500717163086, 0.00037932395935058594]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 9.0, 7.0, 11.0, 15.0, 17.0, 17.0, 13.0, 21.0, 25.0, 23.0, 33.0, 33.0, 35.0, 35.0, 36.0, 36.0, 44.0, 44.0, 45.0, 41.0, 42.0, 42.0, 56.0, 37.0, 31.0, 30.0, 22.0, 35.0, 23.0, 24.0, 24.0, 14.0, 12.0, 17.0, 16.0, 3.0, 9.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004317760467529297, -0.00041820108890533447, -0.00040462613105773926, -0.00039105117321014404, -0.00037747621536254883, -0.0003639012575149536, -0.0003503262996673584, -0.0003367513418197632, -0.00032317638397216797, -0.00030960142612457275, -0.00029602646827697754, -0.0002824515104293823, -0.0002688765525817871, -0.0002553015947341919, -0.00024172663688659668, -0.00022815167903900146, -0.00021457672119140625, -0.00020100176334381104, -0.00018742680549621582, -0.0001738518476486206, -0.0001602768898010254, -0.00014670193195343018, -0.00013312697410583496, -0.00011955201625823975, -0.00010597705841064453, -9.240210056304932e-05, -7.88271427154541e-05, -6.525218486785889e-05, -5.167722702026367e-05, -3.810226917266846e-05, -2.4527311325073242e-05, -1.0952353477478027e-05, 2.6226043701171875e-06, 1.6197562217712402e-05, 2.9772520065307617e-05, 4.334747791290283e-05, 5.692243576049805e-05, 7.049739360809326e-05, 8.407235145568848e-05, 9.764730930328369e-05, 0.0001112222671508789, 0.00012479722499847412, 0.00013837218284606934, 0.00015194714069366455, 0.00016552209854125977, 0.00017909705638885498, 0.0001926720142364502, 0.0002062469720840454, 0.00021982192993164062, 0.00023339688777923584, 0.00024697184562683105, 0.00026054680347442627, 0.0002741217613220215, 0.0002876967191696167, 0.0003012716770172119, 0.00031484663486480713, 0.00032842159271240234, 0.00034199655055999756, 0.0003555715084075928, 0.000369146466255188, 0.0003827214241027832, 0.0003962963819503784, 0.00040987133979797363, 0.00042344629764556885, 0.00043702125549316406]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 8.0, 6.0, 9.0, 5.0, 11.0, 11.0, 19.0, 39.0, 55.0, 41.0, 77.0, 109.0, 148.0, 208.0, 343.0, 538.0, 843.0, 1471.0, 2537.0, 5015.0, 10342.0, 23892.0, 67202.0, 299847.0, 486855.0, 92535.0, 30457.0, 12499.0, 5959.0, 3005.0, 1668.0, 993.0, 619.0, 376.0, 230.0, 187.0, 106.0, 72.0, 62.0, 48.0, 33.0, 25.0, 16.0, 10.0, 7.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0005354881286621094, -0.0005188211798667908, -0.0005021542310714722, -0.00048548728227615356, -0.00046882033348083496, -0.00045215338468551636, -0.00043548643589019775, -0.00041881948709487915, -0.00040215253829956055, -0.00038548558950424194, -0.00036881864070892334, -0.00035215169191360474, -0.00033548474311828613, -0.00031881779432296753, -0.0003021508455276489, -0.0002854838967323303, -0.0002688169479370117, -0.0002521499991416931, -0.0002354830503463745, -0.0002188161015510559, -0.0002021491527557373, -0.0001854822039604187, -0.0001688152551651001, -0.0001521483063697815, -0.0001354813575744629, -0.00011881440877914429, -0.00010214745998382568, -8.548051118850708e-05, -6.881356239318848e-05, -5.214661359786987e-05, -3.547966480255127e-05, -1.8812716007232666e-05, -2.1457672119140625e-06, 1.4521181583404541e-05, 3.1188130378723145e-05, 4.785507917404175e-05, 6.452202796936035e-05, 8.118897676467896e-05, 9.785592555999756e-05, 0.00011452287435531616, 0.00013118982315063477, 0.00014785677194595337, 0.00016452372074127197, 0.00018119066953659058, 0.00019785761833190918, 0.00021452456712722778, 0.0002311915159225464, 0.000247858464717865, 0.0002645254135131836, 0.0002811923623085022, 0.0002978593111038208, 0.0003145262598991394, 0.000331193208694458, 0.0003478601574897766, 0.0003645271062850952, 0.0003811940550804138, 0.0003978610038757324, 0.000414527952671051, 0.00043119490146636963, 0.00044786185026168823, 0.00046452879905700684, 0.00048119574785232544, 0.000497862696647644, 0.0005145296454429626, 0.0005311965942382812]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 8.0, 7.0, 12.0, 15.0, 12.0, 12.0, 19.0, 22.0, 29.0, 38.0, 40.0, 52.0, 45.0, 56.0, 53.0, 49.0, 47.0, 42.0, 45.0, 39.0, 48.0, 52.0, 38.0, 36.0, 37.0, 29.0, 25.0, 17.0, 17.0, 10.0, 15.0, 5.0, 9.0, 6.0, 4.0, 3.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003247261047363281, -0.0003144890069961548, -0.00030425190925598145, -0.0002940148115158081, -0.00028377771377563477, -0.0002735406160354614, -0.0002633035182952881, -0.00025306642055511475, -0.0002428293228149414, -0.00023259222507476807, -0.00022235512733459473, -0.0002121180295944214, -0.00020188093185424805, -0.0001916438341140747, -0.00018140673637390137, -0.00017116963863372803, -0.0001609325408935547, -0.00015069544315338135, -0.000140458345413208, -0.00013022124767303467, -0.00011998414993286133, -0.00010974705219268799, -9.950995445251465e-05, -8.927285671234131e-05, -7.903575897216797e-05, -6.879866123199463e-05, -5.856156349182129e-05, -4.832446575164795e-05, -3.808736801147461e-05, -2.785027027130127e-05, -1.761317253112793e-05, -7.37607479095459e-06, 2.86102294921875e-06, 1.309812068939209e-05, 2.333521842956543e-05, 3.357231616973877e-05, 4.380941390991211e-05, 5.404651165008545e-05, 6.428360939025879e-05, 7.452070713043213e-05, 8.475780487060547e-05, 9.499490261077881e-05, 0.00010523200035095215, 0.00011546909809112549, 0.00012570619583129883, 0.00013594329357147217, 0.0001461803913116455, 0.00015641748905181885, 0.0001666545867919922, 0.00017689168453216553, 0.00018712878227233887, 0.0001973658800125122, 0.00020760297775268555, 0.0002178400754928589, 0.00022807717323303223, 0.00023831427097320557, 0.0002485513687133789, 0.00025878846645355225, 0.0002690255641937256, 0.0002792626619338989, 0.00028949975967407227, 0.0002997368574142456, 0.00030997395515441895, 0.0003202110528945923, 0.0003304481506347656]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 4.0, 2.0, 2.0, 15.0, 6.0, 14.0, 26.0, 29.0, 29.0, 49.0, 57.0, 92.0, 119.0, 167.0, 252.0, 363.0, 524.0, 875.0, 1569.0, 2883.0, 7207.0, 26419.0, 454390.0, 512528.0, 26513.0, 7241.0, 3002.0, 1493.0, 909.0, 548.0, 366.0, 257.0, 157.0, 128.0, 84.0, 68.0, 41.0, 42.0, 20.0, 13.0, 14.0, 12.0, 9.0, 8.0, 4.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016558170318603516, -0.00016006268560886383, -0.0001545436680316925, -0.00014902465045452118, -0.00014350563287734985, -0.00013798661530017853, -0.0001324675977230072, -0.00012694858014583588, -0.00012142956256866455, -0.00011591054499149323, -0.0001103915274143219, -0.00010487250983715057, -9.935349225997925e-05, -9.383447468280792e-05, -8.83154571056366e-05, -8.279643952846527e-05, -7.727742195129395e-05, -7.175840437412262e-05, -6.62393867969513e-05, -6.072036921977997e-05, -5.520135164260864e-05, -4.968233406543732e-05, -4.416331648826599e-05, -3.8644298911094666e-05, -3.312528133392334e-05, -2.7606263756752014e-05, -2.208724617958069e-05, -1.6568228602409363e-05, -1.1049211025238037e-05, -5.5301934480667114e-06, -1.1175870895385742e-08, 5.50784170627594e-06, 1.1026859283447266e-05, 1.654587686061859e-05, 2.2064894437789917e-05, 2.7583912014961243e-05, 3.310292959213257e-05, 3.8621947169303894e-05, 4.414096474647522e-05, 4.9659982323646545e-05, 5.517899990081787e-05, 6.06980174779892e-05, 6.621703505516052e-05, 7.173605263233185e-05, 7.725507020950317e-05, 8.27740877866745e-05, 8.829310536384583e-05, 9.381212294101715e-05, 9.933114051818848e-05, 0.0001048501580953598, 0.00011036917567253113, 0.00011588819324970245, 0.00012140721082687378, 0.0001269262284040451, 0.00013244524598121643, 0.00013796426355838776, 0.00014348328113555908, 0.0001490022987127304, 0.00015452131628990173, 0.00016004033386707306, 0.00016555935144424438, 0.0001710783690214157, 0.00017659738659858704, 0.00018211640417575836, 0.0001876354217529297]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 12.0, 6.0, 3.0, 5.0, 15.0, 12.0, 13.0, 18.0, 18.0, 24.0, 39.0, 46.0, 55.0, 66.0, 64.0, 95.0, 61.0, 70.0, 68.0, 46.0, 49.0, 23.0, 41.0, 22.0, 13.0, 29.0, 8.0, 14.0, 12.0, 8.0, 6.0, 5.0, 9.0, 4.0, 2.0, 1.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.854534149169922e-06, -6.579793989658356e-06, -6.3050538301467896e-06, -6.030313670635223e-06, -5.755573511123657e-06, -5.480833351612091e-06, -5.206093192100525e-06, -4.931353032588959e-06, -4.656612873077393e-06, -4.381872713565826e-06, -4.10713255405426e-06, -3.832392394542694e-06, -3.557652235031128e-06, -3.2829120755195618e-06, -3.0081719160079956e-06, -2.7334317564964294e-06, -2.4586915969848633e-06, -2.183951437473297e-06, -1.909211277961731e-06, -1.6344711184501648e-06, -1.3597309589385986e-06, -1.0849907994270325e-06, -8.102506399154663e-07, -5.355104804039001e-07, -2.60770320892334e-07, 1.3969838619232178e-08, 2.8870999813079834e-07, 5.634501576423645e-07, 8.381903171539307e-07, 1.1129304766654968e-06, 1.387670636177063e-06, 1.6624107956886292e-06, 1.9371509552001953e-06, 2.2118911147117615e-06, 2.4866312742233276e-06, 2.761371433734894e-06, 3.03611159324646e-06, 3.310851752758026e-06, 3.5855919122695923e-06, 3.8603320717811584e-06, 4.135072231292725e-06, 4.409812390804291e-06, 4.684552550315857e-06, 4.959292709827423e-06, 5.234032869338989e-06, 5.508773028850555e-06, 5.783513188362122e-06, 6.058253347873688e-06, 6.332993507385254e-06, 6.60773366689682e-06, 6.882473826408386e-06, 7.157213985919952e-06, 7.4319541454315186e-06, 7.706694304943085e-06, 7.981434464454651e-06, 8.256174623966217e-06, 8.530914783477783e-06, 8.80565494298935e-06, 9.080395102500916e-06, 9.355135262012482e-06, 9.629875421524048e-06, 9.904615581035614e-06, 1.017935574054718e-05, 1.0454095900058746e-05, 1.0728836059570312e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 12.0, 18.0, 27.0, 39.0, 77.0, 145.0, 409.0, 1507.0, 7197.0, 149587.0, 873527.0, 12704.0, 2292.0, 613.0, 181.0, 70.0, 47.0, 35.0, 18.0, 17.0, 4.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006189346313476562, -0.000603891909122467, -0.0005888491868972778, -0.0005738064646720886, -0.0005587637424468994, -0.0005437210202217102, -0.000528678297996521, -0.0005136355757713318, -0.0004985928535461426, -0.00048355013132095337, -0.00046850740909576416, -0.00045346468687057495, -0.00043842196464538574, -0.00042337924242019653, -0.0004083365201950073, -0.0003932937979698181, -0.0003782510757446289, -0.0003632083535194397, -0.0003481656312942505, -0.0003331229090690613, -0.00031808018684387207, -0.00030303746461868286, -0.00028799474239349365, -0.00027295202016830444, -0.00025790929794311523, -0.00024286657571792603, -0.00022782385349273682, -0.0002127811312675476, -0.0001977384090423584, -0.0001826956868171692, -0.00016765296459197998, -0.00015261024236679077, -0.00013756752014160156, -0.00012252479791641235, -0.00010748207569122314, -9.243935346603394e-05, -7.739663124084473e-05, -6.235390901565552e-05, -4.731118679046631e-05, -3.22684645652771e-05, -1.722574234008789e-05, -2.1830201148986816e-06, 1.2859702110290527e-05, 2.7902424335479736e-05, 4.2945146560668945e-05, 5.7987868785858154e-05, 7.303059101104736e-05, 8.807331323623657e-05, 0.00010311603546142578, 0.00011815875768661499, 0.0001332014799118042, 0.0001482442021369934, 0.00016328692436218262, 0.00017832964658737183, 0.00019337236881256104, 0.00020841509103775024, 0.00022345781326293945, 0.00023850053548812866, 0.00025354325771331787, 0.0002685859799385071, 0.0002836287021636963, 0.0002986714243888855, 0.0003137141466140747, 0.0003287568688392639, 0.0003437995910644531]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 9.0, 15.0, 22.0, 37.0, 63.0, 117.0, 242.0, 224.0, 111.0, 48.0, 29.0, 18.0, 14.0, 13.0, 3.0, 3.0, 8.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7120113372802734e-05, -2.575572580099106e-05, -2.4391338229179382e-05, -2.3026950657367706e-05, -2.166256308555603e-05, -2.0298175513744354e-05, -1.8933787941932678e-05, -1.7569400370121002e-05, -1.6205012798309326e-05, -1.484062522649765e-05, -1.3476237654685974e-05, -1.2111850082874298e-05, -1.0747462511062622e-05, -9.383074939250946e-06, -8.01868736743927e-06, -6.654299795627594e-06, -5.289912223815918e-06, -3.925524652004242e-06, -2.561137080192566e-06, -1.1967495083808899e-06, 1.6763806343078613e-07, 1.5320256352424622e-06, 2.896413207054138e-06, 4.260800778865814e-06, 5.62518835067749e-06, 6.989575922489166e-06, 8.353963494300842e-06, 9.718351066112518e-06, 1.1082738637924194e-05, 1.244712620973587e-05, 1.3811513781547546e-05, 1.5175901353359222e-05, 1.65402889251709e-05, 1.7904676496982574e-05, 1.926906406879425e-05, 2.0633451640605927e-05, 2.1997839212417603e-05, 2.336222678422928e-05, 2.4726614356040955e-05, 2.609100192785263e-05, 2.7455389499664307e-05, 2.8819777071475983e-05, 3.018416464328766e-05, 3.1548552215099335e-05, 3.291293978691101e-05, 3.427732735872269e-05, 3.564171493053436e-05, 3.700610250234604e-05, 3.8370490074157715e-05, 3.973487764596939e-05, 4.109926521778107e-05, 4.246365278959274e-05, 4.382804036140442e-05, 4.5192427933216095e-05, 4.655681550502777e-05, 4.792120307683945e-05, 4.928559064865112e-05, 5.06499782204628e-05, 5.2014365792274475e-05, 5.337875336408615e-05, 5.474314093589783e-05, 5.61075285077095e-05, 5.747191607952118e-05, 5.8836303651332855e-05, 6.020069122314453e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 11.0, 18.0, 26.0, 36.0, 70.0, 121.0, 246.0, 197.0, 99.0, 59.0, 51.0, 16.0, 18.0, 9.0, 1.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0015250238357111812, -0.0014877825742587447, -0.0014505411963909864, -0.00141329993493855, -0.0013760585570707917, -0.0013388172956183553, -0.001301575917750597, -0.0012643346562981606, -0.001227093394845724, -0.0011898521333932877, -0.0011526107555255294, -0.001115369494073093, -0.0010781281162053347, -0.0010408868547528982, -0.00100364547688514, -0.0009664042154327035, -0.0009291628375649452, -0.0008919215179048479, -0.0008546801982447505, -0.0008174388785846531, -0.0007801975589245558, -0.0007429562974721193, -0.000705714977812022, -0.0006684736581519246, -0.0006312323384918272, -0.0005939910188317299, -0.0005567496991716325, -0.0005195083795115352, -0.00048226708895526826, -0.0004450257692951709, -0.000407784478738904, -0.00037054315907880664, -0.00033330178121104836, -0.000296060461550951, -0.00025881914189085364, -0.00022157785133458674, -0.00018433653167448938, -0.00014709521201439202, -0.00010985390690620989, -7.261260179802775e-05, -3.537128213793039e-05, 1.8700302462093532e-06, 3.91113426303491e-05, 7.635265501448885e-05, 0.00011359396739862859, 0.00015083528705872595, 0.00018807659216690809, 0.00022531789727509022, 0.0002625592169351876, 0.00029980053659528494, 0.0003370418562553823, 0.0003742831468116492, 0.00041152446647174656, 0.0004487657861318439, 0.00048600707668811083, 0.0005232483963482082, 0.0005604897160083055, 0.0005977310356684029, 0.0006349723553285003, 0.0006722136749885976, 0.000709454994648695, 0.0007466962561011314, 0.0007839375757612288, 0.0008211788954213262, 0.0008584202150814235]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 5.0, 1.0, 3.0, 6.0, 5.0, 5.0, 14.0, 15.0, 8.0, 17.0, 19.0, 17.0, 17.0, 31.0, 29.0, 33.0, 27.0, 36.0, 32.0, 35.0, 31.0, 45.0, 36.0, 48.0, 45.0, 32.0, 41.0, 52.0, 39.0, 33.0, 21.0, 26.0, 20.0, 27.0, 24.0, 20.0, 19.0, 18.0, 20.0, 18.0, 7.0, 3.0, 8.0, 6.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00037157119368202984, -0.00035944435512647033, -0.00034731748746708035, -0.00033519064891152084, -0.0003230638103559613, -0.0003109369718004018, -0.00029881010414101183, -0.0002866832655854523, -0.0002745564270298928, -0.0002624295884743333, -0.0002503027208149433, -0.0002381758822593838, -0.00022604904370382428, -0.00021392219059634954, -0.0002017953374888748, -0.00018966849893331528, -0.00017754164582584053, -0.0001654147927183658, -0.00015328795416280627, -0.00014116110105533153, -0.000129034262499772, -0.00011690740939229727, -0.00010478056356078014, -9.265371772926301e-05, -8.052687189774588e-05, -6.840002606622875e-05, -5.627318023471162e-05, -4.414633076521568e-05, -3.201948493369855e-05, -1.989263910218142e-05, -7.765789632685483e-06, 4.361056198831648e-06, 1.6487902030348778e-05, 2.8614747861865908e-05, 4.074159369338304e-05, 5.2868443162878975e-05, 6.49952853564173e-05, 7.712213846389204e-05, 8.924898429540917e-05, 0.0001013758301269263, 0.00011350267595844343, 0.00012562952178996056, 0.0001377563748974353, 0.00014988321345299482, 0.00016201006656046957, 0.00017413690511602908, 0.00018626375822350383, 0.00019839059677906334, 0.0002105174498865381, 0.00022264430299401283, 0.00023477114154957235, 0.00024689798010513186, 0.00025902484776452184, 0.00027115168632008135, 0.00028327852487564087, 0.00029540539253503084, 0.00030753223109059036, 0.0003196590696461499, 0.00033178593730553985, 0.00034391277586109936, 0.0003560396144166589, 0.0003681664529722184, 0.00038029332063160837, 0.0003924201591871679, 0.0004045469977427274]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 9.0, 11.0, 17.0, 22.0, 27.0, 45.0, 52.0, 84.0, 120.0, 181.0, 263.0, 400.0, 583.0, 970.0, 1390.0, 2189.0, 3462.0, 5280.0, 8450.0, 13606.0, 21702.0, 36073.0, 63471.0, 123612.0, 253653.0, 242734.0, 117797.0, 60859.0, 35015.0, 21109.0, 12896.0, 8096.0, 5220.0, 3159.0, 2115.0, 1352.0, 863.0, 544.0, 388.0, 218.0, 180.0, 116.0, 81.0, 48.0, 27.0, 16.0, 16.0, 14.0, 12.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.000881195068359375, -0.0008544623851776123, -0.0008277297019958496, -0.0008009970188140869, -0.0007742643356323242, -0.0007475316524505615, -0.0007207989692687988, -0.0006940662860870361, -0.0006673336029052734, -0.0006406009197235107, -0.000613868236541748, -0.0005871355533599854, -0.0005604028701782227, -0.00053367018699646, -0.0005069375038146973, -0.00048020482063293457, -0.0004534721374511719, -0.0004267394542694092, -0.0004000067710876465, -0.0003732740879058838, -0.0003465414047241211, -0.0003198087215423584, -0.0002930760383605957, -0.000266343355178833, -0.0002396106719970703, -0.00021287798881530762, -0.00018614530563354492, -0.00015941262245178223, -0.00013267993927001953, -0.00010594725608825684, -7.921457290649414e-05, -5.2481889724731445e-05, -2.574920654296875e-05, 9.834766387939453e-07, 2.771615982055664e-05, 5.4448843002319336e-05, 8.118152618408203e-05, 0.00010791420936584473, 0.00013464689254760742, 0.00016137957572937012, 0.0001881122589111328, 0.0002148449420928955, 0.0002415776252746582, 0.0002683103084564209, 0.0002950429916381836, 0.0003217756748199463, 0.000348508358001709, 0.0003752410411834717, 0.0004019737243652344, 0.00042870640754699707, 0.00045543909072875977, 0.00048217177391052246, 0.0005089044570922852, 0.0005356371402740479, 0.0005623698234558105, 0.0005891025066375732, 0.0006158351898193359, 0.0006425678730010986, 0.0006693005561828613, 0.000696033239364624, 0.0007227659225463867, 0.0007494986057281494, 0.0007762312889099121, 0.0008029639720916748, 0.0008296966552734375]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 10.0, 12.0, 12.0, 9.0, 12.0, 15.0, 21.0, 18.0, 24.0, 26.0, 43.0, 37.0, 31.0, 38.0, 42.0, 33.0, 48.0, 41.0, 49.0, 51.0, 50.0, 41.0, 54.0, 33.0, 21.0, 33.0, 26.0, 32.0, 25.0, 21.0, 19.0, 16.0, 15.0, 15.0, 8.0, 6.0, 6.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002963542938232422, -0.0002862699329853058, -0.0002761855721473694, -0.000266101211309433, -0.0002560168504714966, -0.0002459324896335602, -0.00023584812879562378, -0.00022576376795768738, -0.00021567940711975098, -0.00020559504628181458, -0.00019551068544387817, -0.00018542632460594177, -0.00017534196376800537, -0.00016525760293006897, -0.00015517324209213257, -0.00014508888125419617, -0.00013500452041625977, -0.00012492015957832336, -0.00011483579874038696, -0.00010475143790245056, -9.466707706451416e-05, -8.458271622657776e-05, -7.449835538864136e-05, -6.441399455070496e-05, -5.4329633712768555e-05, -4.424527287483215e-05, -3.416091203689575e-05, -2.407655119895935e-05, -1.399219036102295e-05, -3.907829523086548e-06, 6.1765313148498535e-06, 1.6260892152786255e-05, 2.6345252990722656e-05, 3.642961382865906e-05, 4.651397466659546e-05, 5.659833550453186e-05, 6.668269634246826e-05, 7.676705718040466e-05, 8.685141801834106e-05, 9.693577885627747e-05, 0.00010702013969421387, 0.00011710450053215027, 0.00012718886137008667, 0.00013727322220802307, 0.00014735758304595947, 0.00015744194388389587, 0.00016752630472183228, 0.00017761066555976868, 0.00018769502639770508, 0.00019777938723564148, 0.00020786374807357788, 0.00021794810891151428, 0.00022803246974945068, 0.00023811683058738708, 0.0002482011914253235, 0.0002582855522632599, 0.0002683699131011963, 0.0002784542739391327, 0.0002885386347770691, 0.0002986229956150055, 0.0003087073564529419, 0.0003187917172908783, 0.0003288760781288147, 0.0003389604389667511, 0.0003490447998046875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 13.0, 13.0, 7.0, 10.0, 15.0, 22.0, 37.0, 52.0, 69.0, 93.0, 132.0, 220.0, 369.0, 609.0, 1238.0, 2247.0, 4461.0, 9178.0, 19502.0, 44746.0, 116074.0, 370805.0, 309920.0, 96848.0, 38393.0, 17009.0, 7946.0, 3824.0, 1992.0, 1111.0, 600.0, 325.0, 218.0, 157.0, 89.0, 42.0, 37.0, 40.0, 21.0, 20.0, 15.0, 12.0, 4.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.001323699951171875, -0.0012834817171096802, -0.0012432634830474854, -0.0012030452489852905, -0.0011628270149230957, -0.0011226087808609009, -0.001082390546798706, -0.0010421723127365112, -0.0010019540786743164, -0.0009617358446121216, -0.0009215176105499268, -0.0008812993764877319, -0.0008410811424255371, -0.0008008629083633423, -0.0007606446743011475, -0.0007204264402389526, -0.0006802082061767578, -0.000639989972114563, -0.0005997717380523682, -0.0005595535039901733, -0.0005193352699279785, -0.0004791170358657837, -0.00043889880180358887, -0.00039868056774139404, -0.0003584623336791992, -0.0003182440996170044, -0.00027802586555480957, -0.00023780763149261475, -0.00019758939743041992, -0.0001573711633682251, -0.00011715292930603027, -7.693469524383545e-05, -3.6716461181640625e-05, 3.5017728805541992e-06, 4.3720006942749023e-05, 8.393824100494385e-05, 0.00012415647506713867, 0.0001643747091293335, 0.00020459294319152832, 0.00024481117725372314, 0.00028502941131591797, 0.0003252476453781128, 0.0003654658794403076, 0.00040568411350250244, 0.00044590234756469727, 0.0004861205816268921, 0.0005263388156890869, 0.0005665570497512817, 0.0006067752838134766, 0.0006469935178756714, 0.0006872117519378662, 0.000727429986000061, 0.0007676482200622559, 0.0008078664541244507, 0.0008480846881866455, 0.0008883029222488403, 0.0009285211563110352, 0.00096873939037323, 0.0010089576244354248, 0.0010491758584976196, 0.0010893940925598145, 0.0011296123266220093, 0.001169830560684204, 0.001210048794746399, 0.0012502670288085938]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 4.0, 2.0, 6.0, 11.0, 6.0, 5.0, 16.0, 15.0, 23.0, 14.0, 24.0, 20.0, 31.0, 23.0, 32.0, 29.0, 32.0, 27.0, 49.0, 41.0, 51.0, 37.0, 35.0, 49.0, 49.0, 37.0, 47.0, 23.0, 26.0, 37.0, 40.0, 16.0, 21.0, 21.0, 17.0, 13.0, 13.0, 14.0, 12.0, 9.0, 5.0, 1.0, 1.0, 5.0, 1.0, 3.0, 6.0, 4.0, 1.0, 1.0], "bins": [-0.00027561187744140625, -0.00026786699891090393, -0.0002601221203804016, -0.0002523772418498993, -0.00024463236331939697, -0.00023688748478889465, -0.00022914260625839233, -0.00022139772772789001, -0.0002136528491973877, -0.00020590797066688538, -0.00019816309213638306, -0.00019041821360588074, -0.00018267333507537842, -0.0001749284565448761, -0.00016718357801437378, -0.00015943869948387146, -0.00015169382095336914, -0.00014394894242286682, -0.0001362040638923645, -0.00012845918536186218, -0.00012071430683135986, -0.00011296942830085754, -0.00010522454977035522, -9.74796712398529e-05, -8.973479270935059e-05, -8.198991417884827e-05, -7.424503564834595e-05, -6.650015711784363e-05, -5.875527858734131e-05, -5.101040005683899e-05, -4.326552152633667e-05, -3.552064299583435e-05, -2.777576446533203e-05, -2.0030885934829712e-05, -1.2286007404327393e-05, -4.541128873825073e-06, 3.203749656677246e-06, 1.0948628187179565e-05, 1.8693506717681885e-05, 2.6438385248184204e-05, 3.4183263778686523e-05, 4.192814230918884e-05, 4.967302083969116e-05, 5.741789937019348e-05, 6.51627779006958e-05, 7.290765643119812e-05, 8.065253496170044e-05, 8.839741349220276e-05, 9.614229202270508e-05, 0.0001038871705532074, 0.00011163204908370972, 0.00011937692761421204, 0.00012712180614471436, 0.00013486668467521667, 0.000142611563205719, 0.0001503564417362213, 0.00015810132026672363, 0.00016584619879722595, 0.00017359107732772827, 0.0001813359558582306, 0.0001890808343887329, 0.00019682571291923523, 0.00020457059144973755, 0.00021231546998023987, 0.0002200603485107422]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 3.0, 13.0, 27.0, 37.0, 54.0, 115.0, 120.0, 304.0, 506.0, 975.0, 1814.0, 4063.0, 11049.0, 32840.0, 207956.0, 664374.0, 91111.0, 19737.0, 7566.0, 2844.0, 1436.0, 686.0, 393.0, 215.0, 116.0, 66.0, 48.0, 23.0, 16.0, 17.0, 9.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.6226043701171875e-05, -2.5482848286628723e-05, -2.473965287208557e-05, -2.399645745754242e-05, -2.3253262042999268e-05, -2.2510066628456116e-05, -2.1766871213912964e-05, -2.1023675799369812e-05, -2.028048038482666e-05, -1.9537284970283508e-05, -1.8794089555740356e-05, -1.8050894141197205e-05, -1.7307698726654053e-05, -1.65645033121109e-05, -1.582130789756775e-05, -1.5078112483024597e-05, -1.4334917068481445e-05, -1.3591721653938293e-05, -1.2848526239395142e-05, -1.210533082485199e-05, -1.1362135410308838e-05, -1.0618939995765686e-05, -9.875744581222534e-06, -9.132549166679382e-06, -8.38935375213623e-06, -7.646158337593079e-06, -6.902962923049927e-06, -6.159767508506775e-06, -5.416572093963623e-06, -4.673376679420471e-06, -3.930181264877319e-06, -3.1869858503341675e-06, -2.4437904357910156e-06, -1.7005950212478638e-06, -9.57399606704712e-07, -2.1420419216156006e-07, 5.289912223815918e-07, 1.2721866369247437e-06, 2.0153820514678955e-06, 2.7585774660110474e-06, 3.5017728805541992e-06, 4.244968295097351e-06, 4.988163709640503e-06, 5.731359124183655e-06, 6.474554538726807e-06, 7.2177499532699585e-06, 7.96094536781311e-06, 8.704140782356262e-06, 9.447336196899414e-06, 1.0190531611442566e-05, 1.0933727025985718e-05, 1.167692244052887e-05, 1.2420117855072021e-05, 1.3163313269615173e-05, 1.3906508684158325e-05, 1.4649704098701477e-05, 1.539289951324463e-05, 1.613609492778778e-05, 1.6879290342330933e-05, 1.7622485756874084e-05, 1.8365681171417236e-05, 1.9108876585960388e-05, 1.985207200050354e-05, 2.0595267415046692e-05, 2.1338462829589844e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 4.0, 6.0, 11.0, 19.0, 4.0, 22.0, 34.0, 74.0, 115.0, 67.0, 201.0, 161.0, 95.0, 29.0, 39.0, 37.0, 17.0, 13.0, 10.0, 4.0, 8.0, 9.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.039836883544922e-06, -2.9336661100387573e-06, -2.8274953365325928e-06, -2.7213245630264282e-06, -2.6151537895202637e-06, -2.508983016014099e-06, -2.4028122425079346e-06, -2.29664146900177e-06, -2.1904706954956055e-06, -2.084299921989441e-06, -1.9781291484832764e-06, -1.8719583749771118e-06, -1.7657876014709473e-06, -1.6596168279647827e-06, -1.5534460544586182e-06, -1.4472752809524536e-06, -1.341104507446289e-06, -1.2349337339401245e-06, -1.12876296043396e-06, -1.0225921869277954e-06, -9.164214134216309e-07, -8.102506399154663e-07, -7.040798664093018e-07, -5.979090929031372e-07, -4.917383193969727e-07, -3.855675458908081e-07, -2.7939677238464355e-07, -1.73225998878479e-07, -6.705522537231445e-08, 3.91155481338501e-08, 1.4528632164001465e-07, 2.514570951461792e-07, 3.5762786865234375e-07, 4.637986421585083e-07, 5.699694156646729e-07, 6.761401891708374e-07, 7.82310962677002e-07, 8.884817361831665e-07, 9.94652509689331e-07, 1.1008232831954956e-06, 1.2069940567016602e-06, 1.3131648302078247e-06, 1.4193356037139893e-06, 1.5255063772201538e-06, 1.6316771507263184e-06, 1.737847924232483e-06, 1.8440186977386475e-06, 1.950189471244812e-06, 2.0563602447509766e-06, 2.162531018257141e-06, 2.2687017917633057e-06, 2.3748725652694702e-06, 2.4810433387756348e-06, 2.5872141122817993e-06, 2.693384885787964e-06, 2.7995556592941284e-06, 2.905726432800293e-06, 3.0118972063064575e-06, 3.118067979812622e-06, 3.2242387533187866e-06, 3.330409526824951e-06, 3.4365803003311157e-06, 3.5427510738372803e-06, 3.648921847343445e-06, 3.7550926208496094e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 13.0, 18.0, 29.0, 42.0, 49.0, 97.0, 138.0, 225.0, 350.0, 599.0, 1012.0, 1915.0, 3809.0, 8270.0, 19756.0, 57276.0, 264281.0, 537773.0, 105889.0, 26363.0, 10371.0, 4743.0, 2348.0, 1251.0, 753.0, 442.0, 262.0, 163.0, 94.0, 54.0, 38.0, 27.0, 27.0, 11.0, 5.0, 12.0, 7.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3053417205810547e-05, -1.2634322047233582e-05, -1.2215226888656616e-05, -1.1796131730079651e-05, -1.1377036571502686e-05, -1.095794141292572e-05, -1.0538846254348755e-05, -1.011975109577179e-05, -9.700655937194824e-06, -9.281560778617859e-06, -8.862465620040894e-06, -8.443370461463928e-06, -8.024275302886963e-06, -7.6051801443099976e-06, -7.186084985733032e-06, -6.766989827156067e-06, -6.3478946685791016e-06, -5.928799510002136e-06, -5.509704351425171e-06, -5.0906091928482056e-06, -4.67151403427124e-06, -4.252418875694275e-06, -3.8333237171173096e-06, -3.4142285585403442e-06, -2.995133399963379e-06, -2.5760382413864136e-06, -2.1569430828094482e-06, -1.737847924232483e-06, -1.3187527656555176e-06, -8.996576070785522e-07, -4.805624485015869e-07, -6.146728992462158e-08, 3.5762786865234375e-07, 7.767230272293091e-07, 1.1958181858062744e-06, 1.6149133443832397e-06, 2.034008502960205e-06, 2.4531036615371704e-06, 2.8721988201141357e-06, 3.291293978691101e-06, 3.7103891372680664e-06, 4.129484295845032e-06, 4.548579454421997e-06, 4.967674612998962e-06, 5.386769771575928e-06, 5.805864930152893e-06, 6.224960088729858e-06, 6.644055247306824e-06, 7.063150405883789e-06, 7.482245564460754e-06, 7.90134072303772e-06, 8.320435881614685e-06, 8.73953104019165e-06, 9.158626198768616e-06, 9.577721357345581e-06, 9.996816515922546e-06, 1.0415911674499512e-05, 1.0835006833076477e-05, 1.1254101991653442e-05, 1.1673197150230408e-05, 1.2092292308807373e-05, 1.2511387467384338e-05, 1.2930482625961304e-05, 1.3349577784538269e-05, 1.3768672943115234e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 3.0, 5.0, 3.0, 22.0, 5.0, 25.0, 24.0, 18.0, 40.0, 17.0, 58.0, 47.0, 94.0, 114.0, 56.0, 107.0, 48.0, 69.0, 24.0, 56.0, 37.0, 23.0, 25.0, 9.0, 20.0, 15.0, 2.0, 9.0, 1.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.159046173095703e-06, -3.06498259305954e-06, -2.9709190130233765e-06, -2.876855432987213e-06, -2.78279185295105e-06, -2.6887282729148865e-06, -2.594664692878723e-06, -2.50060111284256e-06, -2.4065375328063965e-06, -2.312473952770233e-06, -2.21841037273407e-06, -2.1243467926979065e-06, -2.030283212661743e-06, -1.93621963262558e-06, -1.8421560525894165e-06, -1.7480924725532532e-06, -1.6540288925170898e-06, -1.5599653124809265e-06, -1.4659017324447632e-06, -1.3718381524085999e-06, -1.2777745723724365e-06, -1.1837109923362732e-06, -1.0896474123001099e-06, -9.955838322639465e-07, -9.015202522277832e-07, -8.074566721916199e-07, -7.133930921554565e-07, -6.193295121192932e-07, -5.252659320831299e-07, -4.3120235204696655e-07, -3.371387720108032e-07, -2.430751919746399e-07, -1.4901161193847656e-07, -5.494803190231323e-08, 3.91155481338501e-08, 1.3317912817001343e-07, 2.2724270820617676e-07, 3.213062882423401e-07, 4.153698682785034e-07, 5.094334483146667e-07, 6.034970283508301e-07, 6.975606083869934e-07, 7.916241884231567e-07, 8.856877684593201e-07, 9.797513484954834e-07, 1.0738149285316467e-06, 1.16787850856781e-06, 1.2619420886039734e-06, 1.3560056686401367e-06, 1.4500692486763e-06, 1.5441328287124634e-06, 1.6381964087486267e-06, 1.73225998878479e-06, 1.8263235688209534e-06, 1.9203871488571167e-06, 2.01445072889328e-06, 2.1085143089294434e-06, 2.2025778889656067e-06, 2.29664146900177e-06, 2.3907050490379333e-06, 2.4847686290740967e-06, 2.57883220911026e-06, 2.6728957891464233e-06, 2.7669593691825867e-06, 2.86102294921875e-06]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 10.0, 7.0, 32.0, 52.0, 139.0, 268.0, 279.0, 113.0, 50.0, 33.0, 10.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008885014103725553, -0.0008461306570097804, -0.0008037598454393446, -0.0007613890920765698, -0.000719018338713795, -0.0006766475271433592, -0.0006342767737805843, -0.0005919060204178095, -0.0005495352670550346, -0.0005071645136922598, -0.0004647937312256545, -0.0004224229487590492, -0.00038005219539627433, -0.000337681412929669, -0.0002953106304630637, -0.00025293987710028887, -0.0002105690655298531, -0.00016819829761516303, -0.00012582752970047295, -8.345674723386765e-05, -4.108597931917757e-05, 1.2847885955125093e-06, 4.3655571062117815e-05, 8.602632442489266e-05, 0.00012839710689149797, 0.00017076787480618805, 0.00021313864272087812, 0.00025550942518748343, 0.00029788020765408874, 0.0003402509610168636, 0.0003826217434834689, 0.00042499249684624374, 0.00046736327931284904, 0.0005097340326756239, 0.0005521048442460597, 0.0005944755976088345, 0.0006368463509716094, 0.0006792171625420451, 0.00072158791590482, 0.0007639586692675948, 0.0008063294226303697, 0.0008487001759931445, 0.0008910709875635803, 0.0009334417409263551, 0.00097581249428913, 0.0010181833058595657, 0.0010605540592223406, 0.0011029248125851154, 0.0011452955659478903, 0.0011876663193106651, 0.00123003707267344, 0.0012724078260362148, 0.0013147786958143115, 0.0013571494491770864, 0.0013995202025398612, 0.001441890955902636, 0.0014842618256807327, 0.0015266325790435076, 0.0015690033324062824, 0.0016113740857690573, 0.001653744955547154, 0.0016961157089099288, 0.0017384864622727036, 0.0017808572156354785, 0.0018232279689982533]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 9.0, 5.0, 13.0, 6.0, 12.0, 16.0, 18.0, 14.0, 15.0, 15.0, 25.0, 24.0, 33.0, 36.0, 38.0, 34.0, 24.0, 36.0, 50.0, 37.0, 41.0, 30.0, 34.0, 25.0, 40.0, 33.0, 32.0, 36.0, 29.0, 32.0, 29.0, 22.0, 16.0, 21.0, 18.0, 15.0, 13.0, 11.0, 12.0, 7.0, 8.0, 10.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0002719314943533391, -0.0002634515112731606, -0.0002549715281929821, -0.0002464915451128036, -0.00023801156203262508, -0.00022953157895244658, -0.00022105158132035285, -0.00021257159824017435, -0.00020409161515999585, -0.00019561163207981735, -0.00018713164899963886, -0.00017865166591946036, -0.00017017166828736663, -0.00016169168520718813, -0.00015321170212700963, -0.00014473171904683113, -0.00013625173596665263, -0.00012777175288647413, -0.00011929176980629563, -0.00011081177945015952, -0.00010233179636998102, -9.385181328980252e-05, -8.537182293366641e-05, -7.689183985348791e-05, -6.841185677330941e-05, -5.993187369313091e-05, -5.1451886974973604e-05, -4.29719002568163e-05, -3.44919171766378e-05, -2.60119340964593e-05, -1.7531947378301993e-05, -9.051960660144687e-06, -5.720066837966442e-07, 7.907978215371259e-06, 1.638796311453916e-05, 2.4867948013707064e-05, 3.334793291287497e-05, 4.1827915993053466e-05, 5.030790271121077e-05, 5.878788942936808e-05, 6.726787250954658e-05, 7.574785558972508e-05, 8.422783866990358e-05, 9.270782902603969e-05, 0.00010118781210621819, 0.00010966779518639669, 0.0001181477855425328, 0.0001266277686227113, 0.0001351077517028898, 0.0001435877347830683, 0.0001520677178632468, 0.0001605477009434253, 0.0001690276840236038, 0.0001775076671037823, 0.00018598766473587602, 0.00019446764781605452, 0.00020294763089623302, 0.00021142761397641152, 0.00021990759705659002, 0.00022838758013676852, 0.00023686757776886225, 0.00024534756084904075, 0.00025382754392921925, 0.00026230752700939775, 0.00027078751008957624]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 10.0, 7.0, 13.0, 17.0, 12.0, 25.0, 31.0, 40.0, 41.0, 54.0, 84.0, 119.0, 147.0, 218.0, 332.0, 458.0, 685.0, 1144.0, 1971.0, 3509.0, 15267.0, 3916857.0, 240247.0, 6037.0, 2667.0, 1444.0, 947.0, 547.0, 376.0, 266.0, 192.0, 117.0, 94.0, 78.0, 39.0, 40.0, 25.0, 27.0, 22.0, 14.0, 11.0, 12.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0010137557983398438, -0.0009818673133850098, -0.0009499788284301758, -0.0009180903434753418, -0.0008862018585205078, -0.0008543133735656738, -0.0008224248886108398, -0.0007905364036560059, -0.0007586479187011719, -0.0007267594337463379, -0.0006948709487915039, -0.0006629824638366699, -0.0006310939788818359, -0.000599205493927002, -0.000567317008972168, -0.000535428524017334, -0.0005035400390625, -0.000471651554107666, -0.00043976306915283203, -0.00040787458419799805, -0.00037598609924316406, -0.0003440976142883301, -0.0003122091293334961, -0.0002803206443786621, -0.0002484321594238281, -0.00021654367446899414, -0.00018465518951416016, -0.00015276670455932617, -0.00012087821960449219, -8.89897346496582e-05, -5.710124969482422e-05, -2.5212764739990234e-05, 6.67572021484375e-06, 3.8564205169677734e-05, 7.045269012451172e-05, 0.0001023411750793457, 0.0001342296600341797, 0.00016611814498901367, 0.00019800662994384766, 0.00022989511489868164, 0.0002617835998535156, 0.0002936720848083496, 0.0003255605697631836, 0.0003574490547180176, 0.00038933753967285156, 0.00042122602462768555, 0.00045311450958251953, 0.0004850029945373535, 0.0005168914794921875, 0.0005487799644470215, 0.0005806684494018555, 0.0006125569343566895, 0.0006444454193115234, 0.0006763339042663574, 0.0007082223892211914, 0.0007401108741760254, 0.0007719993591308594, 0.0008038878440856934, 0.0008357763290405273, 0.0008676648139953613, 0.0008995532989501953, 0.0009314417839050293, 0.0009633302688598633, 0.0009952187538146973, 0.0010271072387695312]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 6.0, 12.0, 8.0, 8.0, 16.0, 9.0, 11.0, 17.0, 18.0, 25.0, 19.0, 37.0, 27.0, 20.0, 33.0, 31.0, 38.0, 35.0, 34.0, 32.0, 43.0, 34.0, 38.0, 38.0, 26.0, 36.0, 28.0, 47.0, 30.0, 29.0, 16.0, 21.0, 24.0, 19.0, 23.0, 14.0, 17.0, 12.0, 14.0, 7.0, 7.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.00022161006927490234, -0.00021473877131938934, -0.00020786747336387634, -0.00020099617540836334, -0.00019412487745285034, -0.00018725357949733734, -0.00018038228154182434, -0.00017351098358631134, -0.00016663968563079834, -0.00015976838767528534, -0.00015289708971977234, -0.00014602579176425934, -0.00013915449380874634, -0.00013228319585323334, -0.00012541189789772034, -0.00011854059994220734, -0.00011166930198669434, -0.00010479800403118134, -9.792670607566833e-05, -9.105540812015533e-05, -8.418411016464233e-05, -7.731281220912933e-05, -7.044151425361633e-05, -6.357021629810333e-05, -5.669891834259033e-05, -4.982762038707733e-05, -4.295632243156433e-05, -3.608502447605133e-05, -2.921372652053833e-05, -2.234242856502533e-05, -1.547113060951233e-05, -8.599832653999329e-06, -1.7285346984863281e-06, 5.142763257026672e-06, 1.2014061212539673e-05, 1.8885359168052673e-05, 2.5756657123565674e-05, 3.2627955079078674e-05, 3.9499253034591675e-05, 4.6370550990104675e-05, 5.3241848945617676e-05, 6.0113146901130676e-05, 6.698444485664368e-05, 7.385574281215668e-05, 8.072704076766968e-05, 8.759833872318268e-05, 9.446963667869568e-05, 0.00010134093463420868, 0.00010821223258972168, 0.00011508353054523468, 0.00012195482850074768, 0.00012882612645626068, 0.00013569742441177368, 0.00014256872236728668, 0.00014944002032279968, 0.00015631131827831268, 0.00016318261623382568, 0.00017005391418933868, 0.00017692521214485168, 0.00018379651010036469, 0.00019066780805587769, 0.00019753910601139069, 0.0002044104039669037, 0.0002112817019224167, 0.0002181529998779297]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 9.0, 10.0, 16.0, 32.0, 48.0, 117.0, 248.0, 445.0, 931.0, 2109.0, 6456.0, 38780.0, 4094647.0, 39962.0, 6481.0, 2193.0, 898.0, 437.0, 205.0, 96.0, 55.0, 34.0, 13.0, 12.0, 16.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017852783203125, -0.0017303526401519775, -0.001675426959991455, -0.0016205012798309326, -0.0015655755996704102, -0.0015106499195098877, -0.0014557242393493652, -0.0014007985591888428, -0.0013458728790283203, -0.0012909471988677979, -0.0012360215187072754, -0.001181095838546753, -0.0011261701583862305, -0.001071244478225708, -0.0010163187980651855, -0.0009613931179046631, -0.0009064674377441406, -0.0008515417575836182, -0.0007966160774230957, -0.0007416903972625732, -0.0006867647171020508, -0.0006318390369415283, -0.0005769133567810059, -0.0005219876766204834, -0.00046706199645996094, -0.0004121363162994385, -0.000357210636138916, -0.00030228495597839355, -0.0002473592758178711, -0.00019243359565734863, -0.00013750791549682617, -8.258223533630371e-05, -2.765655517578125e-05, 2.726912498474121e-05, 8.219480514526367e-05, 0.00013712048530578613, 0.0001920461654663086, 0.00024697184562683105, 0.0003018975257873535, 0.000356823205947876, 0.00041174888610839844, 0.0004666745662689209, 0.0005216002464294434, 0.0005765259265899658, 0.0006314516067504883, 0.0006863772869110107, 0.0007413029670715332, 0.0007962286472320557, 0.0008511543273925781, 0.0009060800075531006, 0.000961005687713623, 0.0010159313678741455, 0.001070857048034668, 0.0011257827281951904, 0.0011807084083557129, 0.0012356340885162354, 0.0012905597686767578, 0.0013454854488372803, 0.0014004111289978027, 0.0014553368091583252, 0.0015102624893188477, 0.0015651881694793701, 0.0016201138496398926, 0.001675039529800415, 0.0017299652099609375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 14.0, 34.0, 73.0, 205.0, 1190.0, 2146.0, 217.0, 74.0, 26.0, 15.0, 11.0, 9.0, 8.0, 9.0, 9.0, 1.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00018334388732910156, -0.00017702579498291016, -0.00017070770263671875, -0.00016438961029052734, -0.00015807151794433594, -0.00015175342559814453, -0.00014543533325195312, -0.00013911724090576172, -0.0001327991485595703, -0.0001264810562133789, -0.0001201629638671875, -0.0001138448715209961, -0.00010752677917480469, -0.00010120868682861328, -9.489059448242188e-05, -8.857250213623047e-05, -8.225440979003906e-05, -7.593631744384766e-05, -6.961822509765625e-05, -6.330013275146484e-05, -5.698204040527344e-05, -5.066394805908203e-05, -4.4345855712890625e-05, -3.802776336669922e-05, -3.170967102050781e-05, -2.5391578674316406e-05, -1.9073486328125e-05, -1.2755393981933594e-05, -6.4373016357421875e-06, -1.1920928955078125e-07, 6.198883056640625e-06, 1.2516975402832031e-05, 1.8835067749023438e-05, 2.5153160095214844e-05, 3.147125244140625e-05, 3.7789344787597656e-05, 4.410743713378906e-05, 5.042552947998047e-05, 5.6743621826171875e-05, 6.306171417236328e-05, 6.937980651855469e-05, 7.56978988647461e-05, 8.20159912109375e-05, 8.83340835571289e-05, 9.465217590332031e-05, 0.00010097026824951172, 0.00010728836059570312, 0.00011360645294189453, 0.00011992454528808594, 0.00012624263763427734, 0.00013256072998046875, 0.00013887882232666016, 0.00014519691467285156, 0.00015151500701904297, 0.00015783309936523438, 0.00016415119171142578, 0.0001704692840576172, 0.0001767873764038086, 0.00018310546875, 0.0001894235610961914, 0.0001957416534423828, 0.00020205974578857422, 0.00020837783813476562, 0.00021469593048095703, 0.00022101402282714844]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 7.0, 13.0, 20.0, 43.0, 61.0, 134.0, 257.0, 191.0, 105.0, 66.0, 40.0, 25.0, 10.0, 10.0, 8.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009001243161037564, -0.0008757165633141994, -0.0008513088687323034, -0.0008269011159427464, -0.0008024933631531894, -0.0007780856685712934, -0.0007536779157817364, -0.0007292701629921794, -0.0007048624102026224, -0.0006804546574130654, -0.0006560469628311694, -0.0006316392100416124, -0.0006072314572520554, -0.0005828237626701593, -0.0005584160098806024, -0.0005340082570910454, -0.0005096005625091493, -0.0004851928388234228, -0.0004607850860338658, -0.0004363773623481393, -0.0004119696095585823, -0.0003875618858728558, -0.00036315416218712926, -0.0003387464093975723, -0.00031433868571184576, -0.00028993096202611923, -0.00026552320923656225, -0.00024111548555083573, -0.00021670774731319398, -0.00019230000907555223, -0.0001678922853898257, -0.00014348454715218395, -0.0001190768089145422, -9.466907067690045e-05, -7.026133971521631e-05, -4.585360875353217e-05, -2.144587051589042e-05, 2.9618677217513323e-06, 2.7369591407477856e-05, 5.177732964511961e-05, 7.618506788276136e-05, 0.00010059280612040311, 0.00012500054435804486, 0.00014940826804377139, 0.00017381600628141314, 0.0001982237445190549, 0.0002226314682047814, 0.00024703919189050794, 0.0002714469446800649, 0.00029585466836579144, 0.0003202624211553484, 0.00034467014484107494, 0.0003690778976306319, 0.00039348562131635845, 0.00041789334500208497, 0.00044230109779164195, 0.0004667088214773685, 0.000491116545163095, 0.000515524297952652, 0.000539932050742209, 0.000564339745324105, 0.000588747498113662, 0.0006131551926955581, 0.000637562945485115, 0.000661970698274672]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 4.0, 7.0, 6.0, 8.0, 10.0, 16.0, 15.0, 21.0, 18.0, 30.0, 23.0, 23.0, 33.0, 24.0, 35.0, 33.0, 28.0, 53.0, 35.0, 47.0, 38.0, 45.0, 35.0, 45.0, 35.0, 39.0, 31.0, 36.0, 32.0, 26.0, 20.0, 20.0, 29.0, 17.0, 17.0, 11.0, 13.0, 6.0, 8.0, 7.0, 7.0, 4.0, 2.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002236159925814718, -0.00021612594719044864, -0.00020863588724751025, -0.0002011458418564871, -0.0001936557819135487, -0.00018616573652252555, -0.0001786756911315024, -0.00017118564574047923, -0.00016369558579754084, -0.00015620554040651768, -0.0001487154804635793, -0.00014122543507255614, -0.00013373538968153298, -0.0001262453297385946, -0.00011875528434757143, -0.00011126523168059066, -0.00010377517901360989, -9.628512634662911e-05, -8.879507367964834e-05, -8.130502828862518e-05, -7.381497562164441e-05, -6.632492295466363e-05, -5.883487392566167e-05, -5.13448248966597e-05, -4.385477222967893e-05, -3.6364719562698156e-05, -2.887467053369619e-05, -2.138461968570482e-05, -1.389456883771345e-05, -6.404516170732677e-06, 1.0855328582692891e-06, 8.575581887271255e-06, 1.606563455425203e-05, 2.3555685402243398e-05, 3.104573625023477e-05, 3.8535785279236734e-05, 4.602583794621751e-05, 5.351589061319828e-05, 6.1005939642200246e-05, 6.849598867120221e-05, 7.598604133818299e-05, 8.347609400516376e-05, 9.096614667214453e-05, 9.845619206316769e-05, 0.00010594624473014846, 0.00011343629739712924, 0.0001209263427881524, 0.00012841640273109078, 0.00013590644812211394, 0.0001433964935131371, 0.0001508865534560755, 0.00015837659884709865, 0.00016586665879003704, 0.0001733567041810602, 0.00018084674957208335, 0.0001883367949631065, 0.0001958268549060449, 0.00020331690029706806, 0.00021080696024000645, 0.0002182970056310296, 0.00022578705102205276, 0.00023327711096499115, 0.0002407671563560143, 0.0002482572162989527, 0.00025574726168997586]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 7.0, 6.0, 10.0, 12.0, 19.0, 23.0, 25.0, 39.0, 48.0, 62.0, 83.0, 115.0, 174.0, 265.0, 346.0, 602.0, 881.0, 1548.0, 2556.0, 4471.0, 8744.0, 18647.0, 42590.0, 108357.0, 312654.0, 341896.0, 117797.0, 45295.0, 19894.0, 9490.0, 4843.0, 2730.0, 1519.0, 944.0, 567.0, 397.0, 287.0, 171.0, 131.0, 86.0, 62.0, 48.0, 37.0, 15.0, 21.0, 9.0, 14.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0], "bins": [-0.00033593177795410156, -0.00032661110162734985, -0.00031729042530059814, -0.00030796974897384644, -0.0002986490726470947, -0.000289328396320343, -0.0002800077199935913, -0.0002706870436668396, -0.0002613663673400879, -0.0002520456910133362, -0.00024272501468658447, -0.00023340433835983276, -0.00022408366203308105, -0.00021476298570632935, -0.00020544230937957764, -0.00019612163305282593, -0.00018680095672607422, -0.0001774802803993225, -0.0001681596040725708, -0.0001588389277458191, -0.00014951825141906738, -0.00014019757509231567, -0.00013087689876556396, -0.00012155622243881226, -0.00011223554611206055, -0.00010291486978530884, -9.359419345855713e-05, -8.427351713180542e-05, -7.495284080505371e-05, -6.5632164478302e-05, -5.631148815155029e-05, -4.6990811824798584e-05, -3.7670135498046875e-05, -2.8349459171295166e-05, -1.9028782844543457e-05, -9.708106517791748e-06, -3.8743019104003906e-07, 8.93324613571167e-06, 1.825392246246338e-05, 2.7574598789215088e-05, 3.68952751159668e-05, 4.6215951442718506e-05, 5.5536627769470215e-05, 6.485730409622192e-05, 7.417798042297363e-05, 8.349865674972534e-05, 9.281933307647705e-05, 0.00010214000940322876, 0.00011146068572998047, 0.00012078136205673218, 0.0001301020383834839, 0.0001394227147102356, 0.0001487433910369873, 0.00015806406736373901, 0.00016738474369049072, 0.00017670542001724243, 0.00018602609634399414, 0.00019534677267074585, 0.00020466744899749756, 0.00021398812532424927, 0.00022330880165100098, 0.00023262947797775269, 0.0002419501543045044, 0.0002512708306312561, 0.0002605915069580078]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 10.0, 15.0, 13.0, 18.0, 16.0, 25.0, 31.0, 21.0, 27.0, 28.0, 27.0, 29.0, 36.0, 35.0, 47.0, 40.0, 51.0, 41.0, 50.0, 36.0, 36.0, 34.0, 39.0, 38.0, 21.0, 29.0, 24.0, 28.0, 22.0, 19.0, 25.0, 12.0, 10.0, 10.0, 11.0, 8.0, 9.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022149085998535156, -0.0002137012779712677, -0.00020591169595718384, -0.00019812211394309998, -0.0001903325319290161, -0.00018254294991493225, -0.0001747533679008484, -0.00016696378588676453, -0.00015917420387268066, -0.0001513846218585968, -0.00014359503984451294, -0.00013580545783042908, -0.00012801587581634521, -0.00012022629380226135, -0.00011243671178817749, -0.00010464712977409363, -9.685754776000977e-05, -8.90679657459259e-05, -8.127838373184204e-05, -7.348880171775818e-05, -6.569921970367432e-05, -5.7909637689590454e-05, -5.012005567550659e-05, -4.233047366142273e-05, -3.454089164733887e-05, -2.6751309633255005e-05, -1.8961727619171143e-05, -1.117214560508728e-05, -3.382563591003418e-06, 4.407018423080444e-06, 1.2196600437164307e-05, 1.998618245124817e-05, 2.777576446533203e-05, 3.5565346479415894e-05, 4.3354928493499756e-05, 5.114451050758362e-05, 5.893409252166748e-05, 6.672367453575134e-05, 7.45132565498352e-05, 8.230283856391907e-05, 9.009242057800293e-05, 9.788200259208679e-05, 0.00010567158460617065, 0.00011346116662025452, 0.00012125074863433838, 0.00012904033064842224, 0.0001368299126625061, 0.00014461949467658997, 0.00015240907669067383, 0.0001601986587047577, 0.00016798824071884155, 0.00017577782273292542, 0.00018356740474700928, 0.00019135698676109314, 0.000199146568775177, 0.00020693615078926086, 0.00021472573280334473, 0.0002225153148174286, 0.00023030489683151245, 0.0002380944788455963, 0.0002458840608596802, 0.00025367364287376404, 0.0002614632248878479, 0.00026925280690193176, 0.0002770423889160156]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 7.0, 8.0, 11.0, 16.0, 25.0, 27.0, 34.0, 36.0, 58.0, 88.0, 93.0, 121.0, 229.0, 239.0, 421.0, 658.0, 991.0, 1641.0, 2689.0, 4846.0, 9704.0, 21204.0, 55336.0, 209052.0, 552098.0, 118609.0, 37428.0, 15476.0, 7307.0, 3971.0, 2185.0, 1283.0, 831.0, 554.0, 350.0, 257.0, 173.0, 109.0, 80.0, 80.0, 54.0, 38.0, 29.0, 22.0, 26.0, 12.0, 10.0, 11.0, 4.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 3.0], "bins": [-0.0003349781036376953, -0.0003246106207370758, -0.0003142431378364563, -0.0003038756549358368, -0.0002935081720352173, -0.0002831406891345978, -0.00027277320623397827, -0.00026240572333335876, -0.00025203824043273926, -0.00024167075753211975, -0.00023130327463150024, -0.00022093579173088074, -0.00021056830883026123, -0.00020020082592964172, -0.00018983334302902222, -0.0001794658601284027, -0.0001690983772277832, -0.0001587308943271637, -0.0001483634114265442, -0.00013799592852592468, -0.00012762844562530518, -0.00011726096272468567, -0.00010689347982406616, -9.652599692344666e-05, -8.615851402282715e-05, -7.579103112220764e-05, -6.542354822158813e-05, -5.505606532096863e-05, -4.468858242034912e-05, -3.4321099519729614e-05, -2.3953616619110107e-05, -1.35861337184906e-05, -3.2186508178710938e-06, 7.148832082748413e-06, 1.751631498336792e-05, 2.7883797883987427e-05, 3.8251280784606934e-05, 4.861876368522644e-05, 5.898624658584595e-05, 6.935372948646545e-05, 7.972121238708496e-05, 9.008869528770447e-05, 0.00010045617818832397, 0.00011082366108894348, 0.00012119114398956299, 0.0001315586268901825, 0.000141926109790802, 0.0001522935926914215, 0.00016266107559204102, 0.00017302855849266052, 0.00018339604139328003, 0.00019376352429389954, 0.00020413100719451904, 0.00021449849009513855, 0.00022486597299575806, 0.00023523345589637756, 0.00024560093879699707, 0.0002559684216976166, 0.0002663359045982361, 0.0002767033874988556, 0.0002870708703994751, 0.0002974383533000946, 0.0003078058362007141, 0.0003181733191013336, 0.0003285408020019531]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [6.0, 0.0, 3.0, 3.0, 2.0, 4.0, 9.0, 10.0, 12.0, 12.0, 9.0, 10.0, 10.0, 20.0, 13.0, 24.0, 31.0, 34.0, 27.0, 25.0, 41.0, 37.0, 50.0, 35.0, 43.0, 40.0, 54.0, 49.0, 32.0, 43.0, 39.0, 32.0, 25.0, 34.0, 27.0, 25.0, 17.0, 21.0, 12.0, 21.0, 17.0, 14.0, 13.0, 3.0, 6.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013065338134765625, -0.00012562982738018036, -0.00012060627341270447, -0.00011558271944522858, -0.00011055916547775269, -0.0001055356115102768, -0.0001005120575428009, -9.548850357532501e-05, -9.046494960784912e-05, -8.544139564037323e-05, -8.041784167289734e-05, -7.539428770542145e-05, -7.037073373794556e-05, -6.534717977046967e-05, -6.0323625802993774e-05, -5.530007183551788e-05, -5.027651786804199e-05, -4.52529639005661e-05, -4.022940993309021e-05, -3.520585596561432e-05, -3.0182301998138428e-05, -2.5158748030662537e-05, -2.0135194063186646e-05, -1.5111640095710754e-05, -1.0088086128234863e-05, -5.064532160758972e-06, -4.0978193283081055e-08, 4.98257577419281e-06, 1.0006129741668701e-05, 1.5029683709144592e-05, 2.0053237676620483e-05, 2.5076791644096375e-05, 3.0100345611572266e-05, 3.512389957904816e-05, 4.014745354652405e-05, 4.517100751399994e-05, 5.019456148147583e-05, 5.521811544895172e-05, 6.024166941642761e-05, 6.52652233839035e-05, 7.02887773513794e-05, 7.531233131885529e-05, 8.033588528633118e-05, 8.535943925380707e-05, 9.038299322128296e-05, 9.540654718875885e-05, 0.00010043010115623474, 0.00010545365512371063, 0.00011047720909118652, 0.00011550076305866241, 0.0001205243170261383, 0.0001255478709936142, 0.0001305714249610901, 0.00013559497892856598, 0.00014061853289604187, 0.00014564208686351776, 0.00015066564083099365, 0.00015568919479846954, 0.00016071274876594543, 0.00016573630273342133, 0.00017075985670089722, 0.0001757834106683731, 0.000180806964635849, 0.0001858305186033249, 0.00019085407257080078]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 9.0, 17.0, 10.0, 16.0, 23.0, 36.0, 38.0, 56.0, 78.0, 108.0, 159.0, 237.0, 342.0, 565.0, 811.0, 1396.0, 2461.0, 5331.0, 12999.0, 42846.0, 633891.0, 292293.0, 33381.0, 10877.0, 4552.0, 2359.0, 1320.0, 734.0, 483.0, 329.0, 243.0, 147.0, 116.0, 80.0, 50.0, 49.0, 22.0, 21.0, 12.0, 16.0, 12.0, 6.0, 5.0, 7.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.797645568847656e-05, -8.521974086761475e-05, -8.246302604675293e-05, -7.970631122589111e-05, -7.69495964050293e-05, -7.419288158416748e-05, -7.143616676330566e-05, -6.867945194244385e-05, -6.592273712158203e-05, -6.316602230072021e-05, -6.04093074798584e-05, -5.765259265899658e-05, -5.4895877838134766e-05, -5.213916301727295e-05, -4.938244819641113e-05, -4.6625733375549316e-05, -4.38690185546875e-05, -4.1112303733825684e-05, -3.835558891296387e-05, -3.559887409210205e-05, -3.2842159271240234e-05, -3.0085444450378418e-05, -2.73287296295166e-05, -2.4572014808654785e-05, -2.181529998779297e-05, -1.9058585166931152e-05, -1.6301870346069336e-05, -1.354515552520752e-05, -1.0788440704345703e-05, -8.031725883483887e-06, -5.27501106262207e-06, -2.518296241760254e-06, 2.384185791015625e-07, 2.995133399963379e-06, 5.751848220825195e-06, 8.508563041687012e-06, 1.1265277862548828e-05, 1.4021992683410645e-05, 1.677870750427246e-05, 1.9535422325134277e-05, 2.2292137145996094e-05, 2.504885196685791e-05, 2.7805566787719727e-05, 3.056228160858154e-05, 3.331899642944336e-05, 3.6075711250305176e-05, 3.883242607116699e-05, 4.158914089202881e-05, 4.4345855712890625e-05, 4.710257053375244e-05, 4.985928535461426e-05, 5.2616000175476074e-05, 5.537271499633789e-05, 5.812942981719971e-05, 6.0886144638061523e-05, 6.364285945892334e-05, 6.639957427978516e-05, 6.915628910064697e-05, 7.191300392150879e-05, 7.46697187423706e-05, 7.742643356323242e-05, 8.018314838409424e-05, 8.293986320495605e-05, 8.569657802581787e-05, 8.845329284667969e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 3.0, 13.0, 13.0, 10.0, 14.0, 13.0, 19.0, 19.0, 16.0, 31.0, 58.0, 65.0, 49.0, 73.0, 126.0, 98.0, 69.0, 65.0, 53.0, 32.0, 35.0, 27.0, 13.0, 14.0, 18.0, 6.0, 12.0, 8.0, 9.0, 5.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-06, -8.089467883110046e-06, -7.834285497665405e-06, -7.579103112220764e-06, -7.323920726776123e-06, -7.068738341331482e-06, -6.813555955886841e-06, -6.5583735704422e-06, -6.303191184997559e-06, -6.0480087995529175e-06, -5.792826414108276e-06, -5.537644028663635e-06, -5.282461643218994e-06, -5.027279257774353e-06, -4.772096872329712e-06, -4.516914486885071e-06, -4.26173210144043e-06, -4.0065497159957886e-06, -3.7513673305511475e-06, -3.4961849451065063e-06, -3.2410025596618652e-06, -2.985820174217224e-06, -2.730637788772583e-06, -2.475455403327942e-06, -2.2202730178833008e-06, -1.9650906324386597e-06, -1.7099082469940186e-06, -1.4547258615493774e-06, -1.1995434761047363e-06, -9.443610906600952e-07, -6.891787052154541e-07, -4.33996319770813e-07, -1.7881393432617188e-07, 7.636845111846924e-08, 3.3155083656311035e-07, 5.867332220077515e-07, 8.419156074523926e-07, 1.0970979928970337e-06, 1.3522803783416748e-06, 1.607462763786316e-06, 1.862645149230957e-06, 2.117827534675598e-06, 2.3730099201202393e-06, 2.6281923055648804e-06, 2.8833746910095215e-06, 3.1385570764541626e-06, 3.3937394618988037e-06, 3.648921847343445e-06, 3.904104232788086e-06, 4.159286618232727e-06, 4.414469003677368e-06, 4.669651389122009e-06, 4.92483377456665e-06, 5.1800161600112915e-06, 5.435198545455933e-06, 5.690380930900574e-06, 5.945563316345215e-06, 6.200745701789856e-06, 6.455928087234497e-06, 6.711110472679138e-06, 6.966292858123779e-06, 7.22147524356842e-06, 7.4766576290130615e-06, 7.731840014457703e-06, 7.987022399902344e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 7.0, 2.0, 13.0, 26.0, 24.0, 44.0, 113.0, 188.0, 436.0, 843.0, 2103.0, 6637.0, 35843.0, 774360.0, 202794.0, 18158.0, 4163.0, 1488.0, 632.0, 313.0, 134.0, 75.0, 59.0, 23.0, 16.0, 16.0, 9.0, 5.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014328956604003906, -0.00013831816613674164, -0.00013334676623344421, -0.0001283753663301468, -0.00012340396642684937, -0.00011843256652355194, -0.00011346116662025452, -0.00010848976671695709, -0.00010351836681365967, -9.854696691036224e-05, -9.357556700706482e-05, -8.86041671037674e-05, -8.363276720046997e-05, -7.866136729717255e-05, -7.368996739387512e-05, -6.87185674905777e-05, -6.374716758728027e-05, -5.877576768398285e-05, -5.3804367780685425e-05, -4.8832967877388e-05, -4.3861567974090576e-05, -3.889016807079315e-05, -3.391876816749573e-05, -2.8947368264198303e-05, -2.397596836090088e-05, -1.9004568457603455e-05, -1.403316855430603e-05, -9.061768651008606e-06, -4.090368747711182e-06, 8.810311555862427e-07, 5.852431058883667e-06, 1.0823830962181091e-05, 1.5795230865478516e-05, 2.076663076877594e-05, 2.5738030672073364e-05, 3.070943057537079e-05, 3.568083047866821e-05, 4.065223038196564e-05, 4.562363028526306e-05, 5.0595030188560486e-05, 5.556643009185791e-05, 6.0537829995155334e-05, 6.550922989845276e-05, 7.048062980175018e-05, 7.545202970504761e-05, 8.042342960834503e-05, 8.539482951164246e-05, 9.036622941493988e-05, 9.53376293182373e-05, 0.00010030902922153473, 0.00010528042912483215, 0.00011025182902812958, 0.000115223228931427, 0.00012019462883472443, 0.00012516602873802185, 0.00013013742864131927, 0.0001351088285446167, 0.00014008022844791412, 0.00014505162835121155, 0.00015002302825450897, 0.0001549944281578064, 0.00015996582806110382, 0.00016493722796440125, 0.00016990862786769867, 0.0001748800277709961]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 8.0, 9.0, 11.0, 14.0, 17.0, 28.0, 34.0, 57.0, 78.0, 146.0, 220.0, 120.0, 61.0, 52.0, 26.0, 20.0, 33.0, 11.0, 16.0, 8.0, 5.0, 7.0, 7.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6450881958007812e-05, -1.587066799402237e-05, -1.5290454030036926e-05, -1.4710240066051483e-05, -1.413002610206604e-05, -1.3549812138080597e-05, -1.2969598174095154e-05, -1.238938421010971e-05, -1.1809170246124268e-05, -1.1228956282138824e-05, -1.0648742318153381e-05, -1.0068528354167938e-05, -9.488314390182495e-06, -8.908100426197052e-06, -8.327886462211609e-06, -7.747672498226166e-06, -7.167458534240723e-06, -6.5872445702552795e-06, -6.0070306062698364e-06, -5.426816642284393e-06, -4.84660267829895e-06, -4.266388714313507e-06, -3.686174750328064e-06, -3.105960786342621e-06, -2.5257468223571777e-06, -1.9455328583717346e-06, -1.3653188943862915e-06, -7.851049304008484e-07, -2.0489096641540527e-07, 3.7532299757003784e-07, 9.55536961555481e-07, 1.535750925540924e-06, 2.115964889526367e-06, 2.6961788535118103e-06, 3.2763928174972534e-06, 3.8566067814826965e-06, 4.43682074546814e-06, 5.017034709453583e-06, 5.597248673439026e-06, 6.177462637424469e-06, 6.757676601409912e-06, 7.337890565395355e-06, 7.918104529380798e-06, 8.498318493366241e-06, 9.078532457351685e-06, 9.658746421337128e-06, 1.023896038532257e-05, 1.0819174349308014e-05, 1.1399388313293457e-05, 1.19796022772789e-05, 1.2559816241264343e-05, 1.3140030205249786e-05, 1.372024416923523e-05, 1.4300458133220673e-05, 1.4880672097206116e-05, 1.546088606119156e-05, 1.6041100025177002e-05, 1.6621313989162445e-05, 1.7201527953147888e-05, 1.778174191713333e-05, 1.8361955881118774e-05, 1.8942169845104218e-05, 1.952238380908966e-05, 2.0102597773075104e-05, 2.0682811737060547e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 4.0, 4.0, 14.0, 28.0, 21.0, 49.0, 85.0, 164.0, 217.0, 157.0, 98.0, 55.0, 38.0, 24.0, 16.0, 9.0, 8.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008250455721281469, -0.0008036580984480679, -0.0007822706829756498, -0.0007608832092955709, -0.0007394957356154919, -0.0007181082619354129, -0.0006967208464629948, -0.0006753333727829158, -0.0006539459573104978, -0.0006325584836304188, -0.0006111710681580007, -0.0005897835944779217, -0.0005683961207978427, -0.0005470087053254247, -0.0005256212316453457, -0.0005042337579652667, -0.0004828462842851877, -0.0004614588397089392, -0.0004400713660288602, -0.0004186839214526117, -0.0003972964477725327, -0.0003759090031962842, -0.00035452155862003565, -0.00033313408493995667, -0.00031174664036370814, -0.0002903591957874596, -0.00026897172210738063, -0.0002475842775311321, -0.00022619681840296835, -0.0002048093592748046, -0.00018342191469855607, -0.0001620344555703923, -0.00014064693823456764, -0.00011925947910640389, -9.787202725419775e-05, -7.64845754019916e-05, -5.509711627382785e-05, -3.3709657145664096e-05, -1.232221256941557e-05, 9.065246558748186e-06, 3.045270568691194e-05, 5.184016117709689e-05, 7.322761666728184e-05, 9.461506851948798e-05, 0.00011600252764765173, 0.0001373899867758155, 0.000158777431352064, 0.00018016489048022777, 0.00020155234960839152, 0.00022293980873655528, 0.00024432726786471903, 0.00026571471244096756, 0.00028710218612104654, 0.00030848963069729507, 0.0003298770752735436, 0.0003512645489536226, 0.0003726519935298711, 0.00039403943810611963, 0.0004154269117861986, 0.00043681435636244714, 0.00045820180093869567, 0.00047958927461877465, 0.0005009766900911927, 0.0005223641637712717, 0.0005437516374513507]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 2.0, 7.0, 6.0, 5.0, 12.0, 16.0, 17.0, 20.0, 22.0, 27.0, 23.0, 25.0, 33.0, 24.0, 37.0, 27.0, 38.0, 45.0, 35.0, 42.0, 39.0, 45.0, 44.0, 37.0, 34.0, 39.0, 34.0, 31.0, 30.0, 31.0, 15.0, 23.0, 27.0, 20.0, 15.0, 16.0, 9.0, 11.0, 5.0, 7.0, 7.0, 4.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002123525191564113, -0.00020520288671832532, -0.00019805325428023934, -0.00019090362184215337, -0.0001837539894040674, -0.00017660435696598142, -0.00016945472452789545, -0.00016230509208980948, -0.0001551554596517235, -0.00014800582721363753, -0.00014085619477555156, -0.00013370656233746558, -0.0001265569298993796, -0.00011940729746129364, -0.00011225766502320766, -0.00010510803258512169, -9.795840014703572e-05, -9.080876770894974e-05, -8.365913527086377e-05, -7.65095028327778e-05, -6.935987039469182e-05, -6.221023795660585e-05, -5.506060551851988e-05, -4.7910973080433905e-05, -4.076134064234793e-05, -3.361170820426196e-05, -2.6462075766175985e-05, -1.9312443328090012e-05, -1.2162810890004039e-05, -5.0131784519180655e-06, 2.1364539861679077e-06, 9.286086424253881e-06, 1.6435718862339854e-05, 2.3585351300425828e-05, 3.07349837385118e-05, 3.7884616176597774e-05, 4.503424861468375e-05, 5.218388105276972e-05, 5.9333513490855694e-05, 6.648314592894167e-05, 7.363277836702764e-05, 8.078241080511361e-05, 8.793204324319959e-05, 9.508167568128556e-05, 0.00010223130811937153, 0.0001093809405574575, 0.00011653057299554348, 0.00012368020543362945, 0.00013082983787171543, 0.0001379794703098014, 0.00014512910274788737, 0.00015227873518597335, 0.00015942836762405932, 0.0001665780000621453, 0.00017372763250023127, 0.00018087726493831724, 0.0001880268973764032, 0.00019517652981448919, 0.00020232616225257516, 0.00020947579469066113, 0.0002166254271287471, 0.00022377505956683308, 0.00023092469200491905, 0.00023807432444300503, 0.000245223956881091]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 9.0, 8.0, 10.0, 17.0, 26.0, 34.0, 41.0, 71.0, 99.0, 166.0, 219.0, 320.0, 435.0, 699.0, 1074.0, 1479.0, 2342.0, 3661.0, 5811.0, 9211.0, 14793.0, 24586.0, 41549.0, 72857.0, 137408.0, 263402.0, 213648.0, 107785.0, 58001.0, 34191.0, 20537.0, 12442.0, 7590.0, 4854.0, 3125.0, 2011.0, 1354.0, 833.0, 598.0, 410.0, 252.0, 165.0, 114.0, 108.0, 68.0, 50.0, 25.0, 19.0, 21.0, 12.0, 6.0, 3.0, 9.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0005478858947753906, -0.0005311891436576843, -0.000514492392539978, -0.0004977956414222717, -0.00048109889030456543, -0.00046440213918685913, -0.00044770538806915283, -0.00043100863695144653, -0.00041431188583374023, -0.00039761513471603394, -0.00038091838359832764, -0.00036422163248062134, -0.00034752488136291504, -0.00033082813024520874, -0.00031413137912750244, -0.00029743462800979614, -0.00028073787689208984, -0.00026404112577438354, -0.00024734437465667725, -0.00023064762353897095, -0.00021395087242126465, -0.00019725412130355835, -0.00018055737018585205, -0.00016386061906814575, -0.00014716386795043945, -0.00013046711683273315, -0.00011377036571502686, -9.707361459732056e-05, -8.037686347961426e-05, -6.368011236190796e-05, -4.698336124420166e-05, -3.028661012649536e-05, -1.3589859008789062e-05, 3.1068921089172363e-06, 1.9803643226623535e-05, 3.6500394344329834e-05, 5.319714546203613e-05, 6.989389657974243e-05, 8.659064769744873e-05, 0.00010328739881515503, 0.00011998414993286133, 0.00013668090105056763, 0.00015337765216827393, 0.00017007440328598022, 0.00018677115440368652, 0.00020346790552139282, 0.00022016465663909912, 0.00023686140775680542, 0.0002535581588745117, 0.000270254909992218, 0.0002869516611099243, 0.0003036484122276306, 0.0003203451633453369, 0.0003370419144630432, 0.0003537386655807495, 0.0003704354166984558, 0.0003871321678161621, 0.0004038289189338684, 0.0004205256700515747, 0.000437222421169281, 0.0004539191722869873, 0.0004706159234046936, 0.0004873126745223999, 0.0005040094256401062, 0.0005207061767578125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 9.0, 8.0, 9.0, 12.0, 12.0, 21.0, 16.0, 34.0, 32.0, 30.0, 31.0, 33.0, 39.0, 34.0, 45.0, 53.0, 50.0, 52.0, 50.0, 37.0, 35.0, 42.0, 43.0, 29.0, 41.0, 24.0, 13.0, 30.0, 29.0, 18.0, 15.0, 12.0, 14.0, 9.0, 7.0, 6.0, 6.0, 4.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00020873546600341797, -0.0002020653337240219, -0.00019539520144462585, -0.0001887250691652298, -0.00018205493688583374, -0.00017538480460643768, -0.00016871467232704163, -0.00016204454004764557, -0.0001553744077682495, -0.00014870427548885345, -0.0001420341432094574, -0.00013536401093006134, -0.00012869387865066528, -0.00012202374637126923, -0.00011535361409187317, -0.00010868348181247711, -0.00010201334953308105, -9.5343217253685e-05, -8.867308497428894e-05, -8.200295269489288e-05, -7.533282041549683e-05, -6.866268813610077e-05, -6.199255585670471e-05, -5.5322423577308655e-05, -4.86522912979126e-05, -4.198215901851654e-05, -3.5312026739120483e-05, -2.8641894459724426e-05, -2.197176218032837e-05, -1.5301629900932312e-05, -8.631497621536255e-06, -1.9613653421401978e-06, 4.708766937255859e-06, 1.1378899216651917e-05, 1.8049031496047974e-05, 2.471916377544403e-05, 3.138929605484009e-05, 3.8059428334236145e-05, 4.47295606136322e-05, 5.139969289302826e-05, 5.8069825172424316e-05, 6.473995745182037e-05, 7.141008973121643e-05, 7.808022201061249e-05, 8.475035429000854e-05, 9.14204865694046e-05, 9.809061884880066e-05, 0.00010476075112819672, 0.00011143088340759277, 0.00011810101568698883, 0.0001247711479663849, 0.00013144128024578094, 0.000138111412525177, 0.00014478154480457306, 0.00015145167708396912, 0.00015812180936336517, 0.00016479194164276123, 0.0001714620739221573, 0.00017813220620155334, 0.0001848023384809494, 0.00019147247076034546, 0.00019814260303974152, 0.00020481273531913757, 0.00021148286759853363, 0.0002181529998779297]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 9.0, 11.0, 12.0, 27.0, 32.0, 47.0, 57.0, 84.0, 156.0, 223.0, 390.0, 620.0, 1104.0, 2065.0, 3985.0, 8385.0, 17323.0, 39789.0, 103982.0, 320190.0, 352014.0, 117207.0, 43396.0, 18966.0, 8956.0, 4396.0, 2189.0, 1212.0, 629.0, 349.0, 262.0, 164.0, 88.0, 75.0, 47.0, 35.0, 34.0, 13.0, 10.0, 5.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0007834434509277344, -0.0007573738694190979, -0.0007313042879104614, -0.000705234706401825, -0.0006791651248931885, -0.000653095543384552, -0.0006270259618759155, -0.000600956380367279, -0.0005748867988586426, -0.0005488172173500061, -0.0005227476358413696, -0.0004966780543327332, -0.0004706084728240967, -0.0004445388913154602, -0.00041846930980682373, -0.00039239972829818726, -0.0003663301467895508, -0.0003402605652809143, -0.00031419098377227783, -0.00028812140226364136, -0.0002620518207550049, -0.0002359822392463684, -0.00020991265773773193, -0.00018384307622909546, -0.00015777349472045898, -0.0001317039132118225, -0.00010563433170318604, -7.956475019454956e-05, -5.3495168685913086e-05, -2.742558717727661e-05, -1.3560056686401367e-06, 2.4713575839996338e-05, 5.078315734863281e-05, 7.685273885726929e-05, 0.00010292232036590576, 0.00012899190187454224, 0.0001550614833831787, 0.00018113106489181519, 0.00020720064640045166, 0.00023327022790908813, 0.0002593398094177246, 0.0002854093909263611, 0.00031147897243499756, 0.00033754855394363403, 0.0003636181354522705, 0.000389687716960907, 0.00041575729846954346, 0.00044182687997817993, 0.0004678964614868164, 0.0004939660429954529, 0.0005200356245040894, 0.0005461052060127258, 0.0005721747875213623, 0.0005982443690299988, 0.0006243139505386353, 0.0006503835320472717, 0.0006764531135559082, 0.0007025226950645447, 0.0007285922765731812, 0.0007546618580818176, 0.0007807314395904541, 0.0008068010210990906, 0.000832870602607727, 0.0008589401841163635, 0.000885009765625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 8.0, 5.0, 5.0, 10.0, 11.0, 15.0, 24.0, 24.0, 18.0, 20.0, 33.0, 37.0, 46.0, 53.0, 50.0, 66.0, 39.0, 54.0, 43.0, 46.0, 46.0, 48.0, 47.0, 34.0, 35.0, 42.0, 24.0, 27.0, 18.0, 28.0, 10.0, 7.0, 9.0, 7.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0002193450927734375, -0.00021308660507202148, -0.00020682811737060547, -0.00020056962966918945, -0.00019431114196777344, -0.00018805265426635742, -0.0001817941665649414, -0.0001755356788635254, -0.00016927719116210938, -0.00016301870346069336, -0.00015676021575927734, -0.00015050172805786133, -0.0001442432403564453, -0.0001379847526550293, -0.00013172626495361328, -0.00012546777725219727, -0.00011920928955078125, -0.00011295080184936523, -0.00010669231414794922, -0.0001004338264465332, -9.417533874511719e-05, -8.791685104370117e-05, -8.165836334228516e-05, -7.539987564086914e-05, -6.914138793945312e-05, -6.288290023803711e-05, -5.6624412536621094e-05, -5.036592483520508e-05, -4.410743713378906e-05, -3.784894943237305e-05, -3.159046173095703e-05, -2.5331974029541016e-05, -1.9073486328125e-05, -1.2814998626708984e-05, -6.556510925292969e-06, -2.980232238769531e-07, 5.9604644775390625e-06, 1.2218952178955078e-05, 1.8477439880371094e-05, 2.473592758178711e-05, 3.0994415283203125e-05, 3.725290298461914e-05, 4.3511390686035156e-05, 4.976987838745117e-05, 5.602836608886719e-05, 6.22868537902832e-05, 6.854534149169922e-05, 7.480382919311523e-05, 8.106231689453125e-05, 8.732080459594727e-05, 9.357929229736328e-05, 9.98377799987793e-05, 0.00010609626770019531, 0.00011235475540161133, 0.00011861324310302734, 0.00012487173080444336, 0.00013113021850585938, 0.0001373887062072754, 0.0001436471939086914, 0.00014990568161010742, 0.00015616416931152344, 0.00016242265701293945, 0.00016868114471435547, 0.00017493963241577148, 0.0001811981201171875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 13.0, 11.0, 15.0, 22.0, 37.0, 53.0, 84.0, 149.0, 252.0, 393.0, 741.0, 1290.0, 3130.0, 6610.0, 18259.0, 75077.0, 628652.0, 254525.0, 38445.0, 11586.0, 4560.0, 2016.0, 1084.0, 616.0, 332.0, 240.0, 118.0, 84.0, 54.0, 29.0, 29.0, 12.0, 11.0, 5.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2576580047607422e-05, -1.215469092130661e-05, -1.1732801795005798e-05, -1.1310912668704987e-05, -1.0889023542404175e-05, -1.0467134416103363e-05, -1.0045245289802551e-05, -9.62335616350174e-06, -9.201467037200928e-06, -8.779577910900116e-06, -8.357688784599304e-06, -7.935799658298492e-06, -7.513910531997681e-06, -7.092021405696869e-06, -6.670132279396057e-06, -6.248243153095245e-06, -5.826354026794434e-06, -5.404464900493622e-06, -4.98257577419281e-06, -4.560686647891998e-06, -4.1387975215911865e-06, -3.7169083952903748e-06, -3.295019268989563e-06, -2.8731301426887512e-06, -2.4512410163879395e-06, -2.0293518900871277e-06, -1.607462763786316e-06, -1.1855736374855042e-06, -7.636845111846924e-07, -3.417953848838806e-07, 8.009374141693115e-08, 5.019828677177429e-07, 9.238719940185547e-07, 1.3457611203193665e-06, 1.7676502466201782e-06, 2.18953937292099e-06, 2.6114284992218018e-06, 3.0333176255226135e-06, 3.4552067518234253e-06, 3.877095878124237e-06, 4.298985004425049e-06, 4.720874130725861e-06, 5.142763257026672e-06, 5.564652383327484e-06, 5.986541509628296e-06, 6.408430635929108e-06, 6.8303197622299194e-06, 7.252208888530731e-06, 7.674098014831543e-06, 8.095987141132355e-06, 8.517876267433167e-06, 8.939765393733978e-06, 9.36165452003479e-06, 9.783543646335602e-06, 1.0205432772636414e-05, 1.0627321898937225e-05, 1.1049211025238037e-05, 1.1471100151538849e-05, 1.189298927783966e-05, 1.2314878404140472e-05, 1.2736767530441284e-05, 1.3158656656742096e-05, 1.3580545783042908e-05, 1.400243490934372e-05, 1.4424324035644531e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 7.0, 9.0, 14.0, 15.0, 23.0, 29.0, 27.0, 115.0, 110.0, 118.0, 219.0, 82.0, 72.0, 61.0, 16.0, 28.0, 11.0, 6.0, 13.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.682209014892578e-06, -2.6011839509010315e-06, -2.520158886909485e-06, -2.4391338229179382e-06, -2.3581087589263916e-06, -2.277083694934845e-06, -2.1960586309432983e-06, -2.1150335669517517e-06, -2.034008502960205e-06, -1.9529834389686584e-06, -1.8719583749771118e-06, -1.7909333109855652e-06, -1.7099082469940186e-06, -1.628883183002472e-06, -1.5478581190109253e-06, -1.4668330550193787e-06, -1.385807991027832e-06, -1.3047829270362854e-06, -1.2237578630447388e-06, -1.1427327990531921e-06, -1.0617077350616455e-06, -9.806826710700989e-07, -8.996576070785522e-07, -8.186325430870056e-07, -7.37607479095459e-07, -6.565824151039124e-07, -5.755573511123657e-07, -4.945322871208191e-07, -4.1350722312927246e-07, -3.3248215913772583e-07, -2.514570951461792e-07, -1.7043203115463257e-07, -8.940696716308594e-08, -8.381903171539307e-09, 7.264316082000732e-08, 1.5366822481155396e-07, 2.3469328880310059e-07, 3.157183527946472e-07, 3.9674341678619385e-07, 4.777684807777405e-07, 5.587935447692871e-07, 6.398186087608337e-07, 7.208436727523804e-07, 8.01868736743927e-07, 8.828938007354736e-07, 9.639188647270203e-07, 1.044943928718567e-06, 1.1259689927101135e-06, 1.2069940567016602e-06, 1.2880191206932068e-06, 1.3690441846847534e-06, 1.4500692486763e-06, 1.5310943126678467e-06, 1.6121193766593933e-06, 1.69314444065094e-06, 1.7741695046424866e-06, 1.8551945686340332e-06, 1.93621963262558e-06, 2.0172446966171265e-06, 2.098269760608673e-06, 2.1792948246002197e-06, 2.2603198885917664e-06, 2.341344952583313e-06, 2.4223700165748596e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 6.0, 8.0, 6.0, 10.0, 9.0, 15.0, 37.0, 43.0, 57.0, 92.0, 158.0, 289.0, 399.0, 654.0, 1128.0, 2164.0, 5655.0, 13066.0, 46001.0, 359645.0, 549040.0, 46337.0, 12996.0, 5064.0, 2441.0, 1480.0, 617.0, 419.0, 231.0, 204.0, 97.0, 55.0, 41.0, 28.0, 19.0, 9.0, 9.0, 8.0, 8.0, 4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.33514404296875e-05, -1.298077404499054e-05, -1.2610107660293579e-05, -1.2239441275596619e-05, -1.1868774890899658e-05, -1.1498108506202698e-05, -1.1127442121505737e-05, -1.0756775736808777e-05, -1.0386109352111816e-05, -1.0015442967414856e-05, -9.644776582717896e-06, -9.274110198020935e-06, -8.903443813323975e-06, -8.532777428627014e-06, -8.162111043930054e-06, -7.791444659233093e-06, -7.420778274536133e-06, -7.050111889839172e-06, -6.679445505142212e-06, -6.3087791204452515e-06, -5.938112735748291e-06, -5.5674463510513306e-06, -5.19677996635437e-06, -4.82611358165741e-06, -4.455447196960449e-06, -4.084780812263489e-06, -3.7141144275665283e-06, -3.343448042869568e-06, -2.9727816581726074e-06, -2.602115273475647e-06, -2.2314488887786865e-06, -1.860782504081726e-06, -1.4901161193847656e-06, -1.1194497346878052e-06, -7.487833499908447e-07, -3.781169652938843e-07, -7.450580596923828e-09, 3.632158041000366e-07, 7.338821887969971e-07, 1.1045485734939575e-06, 1.475214958190918e-06, 1.8458813428878784e-06, 2.216547727584839e-06, 2.5872141122817993e-06, 2.9578804969787598e-06, 3.3285468816757202e-06, 3.6992132663726807e-06, 4.069879651069641e-06, 4.4405460357666016e-06, 4.811212420463562e-06, 5.1818788051605225e-06, 5.552545189857483e-06, 5.923211574554443e-06, 6.293877959251404e-06, 6.664544343948364e-06, 7.035210728645325e-06, 7.405877113342285e-06, 7.776543498039246e-06, 8.147209882736206e-06, 8.517876267433167e-06, 8.888542652130127e-06, 9.259209036827087e-06, 9.629875421524048e-06, 1.0000541806221008e-05, 1.0371208190917969e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 9.0, 5.0, 12.0, 11.0, 7.0, 31.0, 26.0, 72.0, 53.0, 66.0, 173.0, 86.0, 148.0, 64.0, 62.0, 66.0, 16.0, 32.0, 11.0, 11.0, 7.0, 7.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-06, -2.300366759300232e-06, -2.216547727584839e-06, -2.132728695869446e-06, -2.0489096641540527e-06, -1.9650906324386597e-06, -1.8812716007232666e-06, -1.7974525690078735e-06, -1.7136335372924805e-06, -1.6298145055770874e-06, -1.5459954738616943e-06, -1.4621764421463013e-06, -1.3783574104309082e-06, -1.2945383787155151e-06, -1.210719347000122e-06, -1.126900315284729e-06, -1.043081283569336e-06, -9.592622518539429e-07, -8.754432201385498e-07, -7.916241884231567e-07, -7.078051567077637e-07, -6.239861249923706e-07, -5.401670932769775e-07, -4.5634806156158447e-07, -3.725290298461914e-07, -2.8870999813079834e-07, -2.0489096641540527e-07, -1.210719347000122e-07, -3.725290298461914e-08, 4.6566128730773926e-08, 1.30385160446167e-07, 2.1420419216156006e-07, 2.980232238769531e-07, 3.818422555923462e-07, 4.6566128730773926e-07, 5.494803190231323e-07, 6.332993507385254e-07, 7.171183824539185e-07, 8.009374141693115e-07, 8.847564458847046e-07, 9.685754776000977e-07, 1.0523945093154907e-06, 1.1362135410308838e-06, 1.2200325727462769e-06, 1.30385160446167e-06, 1.387670636177063e-06, 1.471489667892456e-06, 1.5553086996078491e-06, 1.6391277313232422e-06, 1.7229467630386353e-06, 1.8067657947540283e-06, 1.8905848264694214e-06, 1.9744038581848145e-06, 2.0582228899002075e-06, 2.1420419216156006e-06, 2.2258609533309937e-06, 2.3096799850463867e-06, 2.3934990167617798e-06, 2.477318048477173e-06, 2.561137080192566e-06, 2.644956111907959e-06, 2.728775143623352e-06, 2.812594175338745e-06, 2.896413207054138e-06, 2.9802322387695312e-06]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 9.0, 9.0, 22.0, 30.0, 38.0, 59.0, 121.0, 211.0, 188.0, 117.0, 79.0, 47.0, 28.0, 15.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000603570428211242, -0.000587223912589252, -0.0005708773387596011, -0.0005545308231376112, -0.0005381842493079603, -0.0005218377336859703, -0.0005054911598563194, -0.0004891446442343295, -0.00047279809950850904, -0.0004564515547826886, -0.0004401050100568682, -0.0004237584653310478, -0.0004074119497090578, -0.00039106537587940693, -0.00037471886025741696, -0.00035837231553159654, -0.0003420257708057761, -0.0003256792260799557, -0.0003093326813541353, -0.00029298613662831485, -0.00027663959190249443, -0.00026029307628050447, -0.00024394653155468404, -0.00022759998682886362, -0.0002112534421030432, -0.00019490689737722278, -0.00017856035265140235, -0.00016221382247749716, -0.00014586727775167674, -0.00012952073302585632, -0.00011317419557599351, -9.68276581261307e-05, -8.048111340031028e-05, -6.413456867448986e-05, -4.778803122462705e-05, -3.144149013678543e-05, -1.5094949048943818e-05, 1.2515956768766046e-06, 1.7598133126739413e-05, 3.394467057660222e-05, 5.029121530242264e-05, 6.663776002824306e-05, 8.298429747810587e-05, 9.933083492796868e-05, 0.0001156773796537891, 0.00013202392437960953, 0.00014837045455351472, 0.00016471699927933514, 0.00018106354400515556, 0.00019741008873097599, 0.0002137566334567964, 0.0002301031636307016, 0.00024644972290843725, 0.0002627962385304272, 0.00027914278325624764, 0.00029548932798206806, 0.0003118358727078885, 0.0003281824174337089, 0.00034452896215952933, 0.00036087550688534975, 0.0003772220225073397, 0.0003935685963369906, 0.00040991511195898056, 0.000426261656684801, 0.0004426082014106214]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 5.0, 2.0, 9.0, 9.0, 15.0, 14.0, 14.0, 15.0, 16.0, 17.0, 24.0, 26.0, 37.0, 47.0, 36.0, 39.0, 29.0, 41.0, 42.0, 40.0, 40.0, 39.0, 36.0, 27.0, 45.0, 36.0, 34.0, 31.0, 31.0, 23.0, 32.0, 11.0, 26.0, 14.0, 18.0, 11.0, 17.0, 9.0, 2.0, 9.0, 4.0, 3.0, 5.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00017329395632259548, -0.0001675445819273591, -0.00016179522208403796, -0.0001560458476888016, -0.00015029648784548044, -0.00014454711345024407, -0.0001387977390550077, -0.00013304836465977132, -0.00012729900481645018, -0.00012154963769717142, -0.00011580027057789266, -0.00011005089618265629, -0.00010430152906337753, -9.855216194409877e-05, -9.28027875488624e-05, -8.705342042958364e-05, -8.130405331030488e-05, -7.555468619102612e-05, -6.980531907174736e-05, -6.405594467651099e-05, -5.830657755723223e-05, -5.255721043795347e-05, -4.6807839680695906e-05, -4.105846892343834e-05, -3.530910180415958e-05, -2.955973286589142e-05, -2.3810363927623257e-05, -1.8060994989355095e-05, -1.2311626051086932e-05, -6.56225711281877e-06, -8.128881745506078e-07, 4.936482582706958e-06, 1.0685849701985717e-05, 1.643521864025388e-05, 2.218458757852204e-05, 2.7933956516790204e-05, 3.3683325455058366e-05, 3.9432692574337125e-05, 4.518206333159469e-05, 5.0931434088852257e-05, 5.6680801208131015e-05, 6.243016832740977e-05, 6.817953544668853e-05, 7.39289098419249e-05, 7.967827696120366e-05, 8.542764408048242e-05, 9.11770184757188e-05, 9.692638559499756e-05, 0.00010267575271427631, 0.00010842511983355507, 0.00011417448695283383, 0.0001199238613480702, 0.00012567322119139135, 0.00013142259558662772, 0.0001371719699818641, 0.00014292134437710047, 0.0001486707042204216, 0.00015442007861565799, 0.00016016943845897913, 0.0001659188128542155, 0.00017166818724945188, 0.00017741754709277302, 0.0001831669214880094, 0.00018891628133133054, 0.0001946656557265669]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 4.0, 13.0, 10.0, 14.0, 20.0, 19.0, 24.0, 23.0, 17.0, 39.0, 40.0, 51.0, 79.0, 83.0, 104.0, 136.0, 169.0, 253.0, 320.0, 408.0, 553.0, 828.0, 1101.0, 1762.0, 5713.0, 67211.0, 3927051.0, 170583.0, 11066.0, 1918.0, 1248.0, 839.0, 602.0, 421.0, 379.0, 222.0, 201.0, 157.0, 128.0, 84.0, 94.0, 80.0, 50.0, 32.0, 23.0, 21.0, 18.0, 18.0, 14.0, 10.0, 8.0, 9.0, 11.0, 4.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003235340118408203, -0.00031224265694618225, -0.0003009513020515442, -0.00028965994715690613, -0.00027836859226226807, -0.00026707723736763, -0.00025578588247299194, -0.0002444945275783539, -0.00023320317268371582, -0.00022191181778907776, -0.0002106204628944397, -0.00019932910799980164, -0.00018803775310516357, -0.0001767463982105255, -0.00016545504331588745, -0.0001541636884212494, -0.00014287233352661133, -0.00013158097863197327, -0.0001202896237373352, -0.00010899826884269714, -9.770691394805908e-05, -8.641555905342102e-05, -7.512420415878296e-05, -6.38328492641449e-05, -5.2541494369506836e-05, -4.1250139474868774e-05, -2.9958784580230713e-05, -1.866742968559265e-05, -7.37607479095459e-06, 3.915280103683472e-06, 1.5206634998321533e-05, 2.6497989892959595e-05, 3.7789344787597656e-05, 4.908069968223572e-05, 6.037205457687378e-05, 7.166340947151184e-05, 8.29547643661499e-05, 9.424611926078796e-05, 0.00010553747415542603, 0.00011682882905006409, 0.00012812018394470215, 0.0001394115388393402, 0.00015070289373397827, 0.00016199424862861633, 0.0001732856035232544, 0.00018457695841789246, 0.00019586831331253052, 0.00020715966820716858, 0.00021845102310180664, 0.0002297423779964447, 0.00024103373289108276, 0.0002523250877857208, 0.0002636164426803589, 0.00027490779757499695, 0.000286199152469635, 0.00029749050736427307, 0.00030878186225891113, 0.0003200732171535492, 0.00033136457204818726, 0.0003426559269428253, 0.0003539472818374634, 0.00036523863673210144, 0.0003765299916267395, 0.00038782134652137756, 0.0003991127014160156]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 3.0, 4.0, 1.0, 4.0, 2.0, 8.0, 7.0, 15.0, 10.0, 11.0, 7.0, 13.0, 22.0, 30.0, 29.0, 35.0, 36.0, 42.0, 45.0, 37.0, 41.0, 45.0, 39.0, 39.0, 45.0, 39.0, 46.0, 31.0, 39.0, 41.0, 32.0, 31.0, 26.0, 27.0, 17.0, 16.0, 17.0, 18.0, 11.0, 6.0, 11.0, 5.0, 3.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00016629695892333984, -0.0001606512814760208, -0.00015500560402870178, -0.00014935992658138275, -0.00014371424913406372, -0.0001380685716867447, -0.00013242289423942566, -0.00012677721679210663, -0.0001211315393447876, -0.00011548586189746857, -0.00010984018445014954, -0.0001041945070028305, -9.854882955551147e-05, -9.290315210819244e-05, -8.725747466087341e-05, -8.161179721355438e-05, -7.596611976623535e-05, -7.032044231891632e-05, -6.467476487159729e-05, -5.902908742427826e-05, -5.338340997695923e-05, -4.77377325296402e-05, -4.209205508232117e-05, -3.6446377635002136e-05, -3.0800700187683105e-05, -2.5155022740364075e-05, -1.9509345293045044e-05, -1.3863667845726013e-05, -8.217990398406982e-06, -2.5723129510879517e-06, 3.073364496231079e-06, 8.71904194355011e-06, 1.436471939086914e-05, 2.001039683818817e-05, 2.5656074285507202e-05, 3.130175173282623e-05, 3.6947429180145264e-05, 4.2593106627464294e-05, 4.8238784074783325e-05, 5.3884461522102356e-05, 5.953013896942139e-05, 6.517581641674042e-05, 7.082149386405945e-05, 7.646717131137848e-05, 8.211284875869751e-05, 8.775852620601654e-05, 9.340420365333557e-05, 9.90498811006546e-05, 0.00010469555854797363, 0.00011034123599529266, 0.0001159869134426117, 0.00012163259088993073, 0.00012727826833724976, 0.0001329239457845688, 0.00013856962323188782, 0.00014421530067920685, 0.00014986097812652588, 0.0001555066555738449, 0.00016115233302116394, 0.00016679801046848297, 0.000172443687915802, 0.00017808936536312103, 0.00018373504281044006, 0.0001893807202577591, 0.00019502639770507812]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 10.0, 14.0, 24.0, 43.0, 84.0, 138.0, 314.0, 897.0, 3626.0, 960273.0, 3223568.0, 3753.0, 900.0, 311.0, 154.0, 77.0, 42.0, 17.0, 24.0, 10.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019989013671875, -0.001947656273841858, -0.0018964111804962158, -0.0018451660871505737, -0.0017939209938049316, -0.0017426759004592896, -0.0016914308071136475, -0.0016401857137680054, -0.0015889406204223633, -0.0015376955270767212, -0.001486450433731079, -0.001435205340385437, -0.001383960247039795, -0.0013327151536941528, -0.0012814700603485107, -0.0012302249670028687, -0.0011789798736572266, -0.0011277347803115845, -0.0010764896869659424, -0.0010252445936203003, -0.0009739995002746582, -0.0009227544069290161, -0.000871509313583374, -0.0008202642202377319, -0.0007690191268920898, -0.0007177740335464478, -0.0006665289402008057, -0.0006152838468551636, -0.0005640387535095215, -0.0005127936601638794, -0.0004615485668182373, -0.0004103034734725952, -0.0003590583801269531, -0.00030781328678131104, -0.00025656819343566895, -0.00020532310009002686, -0.00015407800674438477, -0.00010283291339874268, -5.1587820053100586e-05, -3.427267074584961e-07, 5.0902366638183594e-05, 0.00010214745998382568, 0.00015339255332946777, 0.00020463764667510986, 0.00025588274002075195, 0.00030712783336639404, 0.00035837292671203613, 0.0004096180200576782, 0.0004608631134033203, 0.0005121082067489624, 0.0005633533000946045, 0.0006145983934402466, 0.0006658434867858887, 0.0007170885801315308, 0.0007683336734771729, 0.0008195787668228149, 0.000870823860168457, 0.0009220689535140991, 0.0009733140468597412, 0.0010245591402053833, 0.0010758042335510254, 0.0011270493268966675, 0.0011782944202423096, 0.0012295395135879517, 0.0012807846069335938]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 31.0, 102.0, 1243.0, 2533.0, 108.0, 20.0, 11.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014412403106689453, -0.00013836286962032318, -0.00013260170817375183, -0.00012684054672718048, -0.00012107938528060913, -0.00011531822383403778, -0.00010955706238746643, -0.00010379590094089508, -9.803473949432373e-05, -9.227357804775238e-05, -8.651241660118103e-05, -8.075125515460968e-05, -7.499009370803833e-05, -6.922893226146698e-05, -6.346777081489563e-05, -5.770660936832428e-05, -5.194544792175293e-05, -4.618428647518158e-05, -4.042312502861023e-05, -3.466196358203888e-05, -2.890080213546753e-05, -2.313964068889618e-05, -1.737847924232483e-05, -1.1617317795753479e-05, -5.856156349182129e-06, -9.499490261077881e-08, 5.666166543960571e-06, 1.1427327990531921e-05, 1.718848943710327e-05, 2.294965088367462e-05, 2.871081233024597e-05, 3.447197377681732e-05, 4.023313522338867e-05, 4.599429666996002e-05, 5.175545811653137e-05, 5.751661956310272e-05, 6.327778100967407e-05, 6.903894245624542e-05, 7.480010390281677e-05, 8.056126534938812e-05, 8.632242679595947e-05, 9.208358824253082e-05, 9.784474968910217e-05, 0.00010360591113567352, 0.00010936707258224487, 0.00011512823402881622, 0.00012088939547538757, 0.00012665055692195892, 0.00013241171836853027, 0.00013817287981510162, 0.00014393404126167297, 0.00014969520270824432, 0.00015545636415481567, 0.00016121752560138702, 0.00016697868704795837, 0.00017273984849452972, 0.00017850100994110107, 0.00018426217138767242, 0.00019002333283424377, 0.00019578449428081512, 0.00020154565572738647, 0.00020730681717395782, 0.00021306797862052917, 0.00021882914006710052, 0.00022459030151367188]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 7.0, 7.0, 9.0, 18.0, 31.0, 33.0, 50.0, 83.0, 125.0, 191.0, 138.0, 94.0, 55.0, 49.0, 32.0, 20.0, 14.0, 9.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0004160069511272013, -0.0004049281124025583, -0.00039384927367791533, -0.0003827704058494419, -0.0003716915671247989, -0.0003606127284001559, -0.0003495338896755129, -0.00033845502184703946, -0.00032737618312239647, -0.0003162973443977535, -0.0003052185056731105, -0.00029413963784463704, -0.00028306079911999404, -0.00027198196039535105, -0.00026090312167070806, -0.0002498242538422346, -0.00023874542966950685, -0.00022766659094486386, -0.00021658773766830564, -0.00020550889894366264, -0.00019443004566710442, -0.00018335120694246143, -0.0001722723536659032, -0.00016119351494126022, -0.00015011467621661723, -0.00013903583749197423, -0.00012795698421541601, -0.00011687814549077302, -0.0001057992922142148, -9.472045348957181e-05, -8.36416074889712e-05, -7.25627614883706e-05, -6.148390821181238e-05, -5.040506221121177e-05, -3.9326216210611165e-05, -2.8247373847989365e-05, -1.716852784738876e-05, -6.089681846788153e-06, 4.989160515833646e-06, 1.6068006516434252e-05, 2.714685251703486e-05, 3.8225698517635465e-05, 4.930454451823607e-05, 6.038338688085787e-05, 7.146222924347967e-05, 8.254108252003789e-05, 9.361992124468088e-05, 0.00010469876724528149, 0.0001157776132458821, 0.00012685645197052509, 0.0001379353052470833, 0.0001490141439717263, 0.00016009299724828452, 0.0001711718359729275, 0.00018225068924948573, 0.00019332952797412872, 0.00020440836669877172, 0.0002154872054234147, 0.00022656605869997293, 0.00023764489742461592, 0.00024872375070117414, 0.00025980258942581713, 0.0002708814281504601, 0.00028196029597893357, 0.00029303913470357656]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 3.0, 4.0, 11.0, 7.0, 12.0, 7.0, 15.0, 16.0, 25.0, 23.0, 20.0, 41.0, 33.0, 23.0, 33.0, 43.0, 38.0, 46.0, 55.0, 47.0, 25.0, 50.0, 57.0, 53.0, 37.0, 22.0, 39.0, 29.0, 32.0, 25.0, 22.0, 19.0, 19.0, 16.0, 8.0, 6.0, 10.0, 5.0, 3.0, 5.0, 3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00018155160068999976, -0.000176026311237365, -0.00017050102178473026, -0.0001649757323320955, -0.00015945045743137598, -0.00015392516797874123, -0.00014839987852610648, -0.00014287458907347172, -0.00013734929962083697, -0.00013182401016820222, -0.00012629872071556747, -0.00012077343853889033, -0.00011524814908625558, -0.00010972286690957844, -0.00010419757745694369, -9.867228800430894e-05, -9.31470058276318e-05, -8.762171637499705e-05, -8.209643419831991e-05, -7.657114474568516e-05, -7.104585529305041e-05, -6.552056584041566e-05, -5.999528366373852e-05, -5.446999421110377e-05, -4.894470839644782e-05, -4.341942258179188e-05, -3.7894133129157126e-05, -3.236884731450118e-05, -2.6843559680855833e-05, -2.1318272047210485e-05, -1.579298623255454e-05, -1.0267696779919788e-05, -4.7424109652638435e-06, 7.828762136341538e-07, 6.308163392532151e-06, 1.1833450116682798e-05, 1.7358737750328146e-05, 2.2884025383973494e-05, 2.840931119862944e-05, 3.393460065126419e-05, 3.9459886465920135e-05, 4.498517228057608e-05, 5.051046173321083e-05, 5.6035747547866777e-05, 6.156103336252272e-05, 6.708632281515747e-05, 7.261161226779222e-05, 7.813690172042698e-05, 8.366218389710411e-05, 8.918747334973887e-05, 9.4712755526416e-05, 0.00010023804497905076, 0.00010576333443168551, 0.00011128862388432026, 0.0001168139060609974, 0.00012233920278958976, 0.00012786447769030929, 0.00013338976714294404, 0.0001389150565955788, 0.0001444403314962983, 0.00014996562094893306, 0.00015549091040156782, 0.00016101619985420257, 0.00016654148930683732, 0.00017206677875947207]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 4.0, 5.0, 13.0, 15.0, 21.0, 40.0, 51.0, 93.0, 134.0, 202.0, 340.0, 567.0, 1043.0, 1719.0, 3427.0, 6730.0, 15007.0, 36263.0, 103467.0, 340742.0, 360535.0, 109064.0, 38588.0, 15421.0, 7183.0, 3466.0, 1886.0, 957.0, 594.0, 334.0, 249.0, 128.0, 108.0, 35.0, 37.0, 20.0, 17.0, 8.0, 15.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024020671844482422, -0.00023220665752887726, -0.0002242065966129303, -0.00021620653569698334, -0.00020820647478103638, -0.00020020641386508942, -0.00019220635294914246, -0.0001842062920331955, -0.00017620623111724854, -0.00016820617020130157, -0.00016020610928535461, -0.00015220604836940765, -0.0001442059874534607, -0.00013620592653751373, -0.00012820586562156677, -0.00012020580470561981, -0.00011220574378967285, -0.00010420568287372589, -9.620562195777893e-05, -8.820556104183197e-05, -8.020550012588501e-05, -7.220543920993805e-05, -6.420537829399109e-05, -5.620531737804413e-05, -4.820525646209717e-05, -4.020519554615021e-05, -3.220513463020325e-05, -2.4205073714256287e-05, -1.6205012798309326e-05, -8.204951882362366e-06, -2.0489096641540527e-07, 7.795169949531555e-06, 1.5795230865478516e-05, 2.3795291781425476e-05, 3.1795352697372437e-05, 3.97954136133194e-05, 4.779547452926636e-05, 5.579553544521332e-05, 6.379559636116028e-05, 7.179565727710724e-05, 7.97957181930542e-05, 8.779577910900116e-05, 9.579584002494812e-05, 0.00010379590094089508, 0.00011179596185684204, 0.000119796022772789, 0.00012779608368873596, 0.00013579614460468292, 0.00014379620552062988, 0.00015179626643657684, 0.0001597963273525238, 0.00016779638826847076, 0.00017579644918441772, 0.00018379651010036469, 0.00019179657101631165, 0.0001997966319322586, 0.00020779669284820557, 0.00021579675376415253, 0.0002237968146800995, 0.00023179687559604645, 0.0002397969365119934, 0.00024779699742794037, 0.00025579705834388733, 0.0002637971192598343, 0.00027179718017578125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 8.0, 3.0, 5.0, 8.0, 9.0, 7.0, 13.0, 15.0, 24.0, 20.0, 29.0, 22.0, 31.0, 37.0, 34.0, 40.0, 42.0, 35.0, 39.0, 56.0, 42.0, 47.0, 63.0, 51.0, 52.0, 37.0, 33.0, 24.0, 30.0, 34.0, 19.0, 15.0, 14.0, 13.0, 9.0, 5.0, 8.0, 9.0, 0.0, 6.0, 4.0, 4.0, 3.0, 0.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001862049102783203, -0.0001804400235414505, -0.0001746751368045807, -0.00016891025006771088, -0.00016314536333084106, -0.00015738047659397125, -0.00015161558985710144, -0.00014585070312023163, -0.00014008581638336182, -0.000134320929646492, -0.0001285560429096222, -0.00012279115617275238, -0.00011702626943588257, -0.00011126138269901276, -0.00010549649596214294, -9.973160922527313e-05, -9.396672248840332e-05, -8.820183575153351e-05, -8.24369490146637e-05, -7.667206227779388e-05, -7.090717554092407e-05, -6.514228880405426e-05, -5.937740206718445e-05, -5.3612515330314636e-05, -4.7847628593444824e-05, -4.208274185657501e-05, -3.63178551197052e-05, -3.055296838283539e-05, -2.4788081645965576e-05, -1.9023194909095764e-05, -1.3258308172225952e-05, -7.49342143535614e-06, -1.7285346984863281e-06, 4.036352038383484e-06, 9.801238775253296e-06, 1.5566125512123108e-05, 2.133101224899292e-05, 2.7095898985862732e-05, 3.2860785722732544e-05, 3.8625672459602356e-05, 4.439055919647217e-05, 5.015544593334198e-05, 5.592033267021179e-05, 6.16852194070816e-05, 6.745010614395142e-05, 7.321499288082123e-05, 7.897987961769104e-05, 8.474476635456085e-05, 9.050965309143066e-05, 9.627453982830048e-05, 0.00010203942656517029, 0.0001078043133020401, 0.00011356920003890991, 0.00011933408677577972, 0.00012509897351264954, 0.00013086386024951935, 0.00013662874698638916, 0.00014239363372325897, 0.00014815852046012878, 0.0001539234071969986, 0.0001596882939338684, 0.00016545318067073822, 0.00017121806740760803, 0.00017698295414447784, 0.00018274784088134766]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 11.0, 16.0, 24.0, 33.0, 35.0, 68.0, 87.0, 154.0, 314.0, 527.0, 1037.0, 1948.0, 4394.0, 11381.0, 39571.0, 283537.0, 620381.0, 59024.0, 15298.0, 5599.0, 2442.0, 1216.0, 594.0, 338.0, 167.0, 110.0, 69.0, 45.0, 38.0, 22.0, 12.0, 15.0, 11.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004150867462158203, -0.0004021674394607544, -0.0003892481327056885, -0.00037632882595062256, -0.00036340951919555664, -0.0003504902124404907, -0.0003375709056854248, -0.0003246515989303589, -0.00031173229217529297, -0.00029881298542022705, -0.00028589367866516113, -0.0002729743719100952, -0.0002600550651550293, -0.0002471357583999634, -0.00023421645164489746, -0.00022129714488983154, -0.00020837783813476562, -0.0001954585313796997, -0.0001825392246246338, -0.00016961991786956787, -0.00015670061111450195, -0.00014378130435943604, -0.00013086199760437012, -0.0001179426908493042, -0.00010502338409423828, -9.210407733917236e-05, -7.918477058410645e-05, -6.626546382904053e-05, -5.334615707397461e-05, -4.042685031890869e-05, -2.7507543563842773e-05, -1.4588236808776855e-05, -1.6689300537109375e-06, 1.125037670135498e-05, 2.41696834564209e-05, 3.7088990211486816e-05, 5.0008296966552734e-05, 6.292760372161865e-05, 7.584691047668457e-05, 8.876621723175049e-05, 0.0001016855239868164, 0.00011460483074188232, 0.00012752413749694824, 0.00014044344425201416, 0.00015336275100708008, 0.000166282057762146, 0.00017920136451721191, 0.00019212067127227783, 0.00020503997802734375, 0.00021795928478240967, 0.00023087859153747559, 0.0002437978982925415, 0.0002567172050476074, 0.00026963651180267334, 0.00028255581855773926, 0.0002954751253128052, 0.0003083944320678711, 0.000321313738822937, 0.00033423304557800293, 0.00034715235233306885, 0.00036007165908813477, 0.0003729909658432007, 0.0003859102725982666, 0.0003988295793533325, 0.00041174888610839844]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 8.0, 7.0, 6.0, 12.0, 7.0, 13.0, 12.0, 14.0, 26.0, 19.0, 24.0, 32.0, 35.0, 41.0, 45.0, 39.0, 53.0, 48.0, 36.0, 45.0, 59.0, 56.0, 36.0, 34.0, 35.0, 32.0, 54.0, 27.0, 22.0, 17.0, 13.0, 20.0, 13.0, 8.0, 8.0, 8.0, 14.0, 7.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00011628866195678711, -0.00011256430298089981, -0.00010883994400501251, -0.00010511558502912521, -0.00010139122605323792, -9.766686707735062e-05, -9.394250810146332e-05, -9.021814912557602e-05, -8.649379014968872e-05, -8.276943117380142e-05, -7.904507219791412e-05, -7.532071322202682e-05, -7.159635424613953e-05, -6.787199527025223e-05, -6.414763629436493e-05, -6.042327731847763e-05, -5.669891834259033e-05, -5.2974559366703033e-05, -4.9250200390815735e-05, -4.5525841414928436e-05, -4.180148243904114e-05, -3.807712346315384e-05, -3.435276448726654e-05, -3.062840551137924e-05, -2.6904046535491943e-05, -2.3179687559604645e-05, -1.9455328583717346e-05, -1.5730969607830048e-05, -1.2006610631942749e-05, -8.28225165605545e-06, -4.557892680168152e-06, -8.335337042808533e-07, 2.8908252716064453e-06, 6.615184247493744e-06, 1.0339543223381042e-05, 1.4063902199268341e-05, 1.778826117515564e-05, 2.1512620151042938e-05, 2.5236979126930237e-05, 2.8961338102817535e-05, 3.2685697078704834e-05, 3.641005605459213e-05, 4.013441503047943e-05, 4.385877400636673e-05, 4.758313298225403e-05, 5.130749195814133e-05, 5.5031850934028625e-05, 5.8756209909915924e-05, 6.248056888580322e-05, 6.620492786169052e-05, 6.992928683757782e-05, 7.365364581346512e-05, 7.737800478935242e-05, 8.110236376523972e-05, 8.482672274112701e-05, 8.855108171701431e-05, 9.227544069290161e-05, 9.599979966878891e-05, 9.972415864467621e-05, 0.00010344851762056351, 0.0001071728765964508, 0.0001108972355723381, 0.0001146215945482254, 0.0001183459535241127, 0.0001220703125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 11.0, 22.0, 29.0, 40.0, 50.0, 79.0, 100.0, 139.0, 273.0, 439.0, 717.0, 1050.0, 1866.0, 3367.0, 6326.0, 13532.0, 39015.0, 529125.0, 387152.0, 37489.0, 13691.0, 6010.0, 3316.0, 1796.0, 1037.0, 652.0, 451.0, 242.0, 175.0, 107.0, 70.0, 60.0, 44.0, 23.0, 12.0, 16.0, 13.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.158517837524414e-05, -6.919726729393005e-05, -6.680935621261597e-05, -6.442144513130188e-05, -6.203353404998779e-05, -5.9645622968673706e-05, -5.725771188735962e-05, -5.486980080604553e-05, -5.2481889724731445e-05, -5.009397864341736e-05, -4.770606756210327e-05, -4.5318156480789185e-05, -4.29302453994751e-05, -4.054233431816101e-05, -3.8154423236846924e-05, -3.576651215553284e-05, -3.337860107421875e-05, -3.099068999290466e-05, -2.8602778911590576e-05, -2.621486783027649e-05, -2.3826956748962402e-05, -2.1439045667648315e-05, -1.905113458633423e-05, -1.666322350502014e-05, -1.4275312423706055e-05, -1.1887401342391968e-05, -9.499490261077881e-06, -7.111579179763794e-06, -4.723668098449707e-06, -2.33575701713562e-06, 5.21540641784668e-08, 2.4400651454925537e-06, 4.827976226806641e-06, 7.2158873081207275e-06, 9.603798389434814e-06, 1.1991709470748901e-05, 1.4379620552062988e-05, 1.6767531633377075e-05, 1.9155442714691162e-05, 2.154335379600525e-05, 2.3931264877319336e-05, 2.6319175958633423e-05, 2.870708703994751e-05, 3.10949981212616e-05, 3.3482909202575684e-05, 3.587082028388977e-05, 3.825873136520386e-05, 4.0646642446517944e-05, 4.303455352783203e-05, 4.542246460914612e-05, 4.7810375690460205e-05, 5.019828677177429e-05, 5.258619785308838e-05, 5.4974108934402466e-05, 5.736202001571655e-05, 5.974993109703064e-05, 6.213784217834473e-05, 6.452575325965881e-05, 6.69136643409729e-05, 6.930157542228699e-05, 7.168948650360107e-05, 7.407739758491516e-05, 7.646530866622925e-05, 7.885321974754333e-05, 8.124113082885742e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 3.0, 8.0, 6.0, 5.0, 8.0, 10.0, 14.0, 15.0, 16.0, 24.0, 30.0, 28.0, 33.0, 52.0, 61.0, 48.0, 93.0, 114.0, 89.0, 46.0, 40.0, 50.0, 40.0, 24.0, 20.0, 18.0, 16.0, 14.0, 13.0, 11.0, 6.0, 10.0, 9.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0], "bins": [-6.973743438720703e-06, -6.749294698238373e-06, -6.5248459577560425e-06, -6.300397217273712e-06, -6.075948476791382e-06, -5.8514997363090515e-06, -5.627050995826721e-06, -5.402602255344391e-06, -5.1781535148620605e-06, -4.95370477437973e-06, -4.7292560338974e-06, -4.50480729341507e-06, -4.280358552932739e-06, -4.055909812450409e-06, -3.831461071968079e-06, -3.6070123314857483e-06, -3.382563591003418e-06, -3.1581148505210876e-06, -2.9336661100387573e-06, -2.709217369556427e-06, -2.4847686290740967e-06, -2.2603198885917664e-06, -2.035871148109436e-06, -1.8114224076271057e-06, -1.5869736671447754e-06, -1.362524926662445e-06, -1.1380761861801147e-06, -9.136274456977844e-07, -6.891787052154541e-07, -4.647299647331238e-07, -2.4028122425079346e-07, -1.5832483768463135e-08, 2.086162567138672e-07, 4.330649971961975e-07, 6.575137376785278e-07, 8.819624781608582e-07, 1.1064112186431885e-06, 1.3308599591255188e-06, 1.5553086996078491e-06, 1.7797574400901794e-06, 2.0042061805725098e-06, 2.22865492105484e-06, 2.4531036615371704e-06, 2.6775524020195007e-06, 2.902001142501831e-06, 3.1264498829841614e-06, 3.3508986234664917e-06, 3.575347363948822e-06, 3.7997961044311523e-06, 4.024244844913483e-06, 4.248693585395813e-06, 4.473142325878143e-06, 4.697591066360474e-06, 4.922039806842804e-06, 5.146488547325134e-06, 5.370937287807465e-06, 5.595386028289795e-06, 5.819834768772125e-06, 6.0442835092544556e-06, 6.268732249736786e-06, 6.493180990219116e-06, 6.7176297307014465e-06, 6.942078471183777e-06, 7.166527211666107e-06, 7.3909759521484375e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 6.0, 3.0, 5.0, 9.0, 14.0, 23.0, 25.0, 36.0, 49.0, 72.0, 120.0, 228.0, 387.0, 631.0, 1278.0, 2771.0, 5888.0, 14408.0, 39658.0, 150934.0, 699840.0, 85660.0, 27246.0, 10373.0, 4359.0, 2165.0, 1050.0, 513.0, 300.0, 176.0, 106.0, 67.0, 34.0, 38.0, 23.0, 12.0, 14.0, 13.0, 8.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00010436773300170898, -0.00010132696479558945, -9.828619658946991e-05, -9.524542838335037e-05, -9.220466017723083e-05, -8.91638919711113e-05, -8.612312376499176e-05, -8.308235555887222e-05, -8.004158735275269e-05, -7.700081914663315e-05, -7.396005094051361e-05, -7.091928273439407e-05, -6.787851452827454e-05, -6.4837746322155e-05, -6.179697811603546e-05, -5.8756209909915924e-05, -5.571544170379639e-05, -5.267467349767685e-05, -4.963390529155731e-05, -4.6593137085437775e-05, -4.355236887931824e-05, -4.05116006731987e-05, -3.747083246707916e-05, -3.4430064260959625e-05, -3.138929605484009e-05, -2.834852784872055e-05, -2.5307759642601013e-05, -2.2266991436481476e-05, -1.922622323036194e-05, -1.61854550242424e-05, -1.3144686818122864e-05, -1.0103918612003326e-05, -7.063150405883789e-06, -4.022382199764252e-06, -9.816139936447144e-07, 2.059154212474823e-06, 5.09992241859436e-06, 8.140690624713898e-06, 1.1181458830833435e-05, 1.4222227036952972e-05, 1.726299524307251e-05, 2.0303763449192047e-05, 2.3344531655311584e-05, 2.6385299861431122e-05, 2.942606806755066e-05, 3.2466836273670197e-05, 3.5507604479789734e-05, 3.854837268590927e-05, 4.158914089202881e-05, 4.4629909098148346e-05, 4.767067730426788e-05, 5.071144551038742e-05, 5.375221371650696e-05, 5.6792981922626495e-05, 5.983375012874603e-05, 6.287451833486557e-05, 6.591528654098511e-05, 6.895605474710464e-05, 7.199682295322418e-05, 7.503759115934372e-05, 7.807835936546326e-05, 8.11191275715828e-05, 8.415989577770233e-05, 8.720066398382187e-05, 9.02414321899414e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 3.0, 11.0, 19.0, 17.0, 17.0, 22.0, 16.0, 27.0, 30.0, 28.0, 42.0, 58.0, 128.0, 181.0, 90.0, 48.0, 44.0, 20.0, 24.0, 31.0, 20.0, 21.0, 14.0, 13.0, 16.0, 3.0, 5.0, 5.0, 5.0, 6.0, 7.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.633167266845703e-05, -1.5855766832828522e-05, -1.5379860997200012e-05, -1.4903955161571503e-05, -1.4428049325942993e-05, -1.3952143490314484e-05, -1.3476237654685974e-05, -1.3000331819057465e-05, -1.2524425983428955e-05, -1.2048520147800446e-05, -1.1572614312171936e-05, -1.1096708476543427e-05, -1.0620802640914917e-05, -1.0144896805286407e-05, -9.668990969657898e-06, -9.193085134029388e-06, -8.717179298400879e-06, -8.24127346277237e-06, -7.76536762714386e-06, -7.28946179151535e-06, -6.813555955886841e-06, -6.337650120258331e-06, -5.861744284629822e-06, -5.385838449001312e-06, -4.909932613372803e-06, -4.434026777744293e-06, -3.958120942115784e-06, -3.482215106487274e-06, -3.0063092708587646e-06, -2.530403435230255e-06, -2.0544975996017456e-06, -1.578591763973236e-06, -1.1026859283447266e-06, -6.26780092716217e-07, -1.5087425708770752e-07, 3.25031578540802e-07, 8.009374141693115e-07, 1.276843249797821e-06, 1.7527490854263306e-06, 2.22865492105484e-06, 2.7045607566833496e-06, 3.180466592311859e-06, 3.6563724279403687e-06, 4.132278263568878e-06, 4.608184099197388e-06, 5.084089934825897e-06, 5.559995770454407e-06, 6.035901606082916e-06, 6.511807441711426e-06, 6.987713277339935e-06, 7.463619112968445e-06, 7.939524948596954e-06, 8.415430784225464e-06, 8.891336619853973e-06, 9.367242455482483e-06, 9.843148291110992e-06, 1.0319054126739502e-05, 1.0794959962368011e-05, 1.1270865797996521e-05, 1.174677163362503e-05, 1.222267746925354e-05, 1.269858330488205e-05, 1.3174489140510559e-05, 1.3650394976139069e-05, 1.4126300811767578e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 2.0, 7.0, 10.0, 12.0, 18.0, 26.0, 35.0, 43.0, 72.0, 75.0, 163.0, 168.0, 112.0, 65.0, 45.0, 41.0, 39.0, 14.0, 10.0, 10.0, 10.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038569551543332636, -0.0003755490470211953, -0.0003654026077128947, -0.0003552561393007636, -0.000345109699992463, -0.0003349632315803319, -0.0003248167922720313, -0.00031467032385990024, -0.00030452385544776917, -0.0002943773870356381, -0.0002842309477273375, -0.0002740844793152064, -0.0002639380400069058, -0.0002537915715947747, -0.00024364511773455888, -0.00023349866387434304, -0.0002233522100141272, -0.00021320575615391135, -0.0002030593022936955, -0.00019291284843347967, -0.0001827663800213486, -0.00017261992616113275, -0.0001624734723009169, -0.00015232700388878584, -0.00014218056458048522, -0.00013203411072026938, -0.00012188764958409593, -0.00011174119572388008, -0.00010159473458770663, -9.144828072749078e-05, -8.130182686727494e-05, -7.115536573110148e-05, -6.1008904594928026e-05, -5.0862447096733376e-05, -4.0715989598538727e-05, -3.0569535738322884e-05, -2.0423078240128234e-05, -1.0276620741933584e-05, -1.301668817177415e-07, 1.0016294254455715e-05, 2.0162748114671558e-05, 3.0309205612866208e-05, 4.045566311106086e-05, 5.06021169712767e-05, 6.074857446947135e-05, 7.0895031967666e-05, 8.104148582788184e-05, 9.11879469640553e-05, 0.00010133440082427114, 0.00011148085468448699, 0.00012162731582066044, 0.00013177376240491867, 0.00014192023081704974, 0.00015206668467726558, 0.00016221313853748143, 0.0001723596069496125, 0.0001825060462579131, 0.00019265250011812896, 0.0002027989539783448, 0.00021294542239047587, 0.0002230918762506917, 0.00023323833011090755, 0.0002433847839711234, 0.00025353123783133924, 0.0002636777062434703]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 5.0, 4.0, 2.0, 5.0, 13.0, 4.0, 12.0, 15.0, 12.0, 16.0, 27.0, 22.0, 25.0, 41.0, 29.0, 30.0, 32.0, 38.0, 43.0, 36.0, 57.0, 41.0, 44.0, 44.0, 50.0, 52.0, 30.0, 36.0, 29.0, 34.0, 33.0, 16.0, 22.0, 19.0, 22.0, 14.0, 7.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0001703154412098229, -0.00016509677516296506, -0.00015987810911610723, -0.0001546594430692494, -0.00014944077702239156, -0.00014422211097553372, -0.0001390034449286759, -0.00013378477888181806, -0.00012856611283496022, -0.0001233474467881024, -0.00011812878074124455, -0.00011291011469438672, -0.00010769144864752889, -0.00010247278260067105, -9.725411655381322e-05, -9.203545050695539e-05, -8.681678446009755e-05, -8.159811841323972e-05, -7.637945236638188e-05, -7.116078631952405e-05, -6.594212027266622e-05, -6.072345422580838e-05, -5.550478817895055e-05, -5.0286122132092714e-05, -4.506745608523488e-05, -3.9848790038377047e-05, -3.463012399151921e-05, -2.941145794466138e-05, -2.4192791897803545e-05, -1.897412585094571e-05, -1.3755459804087877e-05, -8.536793757230043e-06, -3.318113158456981e-06, 1.9005528884008527e-06, 7.1192189352586865e-06, 1.233788498211652e-05, 1.7556551028974354e-05, 2.2775217075832188e-05, 2.7993883122690022e-05, 3.3212549169547856e-05, 3.843121521640569e-05, 4.3649881263263524e-05, 4.886854731012136e-05, 5.408721335697919e-05, 5.9305879403837025e-05, 6.452454545069486e-05, 6.974321149755269e-05, 7.496187754441053e-05, 8.018054359126836e-05, 8.53992096381262e-05, 9.061787568498403e-05, 9.583654173184186e-05, 0.0001010552077786997, 0.00010627387382555753, 0.00011149253987241536, 0.0001167112059192732, 0.00012192987196613103, 0.00012714853801298887, 0.0001323672040598467, 0.00013758587010670453, 0.00014280453615356237, 0.0001480232022004202, 0.00015324186824727803, 0.00015846053429413587, 0.0001636792003409937]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 9.0, 8.0, 18.0, 20.0, 24.0, 34.0, 57.0, 88.0, 130.0, 178.0, 251.0, 364.0, 535.0, 758.0, 1039.0, 1604.0, 2326.0, 3469.0, 5337.0, 8053.0, 12836.0, 20835.0, 34113.0, 60456.0, 113702.0, 223179.0, 251108.0, 135003.0, 69236.0, 39315.0, 23260.0, 14177.0, 9001.0, 5996.0, 3790.0, 2548.0, 1792.0, 1201.0, 823.0, 589.0, 417.0, 290.0, 165.0, 137.0, 88.0, 73.0, 35.0, 40.0, 21.0, 16.0, 8.0, 4.0, 1.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003800392150878906, -0.00036782771348953247, -0.0003556162118911743, -0.00034340471029281616, -0.000331193208694458, -0.00031898170709609985, -0.0003067702054977417, -0.00029455870389938354, -0.0002823472023010254, -0.00027013570070266724, -0.0002579241991043091, -0.00024571269750595093, -0.00023350119590759277, -0.00022128969430923462, -0.00020907819271087646, -0.0001968666911125183, -0.00018465518951416016, -0.000172443687915802, -0.00016023218631744385, -0.0001480206847190857, -0.00013580918312072754, -0.00012359768152236938, -0.00011138617992401123, -9.917467832565308e-05, -8.696317672729492e-05, -7.475167512893677e-05, -6.254017353057861e-05, -5.032867193222046e-05, -3.8117170333862305e-05, -2.590566873550415e-05, -1.3694167137145996e-05, -1.4826655387878418e-06, 1.0728836059570312e-05, 2.2940337657928467e-05, 3.515183925628662e-05, 4.7363340854644775e-05, 5.957484245300293e-05, 7.178634405136108e-05, 8.399784564971924e-05, 9.620934724807739e-05, 0.00010842084884643555, 0.0001206323504447937, 0.00013284385204315186, 0.00014505535364151, 0.00015726685523986816, 0.00016947835683822632, 0.00018168985843658447, 0.00019390136003494263, 0.00020611286163330078, 0.00021832436323165894, 0.0002305358648300171, 0.00024274736642837524, 0.0002549588680267334, 0.00026717036962509155, 0.0002793818712234497, 0.00029159337282180786, 0.000303804874420166, 0.00031601637601852417, 0.0003282278776168823, 0.0003404393792152405, 0.00035265088081359863, 0.0003648623824119568, 0.00037707388401031494, 0.0003892853856086731, 0.00040149688720703125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 1.0, 9.0, 5.0, 10.0, 10.0, 11.0, 12.0, 13.0, 9.0, 21.0, 32.0, 32.0, 38.0, 27.0, 34.0, 41.0, 45.0, 44.0, 43.0, 59.0, 37.0, 55.0, 46.0, 41.0, 42.0, 40.0, 45.0, 32.0, 28.0, 22.0, 18.0, 21.0, 19.0, 8.0, 10.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00016355514526367188, -0.00015843287110328674, -0.0001533105969429016, -0.00014818832278251648, -0.00014306604862213135, -0.00013794377446174622, -0.00013282150030136108, -0.00012769922614097595, -0.00012257695198059082, -0.00011745467782020569, -0.00011233240365982056, -0.00010721012949943542, -0.00010208785533905029, -9.696558117866516e-05, -9.184330701828003e-05, -8.67210328578949e-05, -8.159875869750977e-05, -7.647648453712463e-05, -7.13542103767395e-05, -6.623193621635437e-05, -6.110966205596924e-05, -5.5987387895584106e-05, -5.0865113735198975e-05, -4.574283957481384e-05, -4.062056541442871e-05, -3.549829125404358e-05, -3.0376017093658447e-05, -2.5253742933273315e-05, -2.0131468772888184e-05, -1.5009194612503052e-05, -9.88692045211792e-06, -4.764646291732788e-06, 3.5762786865234375e-07, 5.479902029037476e-06, 1.0602176189422607e-05, 1.572445034980774e-05, 2.084672451019287e-05, 2.5968998670578003e-05, 3.1091272830963135e-05, 3.6213546991348267e-05, 4.13358211517334e-05, 4.645809531211853e-05, 5.158036947250366e-05, 5.6702643632888794e-05, 6.182491779327393e-05, 6.694719195365906e-05, 7.206946611404419e-05, 7.719174027442932e-05, 8.231401443481445e-05, 8.743628859519958e-05, 9.255856275558472e-05, 9.768083691596985e-05, 0.00010280311107635498, 0.00010792538523674011, 0.00011304765939712524, 0.00011816993355751038, 0.0001232922077178955, 0.00012841448187828064, 0.00013353675603866577, 0.0001386590301990509, 0.00014378130435943604, 0.00014890357851982117, 0.0001540258526802063, 0.00015914812684059143, 0.00016427040100097656]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 18.0, 12.0, 20.0, 39.0, 51.0, 86.0, 129.0, 220.0, 380.0, 625.0, 1178.0, 2071.0, 3921.0, 7847.0, 15563.0, 34285.0, 83942.0, 269379.0, 402544.0, 133790.0, 49029.0, 21484.0, 10464.0, 5184.0, 2796.0, 1495.0, 816.0, 471.0, 266.0, 151.0, 96.0, 63.0, 42.0, 25.0, 20.0, 7.0, 10.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006375312805175781, -0.0006194263696670532, -0.0006013214588165283, -0.0005832165479660034, -0.0005651116371154785, -0.0005470067262649536, -0.0005289018154144287, -0.0005107969045639038, -0.0004926919937133789, -0.000474587082862854, -0.0004564821720123291, -0.0004383772611618042, -0.0004202723503112793, -0.0004021674394607544, -0.0003840625286102295, -0.0003659576177597046, -0.0003478527069091797, -0.0003297477960586548, -0.0003116428852081299, -0.000293537974357605, -0.0002754330635070801, -0.0002573281526565552, -0.00023922324180603027, -0.00022111833095550537, -0.00020301342010498047, -0.00018490850925445557, -0.00016680359840393066, -0.00014869868755340576, -0.00013059377670288086, -0.00011248886585235596, -9.438395500183105e-05, -7.627904415130615e-05, -5.817413330078125e-05, -4.006922245025635e-05, -2.1964311599731445e-05, -3.859400749206543e-06, 1.424551010131836e-05, 3.235042095184326e-05, 5.0455331802368164e-05, 6.856024265289307e-05, 8.666515350341797e-05, 0.00010477006435394287, 0.00012287497520446777, 0.00014097988605499268, 0.00015908479690551758, 0.00017718970775604248, 0.00019529461860656738, 0.00021339952945709229, 0.0002315044403076172, 0.0002496093511581421, 0.000267714262008667, 0.0002858191728591919, 0.0003039240837097168, 0.0003220289945602417, 0.0003401339054107666, 0.0003582388162612915, 0.0003763437271118164, 0.0003944486379623413, 0.0004125535488128662, 0.0004306584596633911, 0.000448763370513916, 0.0004668682813644409, 0.0004849731922149658, 0.0005030781030654907, 0.0005211830139160156]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 4.0, 7.0, 6.0, 11.0, 10.0, 12.0, 13.0, 18.0, 21.0, 23.0, 20.0, 40.0, 34.0, 36.0, 43.0, 44.0, 50.0, 40.0, 46.0, 41.0, 42.0, 43.0, 39.0, 46.0, 32.0, 43.0, 27.0, 29.0, 24.0, 17.0, 28.0, 21.0, 19.0, 13.0, 8.0, 11.0, 8.0, 8.0, 5.0, 3.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011587142944335938, -0.00011187605559825897, -0.00010788068175315857, -0.00010388530790805817, -9.988993406295776e-05, -9.589456021785736e-05, -9.189918637275696e-05, -8.790381252765656e-05, -8.390843868255615e-05, -7.991306483745575e-05, -7.591769099235535e-05, -7.192231714725494e-05, -6.792694330215454e-05, -6.393156945705414e-05, -5.9936195611953735e-05, -5.594082176685333e-05, -5.194544792175293e-05, -4.795007407665253e-05, -4.3954700231552124e-05, -3.995932638645172e-05, -3.596395254135132e-05, -3.1968578696250916e-05, -2.7973204851150513e-05, -2.397783100605011e-05, -1.9982457160949707e-05, -1.5987083315849304e-05, -1.1991709470748901e-05, -7.996335625648499e-06, -4.000961780548096e-06, -5.587935447692871e-09, 3.98978590965271e-06, 7.985159754753113e-06, 1.1980533599853516e-05, 1.597590744495392e-05, 1.997128129005432e-05, 2.3966655135154724e-05, 2.7962028980255127e-05, 3.195740282535553e-05, 3.595277667045593e-05, 3.9948150515556335e-05, 4.394352436065674e-05, 4.793889820575714e-05, 5.1934272050857544e-05, 5.592964589595795e-05, 5.992501974105835e-05, 6.392039358615875e-05, 6.791576743125916e-05, 7.191114127635956e-05, 7.590651512145996e-05, 7.990188896656036e-05, 8.389726281166077e-05, 8.789263665676117e-05, 9.188801050186157e-05, 9.588338434696198e-05, 9.987875819206238e-05, 0.00010387413203716278, 0.00010786950588226318, 0.00011186487972736359, 0.00011586025357246399, 0.00011985562741756439, 0.0001238510012626648, 0.0001278463751077652, 0.0001318417489528656, 0.000135837122797966, 0.0001398324966430664]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 9.0, 12.0, 12.0, 32.0, 36.0, 47.0, 88.0, 174.0, 333.0, 614.0, 1213.0, 2542.0, 8123.0, 24608.0, 126867.0, 718716.0, 133142.0, 20246.0, 6625.0, 2585.0, 1255.0, 514.0, 309.0, 174.0, 110.0, 60.0, 41.0, 20.0, 15.0, 7.0, 8.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-05, -9.700655937194824e-06, -9.268522262573242e-06, -8.83638858795166e-06, -8.404254913330078e-06, -7.972121238708496e-06, -7.539987564086914e-06, -7.107853889465332e-06, -6.67572021484375e-06, -6.243586540222168e-06, -5.811452865600586e-06, -5.379319190979004e-06, -4.947185516357422e-06, -4.51505184173584e-06, -4.082918167114258e-06, -3.6507844924926758e-06, -3.2186508178710938e-06, -2.7865171432495117e-06, -2.3543834686279297e-06, -1.9222497940063477e-06, -1.4901161193847656e-06, -1.0579824447631836e-06, -6.258487701416016e-07, -1.9371509552001953e-07, 2.384185791015625e-07, 6.705522537231445e-07, 1.1026859283447266e-06, 1.5348196029663086e-06, 1.9669532775878906e-06, 2.3990869522094727e-06, 2.8312206268310547e-06, 3.2633543014526367e-06, 3.6954879760742188e-06, 4.127621650695801e-06, 4.559755325317383e-06, 4.991888999938965e-06, 5.424022674560547e-06, 5.856156349182129e-06, 6.288290023803711e-06, 6.720423698425293e-06, 7.152557373046875e-06, 7.584691047668457e-06, 8.016824722290039e-06, 8.448958396911621e-06, 8.881092071533203e-06, 9.313225746154785e-06, 9.745359420776367e-06, 1.017749309539795e-05, 1.0609626770019531e-05, 1.1041760444641113e-05, 1.1473894119262695e-05, 1.1906027793884277e-05, 1.233816146850586e-05, 1.2770295143127441e-05, 1.3202428817749023e-05, 1.3634562492370605e-05, 1.4066696166992188e-05, 1.449882984161377e-05, 1.4930963516235352e-05, 1.5363097190856934e-05, 1.5795230865478516e-05, 1.6227364540100098e-05, 1.665949821472168e-05, 1.7091631889343262e-05, 1.7523765563964844e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 8.0, 6.0, 4.0, 8.0, 4.0, 30.0, 16.0, 22.0, 84.0, 54.0, 103.0, 292.0, 118.0, 144.0, 36.0, 16.0, 30.0, 7.0, 8.0, 8.0, 2.0, 4.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.337860107421875e-06, -3.255903720855713e-06, -3.1739473342895508e-06, -3.0919909477233887e-06, -3.0100345611572266e-06, -2.9280781745910645e-06, -2.8461217880249023e-06, -2.7641654014587402e-06, -2.682209014892578e-06, -2.600252628326416e-06, -2.518296241760254e-06, -2.436339855194092e-06, -2.3543834686279297e-06, -2.2724270820617676e-06, -2.1904706954956055e-06, -2.1085143089294434e-06, -2.0265579223632812e-06, -1.944601535797119e-06, -1.862645149230957e-06, -1.780688762664795e-06, -1.6987323760986328e-06, -1.6167759895324707e-06, -1.5348196029663086e-06, -1.4528632164001465e-06, -1.3709068298339844e-06, -1.2889504432678223e-06, -1.2069940567016602e-06, -1.125037670135498e-06, -1.043081283569336e-06, -9.611248970031738e-07, -8.791685104370117e-07, -7.972121238708496e-07, -7.152557373046875e-07, -6.332993507385254e-07, -5.513429641723633e-07, -4.6938657760620117e-07, -3.8743019104003906e-07, -3.0547380447387695e-07, -2.2351741790771484e-07, -1.4156103134155273e-07, -5.960464477539063e-08, 2.2351741790771484e-08, 1.043081283569336e-07, 1.862645149230957e-07, 2.682209014892578e-07, 3.501772880554199e-07, 4.3213367462158203e-07, 5.140900611877441e-07, 5.960464477539062e-07, 6.780028343200684e-07, 7.599592208862305e-07, 8.419156074523926e-07, 9.238719940185547e-07, 1.0058283805847168e-06, 1.087784767150879e-06, 1.169741153717041e-06, 1.2516975402832031e-06, 1.3336539268493652e-06, 1.4156103134155273e-06, 1.4975666999816895e-06, 1.5795230865478516e-06, 1.6614794731140137e-06, 1.7434358596801758e-06, 1.8253922462463379e-06, 1.9073486328125e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 5.0, 4.0, 14.0, 18.0, 27.0, 28.0, 74.0, 84.0, 217.0, 365.0, 1117.0, 3183.0, 16506.0, 160734.0, 819611.0, 36620.0, 6984.0, 1809.0, 584.0, 258.0, 112.0, 59.0, 49.0, 37.0, 21.0, 8.0, 7.0, 10.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.288818359375e-05, -2.2319145500659943e-05, -2.1750107407569885e-05, -2.1181069314479828e-05, -2.061203122138977e-05, -2.0042993128299713e-05, -1.9473955035209656e-05, -1.89049169421196e-05, -1.833587884902954e-05, -1.7766840755939484e-05, -1.7197802662849426e-05, -1.662876456975937e-05, -1.605972647666931e-05, -1.5490688383579254e-05, -1.4921650290489197e-05, -1.435261219739914e-05, -1.3783574104309082e-05, -1.3214536011219025e-05, -1.2645497918128967e-05, -1.207645982503891e-05, -1.1507421731948853e-05, -1.0938383638858795e-05, -1.0369345545768738e-05, -9.80030745267868e-06, -9.231269359588623e-06, -8.662231266498566e-06, -8.093193173408508e-06, -7.524155080318451e-06, -6.9551169872283936e-06, -6.386078894138336e-06, -5.817040801048279e-06, -5.2480027079582214e-06, -4.678964614868164e-06, -4.109926521778107e-06, -3.5408884286880493e-06, -2.971850335597992e-06, -2.4028122425079346e-06, -1.8337741494178772e-06, -1.2647360563278198e-06, -6.956979632377625e-07, -1.2665987014770508e-07, 4.423782229423523e-07, 1.0114163160324097e-06, 1.580454409122467e-06, 2.1494925022125244e-06, 2.7185305953025818e-06, 3.287568688392639e-06, 3.8566067814826965e-06, 4.425644874572754e-06, 4.994682967662811e-06, 5.563721060752869e-06, 6.132759153842926e-06, 6.701797246932983e-06, 7.270835340023041e-06, 7.839873433113098e-06, 8.408911526203156e-06, 8.977949619293213e-06, 9.54698771238327e-06, 1.0116025805473328e-05, 1.0685063898563385e-05, 1.1254101991653442e-05, 1.18231400847435e-05, 1.2392178177833557e-05, 1.2961216270923615e-05, 1.3530254364013672e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 10.0, 12.0, 18.0, 29.0, 20.0, 65.0, 109.0, 184.0, 87.0, 171.0, 123.0, 69.0, 21.0, 28.0, 25.0, 8.0, 3.0, 6.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.1597370505332947e-06, -2.0544975996017456e-06, -1.9492581486701965e-06, -1.8440186977386475e-06, -1.7387792468070984e-06, -1.6335397958755493e-06, -1.5283003449440002e-06, -1.4230608940124512e-06, -1.317821443080902e-06, -1.212581992149353e-06, -1.107342541217804e-06, -1.0021030902862549e-06, -8.968636393547058e-07, -7.916241884231567e-07, -6.863847374916077e-07, -5.811452865600586e-07, -4.759058356285095e-07, -3.7066638469696045e-07, -2.654269337654114e-07, -1.601874828338623e-07, -5.494803190231323e-08, 5.029141902923584e-08, 1.555308699607849e-07, 2.60770320892334e-07, 3.6600977182388306e-07, 4.7124922275543213e-07, 5.764886736869812e-07, 6.817281246185303e-07, 7.869675755500793e-07, 8.922070264816284e-07, 9.974464774131775e-07, 1.1026859283447266e-06, 1.2079253792762756e-06, 1.3131648302078247e-06, 1.4184042811393738e-06, 1.5236437320709229e-06, 1.628883183002472e-06, 1.734122633934021e-06, 1.83936208486557e-06, 1.944601535797119e-06, 2.0498409867286682e-06, 2.1550804376602173e-06, 2.2603198885917664e-06, 2.3655593395233154e-06, 2.4707987904548645e-06, 2.5760382413864136e-06, 2.6812776923179626e-06, 2.7865171432495117e-06, 2.891756594181061e-06, 2.99699604511261e-06, 3.102235496044159e-06, 3.207474946975708e-06, 3.312714397907257e-06, 3.417953848838806e-06, 3.5231932997703552e-06, 3.6284327507019043e-06, 3.7336722016334534e-06, 3.8389116525650024e-06, 3.9441511034965515e-06, 4.049390554428101e-06, 4.15463000535965e-06, 4.259869456291199e-06, 4.365108907222748e-06, 4.470348358154297e-06]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 9.0, 23.0, 22.0, 64.0, 148.0, 342.0, 206.0, 93.0, 46.0, 21.0, 17.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0009792015189304948, -0.0009591109119355679, -0.0009390203049406409, -0.000918929697945714, -0.000898839149158448, -0.000878748542163521, -0.0008586579351685941, -0.0008385673281736672, -0.0008184767211787403, -0.0007983861141838133, -0.0007782955071888864, -0.0007582049584016204, -0.0007381143514066935, -0.0007180237444117665, -0.0006979331374168396, -0.0006778425304219127, -0.0006577519234269857, -0.0006376613164320588, -0.0006175707094371319, -0.000597480102442205, -0.0005773895536549389, -0.000557298946660012, -0.0005372083396650851, -0.0005171177326701581, -0.0004970271838828921, -0.0004769365768879652, -0.00045684599899686873, -0.0004367553920019418, -0.00041666478500701487, -0.0003965742071159184, -0.00037648360012099147, -0.00035639299312606454, -0.00033630241523496807, -0.00031621180824004114, -0.00029612123034894466, -0.00027603062335401773, -0.0002559400163590908, -0.0002358494239160791, -0.0002157588314730674, -0.00019566822447814047, -0.00017557763203512877, -0.00015548703959211707, -0.00013539643259719014, -0.00011530584015417844, -9.521524043520913e-05, -7.512464071623981e-05, -5.503404827322811e-05, -3.494344127830118e-05, -1.4852848835289478e-05, 5.2377490646904334e-06, 2.5328346964670345e-05, 4.541894304566085e-05, 6.550954276463017e-05, 8.560014248359948e-05, 0.00010569073492661119, 0.00012578134192153811, 0.00014587193436454982, 0.00016596252680756152, 0.00018605313380248845, 0.00020614372624550015, 0.00022623431868851185, 0.0002463249256834388, 0.0002664155326783657, 0.00028650613967329264, 0.0003065967175643891]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 12.0, 3.0, 12.0, 12.0, 8.0, 15.0, 18.0, 19.0, 18.0, 23.0, 24.0, 32.0, 31.0, 26.0, 38.0, 36.0, 46.0, 27.0, 50.0, 42.0, 43.0, 45.0, 36.0, 36.0, 43.0, 29.0, 29.0, 36.0, 29.0, 25.0, 26.0, 18.0, 16.0, 11.0, 12.0, 7.0, 8.0, 10.0, 10.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00013219415268395096, -0.00012783669808413833, -0.0001234792434843257, -0.00011912178888451308, -0.00011476432700874284, -0.00011040687240893021, -0.00010604941780911759, -0.00010169196320930496, -9.733450133353472e-05, -9.297704673372209e-05, -8.861959213390946e-05, -8.426213753409684e-05, -7.99046756583266e-05, -7.554722105851397e-05, -7.118976645870134e-05, -6.683231185888872e-05, -6.247485725907609e-05, -5.811740265926346e-05, -5.375994442147203e-05, -4.94024898216594e-05, -4.504503158386797e-05, -4.068757698405534e-05, -3.6330122384242713e-05, -3.197266778443009e-05, -2.7615209546638653e-05, -2.3257753127836622e-05, -1.8900296709034592e-05, -1.4542842109221965e-05, -1.0185385690419935e-05, -5.827929271617904e-06, -1.4704746718052775e-06, 2.886981746996753e-06, 7.244438165798783e-06, 1.1601894584600814e-05, 1.5959351003402844e-05, 2.031680560321547e-05, 2.46742620220175e-05, 2.903171844081953e-05, 3.338917304063216e-05, 3.7746627640444785e-05, 4.210408587823622e-05, 4.6461540478048846e-05, 5.081899871584028e-05, 5.517645331565291e-05, 5.9533907915465534e-05, 6.389136251527816e-05, 6.824881711509079e-05, 7.260627899086103e-05, 7.696373359067366e-05, 8.132118819048628e-05, 8.567864279029891e-05, 9.003610466606915e-05, 9.439355926588178e-05, 9.87510138656944e-05, 0.00010310846846550703, 0.00010746592306531966, 0.00011182337766513228, 0.00011618083226494491, 0.00012053828686475754, 0.00012489574146457016, 0.0001292531960643828, 0.00013361065066419542, 0.00013796810526400805, 0.0001423255744157359, 0.00014668302901554853]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 6.0, 15.0, 16.0, 24.0, 27.0, 30.0, 43.0, 88.0, 89.0, 127.0, 163.0, 233.0, 345.0, 571.0, 1285.0, 18106.0, 3975538.0, 190803.0, 4430.0, 881.0, 479.0, 246.0, 196.0, 150.0, 106.0, 66.0, 55.0, 37.0, 30.0, 27.0, 14.0, 14.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036072731018066406, -0.0003486163914203644, -0.0003365054726600647, -0.000324394553899765, -0.00031228363513946533, -0.00030017271637916565, -0.00028806179761886597, -0.0002759508788585663, -0.0002638399600982666, -0.0002517290413379669, -0.00023961812257766724, -0.00022750720381736755, -0.00021539628505706787, -0.0002032853662967682, -0.0001911744475364685, -0.00017906352877616882, -0.00016695261001586914, -0.00015484169125556946, -0.00014273077249526978, -0.0001306198537349701, -0.00011850893497467041, -0.00010639801621437073, -9.428709745407104e-05, -8.217617869377136e-05, -7.006525993347168e-05, -5.7954341173172e-05, -4.5843422412872314e-05, -3.373250365257263e-05, -2.162158489227295e-05, -9.510666131973267e-06, 2.600252628326416e-06, 1.4711171388626099e-05, 2.682209014892578e-05, 3.8933008909225464e-05, 5.1043927669525146e-05, 6.315484642982483e-05, 7.526576519012451e-05, 8.73766839504242e-05, 9.948760271072388e-05, 0.00011159852147102356, 0.00012370944023132324, 0.00013582035899162292, 0.0001479312777519226, 0.0001600421965122223, 0.00017215311527252197, 0.00018426403403282166, 0.00019637495279312134, 0.00020848587155342102, 0.0002205967903137207, 0.00023270770907402039, 0.00024481862783432007, 0.00025692954659461975, 0.00026904046535491943, 0.0002811513841152191, 0.0002932623028755188, 0.0003053732216358185, 0.00031748414039611816, 0.00032959505915641785, 0.00034170597791671753, 0.0003538168966770172, 0.0003659278154373169, 0.0003780387341976166, 0.00039014965295791626, 0.00040226057171821594, 0.0004143714904785156]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 8.0, 14.0, 7.0, 12.0, 9.0, 18.0, 19.0, 15.0, 14.0, 26.0, 31.0, 27.0, 38.0, 35.0, 43.0, 33.0, 42.0, 55.0, 53.0, 42.0, 40.0, 47.0, 46.0, 48.0, 39.0, 31.0, 24.0, 35.0, 17.0, 25.0, 13.0, 18.0, 15.0, 10.0, 9.0, 9.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013494491577148438, -0.00013041868805885315, -0.00012589246034622192, -0.0001213662326335907, -0.00011684000492095947, -0.00011231377720832825, -0.00010778754949569702, -0.0001032613217830658, -9.873509407043457e-05, -9.420886635780334e-05, -8.968263864517212e-05, -8.51564109325409e-05, -8.063018321990967e-05, -7.610395550727844e-05, -7.157772779464722e-05, -6.705150008201599e-05, -6.252527236938477e-05, -5.799904465675354e-05, -5.3472816944122314e-05, -4.894658923149109e-05, -4.442036151885986e-05, -3.989413380622864e-05, -3.536790609359741e-05, -3.0841678380966187e-05, -2.631545066833496e-05, -2.1789222955703735e-05, -1.726299524307251e-05, -1.2736767530441284e-05, -8.210539817810059e-06, -3.684312105178833e-06, 8.419156074523926e-07, 5.368143320083618e-06, 9.894371032714844e-06, 1.442059874534607e-05, 1.8946826457977295e-05, 2.347305417060852e-05, 2.7999281883239746e-05, 3.252550959587097e-05, 3.70517373085022e-05, 4.157796502113342e-05, 4.610419273376465e-05, 5.0630420446395874e-05, 5.51566481590271e-05, 5.9682875871658325e-05, 6.420910358428955e-05, 6.873533129692078e-05, 7.3261559009552e-05, 7.778778672218323e-05, 8.231401443481445e-05, 8.684024214744568e-05, 9.13664698600769e-05, 9.589269757270813e-05, 0.00010041892528533936, 0.00010494515299797058, 0.0001094713807106018, 0.00011399760842323303, 0.00011852383613586426, 0.00012305006384849548, 0.0001275762915611267, 0.00013210251927375793, 0.00013662874698638916, 0.00014115497469902039, 0.0001456812024116516, 0.00015020743012428284, 0.00015473365783691406]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 3.0, 16.0, 33.0, 39.0, 99.0, 232.0, 626.0, 2221.0, 45192.0, 4139156.0, 4987.0, 1015.0, 362.0, 148.0, 62.0, 32.0, 28.0, 5.0, 7.0, 6.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012826919555664062, -0.0012499913573265076, -0.0012172907590866089, -0.0011845901608467102, -0.0011518895626068115, -0.0011191889643669128, -0.0010864883661270142, -0.0010537877678871155, -0.0010210871696472168, -0.0009883865714073181, -0.0009556859731674194, -0.0009229853749275208, -0.0008902847766876221, -0.0008575841784477234, -0.0008248835802078247, -0.000792182981967926, -0.0007594823837280273, -0.0007267817854881287, -0.00069408118724823, -0.0006613805890083313, -0.0006286799907684326, -0.0005959793925285339, -0.0005632787942886353, -0.0005305781960487366, -0.0004978775978088379, -0.0004651769995689392, -0.00043247640132904053, -0.00039977580308914185, -0.00036707520484924316, -0.0003343746066093445, -0.0003016740083694458, -0.0002689734101295471, -0.00023627281188964844, -0.00020357221364974976, -0.00017087161540985107, -0.0001381710171699524, -0.00010547041893005371, -7.276982069015503e-05, -4.006922245025635e-05, -7.368624210357666e-06, 2.5331974029541016e-05, 5.80325722694397e-05, 9.073317050933838e-05, 0.00012343376874923706, 0.00015613436698913574, 0.00018883496522903442, 0.0002215355634689331, 0.0002542361617088318, 0.00028693675994873047, 0.00031963735818862915, 0.00035233795642852783, 0.0003850385546684265, 0.0004177391529083252, 0.0004504397511482239, 0.00048314034938812256, 0.0005158409476280212, 0.0005485415458679199, 0.0005812421441078186, 0.0006139427423477173, 0.000646643340587616, 0.0006793439388275146, 0.0007120445370674133, 0.000744745135307312, 0.0007774457335472107, 0.0008101463317871094]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 14.0, 34.0, 144.0, 697.0, 2926.0, 159.0, 67.0, 14.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.659196853637695e-05, -7.341336458921432e-05, -7.02347606420517e-05, -6.705615669488907e-05, -6.387755274772644e-05, -6.069894880056381e-05, -5.7520344853401184e-05, -5.4341740906238556e-05, -5.116313695907593e-05, -4.79845330119133e-05, -4.480592906475067e-05, -4.162732511758804e-05, -3.8448721170425415e-05, -3.527011722326279e-05, -3.209151327610016e-05, -2.891290932893753e-05, -2.5734305381774902e-05, -2.2555701434612274e-05, -1.9377097487449646e-05, -1.6198493540287018e-05, -1.301988959312439e-05, -9.841285645961761e-06, -6.662681698799133e-06, -3.484077751636505e-06, -3.0547380447387695e-07, 2.8731301426887512e-06, 6.051734089851379e-06, 9.230338037014008e-06, 1.2408941984176636e-05, 1.5587545931339264e-05, 1.8766149878501892e-05, 2.194475382566452e-05, 2.512335777282715e-05, 2.8301961719989777e-05, 3.1480565667152405e-05, 3.465916961431503e-05, 3.783777356147766e-05, 4.101637750864029e-05, 4.419498145580292e-05, 4.7373585402965546e-05, 5.0552189350128174e-05, 5.37307932972908e-05, 5.690939724445343e-05, 6.008800119161606e-05, 6.326660513877869e-05, 6.644520908594131e-05, 6.962381303310394e-05, 7.280241698026657e-05, 7.59810209274292e-05, 7.915962487459183e-05, 8.233822882175446e-05, 8.551683276891708e-05, 8.869543671607971e-05, 9.187404066324234e-05, 9.505264461040497e-05, 9.82312485575676e-05, 0.00010140985250473022, 0.00010458845645189285, 0.00010776706039905548, 0.00011094566434621811, 0.00011412426829338074, 0.00011730287224054337, 0.000120481476187706, 0.00012366008013486862, 0.00012683868408203125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 11.0, 13.0, 14.0, 41.0, 61.0, 120.0, 235.0, 232.0, 113.0, 62.0, 36.0, 20.0, 13.0, 6.0, 8.0, 5.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005174302496016026, -0.00050449522677809, -0.0004915602039545774, -0.0004786251811310649, -0.00046569015830755234, -0.0004527551354840398, -0.00043982011266052723, -0.0004268850898370147, -0.0004139500670135021, -0.00040101504418998957, -0.000388080021366477, -0.00037514499854296446, -0.0003622099757194519, -0.00034927495289593935, -0.0003363399300724268, -0.00032340490724891424, -0.00031046991352923214, -0.0002975348907057196, -0.00028459986788220704, -0.0002716648450586945, -0.00025872982223518193, -0.0002457947994116694, -0.00023285979114007205, -0.0002199247683165595, -0.00020698974549304694, -0.00019405472266953439, -0.00018111969984602183, -0.0001681846915744245, -0.00015524966875091195, -0.0001423146459273994, -0.00012937962310388684, -0.00011644460028037429, -0.00010350957745686173, -9.057455463334918e-05, -7.763953180983663e-05, -6.470451626228169e-05, -5.176949343876913e-05, -3.883447061525658e-05, -2.5899455067701638e-05, -1.2964432244189084e-05, -2.9409420676529408e-08, 1.2905611583846621e-05, 2.5840632588369772e-05, 3.877565177390352e-05, 5.171067459741607e-05, 6.464569742092863e-05, 7.758071296848357e-05, 9.051573579199612e-05, 0.00010345075861550868, 0.00011638578143902123, 0.00012932080426253378, 0.00014225582708604634, 0.0001551908499095589, 0.00016812587273307145, 0.00018106088100466877, 0.00019399590382818133, 0.00020693092665169388, 0.00021986594947520643, 0.000232800972298719, 0.0002457359805703163, 0.00025867100339382887, 0.0002716060262173414, 0.000284541049040854, 0.00029747607186436653, 0.0003104110946878791]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 2.0, 5.0, 6.0, 9.0, 14.0, 9.0, 12.0, 20.0, 19.0, 15.0, 20.0, 16.0, 28.0, 32.0, 35.0, 42.0, 27.0, 45.0, 39.0, 35.0, 46.0, 45.0, 52.0, 29.0, 32.0, 46.0, 43.0, 23.0, 40.0, 35.0, 35.0, 23.0, 21.0, 19.0, 18.0, 14.0, 5.0, 8.0, 10.0, 4.0, 6.0, 1.0, 7.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00013017424498684704, -0.00012600065383594483, -0.00012182707723695785, -0.00011765349336201325, -0.00011347990948706865, -0.00010930631833616644, -0.00010513273446122184, -0.00010095915058627725, -9.678556671133265e-05, -9.261198283638805e-05, -8.843839896144345e-05, -8.426481508649886e-05, -8.009122393559664e-05, -7.591764733660966e-05, -7.174405618570745e-05, -6.757047231076285e-05, -6.339688843581825e-05, -5.922330456087366e-05, -5.504972068592906e-05, -5.0876133173005655e-05, -4.670254929806106e-05, -4.252896542311646e-05, -3.8355377910193056e-05, -3.418179403524846e-05, -3.000821016030386e-05, -2.5834626285359263e-05, -2.1661040591425262e-05, -1.748745489749126e-05, -1.3313871022546664e-05, -9.140287147602066e-06, -4.966701453668065e-06, -7.931157597340643e-07, 3.3804826671257615e-06, 7.554067451565061e-06, 1.172765223600436e-05, 1.590123792993836e-05, 2.007482180488296e-05, 2.4248405679827556e-05, 2.8421991373761557e-05, 3.259557706769556e-05, 3.6769160942640156e-05, 4.094274481758475e-05, 4.511632869252935e-05, 4.9289916205452755e-05, 5.346350008039735e-05, 5.763708395534195e-05, 6.181067146826535e-05, 6.598425534320995e-05, 7.015783921815455e-05, 7.433142309309915e-05, 7.850500696804374e-05, 8.267859084298834e-05, 8.685217471793294e-05, 9.102576586883515e-05, 9.519934974377975e-05, 9.937293361872435e-05, 0.00010354651749366894, 0.00010772010136861354, 0.00011189368524355814, 0.00011606726911850274, 0.00012024086026940495, 0.00012441443686839193, 0.00012858802801929414, 0.00013276160461828113, 0.00013693519576918334]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 17.0, 12.0, 29.0, 42.0, 44.0, 58.0, 84.0, 131.0, 138.0, 231.0, 314.0, 442.0, 716.0, 987.0, 1538.0, 2344.0, 3704.0, 5939.0, 9991.0, 17275.0, 31505.0, 61155.0, 127452.0, 287472.0, 258724.0, 113750.0, 55267.0, 28423.0, 15755.0, 9292.0, 5512.0, 3457.0, 2183.0, 1484.0, 969.0, 609.0, 451.0, 297.0, 204.0, 160.0, 109.0, 85.0, 53.0, 38.0, 35.0, 16.0, 9.0, 16.0, 13.0, 6.0, 5.0, 6.0, 2.0, 1.0, 2.0], "bins": [-0.00012195110321044922, -0.00011824723333120346, -0.0001145433634519577, -0.00011083949357271194, -0.00010713562369346619, -0.00010343175381422043, -9.972788393497467e-05, -9.602401405572891e-05, -9.232014417648315e-05, -8.86162742972374e-05, -8.491240441799164e-05, -8.120853453874588e-05, -7.750466465950012e-05, -7.380079478025436e-05, -7.00969249010086e-05, -6.639305502176285e-05, -6.268918514251709e-05, -5.898531526327133e-05, -5.5281445384025574e-05, -5.1577575504779816e-05, -4.787370562553406e-05, -4.41698357462883e-05, -4.046596586704254e-05, -3.6762095987796783e-05, -3.3058226108551025e-05, -2.9354356229305267e-05, -2.565048635005951e-05, -2.194661647081375e-05, -1.8242746591567993e-05, -1.4538876712322235e-05, -1.0835006833076477e-05, -7.131136953830719e-06, -3.427267074584961e-06, 2.766028046607971e-07, 3.980472683906555e-06, 7.684342563152313e-06, 1.1388212442398071e-05, 1.509208232164383e-05, 1.8795952200889587e-05, 2.2499822080135345e-05, 2.6203691959381104e-05, 2.990756183862686e-05, 3.361143171787262e-05, 3.731530159711838e-05, 4.1019171476364136e-05, 4.4723041355609894e-05, 4.842691123485565e-05, 5.213078111410141e-05, 5.583465099334717e-05, 5.9538520872592926e-05, 6.324239075183868e-05, 6.694626063108444e-05, 7.06501305103302e-05, 7.435400038957596e-05, 7.805787026882172e-05, 8.176174014806747e-05, 8.546561002731323e-05, 8.916947990655899e-05, 9.287334978580475e-05, 9.65772196650505e-05, 0.00010028108954429626, 0.00010398495942354202, 0.00010768882930278778, 0.00011139269918203354, 0.0001150965690612793]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 5.0, 8.0, 7.0, 9.0, 8.0, 11.0, 10.0, 17.0, 11.0, 11.0, 19.0, 19.0, 22.0, 38.0, 33.0, 40.0, 36.0, 41.0, 35.0, 39.0, 39.0, 44.0, 53.0, 39.0, 49.0, 27.0, 34.0, 30.0, 38.0, 26.0, 42.0, 24.0, 18.0, 22.0, 16.0, 16.0, 11.0, 10.0, 7.0, 5.0, 6.0, 4.0, 4.0, 4.0, 0.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0001341104507446289, -0.00013010762631893158, -0.00012610480189323425, -0.00012210197746753693, -0.0001180991530418396, -0.00011409632861614227, -0.00011009350419044495, -0.00010609067976474762, -0.00010208785533905029, -9.808503091335297e-05, -9.408220648765564e-05, -9.007938206195831e-05, -8.607655763626099e-05, -8.207373321056366e-05, -7.807090878486633e-05, -7.4068084359169e-05, -7.006525993347168e-05, -6.606243550777435e-05, -6.205961108207703e-05, -5.80567866563797e-05, -5.405396223068237e-05, -5.0051137804985046e-05, -4.604831337928772e-05, -4.204548895359039e-05, -3.8042664527893066e-05, -3.403984010219574e-05, -3.0037015676498413e-05, -2.6034191250801086e-05, -2.203136682510376e-05, -1.8028542399406433e-05, -1.4025717973709106e-05, -1.002289354801178e-05, -6.020069122314453e-06, -2.0172446966171265e-06, 1.9855797290802e-06, 5.988404154777527e-06, 9.991228580474854e-06, 1.399405300617218e-05, 1.7996877431869507e-05, 2.1999701857566833e-05, 2.600252628326416e-05, 3.0005350708961487e-05, 3.4008175134658813e-05, 3.801099956035614e-05, 4.201382398605347e-05, 4.6016648411750793e-05, 5.001947283744812e-05, 5.402229726314545e-05, 5.8025121688842773e-05, 6.20279461145401e-05, 6.603077054023743e-05, 7.003359496593475e-05, 7.403641939163208e-05, 7.80392438173294e-05, 8.204206824302673e-05, 8.604489266872406e-05, 9.004771709442139e-05, 9.405054152011871e-05, 9.805336594581604e-05, 0.00010205619037151337, 0.0001060590147972107, 0.00011006183922290802, 0.00011406466364860535, 0.00011806748807430267, 0.0001220703125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 11.0, 10.0, 20.0, 36.0, 42.0, 44.0, 66.0, 122.0, 182.0, 284.0, 504.0, 830.0, 1468.0, 2927.0, 5803.0, 13980.0, 37377.0, 157036.0, 650468.0, 122440.0, 31672.0, 11987.0, 5132.0, 2533.0, 1419.0, 800.0, 491.0, 293.0, 184.0, 129.0, 88.0, 51.0, 30.0, 18.0, 25.0, 10.0, 9.0, 13.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00022494792938232422, -0.00021778978407382965, -0.00021063163876533508, -0.00020347349345684052, -0.00019631534814834595, -0.00018915720283985138, -0.0001819990575313568, -0.00017484091222286224, -0.00016768276691436768, -0.0001605246216058731, -0.00015336647629737854, -0.00014620833098888397, -0.0001390501856803894, -0.00013189204037189484, -0.00012473389506340027, -0.0001175757497549057, -0.00011041760444641113, -0.00010325945913791656, -9.6101313829422e-05, -8.894316852092743e-05, -8.178502321243286e-05, -7.46268779039383e-05, -6.746873259544373e-05, -6.031058728694916e-05, -5.315244197845459e-05, -4.599429666996002e-05, -3.8836151361465454e-05, -3.1678006052970886e-05, -2.451986074447632e-05, -1.736171543598175e-05, -1.0203570127487183e-05, -3.0454248189926147e-06, 4.112720489501953e-06, 1.1270865797996521e-05, 1.842901110649109e-05, 2.5587156414985657e-05, 3.2745301723480225e-05, 3.990344703197479e-05, 4.706159234046936e-05, 5.421973764896393e-05, 6.13778829574585e-05, 6.853602826595306e-05, 7.569417357444763e-05, 8.28523188829422e-05, 9.001046419143677e-05, 9.716860949993134e-05, 0.0001043267548084259, 0.00011148490011692047, 0.00011864304542541504, 0.0001258011907339096, 0.00013295933604240417, 0.00014011748135089874, 0.0001472756266593933, 0.00015443377196788788, 0.00016159191727638245, 0.00016875006258487701, 0.00017590820789337158, 0.00018306635320186615, 0.00019022449851036072, 0.00019738264381885529, 0.00020454078912734985, 0.00021169893443584442, 0.000218857079744339, 0.00022601522505283356, 0.00023317337036132812]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 6.0, 14.0, 6.0, 12.0, 9.0, 14.0, 12.0, 17.0, 25.0, 26.0, 24.0, 21.0, 25.0, 33.0, 28.0, 42.0, 33.0, 50.0, 28.0, 32.0, 41.0, 42.0, 35.0, 38.0, 42.0, 33.0, 33.0, 31.0, 30.0, 39.0, 22.0, 17.0, 19.0, 17.0, 16.0, 10.0, 12.0, 10.0, 12.0, 11.0, 3.0, 10.0, 4.0, 1.0, 7.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.855892181396484e-05, -7.619895040988922e-05, -7.38389790058136e-05, -7.147900760173798e-05, -6.911903619766235e-05, -6.675906479358673e-05, -6.439909338951111e-05, -6.203912198543549e-05, -5.967915058135986e-05, -5.731917917728424e-05, -5.495920777320862e-05, -5.2599236369132996e-05, -5.023926496505737e-05, -4.787929356098175e-05, -4.551932215690613e-05, -4.3159350752830505e-05, -4.079937934875488e-05, -3.843940794467926e-05, -3.607943654060364e-05, -3.3719465136528015e-05, -3.135949373245239e-05, -2.899952232837677e-05, -2.6639550924301147e-05, -2.4279579520225525e-05, -2.1919608116149902e-05, -1.955963671207428e-05, -1.7199665307998657e-05, -1.4839693903923035e-05, -1.2479722499847412e-05, -1.011975109577179e-05, -7.759779691696167e-06, -5.3998082876205444e-06, -3.039836883544922e-06, -6.798654794692993e-07, 1.6801059246063232e-06, 4.040077328681946e-06, 6.400048732757568e-06, 8.760020136833191e-06, 1.1119991540908813e-05, 1.3479962944984436e-05, 1.583993434906006e-05, 1.819990575313568e-05, 2.0559877157211304e-05, 2.2919848561286926e-05, 2.527981996536255e-05, 2.763979136943817e-05, 2.9999762773513794e-05, 3.2359734177589417e-05, 3.471970558166504e-05, 3.707967698574066e-05, 3.9439648389816284e-05, 4.179961979389191e-05, 4.415959119796753e-05, 4.651956260204315e-05, 4.8879534006118774e-05, 5.12395054101944e-05, 5.359947681427002e-05, 5.595944821834564e-05, 5.8319419622421265e-05, 6.067939102649689e-05, 6.303936243057251e-05, 6.539933383464813e-05, 6.775930523872375e-05, 7.011927664279938e-05, 7.2479248046875e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 7.0, 11.0, 14.0, 19.0, 18.0, 46.0, 58.0, 77.0, 114.0, 155.0, 168.0, 314.0, 432.0, 701.0, 1032.0, 1735.0, 2936.0, 5453.0, 11221.0, 31169.0, 155469.0, 741207.0, 62211.0, 16943.0, 7187.0, 3786.0, 2037.0, 1355.0, 882.0, 565.0, 359.0, 241.0, 151.0, 138.0, 96.0, 78.0, 50.0, 28.0, 24.0, 15.0, 11.0, 7.0, 7.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.701448440551758e-05, -3.593321889638901e-05, -3.485195338726044e-05, -3.3770687878131866e-05, -3.2689422369003296e-05, -3.1608156859874725e-05, -3.0526891350746155e-05, -2.9445625841617584e-05, -2.8364360332489014e-05, -2.7283094823360443e-05, -2.6201829314231873e-05, -2.5120563805103302e-05, -2.403929829597473e-05, -2.295803278684616e-05, -2.187676727771759e-05, -2.079550176858902e-05, -1.971423625946045e-05, -1.863297075033188e-05, -1.7551705241203308e-05, -1.6470439732074738e-05, -1.5389174222946167e-05, -1.4307908713817596e-05, -1.3226643204689026e-05, -1.2145377695560455e-05, -1.1064112186431885e-05, -9.982846677303314e-06, -8.901581168174744e-06, -7.820315659046173e-06, -6.7390501499176025e-06, -5.657784640789032e-06, -4.5765191316604614e-06, -3.495253622531891e-06, -2.4139881134033203e-06, -1.3327226042747498e-06, -2.514570951461792e-07, 8.298084139823914e-07, 1.911073923110962e-06, 2.9923394322395325e-06, 4.073604941368103e-06, 5.154870450496674e-06, 6.236135959625244e-06, 7.317401468753815e-06, 8.398666977882385e-06, 9.479932487010956e-06, 1.0561197996139526e-05, 1.1642463505268097e-05, 1.2723729014396667e-05, 1.3804994523525238e-05, 1.4886260032653809e-05, 1.596752554178238e-05, 1.704879105091095e-05, 1.813005656003952e-05, 1.921132206916809e-05, 2.029258757829666e-05, 2.1373853087425232e-05, 2.2455118596553802e-05, 2.3536384105682373e-05, 2.4617649614810944e-05, 2.5698915123939514e-05, 2.6780180633068085e-05, 2.7861446142196655e-05, 2.8942711651325226e-05, 3.0023977160453796e-05, 3.110524266958237e-05, 3.218650817871094e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 1.0, 3.0, 1.0, 5.0, 10.0, 9.0, 9.0, 11.0, 10.0, 13.0, 13.0, 13.0, 24.0, 26.0, 29.0, 43.0, 60.0, 83.0, 38.0, 197.0, 68.0, 72.0, 53.0, 21.0, 33.0, 16.0, 27.0, 12.0, 8.0, 9.0, 10.0, 8.0, 12.0, 8.0, 9.0, 2.0, 5.0, 6.0, 3.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125999450683594e-06, -4.957430064678192e-06, -4.7888606786727905e-06, -4.620291292667389e-06, -4.451721906661987e-06, -4.283152520656586e-06, -4.114583134651184e-06, -3.9460137486457825e-06, -3.777444362640381e-06, -3.6088749766349792e-06, -3.4403055906295776e-06, -3.271736204624176e-06, -3.1031668186187744e-06, -2.934597432613373e-06, -2.766028046607971e-06, -2.5974586606025696e-06, -2.428889274597168e-06, -2.2603198885917664e-06, -2.0917505025863647e-06, -1.923181116580963e-06, -1.7546117305755615e-06, -1.58604234457016e-06, -1.4174729585647583e-06, -1.2489035725593567e-06, -1.080334186553955e-06, -9.117648005485535e-07, -7.431954145431519e-07, -5.746260285377502e-07, -4.0605664253234863e-07, -2.3748725652694702e-07, -6.891787052154541e-08, 9.96515154838562e-08, 2.682209014892578e-07, 4.367902874946594e-07, 6.05359673500061e-07, 7.739290595054626e-07, 9.424984455108643e-07, 1.1110678315162659e-06, 1.2796372175216675e-06, 1.448206603527069e-06, 1.6167759895324707e-06, 1.7853453755378723e-06, 1.953914761543274e-06, 2.1224841475486755e-06, 2.291053533554077e-06, 2.4596229195594788e-06, 2.6281923055648804e-06, 2.796761691570282e-06, 2.9653310775756836e-06, 3.133900463581085e-06, 3.302469849586487e-06, 3.4710392355918884e-06, 3.63960862159729e-06, 3.8081780076026917e-06, 3.976747393608093e-06, 4.145316779613495e-06, 4.3138861656188965e-06, 4.482455551624298e-06, 4.6510249376297e-06, 4.819594323635101e-06, 4.988163709640503e-06, 5.1567330956459045e-06, 5.325302481651306e-06, 5.493871867656708e-06, 5.662441253662109e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 1.0, 7.0, 3.0, 5.0, 17.0, 10.0, 17.0, 30.0, 28.0, 64.0, 108.0, 230.0, 553.0, 1325.0, 3813.0, 13765.0, 73582.0, 856210.0, 78832.0, 13497.0, 3969.0, 1379.0, 558.0, 237.0, 110.0, 80.0, 19.0, 26.0, 20.0, 14.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.979703903198242e-05, -6.74314796924591e-05, -6.506592035293579e-05, -6.270036101341248e-05, -6.033480167388916e-05, -5.7969242334365845e-05, -5.560368299484253e-05, -5.3238123655319214e-05, -5.08725643157959e-05, -4.850700497627258e-05, -4.614144563674927e-05, -4.377588629722595e-05, -4.141032695770264e-05, -3.904476761817932e-05, -3.6679208278656006e-05, -3.431364893913269e-05, -3.1948089599609375e-05, -2.958253026008606e-05, -2.7216970920562744e-05, -2.485141158103943e-05, -2.2485852241516113e-05, -2.0120292901992798e-05, -1.7754733562469482e-05, -1.5389174222946167e-05, -1.3023614883422852e-05, -1.0658055543899536e-05, -8.29249620437622e-06, -5.926936864852905e-06, -3.56137752532959e-06, -1.1958181858062744e-06, 1.169741153717041e-06, 3.5353004932403564e-06, 5.900859832763672e-06, 8.266419172286987e-06, 1.0631978511810303e-05, 1.2997537851333618e-05, 1.5363097190856934e-05, 1.772865653038025e-05, 2.0094215869903564e-05, 2.245977520942688e-05, 2.4825334548950195e-05, 2.719089388847351e-05, 2.9556453227996826e-05, 3.192201256752014e-05, 3.428757190704346e-05, 3.665313124656677e-05, 3.901869058609009e-05, 4.13842499256134e-05, 4.374980926513672e-05, 4.6115368604660034e-05, 4.848092794418335e-05, 5.0846487283706665e-05, 5.321204662322998e-05, 5.5577605962753296e-05, 5.794316530227661e-05, 6.030872464179993e-05, 6.267428398132324e-05, 6.503984332084656e-05, 6.740540266036987e-05, 6.977096199989319e-05, 7.21365213394165e-05, 7.450208067893982e-05, 7.686764001846313e-05, 7.923319935798645e-05, 8.159875869750977e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 6.0, 8.0, 13.0, 11.0, 13.0, 18.0, 10.0, 33.0, 25.0, 56.0, 40.0, 94.0, 129.0, 138.0, 103.0, 51.0, 44.0, 47.0, 27.0, 15.0, 12.0, 11.0, 13.0, 11.0, 12.0, 11.0, 3.0, 8.0, 4.0, 4.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.331371307373047e-06, -7.117167115211487e-06, -6.902962923049927e-06, -6.688758730888367e-06, -6.474554538726807e-06, -6.260350346565247e-06, -6.0461461544036865e-06, -5.8319419622421265e-06, -5.617737770080566e-06, -5.403533577919006e-06, -5.189329385757446e-06, -4.975125193595886e-06, -4.760921001434326e-06, -4.546716809272766e-06, -4.332512617111206e-06, -4.118308424949646e-06, -3.904104232788086e-06, -3.689900040626526e-06, -3.475695848464966e-06, -3.2614916563034058e-06, -3.0472874641418457e-06, -2.8330832719802856e-06, -2.6188790798187256e-06, -2.4046748876571655e-06, -2.1904706954956055e-06, -1.9762665033340454e-06, -1.7620623111724854e-06, -1.5478581190109253e-06, -1.3336539268493652e-06, -1.1194497346878052e-06, -9.052455425262451e-07, -6.910413503646851e-07, -4.76837158203125e-07, -2.6263296604156494e-07, -4.842877388000488e-08, 1.6577541828155518e-07, 3.7997961044311523e-07, 5.941838026046753e-07, 8.083879947662354e-07, 1.0225921869277954e-06, 1.2367963790893555e-06, 1.4510005712509155e-06, 1.6652047634124756e-06, 1.8794089555740356e-06, 2.0936131477355957e-06, 2.3078173398971558e-06, 2.522021532058716e-06, 2.736225724220276e-06, 2.950429916381836e-06, 3.164634108543396e-06, 3.378838300704956e-06, 3.593042492866516e-06, 3.807246685028076e-06, 4.021450877189636e-06, 4.235655069351196e-06, 4.449859261512756e-06, 4.664063453674316e-06, 4.8782676458358765e-06, 5.0924718379974365e-06, 5.306676030158997e-06, 5.520880222320557e-06, 5.735084414482117e-06, 5.949288606643677e-06, 6.163492798805237e-06, 6.377696990966797e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 11.0, 9.0, 14.0, 14.0, 32.0, 46.0, 61.0, 96.0, 145.0, 189.0, 114.0, 68.0, 48.0, 34.0, 27.0, 27.0, 12.0, 10.0, 5.0, 4.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023227673955261707, -0.00022406867356039584, -0.00021586062212008983, -0.0002076525561278686, -0.00019944449013564736, -0.00019123643869534135, -0.0001830283727031201, -0.00017482030671089888, -0.00016661224071867764, -0.0001584041747264564, -0.0001501961232861504, -0.00014198805729392916, -0.00013377999130170792, -0.00012557193986140192, -0.00011736387386918068, -0.00010915580787695944, -0.00010094775643665344, -9.273969772038981e-05, -8.453163172816858e-05, -7.632357301190495e-05, -6.811550701968372e-05, -5.99074483034201e-05, -5.1699389587156475e-05, -4.3491327232914045e-05, -3.5283264878671616e-05, -2.7075202524429187e-05, -1.886714198917616e-05, -1.0659081453923136e-05, -2.451019099680707e-06, 5.757043254561722e-06, 1.3965101970825344e-05, 2.2173164325067773e-05, 3.0381226679310203e-05, 3.858928903355263e-05, 4.679735138779506e-05, 5.500541010405868e-05, 6.321347609627992e-05, 7.142153481254354e-05, 7.962959352880716e-05, 8.78376595210284e-05, 9.604571823729202e-05, 0.00010425377695355564, 0.00011246184294577688, 0.0001206699016620405, 0.00012887796037830412, 0.00013708602637052536, 0.0001452940923627466, 0.0001535021438030526, 0.00016171020979527384, 0.00016991827578749508, 0.00017812632722780108, 0.00018633439322002232, 0.00019454245921224356, 0.0002027505252044648, 0.0002109585766447708, 0.00021916664263699204, 0.00022737469407729805, 0.00023558276006951928, 0.0002437908115098253, 0.00025199889205396175, 0.00026020692894235253, 0.00026841499493457377, 0.000276623060926795, 0.00028483112691901624, 0.0002930391929112375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 6.0, 2.0, 3.0, 9.0, 9.0, 13.0, 7.0, 14.0, 23.0, 16.0, 15.0, 17.0, 21.0, 25.0, 33.0, 34.0, 44.0, 29.0, 37.0, 39.0, 36.0, 50.0, 47.0, 48.0, 36.0, 30.0, 47.0, 37.0, 32.0, 37.0, 32.0, 37.0, 23.0, 22.0, 17.0, 18.0, 12.0, 7.0, 7.0, 11.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00012131590483477339, -0.00011742755305022001, -0.00011353920126566663, -0.00010965084948111326, -0.00010576249769655988, -0.0001018741459120065, -9.798580140341073e-05, -9.409744234289974e-05, -9.020909783430398e-05, -8.63207460497506e-05, -8.243239426519722e-05, -7.854404248064384e-05, -7.465569069609046e-05, -7.076733891153708e-05, -6.68789871269837e-05, -6.299064261838794e-05, -5.9102283557876945e-05, -5.5213931773323566e-05, -5.132557998877019e-05, -4.743722820421681e-05, -4.354887641966343e-05, -3.966052463511005e-05, -3.577217648853548e-05, -3.18838247039821e-05, -2.799547291942872e-05, -2.4107121134875342e-05, -2.0218769350321963e-05, -1.6330419384757988e-05, -1.244206760020461e-05, -8.55371581565123e-06, -4.665365850087255e-06, -7.770140655338764e-07, 3.1113304430618882e-06, 6.999681772867916e-06, 1.0888033102673944e-05, 1.4776383977732621e-05, 1.8664735762286e-05, 2.255308754683938e-05, 2.6441437512403354e-05, 3.0329789296956733e-05, 3.421814108151011e-05, 3.810649286606349e-05, 4.199484465061687e-05, 4.588319279719144e-05, 4.977154458174482e-05, 5.36598963662982e-05, 5.754824815085158e-05, 6.143659993540496e-05, 6.532495171995834e-05, 6.921330350451171e-05, 7.310165528906509e-05, 7.699000707361847e-05, 8.087835885817185e-05, 8.476671064272523e-05, 8.8655055151321e-05, 9.254341421183199e-05, 9.643175872042775e-05, 0.00010032011050498113, 0.00010420846228953451, 0.00010809681407408789, 0.00011198516585864127, 0.00011587351764319465, 0.00011976186942774802, 0.0001236502139363438, 0.00012753857299685478]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 5.0, 1.0, 2.0, 4.0, 17.0, 25.0, 30.0, 33.0, 46.0, 75.0, 99.0, 124.0, 206.0, 293.0, 426.0, 624.0, 884.0, 1293.0, 1912.0, 2841.0, 4221.0, 6440.0, 10033.0, 15246.0, 24231.0, 39621.0, 67819.0, 122404.0, 216082.0, 222209.0, 127275.0, 71062.0, 41583.0, 25135.0, 15733.0, 10215.0, 6713.0, 4470.0, 2973.0, 1991.0, 1291.0, 881.0, 636.0, 389.0, 311.0, 185.0, 130.0, 92.0, 70.0, 44.0, 38.0, 41.0, 25.0, 16.0, 7.0, 6.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.00025725364685058594, -0.000248689204454422, -0.00024012476205825806, -0.00023156031966209412, -0.00022299587726593018, -0.00021443143486976624, -0.0002058669924736023, -0.00019730255007743835, -0.00018873810768127441, -0.00018017366528511047, -0.00017160922288894653, -0.0001630447804927826, -0.00015448033809661865, -0.0001459158957004547, -0.00013735145330429077, -0.00012878701090812683, -0.00012022256851196289, -0.00011165812611579895, -0.00010309368371963501, -9.452924132347107e-05, -8.596479892730713e-05, -7.740035653114319e-05, -6.883591413497925e-05, -6.027147173881531e-05, -5.170702934265137e-05, -4.314258694648743e-05, -3.4578144550323486e-05, -2.6013702154159546e-05, -1.7449259757995605e-05, -8.884817361831665e-06, -3.203749656677246e-07, 8.244067430496216e-06, 1.6808509826660156e-05, 2.5372952222824097e-05, 3.393739461898804e-05, 4.250183701515198e-05, 5.106627941131592e-05, 5.963072180747986e-05, 6.81951642036438e-05, 7.675960659980774e-05, 8.532404899597168e-05, 9.388849139213562e-05, 0.00010245293378829956, 0.0001110173761844635, 0.00011958181858062744, 0.00012814626097679138, 0.00013671070337295532, 0.00014527514576911926, 0.0001538395881652832, 0.00016240403056144714, 0.00017096847295761108, 0.00017953291535377502, 0.00018809735774993896, 0.0001966618001461029, 0.00020522624254226685, 0.00021379068493843079, 0.00022235512733459473, 0.00023091956973075867, 0.0002394840121269226, 0.00024804845452308655, 0.0002566128969192505, 0.00026517733931541443, 0.00027374178171157837, 0.0002823062241077423, 0.00029087066650390625]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 10.0, 7.0, 9.0, 13.0, 13.0, 12.0, 18.0, 18.0, 20.0, 24.0, 23.0, 33.0, 37.0, 40.0, 41.0, 33.0, 34.0, 52.0, 47.0, 54.0, 47.0, 44.0, 49.0, 40.0, 35.0, 32.0, 37.0, 28.0, 29.0, 27.0, 17.0, 17.0, 15.0, 8.0, 7.0, 10.0, 2.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.00011223554611206055, -0.00010871794074773788, -0.00010520033538341522, -0.00010168273001909256, -9.81651246547699e-05, -9.464751929044724e-05, -9.112991392612457e-05, -8.761230856180191e-05, -8.409470319747925e-05, -8.057709783315659e-05, -7.705949246883392e-05, -7.354188710451126e-05, -7.00242817401886e-05, -6.650667637586594e-05, -6.298907101154327e-05, -5.947146564722061e-05, -5.595386028289795e-05, -5.243625491857529e-05, -4.8918649554252625e-05, -4.540104418992996e-05, -4.18834388256073e-05, -3.836583346128464e-05, -3.4848228096961975e-05, -3.133062273263931e-05, -2.781301736831665e-05, -2.4295412003993988e-05, -2.0777806639671326e-05, -1.7260201275348663e-05, -1.3742595911026001e-05, -1.0224990546703339e-05, -6.707385182380676e-06, -3.189779818058014e-06, 3.2782554626464844e-07, 3.845430910587311e-06, 7.363036274909973e-06, 1.0880641639232635e-05, 1.4398247003555298e-05, 1.791585236787796e-05, 2.1433457732200623e-05, 2.4951063096523285e-05, 2.8468668460845947e-05, 3.198627382516861e-05, 3.550387918949127e-05, 3.9021484553813934e-05, 4.25390899181366e-05, 4.605669528245926e-05, 4.957430064678192e-05, 5.3091906011104584e-05, 5.6609511375427246e-05, 6.012711673974991e-05, 6.364472210407257e-05, 6.716232746839523e-05, 7.06799328327179e-05, 7.419753819704056e-05, 7.771514356136322e-05, 8.123274892568588e-05, 8.475035429000854e-05, 8.826795965433121e-05, 9.178556501865387e-05, 9.530317038297653e-05, 9.88207757472992e-05, 0.00010233838111162186, 0.00010585598647594452, 0.00010937359184026718, 0.00011289119720458984]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 7.0, 1.0, 2.0, 2.0, 5.0, 2.0, 11.0, 12.0, 24.0, 41.0, 69.0, 93.0, 146.0, 260.0, 395.0, 720.0, 1301.0, 2376.0, 4107.0, 7623.0, 14323.0, 27758.0, 58083.0, 135460.0, 343191.0, 260325.0, 99711.0, 44647.0, 22214.0, 11572.0, 6230.0, 3277.0, 1960.0, 1082.0, 620.0, 356.0, 215.0, 125.0, 77.0, 58.0, 31.0, 20.0, 10.0, 6.0, 8.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003199577331542969, -0.00030886009335517883, -0.0002977624535560608, -0.00028666481375694275, -0.0002755671739578247, -0.00026446953415870667, -0.0002533718943595886, -0.00024227425456047058, -0.00023117661476135254, -0.0002200789749622345, -0.00020898133516311646, -0.0001978836953639984, -0.00018678605556488037, -0.00017568841576576233, -0.0001645907759666443, -0.00015349313616752625, -0.0001423954963684082, -0.00013129785656929016, -0.00012020021677017212, -0.00010910257697105408, -9.800493717193604e-05, -8.690729737281799e-05, -7.580965757369995e-05, -6.471201777458191e-05, -5.361437797546387e-05, -4.2516738176345825e-05, -3.141909837722778e-05, -2.032145857810974e-05, -9.2238187789917e-06, 1.8738210201263428e-06, 1.2971460819244385e-05, 2.4069100618362427e-05, 3.516674041748047e-05, 4.626438021659851e-05, 5.736202001571655e-05, 6.84596598148346e-05, 7.955729961395264e-05, 9.065493941307068e-05, 0.00010175257921218872, 0.00011285021901130676, 0.0001239478588104248, 0.00013504549860954285, 0.0001461431384086609, 0.00015724077820777893, 0.00016833841800689697, 0.00017943605780601501, 0.00019053369760513306, 0.0002016313374042511, 0.00021272897720336914, 0.00022382661700248718, 0.00023492425680160522, 0.00024602189660072327, 0.0002571195363998413, 0.00026821717619895935, 0.0002793148159980774, 0.00029041245579719543, 0.0003015100955963135, 0.0003126077353954315, 0.00032370537519454956, 0.0003348030149936676, 0.00034590065479278564, 0.0003569982945919037, 0.00036809593439102173, 0.00037919357419013977, 0.0003902912139892578]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 5.0, 3.0, 9.0, 7.0, 15.0, 9.0, 19.0, 17.0, 28.0, 21.0, 23.0, 26.0, 32.0, 31.0, 34.0, 39.0, 50.0, 46.0, 42.0, 41.0, 50.0, 53.0, 38.0, 46.0, 31.0, 41.0, 28.0, 33.0, 26.0, 22.0, 19.0, 20.0, 12.0, 19.0, 18.0, 9.0, 15.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.924173355102539e-05, -9.632576256990433e-05, -9.340979158878326e-05, -9.04938206076622e-05, -8.757784962654114e-05, -8.466187864542007e-05, -8.174590766429901e-05, -7.882993668317795e-05, -7.591396570205688e-05, -7.299799472093582e-05, -7.008202373981476e-05, -6.71660527586937e-05, -6.425008177757263e-05, -6.133411079645157e-05, -5.8418139815330505e-05, -5.550216883420944e-05, -5.258619785308838e-05, -4.9670226871967316e-05, -4.675425589084625e-05, -4.383828490972519e-05, -4.0922313928604126e-05, -3.800634294748306e-05, -3.5090371966362e-05, -3.2174400985240936e-05, -2.9258430004119873e-05, -2.634245902299881e-05, -2.3426488041877747e-05, -2.0510517060756683e-05, -1.759454607963562e-05, -1.4678575098514557e-05, -1.1762604117393494e-05, -8.84663313627243e-06, -5.930662155151367e-06, -3.014691174030304e-06, -9.872019290924072e-08, 2.8172507882118225e-06, 5.733221769332886e-06, 8.649192750453949e-06, 1.1565163731575012e-05, 1.4481134712696075e-05, 1.739710569381714e-05, 2.0313076674938202e-05, 2.3229047656059265e-05, 2.614501863718033e-05, 2.906098961830139e-05, 3.1976960599422455e-05, 3.489293158054352e-05, 3.780890256166458e-05, 4.0724873542785645e-05, 4.364084452390671e-05, 4.655681550502777e-05, 4.9472786486148834e-05, 5.23887574672699e-05, 5.530472844839096e-05, 5.8220699429512024e-05, 6.113667041063309e-05, 6.405264139175415e-05, 6.696861237287521e-05, 6.988458335399628e-05, 7.280055433511734e-05, 7.57165253162384e-05, 7.863249629735947e-05, 8.154846727848053e-05, 8.446443825960159e-05, 8.738040924072266e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 10.0, 20.0, 25.0, 35.0, 53.0, 81.0, 109.0, 232.0, 493.0, 1011.0, 2440.0, 6836.0, 23129.0, 127008.0, 725337.0, 117561.0, 30384.0, 8336.0, 2902.0, 1251.0, 569.0, 285.0, 164.0, 89.0, 53.0, 47.0, 22.0, 21.0, 11.0, 9.0, 8.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0371208190917969e-05, -1.0079704225063324e-05, -9.78820025920868e-06, -9.496696293354034e-06, -9.20519232749939e-06, -8.913688361644745e-06, -8.6221843957901e-06, -8.330680429935455e-06, -8.03917646408081e-06, -7.747672498226166e-06, -7.456168532371521e-06, -7.164664566516876e-06, -6.8731606006622314e-06, -6.581656634807587e-06, -6.290152668952942e-06, -5.998648703098297e-06, -5.707144737243652e-06, -5.4156407713890076e-06, -5.124136805534363e-06, -4.832632839679718e-06, -4.541128873825073e-06, -4.2496249079704285e-06, -3.958120942115784e-06, -3.666616976261139e-06, -3.375113010406494e-06, -3.0836090445518494e-06, -2.7921050786972046e-06, -2.50060111284256e-06, -2.209097146987915e-06, -1.9175931811332703e-06, -1.6260892152786255e-06, -1.3345852494239807e-06, -1.043081283569336e-06, -7.515773177146912e-07, -4.600733518600464e-07, -1.685693860054016e-07, 1.2293457984924316e-07, 4.1443854570388794e-07, 7.059425115585327e-07, 9.974464774131775e-07, 1.2889504432678223e-06, 1.580454409122467e-06, 1.8719583749771118e-06, 2.1634623408317566e-06, 2.4549663066864014e-06, 2.746470272541046e-06, 3.037974238395691e-06, 3.3294782042503357e-06, 3.6209821701049805e-06, 3.912486135959625e-06, 4.20399010181427e-06, 4.495494067668915e-06, 4.7869980335235596e-06, 5.078501999378204e-06, 5.370005965232849e-06, 5.661509931087494e-06, 5.953013896942139e-06, 6.2445178627967834e-06, 6.536021828651428e-06, 6.827525794506073e-06, 7.119029760360718e-06, 7.4105337262153625e-06, 7.702037692070007e-06, 7.993541657924652e-06, 8.285045623779297e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 0.0, 11.0, 11.0, 0.0, 19.0, 0.0, 39.0, 59.0, 0.0, 84.0, 162.0, 0.0, 186.0, 170.0, 0.0, 128.0, 62.0, 0.0, 25.0, 0.0, 18.0, 8.0, 0.0, 11.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.366761565208435e-07, -6.984919309616089e-07, -6.603077054023743e-07, -6.221234798431396e-07, -5.83939254283905e-07, -5.457550287246704e-07, -5.075708031654358e-07, -4.6938657760620117e-07, -4.3120235204696655e-07, -3.9301812648773193e-07, -3.548339009284973e-07, -3.166496753692627e-07, -2.784654498100281e-07, -2.4028122425079346e-07, -2.0209699869155884e-07, -1.6391277313232422e-07, -1.257285475730896e-07, -8.754432201385498e-08, -4.936009645462036e-08, -1.1175870895385742e-08, 2.7008354663848877e-08, 6.51925802230835e-08, 1.0337680578231812e-07, 1.4156103134155273e-07, 1.7974525690078735e-07, 2.1792948246002197e-07, 2.561137080192566e-07, 2.942979335784912e-07, 3.3248215913772583e-07, 3.7066638469696045e-07, 4.0885061025619507e-07, 4.470348358154297e-07, 4.852190613746643e-07, 5.234032869338989e-07, 5.615875124931335e-07, 5.997717380523682e-07, 6.379559636116028e-07, 6.761401891708374e-07, 7.14324414730072e-07, 7.525086402893066e-07, 7.906928658485413e-07, 8.288770914077759e-07, 8.670613169670105e-07, 9.052455425262451e-07, 9.434297680854797e-07, 9.816139936447144e-07, 1.019798219203949e-06, 1.0579824447631836e-06, 1.0961666703224182e-06, 1.1343508958816528e-06, 1.1725351214408875e-06, 1.210719347000122e-06, 1.2489035725593567e-06, 1.2870877981185913e-06, 1.325272023677826e-06, 1.3634562492370605e-06, 1.4016404747962952e-06, 1.4398247003555298e-06, 1.4780089259147644e-06, 1.516193151473999e-06, 1.5543773770332336e-06, 1.5925616025924683e-06, 1.6307458281517029e-06, 1.6689300537109375e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 10.0, 8.0, 14.0, 15.0, 30.0, 48.0, 54.0, 83.0, 117.0, 187.0, 283.0, 650.0, 1218.0, 2572.0, 6788.0, 23150.0, 112054.0, 667140.0, 186085.0, 32537.0, 9261.0, 3173.0, 1551.0, 582.0, 319.0, 212.0, 121.0, 90.0, 77.0, 43.0, 29.0, 21.0, 12.0, 4.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.735324859619141e-06, -6.491318345069885e-06, -6.24731183052063e-06, -6.0033053159713745e-06, -5.759298801422119e-06, -5.515292286872864e-06, -5.271285772323608e-06, -5.027279257774353e-06, -4.783272743225098e-06, -4.539266228675842e-06, -4.295259714126587e-06, -4.0512531995773315e-06, -3.807246685028076e-06, -3.563240170478821e-06, -3.3192336559295654e-06, -3.07522714138031e-06, -2.8312206268310547e-06, -2.5872141122817993e-06, -2.343207597732544e-06, -2.0992010831832886e-06, -1.8551945686340332e-06, -1.6111880540847778e-06, -1.3671815395355225e-06, -1.123175024986267e-06, -8.791685104370117e-07, -6.351619958877563e-07, -3.91155481338501e-07, -1.471489667892456e-07, 9.685754776000977e-08, 3.4086406230926514e-07, 5.848705768585205e-07, 8.288770914077759e-07, 1.0728836059570312e-06, 1.3168901205062866e-06, 1.560896635055542e-06, 1.8049031496047974e-06, 2.0489096641540527e-06, 2.292916178703308e-06, 2.5369226932525635e-06, 2.780929207801819e-06, 3.0249357223510742e-06, 3.2689422369003296e-06, 3.512948751449585e-06, 3.7569552659988403e-06, 4.000961780548096e-06, 4.244968295097351e-06, 4.4889748096466064e-06, 4.732981324195862e-06, 4.976987838745117e-06, 5.2209943532943726e-06, 5.465000867843628e-06, 5.709007382392883e-06, 5.953013896942139e-06, 6.197020411491394e-06, 6.441026926040649e-06, 6.685033440589905e-06, 6.92903995513916e-06, 7.1730464696884155e-06, 7.417052984237671e-06, 7.661059498786926e-06, 7.905066013336182e-06, 8.149072527885437e-06, 8.393079042434692e-06, 8.637085556983948e-06, 8.881092071533203e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 11.0, 9.0, 8.0, 14.0, 65.0, 50.0, 84.0, 104.0, 95.0, 116.0, 102.0, 95.0, 76.0, 53.0, 28.0, 33.0, 23.0, 9.0, 11.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.3245811462402344e-06, -2.263113856315613e-06, -2.201646566390991e-06, -2.1401792764663696e-06, -2.078711986541748e-06, -2.0172446966171265e-06, -1.955777406692505e-06, -1.8943101167678833e-06, -1.8328428268432617e-06, -1.7713755369186401e-06, -1.7099082469940186e-06, -1.648440957069397e-06, -1.5869736671447754e-06, -1.5255063772201538e-06, -1.4640390872955322e-06, -1.4025717973709106e-06, -1.341104507446289e-06, -1.2796372175216675e-06, -1.218169927597046e-06, -1.1567026376724243e-06, -1.0952353477478027e-06, -1.0337680578231812e-06, -9.723007678985596e-07, -9.10833477973938e-07, -8.493661880493164e-07, -7.878988981246948e-07, -7.264316082000732e-07, -6.649643182754517e-07, -6.034970283508301e-07, -5.420297384262085e-07, -4.805624485015869e-07, -4.1909515857696533e-07, -3.5762786865234375e-07, -2.9616057872772217e-07, -2.3469328880310059e-07, -1.73225998878479e-07, -1.1175870895385742e-07, -5.029141902923584e-08, 1.1175870895385742e-08, 7.264316082000732e-08, 1.341104507446289e-07, 1.955777406692505e-07, 2.5704503059387207e-07, 3.1851232051849365e-07, 3.7997961044311523e-07, 4.414469003677368e-07, 5.029141902923584e-07, 5.6438148021698e-07, 6.258487701416016e-07, 6.873160600662231e-07, 7.487833499908447e-07, 8.102506399154663e-07, 8.717179298400879e-07, 9.331852197647095e-07, 9.94652509689331e-07, 1.0561197996139526e-06, 1.1175870895385742e-06, 1.1790543794631958e-06, 1.2405216693878174e-06, 1.301988959312439e-06, 1.3634562492370605e-06, 1.4249235391616821e-06, 1.4863908290863037e-06, 1.5478581190109253e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 6.0, 5.0, 12.0, 13.0, 20.0, 24.0, 37.0, 53.0, 102.0, 140.0, 169.0, 150.0, 75.0, 59.0, 35.0, 28.0, 19.0, 15.0, 11.0, 9.0, 3.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002981526486109942, -0.00029079453088343143, -0.0002834364422596991, -0.0002760783245321363, -0.00026872020680457354, -0.00026136208907701075, -0.0002540040004532784, -0.00024664588272571564, -0.00023928776499815285, -0.0002319296618225053, -0.0002245715440949425, -0.00021721344091929495, -0.00020985532319173217, -0.0002024972200160846, -0.00019513911684043705, -0.00018778099911287427, -0.0001804228959372267, -0.00017306479276157916, -0.00016570667503401637, -0.00015834857185836881, -0.00015099045413080603, -0.00014363235095515847, -0.0001362742332275957, -0.00012891613005194813, -0.00012155801960034296, -0.00011419990914873779, -0.00010684179869713262, -9.948368824552745e-05, -9.212558506987989e-05, -8.47674673423171e-05, -7.740936416666955e-05, -7.005125371506438e-05, -6.269312871154398e-05, -5.5335018259938806e-05, -4.7976907808333635e-05, -4.061880099470727e-05, -3.32606905431021e-05, -2.590258009149693e-05, -1.8544473277870566e-05, -1.1186362826265395e-05, -3.828252374660224e-06, 3.5298571674502455e-06, 1.0887966709560715e-05, 1.8246075342176482e-05, 2.5604185793781653e-05, 3.2962296245386824e-05, 4.032040305901319e-05, 4.767851351061836e-05, 5.503662396222353e-05, 6.23947344138287e-05, 6.975284486543387e-05, 7.711094804108143e-05, 8.446906576864421e-05, 9.182716894429177e-05, 9.918527939589694e-05, 0.00010654338984750211, 0.00011390150029910728, 0.00012125961075071245, 0.00012861771392636, 0.0001359758316539228, 0.00014333393482957035, 0.00015069205255713314, 0.0001580501557327807, 0.00016540827346034348, 0.00017276637663599104]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 10.0, 10.0, 10.0, 8.0, 9.0, 10.0, 14.0, 16.0, 16.0, 25.0, 32.0, 24.0, 22.0, 40.0, 34.0, 27.0, 45.0, 34.0, 32.0, 37.0, 51.0, 37.0, 36.0, 41.0, 32.0, 31.0, 38.0, 26.0, 30.0, 20.0, 31.0, 29.0, 20.0, 15.0, 15.0, 16.0, 10.0, 10.0, 13.0, 9.0, 3.0, 9.0, 5.0, 2.0, 3.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.876726835500449e-05, -9.56244402914308e-05, -9.248161222785711e-05, -8.933878416428342e-05, -8.619595610070974e-05, -8.305313531309366e-05, -7.991029997356236e-05, -7.676747918594629e-05, -7.36246511223726e-05, -7.048182305879891e-05, -6.733899499522522e-05, -6.419616693165153e-05, -6.105333886807784e-05, -5.791051444248296e-05, -5.4767686378909275e-05, -5.1624861953314394e-05, -4.84820302517619e-05, -4.533920218818821e-05, -4.219637412461452e-05, -3.905354969901964e-05, -3.591072163544595e-05, -3.2767893571872264e-05, -2.9625065508298576e-05, -2.648223926371429e-05, -2.3339411200140603e-05, -2.0196583136566915e-05, -1.705375689198263e-05, -1.3910928828408942e-05, -1.0768101674329955e-05, -7.625274520250969e-06, -4.48244645667728e-06, -1.3396202120929956e-06, 1.8032078514806926e-06, 4.946035005559679e-06, 8.088862159638666e-06, 1.1231690223212354e-05, 1.437451737729134e-05, 1.7517344531370327e-05, 2.0660172594944015e-05, 2.38029988395283e-05, 2.6945826903101988e-05, 3.0088654966675676e-05, 3.323148121125996e-05, 3.637430927483365e-05, 3.951713733840734e-05, 4.2659965401981026e-05, 4.5802793465554714e-05, 4.8945617891149595e-05, 5.2088445954723284e-05, 5.523127401829697e-05, 5.837410208187066e-05, 6.151692650746554e-05, 6.465975457103923e-05, 6.780258263461292e-05, 7.09454106981866e-05, 7.40882387617603e-05, 7.723106682533398e-05, 8.037389488890767e-05, 8.351672295248136e-05, 8.665955101605505e-05, 8.980237907962874e-05, 9.294520714320242e-05, 9.60880279308185e-05, 9.923085599439219e-05, 0.00010237368405796587]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 17.0, 21.0, 23.0, 38.0, 53.0, 58.0, 98.0, 136.0, 184.0, 268.0, 377.0, 514.0, 749.0, 1040.0, 1602.0, 2403.0, 3597.0, 6212.0, 10842.0, 21701.0, 119533.0, 3937847.0, 46171.0, 16372.0, 8745.0, 5251.0, 3251.0, 2153.0, 1443.0, 1024.0, 687.0, 526.0, 391.0, 245.0, 205.0, 138.0, 86.0, 72.0, 48.0, 54.0, 32.0, 19.0, 15.0, 12.0, 10.0, 2.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00032138824462890625, -0.000311143696308136, -0.0003008991479873657, -0.00029065459966659546, -0.0002804100513458252, -0.00027016550302505493, -0.00025992095470428467, -0.0002496764063835144, -0.00023943185806274414, -0.00022918730974197388, -0.0002189427614212036, -0.00020869821310043335, -0.00019845366477966309, -0.00018820911645889282, -0.00017796456813812256, -0.0001677200198173523, -0.00015747547149658203, -0.00014723092317581177, -0.0001369863748550415, -0.00012674182653427124, -0.00011649727821350098, -0.00010625272989273071, -9.600818157196045e-05, -8.576363325119019e-05, -7.551908493041992e-05, -6.527453660964966e-05, -5.5029988288879395e-05, -4.478543996810913e-05, -3.454089164733887e-05, -2.4296343326568604e-05, -1.405179500579834e-05, -3.807246685028076e-06, 6.4373016357421875e-06, 1.668184995651245e-05, 2.6926398277282715e-05, 3.717094659805298e-05, 4.741549491882324e-05, 5.7660043239593506e-05, 6.790459156036377e-05, 7.814913988113403e-05, 8.83936882019043e-05, 9.863823652267456e-05, 0.00010888278484344482, 0.00011912733316421509, 0.00012937188148498535, 0.00013961642980575562, 0.00014986097812652588, 0.00016010552644729614, 0.0001703500747680664, 0.00018059462308883667, 0.00019083917140960693, 0.0002010837197303772, 0.00021132826805114746, 0.00022157281637191772, 0.000231817364692688, 0.00024206191301345825, 0.0002523064613342285, 0.0002625510096549988, 0.00027279555797576904, 0.0002830401062965393, 0.00029328465461730957, 0.00030352920293807983, 0.0003137737512588501, 0.00032401829957962036, 0.0003342628479003906]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 4.0, 9.0, 6.0, 12.0, 13.0, 12.0, 14.0, 15.0, 23.0, 28.0, 23.0, 23.0, 28.0, 36.0, 42.0, 40.0, 54.0, 35.0, 41.0, 34.0, 56.0, 41.0, 44.0, 29.0, 42.0, 26.0, 31.0, 27.0, 27.0, 28.0, 22.0, 17.0, 16.0, 23.0, 8.0, 12.0, 8.0, 8.0, 12.0, 8.0, 5.0, 4.0, 2.0, 7.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.091594696044922e-05, -5.8955512940883636e-05, -5.6995078921318054e-05, -5.503464490175247e-05, -5.307421088218689e-05, -5.111377686262131e-05, -4.9153342843055725e-05, -4.719290882349014e-05, -4.523247480392456e-05, -4.327204078435898e-05, -4.1311606764793396e-05, -3.9351172745227814e-05, -3.739073872566223e-05, -3.543030470609665e-05, -3.346987068653107e-05, -3.1509436666965485e-05, -2.9549002647399902e-05, -2.758856862783432e-05, -2.5628134608268738e-05, -2.3667700588703156e-05, -2.1707266569137573e-05, -1.974683254957199e-05, -1.778639853000641e-05, -1.5825964510440826e-05, -1.3865530490875244e-05, -1.1905096471309662e-05, -9.94466245174408e-06, -7.984228432178497e-06, -6.023794412612915e-06, -4.063360393047333e-06, -2.1029263734817505e-06, -1.424923539161682e-07, 1.817941665649414e-06, 3.7783756852149963e-06, 5.738809704780579e-06, 7.699243724346161e-06, 9.659677743911743e-06, 1.1620111763477325e-05, 1.3580545783042908e-05, 1.554097980260849e-05, 1.7501413822174072e-05, 1.9461847841739655e-05, 2.1422281861305237e-05, 2.338271588087082e-05, 2.53431499004364e-05, 2.7303583920001984e-05, 2.9264017939567566e-05, 3.122445195913315e-05, 3.318488597869873e-05, 3.514531999826431e-05, 3.7105754017829895e-05, 3.906618803739548e-05, 4.102662205696106e-05, 4.298705607652664e-05, 4.4947490096092224e-05, 4.6907924115657806e-05, 4.886835813522339e-05, 5.082879215478897e-05, 5.278922617435455e-05, 5.4749660193920135e-05, 5.671009421348572e-05, 5.86705282330513e-05, 6.063096225261688e-05, 6.259139627218246e-05, 6.455183029174805e-05]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 3.0, 9.0, 8.0, 16.0, 22.0, 24.0, 33.0, 98.0, 148.0, 320.0, 628.0, 1560.0, 4300.0, 14115.0, 91505.0, 4016623.0, 48817.0, 10392.0, 3291.0, 1253.0, 522.0, 266.0, 121.0, 83.0, 40.0, 19.0, 16.0, 16.0, 10.0, 5.0, 3.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006003379821777344, -0.0005828738212585449, -0.0005654096603393555, -0.000547945499420166, -0.0005304813385009766, -0.0005130171775817871, -0.0004955530166625977, -0.0004780888557434082, -0.00046062469482421875, -0.0004431605339050293, -0.00042569637298583984, -0.0004082322120666504, -0.00039076805114746094, -0.0003733038902282715, -0.00035583972930908203, -0.0003383755683898926, -0.0003209114074707031, -0.00030344724655151367, -0.0002859830856323242, -0.00026851892471313477, -0.0002510547637939453, -0.00023359060287475586, -0.0002161264419555664, -0.00019866228103637695, -0.0001811981201171875, -0.00016373395919799805, -0.0001462697982788086, -0.00012880563735961914, -0.00011134147644042969, -9.387731552124023e-05, -7.641315460205078e-05, -5.894899368286133e-05, -4.1484832763671875e-05, -2.4020671844482422e-05, -6.556510925292969e-06, 1.0907649993896484e-05, 2.8371810913085938e-05, 4.583597183227539e-05, 6.330013275146484e-05, 8.07642936706543e-05, 9.822845458984375e-05, 0.0001156926155090332, 0.00013315677642822266, 0.0001506209373474121, 0.00016808509826660156, 0.00018554925918579102, 0.00020301342010498047, 0.00022047758102416992, 0.00023794174194335938, 0.00025540590286254883, 0.0002728700637817383, 0.00029033422470092773, 0.0003077983856201172, 0.00032526254653930664, 0.0003427267074584961, 0.00036019086837768555, 0.000377655029296875, 0.00039511919021606445, 0.0004125833511352539, 0.00043004751205444336, 0.0004475116729736328, 0.00046497583389282227, 0.0004824399948120117, 0.0004999041557312012, 0.0005173683166503906]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 8.0, 4.0, 14.0, 13.0, 18.0, 37.0, 50.0, 113.0, 426.0, 2683.0, 404.0, 110.0, 47.0, 31.0, 17.0, 14.0, 12.0, 8.0, 7.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.869699478149414e-05, -4.6620145440101624e-05, -4.4543296098709106e-05, -4.246644675731659e-05, -4.038959741592407e-05, -3.8312748074531555e-05, -3.623589873313904e-05, -3.415904939174652e-05, -3.2082200050354004e-05, -3.0005350708961487e-05, -2.792850136756897e-05, -2.5851652026176453e-05, -2.3774802684783936e-05, -2.169795334339142e-05, -1.96211040019989e-05, -1.7544254660606384e-05, -1.5467405319213867e-05, -1.339055597782135e-05, -1.1313706636428833e-05, -9.236857295036316e-06, -7.160007953643799e-06, -5.083158612251282e-06, -3.0063092708587646e-06, -9.294599294662476e-07, 1.1473894119262695e-06, 3.2242387533187866e-06, 5.301088094711304e-06, 7.377937436103821e-06, 9.454786777496338e-06, 1.1531636118888855e-05, 1.3608485460281372e-05, 1.568533480167389e-05, 1.7762184143066406e-05, 1.9839033484458923e-05, 2.191588282585144e-05, 2.3992732167243958e-05, 2.6069581508636475e-05, 2.8146430850028992e-05, 3.022328019142151e-05, 3.2300129532814026e-05, 3.437697887420654e-05, 3.645382821559906e-05, 3.853067755699158e-05, 4.0607526898384094e-05, 4.268437623977661e-05, 4.476122558116913e-05, 4.6838074922561646e-05, 4.891492426395416e-05, 5.099177360534668e-05, 5.30686229467392e-05, 5.5145472288131714e-05, 5.722232162952423e-05, 5.929917097091675e-05, 6.137602031230927e-05, 6.345286965370178e-05, 6.55297189950943e-05, 6.760656833648682e-05, 6.968341767787933e-05, 7.176026701927185e-05, 7.383711636066437e-05, 7.591396570205688e-05, 7.79908150434494e-05, 8.006766438484192e-05, 8.214451372623444e-05, 8.422136306762695e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 13.0, 10.0, 13.0, 15.0, 26.0, 38.0, 59.0, 92.0, 127.0, 198.0, 126.0, 84.0, 62.0, 31.0, 31.0, 17.0, 13.0, 11.0, 8.0, 11.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00022246180742513388, -0.00021735552581958473, -0.0002122492587659508, -0.00020714297716040164, -0.00020203671010676771, -0.00019693042850121856, -0.00019182416144758463, -0.00018671787984203547, -0.00018161159823648632, -0.00017650531663093716, -0.00017139904957730323, -0.00016629276797175407, -0.00016118650091812015, -0.000156080219312571, -0.00015097393770702183, -0.0001458676706533879, -0.00014076140359975398, -0.00013565512199420482, -0.0001305488549405709, -0.00012544257333502173, -0.0001203363062813878, -0.00011523002467583865, -0.00011012375034624711, -0.00010501747601665556, -9.991120168706402e-05, -9.480492735747248e-05, -8.969865302788094e-05, -8.45923786982894e-05, -7.948609709274024e-05, -7.437983003910631e-05, -6.927354843355715e-05, -6.416727410396561e-05, -5.906100705033168e-05, -5.395473272074014e-05, -4.88484583911486e-05, -4.374218042357825e-05, -3.8635906093986705e-05, -3.352963176439516e-05, -2.8423353796824813e-05, -2.331707946723327e-05, -1.8210805137641728e-05, -1.3104529898555484e-05, -7.99825465946924e-06, -2.8919785108882934e-06, 2.214295818703249e-06, 7.320570148294792e-06, 1.2426848115865141e-05, 1.7533122445456684e-05, 2.2639396775048226e-05, 2.774567110463977e-05, 3.285194543423131e-05, 3.795822340180166e-05, 4.30644977313932e-05, 4.8170772060984746e-05, 5.3277050028555095e-05, 5.838332435814664e-05, 6.348959868773818e-05, 6.859587301732972e-05, 7.370214734692127e-05, 7.880842895247042e-05, 8.391469600610435e-05, 8.90209776116535e-05, 9.412725194124505e-05, 9.923352627083659e-05, 0.00010433980060042813]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 6.0, 5.0, 4.0, 7.0, 7.0, 12.0, 5.0, 10.0, 11.0, 18.0, 15.0, 21.0, 18.0, 24.0, 21.0, 31.0, 35.0, 26.0, 33.0, 41.0, 25.0, 32.0, 30.0, 29.0, 44.0, 42.0, 26.0, 36.0, 21.0, 28.0, 28.0, 33.0, 29.0, 26.0, 25.0, 32.0, 25.0, 21.0, 19.0, 11.0, 18.0, 22.0, 11.0, 3.0, 12.0, 5.0, 6.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0], "bins": [-6.571735139004886e-05, -6.366681918734685e-05, -6.161628698464483e-05, -5.956575114396401e-05, -5.7515215303283185e-05, -5.546468310058117e-05, -5.3414150897879153e-05, -5.136361505719833e-05, -4.931307921651751e-05, -4.726254701381549e-05, -4.521201117313467e-05, -4.3161478970432654e-05, -4.111094312975183e-05, -3.9060410927049816e-05, -3.70098787243478e-05, -3.495934288366698e-05, -3.290881068096496e-05, -3.0858278478262946e-05, -2.8807742637582123e-05, -2.6757210434880108e-05, -2.4706674594199285e-05, -2.265614239149727e-05, -2.060560836980585e-05, -1.855507434811443e-05, -1.6504540326423012e-05, -1.4454006304731593e-05, -1.2403472283040173e-05, -1.0352939170843456e-05, -8.302405149152037e-06, -6.2518711274606176e-06, -4.2013380152639e-06, -2.150803993572481e-06, -1.0026997188106179e-07, 1.950263822436682e-06, 4.000797616754426e-06, 6.051331183698494e-06, 8.101865205389913e-06, 1.0152399227081332e-05, 1.220293233927805e-05, 1.4253466360969469e-05, 1.6304000382660888e-05, 1.8354534404352307e-05, 2.0405068426043727e-05, 2.2455602447735146e-05, 2.450613465043716e-05, 2.6556670491117984e-05, 2.860720269382e-05, 3.0657734896522015e-05, 3.270827073720284e-05, 3.4758802939904854e-05, 3.6809338780585676e-05, 3.885987098328769e-05, 4.0910406823968515e-05, 4.296093902667053e-05, 4.501147486735135e-05, 4.706200707005337e-05, 4.9112539272755384e-05, 5.11630714754574e-05, 5.321360731613822e-05, 5.526413951884024e-05, 5.731467535952106e-05, 5.936520756222308e-05, 6.141573976492509e-05, 6.346627196762711e-05, 6.551681144628674e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 9.0, 7.0, 15.0, 25.0, 36.0, 56.0, 81.0, 108.0, 163.0, 204.0, 304.0, 415.0, 601.0, 820.0, 1241.0, 1780.0, 2587.0, 3972.0, 6433.0, 11114.0, 20227.0, 39009.0, 84193.0, 214545.0, 379925.0, 147544.0, 63031.0, 29594.0, 15677.0, 8948.0, 5335.0, 3516.0, 2189.0, 1429.0, 1003.0, 712.0, 489.0, 357.0, 243.0, 184.0, 130.0, 100.0, 66.0, 55.0, 28.0, 17.0, 22.0, 6.0, 6.0, 4.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00010126829147338867, -9.792670607566833e-05, -9.4585120677948e-05, -9.124353528022766e-05, -8.790194988250732e-05, -8.456036448478699e-05, -8.121877908706665e-05, -7.787719368934631e-05, -7.453560829162598e-05, -7.119402289390564e-05, -6.78524374961853e-05, -6.451085209846497e-05, -6.116926670074463e-05, -5.782768130302429e-05, -5.4486095905303955e-05, -5.114451050758362e-05, -4.780292510986328e-05, -4.4461339712142944e-05, -4.111975431442261e-05, -3.777816891670227e-05, -3.4436583518981934e-05, -3.10949981212616e-05, -2.775341272354126e-05, -2.4411827325820923e-05, -2.1070241928100586e-05, -1.772865653038025e-05, -1.4387071132659912e-05, -1.1045485734939575e-05, -7.703900337219238e-06, -4.362314939498901e-06, -1.0207295417785645e-06, 2.3208558559417725e-06, 5.662441253662109e-06, 9.004026651382446e-06, 1.2345612049102783e-05, 1.568719744682312e-05, 1.9028782844543457e-05, 2.2370368242263794e-05, 2.571195363998413e-05, 2.9053539037704468e-05, 3.2395124435424805e-05, 3.573670983314514e-05, 3.907829523086548e-05, 4.2419880628585815e-05, 4.576146602630615e-05, 4.910305142402649e-05, 5.2444636821746826e-05, 5.578622221946716e-05, 5.91278076171875e-05, 6.246939301490784e-05, 6.581097841262817e-05, 6.915256381034851e-05, 7.249414920806885e-05, 7.583573460578918e-05, 7.917732000350952e-05, 8.251890540122986e-05, 8.58604907989502e-05, 8.920207619667053e-05, 9.254366159439087e-05, 9.58852469921112e-05, 9.922683238983154e-05, 0.00010256841778755188, 0.00010591000318527222, 0.00010925158858299255, 0.00011259317398071289]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 8.0, 9.0, 7.0, 7.0, 14.0, 17.0, 20.0, 19.0, 17.0, 16.0, 26.0, 25.0, 32.0, 21.0, 29.0, 29.0, 37.0, 36.0, 28.0, 36.0, 34.0, 39.0, 46.0, 40.0, 26.0, 27.0, 26.0, 40.0, 31.0, 26.0, 23.0, 26.0, 22.0, 30.0, 15.0, 14.0, 15.0, 10.0, 11.0, 11.0, 10.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-6.431341171264648e-05, -6.226636469364166e-05, -6.021931767463684e-05, -5.817227065563202e-05, -5.61252236366272e-05, -5.4078176617622375e-05, -5.2031129598617554e-05, -4.998408257961273e-05, -4.793703556060791e-05, -4.588998854160309e-05, -4.3842941522598267e-05, -4.1795894503593445e-05, -3.974884748458862e-05, -3.77018004655838e-05, -3.565475344657898e-05, -3.360770642757416e-05, -3.1560659408569336e-05, -2.9513612389564514e-05, -2.7466565370559692e-05, -2.541951835155487e-05, -2.337247133255005e-05, -2.1325424313545227e-05, -1.9278377294540405e-05, -1.7231330275535583e-05, -1.5184283256530762e-05, -1.313723623752594e-05, -1.1090189218521118e-05, -9.043142199516296e-06, -6.996095180511475e-06, -4.949048161506653e-06, -2.902001142501831e-06, -8.549541234970093e-07, 1.1920928955078125e-06, 3.2391399145126343e-06, 5.286186933517456e-06, 7.333233952522278e-06, 9.3802809715271e-06, 1.1427327990531921e-05, 1.3474375009536743e-05, 1.5521422028541565e-05, 1.7568469047546387e-05, 1.961551606655121e-05, 2.166256308555603e-05, 2.3709610104560852e-05, 2.5756657123565674e-05, 2.7803704142570496e-05, 2.9850751161575317e-05, 3.189779818058014e-05, 3.394484519958496e-05, 3.599189221858978e-05, 3.8038939237594604e-05, 4.0085986256599426e-05, 4.213303327560425e-05, 4.418008029460907e-05, 4.622712731361389e-05, 4.827417433261871e-05, 5.0321221351623535e-05, 5.236826837062836e-05, 5.441531538963318e-05, 5.6462362408638e-05, 5.850940942764282e-05, 6.0556456446647644e-05, 6.260350346565247e-05, 6.465055048465729e-05, 6.669759750366211e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 10.0, 10.0, 9.0, 9.0, 13.0, 22.0, 47.0, 46.0, 85.0, 114.0, 144.0, 189.0, 354.0, 492.0, 816.0, 1318.0, 2224.0, 4190.0, 8593.0, 22663.0, 88008.0, 712139.0, 152816.0, 31185.0, 11185.0, 5016.0, 2690.0, 1530.0, 898.0, 564.0, 370.0, 250.0, 166.0, 119.0, 84.0, 55.0, 31.0, 29.0, 20.0, 15.0, 16.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020015239715576172, -0.00019362010061740875, -0.00018708780407905579, -0.00018055550754070282, -0.00017402321100234985, -0.0001674909144639969, -0.00016095861792564392, -0.00015442632138729095, -0.000147894024848938, -0.00014136172831058502, -0.00013482943177223206, -0.0001282971352338791, -0.00012176483869552612, -0.00011523254215717316, -0.00010870024561882019, -0.00010216794908046722, -9.563565254211426e-05, -8.910335600376129e-05, -8.257105946540833e-05, -7.603876292705536e-05, -6.950646638870239e-05, -6.297416985034943e-05, -5.644187331199646e-05, -4.9909576773643494e-05, -4.337728023529053e-05, -3.684498369693756e-05, -3.0312687158584595e-05, -2.378039062023163e-05, -1.7248094081878662e-05, -1.0715797543525696e-05, -4.1835010051727295e-06, 2.348795533180237e-06, 8.881092071533203e-06, 1.541338860988617e-05, 2.1945685148239136e-05, 2.8477981686592102e-05, 3.501027822494507e-05, 4.1542574763298035e-05, 4.8074871301651e-05, 5.460716784000397e-05, 6.113946437835693e-05, 6.76717609167099e-05, 7.420405745506287e-05, 8.073635399341583e-05, 8.72686505317688e-05, 9.380094707012177e-05, 0.00010033324360847473, 0.0001068655401468277, 0.00011339783668518066, 0.00011993013322353363, 0.0001264624297618866, 0.00013299472630023956, 0.00013952702283859253, 0.0001460593193769455, 0.00015259161591529846, 0.00015912391245365143, 0.0001656562089920044, 0.00017218850553035736, 0.00017872080206871033, 0.0001852530986070633, 0.00019178539514541626, 0.00019831769168376923, 0.0002048499882221222, 0.00021138228476047516, 0.00021791458129882812]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 5.0, 2.0, 10.0, 12.0, 15.0, 22.0, 21.0, 16.0, 25.0, 35.0, 22.0, 52.0, 30.0, 32.0, 37.0, 35.0, 35.0, 32.0, 39.0, 39.0, 25.0, 35.0, 33.0, 40.0, 49.0, 41.0, 32.0, 37.0, 39.0, 24.0, 24.0, 14.0, 11.0, 16.0, 19.0, 8.0, 11.0, 6.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.38690185546875e-05, -4.2370520532131195e-05, -4.087202250957489e-05, -3.9373524487018585e-05, -3.787502646446228e-05, -3.6376528441905975e-05, -3.487803041934967e-05, -3.3379532396793365e-05, -3.188103437423706e-05, -3.0382536351680756e-05, -2.888403832912445e-05, -2.7385540306568146e-05, -2.588704228401184e-05, -2.4388544261455536e-05, -2.289004623889923e-05, -2.1391548216342926e-05, -1.989305019378662e-05, -1.8394552171230316e-05, -1.689605414867401e-05, -1.5397556126117706e-05, -1.3899058103561401e-05, -1.2400560081005096e-05, -1.0902062058448792e-05, -9.403564035892487e-06, -7.905066013336182e-06, -6.406567990779877e-06, -4.908069968223572e-06, -3.409571945667267e-06, -1.911073923110962e-06, -4.12575900554657e-07, 1.085922122001648e-06, 2.584420144557953e-06, 4.082918167114258e-06, 5.581416189670563e-06, 7.079914212226868e-06, 8.578412234783173e-06, 1.0076910257339478e-05, 1.1575408279895782e-05, 1.3073906302452087e-05, 1.4572404325008392e-05, 1.6070902347564697e-05, 1.7569400370121002e-05, 1.9067898392677307e-05, 2.0566396415233612e-05, 2.2064894437789917e-05, 2.3563392460346222e-05, 2.5061890482902527e-05, 2.6560388505458832e-05, 2.8058886528015137e-05, 2.955738455057144e-05, 3.1055882573127747e-05, 3.255438059568405e-05, 3.4052878618240356e-05, 3.555137664079666e-05, 3.7049874663352966e-05, 3.854837268590927e-05, 4.0046870708465576e-05, 4.154536873102188e-05, 4.3043866753578186e-05, 4.454236477613449e-05, 4.6040862798690796e-05, 4.75393608212471e-05, 4.9037858843803406e-05, 5.053635686635971e-05, 5.2034854888916016e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 11.0, 13.0, 18.0, 13.0, 32.0, 36.0, 50.0, 79.0, 138.0, 164.0, 233.0, 418.0, 671.0, 1096.0, 1731.0, 3202.0, 6852.0, 15971.0, 109237.0, 857940.0, 30431.0, 9752.0, 4540.0, 2264.0, 1357.0, 813.0, 512.0, 294.0, 222.0, 154.0, 97.0, 68.0, 47.0, 22.0, 22.0, 12.0, 13.0, 5.0, 6.0, 5.0, 7.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.552436828613281e-05, -3.434903919696808e-05, -3.3173710107803345e-05, -3.199838101863861e-05, -3.082305192947388e-05, -2.9647722840309143e-05, -2.847239375114441e-05, -2.7297064661979675e-05, -2.612173557281494e-05, -2.4946406483650208e-05, -2.3771077394485474e-05, -2.259574830532074e-05, -2.1420419216156006e-05, -2.0245090126991272e-05, -1.9069761037826538e-05, -1.7894431948661804e-05, -1.671910285949707e-05, -1.5543773770332336e-05, -1.4368444681167603e-05, -1.3193115592002869e-05, -1.2017786502838135e-05, -1.0842457413673401e-05, -9.667128324508667e-06, -8.491799235343933e-06, -7.316470146179199e-06, -6.141141057014465e-06, -4.9658119678497314e-06, -3.7904828786849976e-06, -2.6151537895202637e-06, -1.4398247003555298e-06, -2.644956111907959e-07, 9.10833477973938e-07, 2.086162567138672e-06, 3.2614916563034058e-06, 4.43682074546814e-06, 5.6121498346328735e-06, 6.787478923797607e-06, 7.962808012962341e-06, 9.138137102127075e-06, 1.0313466191291809e-05, 1.1488795280456543e-05, 1.2664124369621277e-05, 1.383945345878601e-05, 1.5014782547950745e-05, 1.619011163711548e-05, 1.7365440726280212e-05, 1.8540769815444946e-05, 1.971609890460968e-05, 2.0891427993774414e-05, 2.2066757082939148e-05, 2.3242086172103882e-05, 2.4417415261268616e-05, 2.559274435043335e-05, 2.6768073439598083e-05, 2.7943402528762817e-05, 2.911873161792755e-05, 3.0294060707092285e-05, 3.146938979625702e-05, 3.264471888542175e-05, 3.382004797458649e-05, 3.499537706375122e-05, 3.6170706152915955e-05, 3.734603524208069e-05, 3.852136433124542e-05, 3.9696693420410156e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 8.0, 4.0, 6.0, 5.0, 8.0, 9.0, 14.0, 8.0, 9.0, 26.0, 9.0, 26.0, 29.0, 17.0, 61.0, 19.0, 50.0, 72.0, 39.0, 200.0, 72.0, 31.0, 45.0, 44.0, 14.0, 25.0, 30.0, 2.0, 36.0, 14.0, 2.0, 8.0, 10.0, 6.0, 13.0, 11.0, 5.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4570693969726562e-06, -3.3583492040634155e-06, -3.259629011154175e-06, -3.160908818244934e-06, -3.0621886253356934e-06, -2.9634684324264526e-06, -2.864748239517212e-06, -2.766028046607971e-06, -2.6673078536987305e-06, -2.5685876607894897e-06, -2.469867467880249e-06, -2.3711472749710083e-06, -2.2724270820617676e-06, -2.173706889152527e-06, -2.074986696243286e-06, -1.9762665033340454e-06, -1.8775463104248047e-06, -1.778826117515564e-06, -1.6801059246063232e-06, -1.5813857316970825e-06, -1.4826655387878418e-06, -1.383945345878601e-06, -1.2852251529693604e-06, -1.1865049600601196e-06, -1.087784767150879e-06, -9.890645742416382e-07, -8.903443813323975e-07, -7.916241884231567e-07, -6.92903995513916e-07, -5.941838026046753e-07, -4.954636096954346e-07, -3.9674341678619385e-07, -2.980232238769531e-07, -1.993030309677124e-07, -1.0058283805847168e-07, -1.862645149230957e-09, 9.685754776000977e-08, 1.955777406692505e-07, 2.942979335784912e-07, 3.9301812648773193e-07, 4.917383193969727e-07, 5.904585123062134e-07, 6.891787052154541e-07, 7.878988981246948e-07, 8.866190910339355e-07, 9.853392839431763e-07, 1.084059476852417e-06, 1.1827796697616577e-06, 1.2814998626708984e-06, 1.3802200555801392e-06, 1.4789402484893799e-06, 1.5776604413986206e-06, 1.6763806343078613e-06, 1.775100827217102e-06, 1.8738210201263428e-06, 1.9725412130355835e-06, 2.0712614059448242e-06, 2.169981598854065e-06, 2.2687017917633057e-06, 2.3674219846725464e-06, 2.466142177581787e-06, 2.564862370491028e-06, 2.6635825634002686e-06, 2.7623027563095093e-06, 2.86102294921875e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 6.0, 12.0, 23.0, 14.0, 19.0, 46.0, 78.0, 121.0, 288.0, 684.0, 1882.0, 5725.0, 23458.0, 393534.0, 588644.0, 24745.0, 6109.0, 1829.0, 679.0, 283.0, 131.0, 73.0, 48.0, 27.0, 22.0, 14.0, 10.0, 7.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.300210952758789e-05, -6.109382957220078e-05, -5.918554961681366e-05, -5.7277269661426544e-05, -5.536898970603943e-05, -5.346070975065231e-05, -5.15524297952652e-05, -4.964414983987808e-05, -4.773586988449097e-05, -4.582758992910385e-05, -4.3919309973716736e-05, -4.201103001832962e-05, -4.0102750062942505e-05, -3.819447010755539e-05, -3.6286190152168274e-05, -3.437791019678116e-05, -3.246963024139404e-05, -3.056135028600693e-05, -2.8653070330619812e-05, -2.6744790375232697e-05, -2.483651041984558e-05, -2.2928230464458466e-05, -2.101995050907135e-05, -1.9111670553684235e-05, -1.720339059829712e-05, -1.5295110642910004e-05, -1.3386830687522888e-05, -1.1478550732135773e-05, -9.570270776748657e-06, -7.661990821361542e-06, -5.753710865974426e-06, -3.845430910587311e-06, -1.9371509552001953e-06, -2.8870999813079834e-08, 1.8794089555740356e-06, 3.787688910961151e-06, 5.695968866348267e-06, 7.604248821735382e-06, 9.512528777122498e-06, 1.1420808732509613e-05, 1.3329088687896729e-05, 1.5237368643283844e-05, 1.714564859867096e-05, 1.9053928554058075e-05, 2.096220850944519e-05, 2.2870488464832306e-05, 2.477876842021942e-05, 2.6687048375606537e-05, 2.8595328330993652e-05, 3.0503608286380768e-05, 3.241188824176788e-05, 3.4320168197155e-05, 3.6228448152542114e-05, 3.813672810792923e-05, 4.0045008063316345e-05, 4.195328801870346e-05, 4.3861567974090576e-05, 4.576984792947769e-05, 4.767812788486481e-05, 4.958640784025192e-05, 5.149468779563904e-05, 5.3402967751026154e-05, 5.531124770641327e-05, 5.7219527661800385e-05, 5.91278076171875e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 8.0, 2.0, 5.0, 6.0, 5.0, 2.0, 8.0, 5.0, 11.0, 16.0, 14.0, 30.0, 29.0, 29.0, 120.0, 155.0, 220.0, 117.0, 48.0, 36.0, 16.0, 21.0, 12.0, 14.0, 12.0, 12.0, 9.0, 5.0, 7.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.662441253662109e-06, -5.475245416164398e-06, -5.288049578666687e-06, -5.100853741168976e-06, -4.913657903671265e-06, -4.7264620661735535e-06, -4.539266228675842e-06, -4.352070391178131e-06, -4.16487455368042e-06, -3.977678716182709e-06, -3.7904828786849976e-06, -3.6032870411872864e-06, -3.416091203689575e-06, -3.228895366191864e-06, -3.041699528694153e-06, -2.8545036911964417e-06, -2.6673078536987305e-06, -2.4801120162010193e-06, -2.292916178703308e-06, -2.105720341205597e-06, -1.9185245037078857e-06, -1.7313286662101746e-06, -1.5441328287124634e-06, -1.3569369912147522e-06, -1.169741153717041e-06, -9.825453162193298e-07, -7.953494787216187e-07, -6.081536412239075e-07, -4.209578037261963e-07, -2.337619662284851e-07, -4.6566128730773926e-08, 1.4062970876693726e-07, 3.2782554626464844e-07, 5.150213837623596e-07, 7.022172212600708e-07, 8.89413058757782e-07, 1.0766088962554932e-06, 1.2638047337532043e-06, 1.4510005712509155e-06, 1.6381964087486267e-06, 1.8253922462463379e-06, 2.012588083744049e-06, 2.1997839212417603e-06, 2.3869797587394714e-06, 2.5741755962371826e-06, 2.761371433734894e-06, 2.948567271232605e-06, 3.135763108730316e-06, 3.3229589462280273e-06, 3.5101547837257385e-06, 3.6973506212234497e-06, 3.884546458721161e-06, 4.071742296218872e-06, 4.258938133716583e-06, 4.4461339712142944e-06, 4.633329808712006e-06, 4.820525646209717e-06, 5.007721483707428e-06, 5.194917321205139e-06, 5.38211315870285e-06, 5.5693089962005615e-06, 5.756504833698273e-06, 5.943700671195984e-06, 6.130896508693695e-06, 6.318092346191406e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 11.0, 6.0, 6.0, 9.0, 19.0, 13.0, 29.0, 42.0, 52.0, 79.0, 128.0, 155.0, 124.0, 102.0, 56.0, 40.0, 26.0, 24.0, 26.0, 7.0, 13.0, 9.0, 1.0, 4.0, 3.0, 8.0, 2.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014426402049139142, -0.00013996637426316738, -0.00013566872803494334, -0.00013137109635863453, -0.0001270734501304105, -0.00012277580390218645, -0.00011847815767396241, -0.00011418051144573838, -0.00010988287249347195, -0.00010558522626524791, -0.00010128758731298149, -9.698994108475745e-05, -9.269229485653341e-05, -8.839465590426698e-05, -8.409700967604294e-05, -7.979937072377652e-05, -7.550172449555248e-05, -7.120407826732844e-05, -6.690643931506202e-05, -6.260879308683798e-05, -5.8311150496592745e-05, -5.401350790634751e-05, -4.9715861678123474e-05, -4.541821908787824e-05, -4.112057649763301e-05, -3.682293390738778e-05, -3.2525291317142546e-05, -2.8227645088918507e-05, -2.3930002498673275e-05, -1.9632359908428043e-05, -1.5334715499193408e-05, -1.1037071089958772e-05, -6.7394430516287684e-06, -2.4417995518888347e-06, 1.855843947851099e-06, 6.153487447591033e-06, 1.0451130947330967e-05, 1.4748773537576199e-05, 1.9046417946810834e-05, 2.334406235604547e-05, 2.76417049462907e-05, 3.1939347536535934e-05, 3.6236990126781166e-05, 4.0534636355005205e-05, 4.483227894525044e-05, 4.912992153549567e-05, 5.342756776371971e-05, 5.772521035396494e-05, 6.202285294421017e-05, 6.632049917243421e-05, 7.061813812470064e-05, 7.491578435292467e-05, 7.92134233051911e-05, 8.351106953341514e-05, 8.780871576163918e-05, 9.210636198986322e-05, 9.640400094212964e-05, 0.00010070164717035368, 0.0001049992861226201, 0.00010929693235084414, 0.00011359457857906818, 0.00011789221753133461, 0.00012218985648360103, 0.00012648750271182507, 0.0001307851489400491]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 9.0, 9.0, 10.0, 9.0, 9.0, 14.0, 20.0, 19.0, 19.0, 21.0, 21.0, 37.0, 31.0, 28.0, 30.0, 34.0, 32.0, 31.0, 36.0, 28.0, 40.0, 40.0, 30.0, 33.0, 27.0, 21.0, 27.0, 38.0, 27.0, 31.0, 21.0, 28.0, 24.0, 22.0, 20.0, 13.0, 16.0, 20.0, 14.0, 6.0, 12.0, 5.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0], "bins": [-6.0833768657175824e-05, -5.893787238164805e-05, -5.7041972468141466e-05, -5.514607619261369e-05, -5.3250179917085916e-05, -5.135428364155814e-05, -4.945838372805156e-05, -4.756248745252378e-05, -4.56665875390172e-05, -4.3770691263489425e-05, -4.187479134998284e-05, -3.997889507445507e-05, -3.808299879892729e-05, -3.618709888542071e-05, -3.4291202609892935e-05, -3.239530633436516e-05, -3.0499410058837384e-05, -2.8603511964320205e-05, -2.670761568879243e-05, -2.481171759427525e-05, -2.2915821318747476e-05, -2.1019923224230297e-05, -1.9124025129713118e-05, -1.7228128854185343e-05, -1.5332230759668164e-05, -1.3436333574645687e-05, -1.154043638962321e-05, -9.644538295106031e-06, -7.748641110083554e-06, -5.852743925061077e-06, -3.956845830543898e-06, -2.060948645521421e-06, -1.6504782252013683e-07, 1.7308495898760157e-06, 3.626747002272168e-06, 5.522644642041996e-06, 7.418541827064473e-06, 9.31443901208695e-06, 1.1210337106604129e-05, 1.3106234291626606e-05, 1.5002131476649083e-05, 1.6898029571166262e-05, 1.8793925846694037e-05, 2.0689823941211216e-05, 2.2585722035728395e-05, 2.448161831125617e-05, 2.637751640577335e-05, 2.8273414500290528e-05, 3.0169310775818303e-05, 3.206520705134608e-05, 3.396110696485266e-05, 3.5857003240380436e-05, 3.775289951590821e-05, 3.964879579143599e-05, 4.154469570494257e-05, 4.3440591980470344e-05, 4.533649189397693e-05, 4.72323881695047e-05, 4.9128288083011284e-05, 5.102418435853906e-05, 5.2920080634066835e-05, 5.481598054757342e-05, 5.671187682310119e-05, 5.860777309862897e-05, 6.050366937415674e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 13.0, 18.0, 10.0, 17.0, 33.0, 56.0, 76.0, 127.0, 206.0, 353.0, 609.0, 1114.0, 2052.0, 3923.0, 7904.0, 17208.0, 40106.0, 103986.0, 332216.0, 353668.0, 108220.0, 41569.0, 17838.0, 8380.0, 4013.0, 2070.0, 1185.0, 628.0, 343.0, 206.0, 138.0, 93.0, 60.0, 37.0, 21.0, 13.0, 10.0, 9.0, 9.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002880096435546875, -0.00027694180607795715, -0.0002658739686012268, -0.00025480613112449646, -0.0002437382936477661, -0.00023267045617103577, -0.00022160261869430542, -0.00021053478121757507, -0.00019946694374084473, -0.00018839910626411438, -0.00017733126878738403, -0.0001662634313106537, -0.00015519559383392334, -0.000144127756357193, -0.00013305991888046265, -0.0001219920814037323, -0.00011092424392700195, -9.98564064502716e-05, -8.878856897354126e-05, -7.772073149681091e-05, -6.665289402008057e-05, -5.558505654335022e-05, -4.451721906661987e-05, -3.3449381589889526e-05, -2.238154411315918e-05, -1.1313706636428833e-05, -2.4586915969848633e-07, 1.082196831703186e-05, 2.1889805793762207e-05, 3.2957643270492554e-05, 4.40254807472229e-05, 5.509331822395325e-05, 6.61611557006836e-05, 7.722899317741394e-05, 8.829683065414429e-05, 9.936466813087463e-05, 0.00011043250560760498, 0.00012150034308433533, 0.00013256818056106567, 0.00014363601803779602, 0.00015470385551452637, 0.00016577169299125671, 0.00017683953046798706, 0.0001879073679447174, 0.00019897520542144775, 0.0002100430428981781, 0.00022111088037490845, 0.0002321787178516388, 0.00024324655532836914, 0.0002543143928050995, 0.00026538223028182983, 0.0002764500677585602, 0.00028751790523529053, 0.0002985857427120209, 0.0003096535801887512, 0.00032072141766548157, 0.0003317892551422119, 0.00034285709261894226, 0.0003539249300956726, 0.00036499276757240295, 0.0003760606050491333, 0.00038712844252586365, 0.000398196280002594, 0.00040926411747932434, 0.0004203319549560547]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 14.0, 14.0, 23.0, 17.0, 47.0, 45.0, 34.0, 42.0, 49.0, 48.0, 41.0, 54.0, 49.0, 63.0, 42.0, 36.0, 37.0, 50.0, 45.0, 45.0, 31.0, 28.0, 17.0, 20.0, 20.0, 14.0, 17.0, 7.0, 6.0, 5.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.458427429199219e-05, -4.2865052819252014e-05, -4.114583134651184e-05, -3.942660987377167e-05, -3.7707388401031494e-05, -3.598816692829132e-05, -3.426894545555115e-05, -3.2549723982810974e-05, -3.08305025100708e-05, -2.9111281037330627e-05, -2.7392059564590454e-05, -2.567283809185028e-05, -2.3953616619110107e-05, -2.2234395146369934e-05, -2.051517367362976e-05, -1.8795952200889587e-05, -1.7076730728149414e-05, -1.535750925540924e-05, -1.3638287782669067e-05, -1.1919066309928894e-05, -1.019984483718872e-05, -8.480623364448547e-06, -6.761401891708374e-06, -5.042180418968201e-06, -3.3229589462280273e-06, -1.603737473487854e-06, 1.1548399925231934e-07, 1.8347054719924927e-06, 3.553926944732666e-06, 5.273148417472839e-06, 6.992369890213013e-06, 8.711591362953186e-06, 1.043081283569336e-05, 1.2150034308433533e-05, 1.3869255781173706e-05, 1.558847725391388e-05, 1.7307698726654053e-05, 1.9026920199394226e-05, 2.07461416721344e-05, 2.2465363144874573e-05, 2.4184584617614746e-05, 2.590380609035492e-05, 2.7623027563095093e-05, 2.9342249035835266e-05, 3.106147050857544e-05, 3.278069198131561e-05, 3.4499913454055786e-05, 3.621913492679596e-05, 3.793835639953613e-05, 3.9657577872276306e-05, 4.137679934501648e-05, 4.309602081775665e-05, 4.4815242290496826e-05, 4.6534463763237e-05, 4.825368523597717e-05, 4.9972906708717346e-05, 5.169212818145752e-05, 5.341134965419769e-05, 5.5130571126937866e-05, 5.684979259967804e-05, 5.856901407241821e-05, 6.0288235545158386e-05, 6.200745701789856e-05, 6.372667849063873e-05, 6.54458999633789e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 10.0, 17.0, 22.0, 33.0, 57.0, 63.0, 95.0, 120.0, 203.0, 291.0, 419.0, 618.0, 846.0, 1354.0, 2038.0, 2972.0, 4798.0, 7137.0, 10985.0, 17337.0, 26995.0, 44231.0, 74370.0, 144448.0, 322854.0, 171807.0, 84480.0, 47505.0, 29900.0, 18271.0, 11717.0, 7796.0, 4964.0, 3284.0, 2136.0, 1322.0, 1019.0, 659.0, 432.0, 305.0, 219.0, 127.0, 96.0, 59.0, 42.0, 30.0, 22.0, 12.0, 11.0, 8.0, 8.0, 3.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.00011152029037475586, -0.00010809861123561859, -0.00010467693209648132, -0.00010125525295734406, -9.783357381820679e-05, -9.441189467906952e-05, -9.099021553993225e-05, -8.756853640079498e-05, -8.414685726165771e-05, -8.072517812252045e-05, -7.730349898338318e-05, -7.388181984424591e-05, -7.046014070510864e-05, -6.703846156597137e-05, -6.36167824268341e-05, -6.019510328769684e-05, -5.677342414855957e-05, -5.33517450094223e-05, -4.9930065870285034e-05, -4.6508386731147766e-05, -4.30867075920105e-05, -3.966502845287323e-05, -3.624334931373596e-05, -3.2821670174598694e-05, -2.9399991035461426e-05, -2.5978311896324158e-05, -2.255663275718689e-05, -1.913495361804962e-05, -1.5713274478912354e-05, -1.2291595339775085e-05, -8.869916200637817e-06, -5.448237061500549e-06, -2.0265579223632812e-06, 1.3951212167739868e-06, 4.816800355911255e-06, 8.238479495048523e-06, 1.1660158634185791e-05, 1.5081837773323059e-05, 1.8503516912460327e-05, 2.1925196051597595e-05, 2.5346875190734863e-05, 2.876855432987213e-05, 3.21902334690094e-05, 3.561191260814667e-05, 3.9033591747283936e-05, 4.2455270886421204e-05, 4.587695002555847e-05, 4.929862916469574e-05, 5.272030830383301e-05, 5.6141987442970276e-05, 5.9563666582107544e-05, 6.298534572124481e-05, 6.640702486038208e-05, 6.982870399951935e-05, 7.325038313865662e-05, 7.667206227779388e-05, 8.009374141693115e-05, 8.351542055606842e-05, 8.693709969520569e-05, 9.035877883434296e-05, 9.378045797348022e-05, 9.720213711261749e-05, 0.00010062381625175476, 0.00010404549539089203, 0.0001074671745300293]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 7.0, 4.0, 8.0, 16.0, 6.0, 25.0, 18.0, 21.0, 16.0, 24.0, 26.0, 34.0, 34.0, 22.0, 37.0, 32.0, 38.0, 50.0, 44.0, 34.0, 52.0, 40.0, 45.0, 43.0, 35.0, 37.0, 31.0, 28.0, 22.0, 27.0, 24.0, 20.0, 20.0, 11.0, 14.0, 13.0, 13.0, 3.0, 8.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.325939178466797e-05, -3.21120023727417e-05, -3.096461296081543e-05, -2.981722354888916e-05, -2.866983413696289e-05, -2.752244472503662e-05, -2.637505531311035e-05, -2.5227665901184082e-05, -2.4080276489257812e-05, -2.2932887077331543e-05, -2.1785497665405273e-05, -2.0638108253479004e-05, -1.9490718841552734e-05, -1.8343329429626465e-05, -1.7195940017700195e-05, -1.6048550605773926e-05, -1.4901161193847656e-05, -1.3753771781921387e-05, -1.2606382369995117e-05, -1.1458992958068848e-05, -1.0311603546142578e-05, -9.164214134216309e-06, -8.016824722290039e-06, -6.8694353103637695e-06, -5.7220458984375e-06, -4.5746564865112305e-06, -3.427267074584961e-06, -2.2798776626586914e-06, -1.1324882507324219e-06, 1.4901161193847656e-08, 1.1622905731201172e-06, 2.3096799850463867e-06, 3.4570693969726562e-06, 4.604458808898926e-06, 5.751848220825195e-06, 6.899237632751465e-06, 8.046627044677734e-06, 9.194016456604004e-06, 1.0341405868530273e-05, 1.1488795280456543e-05, 1.2636184692382812e-05, 1.3783574104309082e-05, 1.4930963516235352e-05, 1.607835292816162e-05, 1.722574234008789e-05, 1.837313175201416e-05, 1.952052116394043e-05, 2.06679105758667e-05, 2.181529998779297e-05, 2.2962689399719238e-05, 2.4110078811645508e-05, 2.5257468223571777e-05, 2.6404857635498047e-05, 2.7552247047424316e-05, 2.8699636459350586e-05, 2.9847025871276855e-05, 3.0994415283203125e-05, 3.2141804695129395e-05, 3.3289194107055664e-05, 3.4436583518981934e-05, 3.55839729309082e-05, 3.673136234283447e-05, 3.787875175476074e-05, 3.902614116668701e-05, 4.017353057861328e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 8.0, 11.0, 10.0, 7.0, 10.0, 25.0, 18.0, 39.0, 38.0, 48.0, 106.0, 87.0, 133.0, 368.0, 432.0, 1274.0, 1743.0, 3607.0, 15044.0, 36132.0, 735752.0, 194227.0, 36106.0, 15409.0, 3434.0, 2316.0, 698.0, 487.0, 388.0, 157.0, 151.0, 70.0, 55.0, 41.0, 33.0, 26.0, 23.0, 8.0, 8.0, 6.0, 4.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.410743713378906e-06, -4.268251359462738e-06, -4.12575900554657e-06, -3.983266651630402e-06, -3.840774297714233e-06, -3.698281943798065e-06, -3.555789589881897e-06, -3.4132972359657288e-06, -3.2708048820495605e-06, -3.1283125281333923e-06, -2.985820174217224e-06, -2.843327820301056e-06, -2.7008354663848877e-06, -2.5583431124687195e-06, -2.4158507585525513e-06, -2.273358404636383e-06, -2.130866050720215e-06, -1.9883736968040466e-06, -1.8458813428878784e-06, -1.7033889889717102e-06, -1.560896635055542e-06, -1.4184042811393738e-06, -1.2759119272232056e-06, -1.1334195733070374e-06, -9.909272193908691e-07, -8.484348654747009e-07, -7.059425115585327e-07, -5.634501576423645e-07, -4.209578037261963e-07, -2.784654498100281e-07, -1.3597309589385986e-07, 6.51925802230835e-09, 1.4901161193847656e-07, 2.915039658546448e-07, 4.33996319770813e-07, 5.764886736869812e-07, 7.189810276031494e-07, 8.614733815193176e-07, 1.0039657354354858e-06, 1.146458089351654e-06, 1.2889504432678223e-06, 1.4314427971839905e-06, 1.5739351511001587e-06, 1.716427505016327e-06, 1.8589198589324951e-06, 2.0014122128486633e-06, 2.1439045667648315e-06, 2.2863969206809998e-06, 2.428889274597168e-06, 2.571381628513336e-06, 2.7138739824295044e-06, 2.8563663363456726e-06, 2.998858690261841e-06, 3.141351044178009e-06, 3.2838433980941772e-06, 3.4263357520103455e-06, 3.5688281059265137e-06, 3.711320459842682e-06, 3.85381281375885e-06, 3.996305167675018e-06, 4.1387975215911865e-06, 4.281289875507355e-06, 4.423782229423523e-06, 4.566274583339691e-06, 4.708766937255859e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 5.0, 0.0, 31.0, 0.0, 55.0, 0.0, 134.0, 0.0, 550.0, 0.0, 131.0, 0.0, 55.0, 0.0, 29.0, 0.0, 12.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07, 9.834766387939453e-07, 1.0132789611816406e-06, 1.043081283569336e-06, 1.0728836059570312e-06, 1.1026859283447266e-06, 1.1324882507324219e-06, 1.1622905731201172e-06, 1.1920928955078125e-06, 1.2218952178955078e-06, 1.2516975402832031e-06, 1.2814998626708984e-06, 1.3113021850585938e-06, 1.341104507446289e-06, 1.3709068298339844e-06, 1.4007091522216797e-06, 1.430511474609375e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 6.0, 12.0, 9.0, 25.0, 21.0, 27.0, 41.0, 67.0, 90.0, 126.0, 218.0, 792.0, 1334.0, 3238.0, 9441.0, 35358.0, 746388.0, 200570.0, 35153.0, 9510.0, 4093.0, 904.0, 449.0, 220.0, 171.0, 70.0, 40.0, 36.0, 39.0, 24.0, 11.0, 13.0, 9.0, 9.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.649162292480469e-06, -4.515983164310455e-06, -4.382804036140442e-06, -4.2496249079704285e-06, -4.116445779800415e-06, -3.983266651630402e-06, -3.850087523460388e-06, -3.7169083952903748e-06, -3.5837292671203613e-06, -3.450550138950348e-06, -3.3173710107803345e-06, -3.184191882610321e-06, -3.0510127544403076e-06, -2.917833626270294e-06, -2.7846544981002808e-06, -2.6514753699302673e-06, -2.518296241760254e-06, -2.3851171135902405e-06, -2.251937985420227e-06, -2.1187588572502136e-06, -1.9855797290802e-06, -1.8524006009101868e-06, -1.7192214727401733e-06, -1.58604234457016e-06, -1.4528632164001465e-06, -1.319684088230133e-06, -1.1865049600601196e-06, -1.0533258318901062e-06, -9.201467037200928e-07, -7.869675755500793e-07, -6.537884473800659e-07, -5.206093192100525e-07, -3.8743019104003906e-07, -2.5425106287002563e-07, -1.210719347000122e-07, 1.210719347000122e-08, 1.4528632164001465e-07, 2.784654498100281e-07, 4.116445779800415e-07, 5.448237061500549e-07, 6.780028343200684e-07, 8.111819624900818e-07, 9.443610906600952e-07, 1.0775402188301086e-06, 1.210719347000122e-06, 1.3438984751701355e-06, 1.477077603340149e-06, 1.6102567315101624e-06, 1.7434358596801758e-06, 1.8766149878501892e-06, 2.0097941160202026e-06, 2.142973244190216e-06, 2.2761523723602295e-06, 2.409331500530243e-06, 2.5425106287002563e-06, 2.6756897568702698e-06, 2.808868885040283e-06, 2.9420480132102966e-06, 3.07522714138031e-06, 3.2084062695503235e-06, 3.341585397720337e-06, 3.4747645258903503e-06, 3.6079436540603638e-06, 3.741122782230377e-06, 3.874301910400391e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 11.0, 0.0, 20.0, 0.0, 40.0, 106.0, 0.0, 197.0, 0.0, 295.0, 0.0, 165.0, 0.0, 92.0, 45.0, 0.0, 26.0, 0.0, 9.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4565885066986084e-06, -1.4230608940124512e-06, -1.389533281326294e-06, -1.3560056686401367e-06, -1.3224780559539795e-06, -1.2889504432678223e-06, -1.255422830581665e-06, -1.2218952178955078e-06, -1.1883676052093506e-06, -1.1548399925231934e-06, -1.1213123798370361e-06, -1.087784767150879e-06, -1.0542571544647217e-06, -1.0207295417785645e-06, -9.872019290924072e-07, -9.5367431640625e-07, -9.201467037200928e-07, -8.866190910339355e-07, -8.530914783477783e-07, -8.195638656616211e-07, -7.860362529754639e-07, -7.525086402893066e-07, -7.189810276031494e-07, -6.854534149169922e-07, -6.51925802230835e-07, -6.183981895446777e-07, -5.848705768585205e-07, -5.513429641723633e-07, -5.178153514862061e-07, -4.842877388000488e-07, -4.507601261138916e-07, -4.172325134277344e-07, -3.8370490074157715e-07, -3.501772880554199e-07, -3.166496753692627e-07, -2.8312206268310547e-07, -2.4959444999694824e-07, -2.1606683731079102e-07, -1.825392246246338e-07, -1.4901161193847656e-07, -1.1548399925231934e-07, -8.195638656616211e-08, -4.842877388000488e-08, -1.4901161193847656e-08, 1.862645149230957e-08, 5.21540641784668e-08, 8.568167686462402e-08, 1.1920928955078125e-07, 1.5273690223693848e-07, 1.862645149230957e-07, 2.1979212760925293e-07, 2.5331974029541016e-07, 2.868473529815674e-07, 3.203749656677246e-07, 3.5390257835388184e-07, 3.8743019104003906e-07, 4.209578037261963e-07, 4.544854164123535e-07, 4.880130290985107e-07, 5.21540641784668e-07, 5.550682544708252e-07, 5.885958671569824e-07, 6.221234798431396e-07, 6.556510925292969e-07]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 8.0, 5.0, 15.0, 15.0, 19.0, 39.0, 48.0, 62.0, 75.0, 123.0, 195.0, 108.0, 68.0, 51.0, 38.0, 28.0, 24.0, 15.0, 19.0, 5.0, 6.0, 10.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.883457096293569e-05, -9.6247109468095e-05, -9.365964069729671e-05, -9.107217192649841e-05, -8.848471043165773e-05, -8.589724893681705e-05, -8.330978016601875e-05, -8.072231139522046e-05, -7.813484990037978e-05, -7.55473884055391e-05, -7.29599196347408e-05, -7.03724508639425e-05, -6.778498936910182e-05, -6.519752787426114e-05, -6.261005910346285e-05, -6.0022593970643356e-05, -5.743512883782387e-05, -5.484766370500438e-05, -5.226019857218489e-05, -4.96727334393654e-05, -4.708526830654591e-05, -4.4497803173726425e-05, -4.1910338040906936e-05, -3.932287290808745e-05, -3.673540777526796e-05, -3.414794264244847e-05, -3.156047750962898e-05, -2.8973012376809493e-05, -2.6385547243990004e-05, -2.3798082111170515e-05, -2.1210616978351027e-05, -1.8623151845531538e-05, -1.6035679436754435e-05, -1.3448214303934947e-05, -1.0860749171115458e-05, -8.27328403829597e-06, -5.685818905476481e-06, -3.098353772656992e-06, -5.108886398375034e-07, 2.076576492981985e-06, 4.664041625801474e-06, 7.2515067586209625e-06, 9.838971891440451e-06, 1.242643702425994e-05, 1.5013902157079428e-05, 1.7601367289898917e-05, 2.0188832422718406e-05, 2.2776297555537894e-05, 2.5363762688357383e-05, 2.795122782117687e-05, 3.053869295399636e-05, 3.312615808681585e-05, 3.571362321963534e-05, 3.8301088352454826e-05, 4.0888553485274315e-05, 4.3476018618093804e-05, 4.606348375091329e-05, 4.865094888373278e-05, 5.123841401655227e-05, 5.382587914937176e-05, 5.641334428219125e-05, 5.9000809415010735e-05, 6.158827454783022e-05, 6.41757360426709e-05, 6.67632048134692e-05]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 8.0, 3.0, 7.0, 8.0, 12.0, 21.0, 12.0, 17.0, 24.0, 28.0, 23.0, 29.0, 22.0, 26.0, 45.0, 41.0, 39.0, 41.0, 39.0, 40.0, 35.0, 46.0, 39.0, 47.0, 40.0, 43.0, 37.0, 34.0, 25.0, 30.0, 18.0, 29.0, 18.0, 16.0, 8.0, 9.0, 14.0, 8.0, 5.0, 4.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.094462201464921e-05, -3.948577796109021e-05, -3.80269339075312e-05, -3.6568089853972197e-05, -3.5109242162434384e-05, -3.365039810887538e-05, -3.2191554055316374e-05, -3.073271000175737e-05, -2.9273865948198363e-05, -2.7815021894639358e-05, -2.635617602209095e-05, -2.4897331968531944e-05, -2.343848791497294e-05, -2.197964204242453e-05, -2.0520797988865525e-05, -1.906195393530652e-05, -1.760310806275811e-05, -1.6144264009199105e-05, -1.4685419046145398e-05, -1.3226574083091691e-05, -1.1767730029532686e-05, -1.0308885066478979e-05, -8.850040103425272e-06, -7.3911960498662665e-06, -5.9323510868125595e-06, -4.473506578506203e-06, -3.0146618428261718e-06, -1.5558171071461402e-06, -9.697259883978404e-08, 1.3618719094665721e-06, 2.820716872520279e-06, 4.279560926079284e-06, 5.7384058891329914e-06, 7.197250397439348e-06, 8.656094905745704e-06, 1.011493986879941e-05, 1.1573783922358416e-05, 1.3032628885412123e-05, 1.449147384846583e-05, 1.5950317902024835e-05, 1.740916195558384e-05, 1.8868006009142846e-05, 2.0326851881691255e-05, 2.178569593525026e-05, 2.3244539988809265e-05, 2.4703385861357674e-05, 2.616222991491668e-05, 2.7621073968475685e-05, 2.9079919841024093e-05, 3.05387657135725e-05, 3.199760976713151e-05, 3.345645382069051e-05, 3.491529787424952e-05, 3.637414192780852e-05, 3.783298598136753e-05, 3.9291830034926534e-05, 4.0750677726464346e-05, 4.220952178002335e-05, 4.3668365833582357e-05, 4.512721352512017e-05, 4.6586057578679174e-05, 4.804490163223818e-05, 4.9503745685797185e-05, 5.096258973935619e-05, 5.2421433792915195e-05]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 10.0, 5.0, 16.0, 16.0, 34.0, 46.0, 77.0, 104.0, 176.0, 272.0, 399.0, 611.0, 951.0, 1500.0, 2397.0, 3888.0, 6413.0, 11039.0, 18645.0, 32706.0, 62971.0, 124893.0, 292693.0, 3027272.0, 332064.0, 129861.0, 63878.0, 33361.0, 19062.0, 11202.0, 6626.0, 3988.0, 2476.0, 1574.0, 991.0, 670.0, 451.0, 295.0, 197.0, 138.0, 102.0, 57.0, 53.0, 25.0, 26.0, 21.0, 12.0, 9.0, 6.0, 6.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.888938903808594e-05, -5.67510724067688e-05, -5.461275577545166e-05, -5.247443914413452e-05, -5.033612251281738e-05, -4.8197805881500244e-05, -4.6059489250183105e-05, -4.392117261886597e-05, -4.178285598754883e-05, -3.964453935623169e-05, -3.750622272491455e-05, -3.536790609359741e-05, -3.3229589462280273e-05, -3.1091272830963135e-05, -2.8952956199645996e-05, -2.6814639568328857e-05, -2.467632293701172e-05, -2.253800630569458e-05, -2.039968967437744e-05, -1.8261373043060303e-05, -1.6123056411743164e-05, -1.3984739780426025e-05, -1.1846423149108887e-05, -9.708106517791748e-06, -7.569789886474609e-06, -5.431473255157471e-06, -3.293156623840332e-06, -1.1548399925231934e-06, 9.834766387939453e-07, 3.121793270111084e-06, 5.260109901428223e-06, 7.398426532745361e-06, 9.5367431640625e-06, 1.1675059795379639e-05, 1.3813376426696777e-05, 1.5951693058013916e-05, 1.8090009689331055e-05, 2.0228326320648193e-05, 2.2366642951965332e-05, 2.450495958328247e-05, 2.664327621459961e-05, 2.8781592845916748e-05, 3.091990947723389e-05, 3.3058226108551025e-05, 3.5196542739868164e-05, 3.73348593711853e-05, 3.947317600250244e-05, 4.161149263381958e-05, 4.374980926513672e-05, 4.588812589645386e-05, 4.8026442527770996e-05, 5.0164759159088135e-05, 5.2303075790405273e-05, 5.444139242172241e-05, 5.657970905303955e-05, 5.871802568435669e-05, 6.085634231567383e-05, 6.299465894699097e-05, 6.51329755783081e-05, 6.727129220962524e-05, 6.940960884094238e-05, 7.154792547225952e-05, 7.368624210357666e-05, 7.58245587348938e-05, 7.796287536621094e-05]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 3.0, 5.0, 5.0, 9.0, 11.0, 13.0, 17.0, 15.0, 30.0, 27.0, 29.0, 30.0, 28.0, 50.0, 43.0, 36.0, 32.0, 39.0, 40.0, 47.0, 61.0, 47.0, 38.0, 48.0, 29.0, 41.0, 38.0, 28.0, 22.0, 26.0, 24.0, 28.0, 9.0, 10.0, 11.0, 7.0, 5.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125999450683594e-06, -4.9388036131858826e-06, -4.751607775688171e-06, -4.56441193819046e-06, -4.377216100692749e-06, -4.190020263195038e-06, -4.002824425697327e-06, -3.8156285881996155e-06, -3.6284327507019043e-06, -3.441236913204193e-06, -3.254041075706482e-06, -3.0668452382087708e-06, -2.8796494007110596e-06, -2.6924535632133484e-06, -2.505257725715637e-06, -2.318061888217926e-06, -2.130866050720215e-06, -1.9436702132225037e-06, -1.7564743757247925e-06, -1.5692785382270813e-06, -1.3820827007293701e-06, -1.194886863231659e-06, -1.0076910257339478e-06, -8.204951882362366e-07, -6.332993507385254e-07, -4.461035132408142e-07, -2.5890767574310303e-07, -7.171183824539185e-08, 1.1548399925231934e-07, 3.026798367500305e-07, 4.898756742477417e-07, 6.770715117454529e-07, 8.642673492431641e-07, 1.0514631867408752e-06, 1.2386590242385864e-06, 1.4258548617362976e-06, 1.6130506992340088e-06, 1.80024653673172e-06, 1.987442374229431e-06, 2.1746382117271423e-06, 2.3618340492248535e-06, 2.5490298867225647e-06, 2.736225724220276e-06, 2.923421561717987e-06, 3.1106173992156982e-06, 3.2978132367134094e-06, 3.4850090742111206e-06, 3.6722049117088318e-06, 3.859400749206543e-06, 4.046596586704254e-06, 4.233792424201965e-06, 4.4209882616996765e-06, 4.608184099197388e-06, 4.795379936695099e-06, 4.98257577419281e-06, 5.169771611690521e-06, 5.356967449188232e-06, 5.544163286685944e-06, 5.731359124183655e-06, 5.918554961681366e-06, 6.105750799179077e-06, 6.292946636676788e-06, 6.4801424741744995e-06, 6.667338311672211e-06, 6.854534149169922e-06]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 9.0, 6.0, 12.0, 12.0, 27.0, 28.0, 34.0, 53.0, 68.0, 114.0, 194.0, 253.0, 407.0, 724.0, 1273.0, 3144.0, 8944.0, 34737.0, 176669.0, 3351597.0, 516999.0, 72781.0, 16363.0, 5174.0, 2047.0, 1014.0, 573.0, 340.0, 244.0, 135.0, 104.0, 74.0, 42.0, 33.0, 18.0, 13.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.00010311603546142578, -0.00010052137076854706, -9.792670607566833e-05, -9.533204138278961e-05, -9.273737668991089e-05, -9.014271199703217e-05, -8.754804730415344e-05, -8.495338261127472e-05, -8.2358717918396e-05, -7.976405322551727e-05, -7.716938853263855e-05, -7.457472383975983e-05, -7.19800591468811e-05, -6.938539445400238e-05, -6.679072976112366e-05, -6.419606506824493e-05, -6.160140037536621e-05, -5.900673568248749e-05, -5.6412070989608765e-05, -5.381740629673004e-05, -5.122274160385132e-05, -4.8628076910972595e-05, -4.603341221809387e-05, -4.343874752521515e-05, -4.0844082832336426e-05, -3.82494181394577e-05, -3.565475344657898e-05, -3.3060088753700256e-05, -3.0465424060821533e-05, -2.787075936794281e-05, -2.5276094675064087e-05, -2.2681429982185364e-05, -2.008676528930664e-05, -1.7492100596427917e-05, -1.4897435903549194e-05, -1.2302771210670471e-05, -9.708106517791748e-06, -7.113441824913025e-06, -4.518777132034302e-06, -1.9241124391555786e-06, 6.705522537231445e-07, 3.2652169466018677e-06, 5.859881639480591e-06, 8.454546332359314e-06, 1.1049211025238037e-05, 1.364387571811676e-05, 1.6238540410995483e-05, 1.8833205103874207e-05, 2.142786979675293e-05, 2.4022534489631653e-05, 2.6617199182510376e-05, 2.92118638753891e-05, 3.180652856826782e-05, 3.4401193261146545e-05, 3.699585795402527e-05, 3.959052264690399e-05, 4.2185187339782715e-05, 4.477985203266144e-05, 4.737451672554016e-05, 4.9969181418418884e-05, 5.256384611129761e-05, 5.515851080417633e-05, 5.7753175497055054e-05, 6.034784018993378e-05, 6.29425048828125e-05]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 9.0, 10.0, 18.0, 28.0, 40.0, 75.0, 65.0, 108.0, 123.0, 131.0, 212.0, 270.0, 1227.0, 762.0, 291.0, 159.0, 164.0, 83.0, 77.0, 53.0, 48.0, 28.0, 23.0, 12.0, 12.0, 8.0, 8.0, 8.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.271766662597656e-06, -6.888061761856079e-06, -6.504356861114502e-06, -6.120651960372925e-06, -5.736947059631348e-06, -5.3532421588897705e-06, -4.969537258148193e-06, -4.585832357406616e-06, -4.202127456665039e-06, -3.818422555923462e-06, -3.4347176551818848e-06, -3.0510127544403076e-06, -2.6673078536987305e-06, -2.2836029529571533e-06, -1.8998980522155762e-06, -1.516193151473999e-06, -1.1324882507324219e-06, -7.487833499908447e-07, -3.650784492492676e-07, 1.862645149230957e-08, 4.023313522338867e-07, 7.860362529754639e-07, 1.169741153717041e-06, 1.5534460544586182e-06, 1.9371509552001953e-06, 2.3208558559417725e-06, 2.7045607566833496e-06, 3.0882656574249268e-06, 3.471970558166504e-06, 3.855675458908081e-06, 4.239380359649658e-06, 4.623085260391235e-06, 5.0067901611328125e-06, 5.39049506187439e-06, 5.774199962615967e-06, 6.157904863357544e-06, 6.541609764099121e-06, 6.925314664840698e-06, 7.309019565582275e-06, 7.692724466323853e-06, 8.07642936706543e-06, 8.460134267807007e-06, 8.843839168548584e-06, 9.227544069290161e-06, 9.611248970031738e-06, 9.994953870773315e-06, 1.0378658771514893e-05, 1.076236367225647e-05, 1.1146068572998047e-05, 1.1529773473739624e-05, 1.1913478374481201e-05, 1.2297183275222778e-05, 1.2680888175964355e-05, 1.3064593076705933e-05, 1.344829797744751e-05, 1.3832002878189087e-05, 1.4215707778930664e-05, 1.4599412679672241e-05, 1.4983117580413818e-05, 1.5366822481155396e-05, 1.5750527381896973e-05, 1.613423228263855e-05, 1.6517937183380127e-05, 1.6901642084121704e-05, 1.728534698486328e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 9.0, 6.0, 17.0, 14.0, 17.0, 21.0, 33.0, 50.0, 66.0, 76.0, 99.0, 130.0, 105.0, 77.0, 58.0, 40.0, 32.0, 27.0, 23.0, 16.0, 12.0, 4.0, 7.0, 13.0, 5.0, 4.0, 1.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.649423186085187e-05, -2.5748700863914564e-05, -2.500316986697726e-05, -2.4257638870039955e-05, -2.351210787310265e-05, -2.2766575057175942e-05, -2.2021044060238637e-05, -2.1275513063301332e-05, -2.0529982066364028e-05, -1.9784451069426723e-05, -1.9038920072489418e-05, -1.8293389075552113e-05, -1.7547856259625405e-05, -1.68023252626881e-05, -1.6056794265750796e-05, -1.531126326881349e-05, -1.4565732271876186e-05, -1.3820201274938881e-05, -1.3074670278001577e-05, -1.232913837156957e-05, -1.1583607374632265e-05, -1.083807637769496e-05, -1.0092544471262954e-05, -9.34701347432565e-06, -8.601482477388345e-06, -7.85595148045104e-06, -7.110420028766384e-06, -6.364888577081729e-06, -5.619357580144424e-06, -4.873826583207119e-06, -4.128295131522464e-06, -3.382763679837808e-06, -2.6372308639110997e-06, -1.8916996396001196e-06, -1.1461684152891394e-06, -4.006371909781592e-07, 3.44894033332821e-07, 1.0904252576438012e-06, 1.8359564819547813e-06, 2.581487933639437e-06, 3.3270189305767417e-06, 4.0725499275140464e-06, 4.818081379198702e-06, 5.563612830883358e-06, 6.309143827820662e-06, 7.054674824757967e-06, 7.800206731189974e-06, 8.545737728127278e-06, 9.291268725064583e-06, 1.0036799722001888e-05, 1.0782330718939193e-05, 1.1527862625371199e-05, 1.2273393622308504e-05, 1.3018924619245809e-05, 1.3764456525677815e-05, 1.450998752261512e-05, 1.5255518519552425e-05, 1.600104951648973e-05, 1.6746580513427034e-05, 1.749211151036434e-05, 1.8237642507301643e-05, 1.8983175323228352e-05, 1.9728706320165657e-05, 2.047423731710296e-05, 2.1219768314040266e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 2.0, 4.0, 8.0, 14.0, 13.0, 12.0, 16.0, 12.0, 23.0, 23.0, 23.0, 27.0, 26.0, 22.0, 35.0, 41.0, 26.0, 38.0, 43.0, 40.0, 35.0, 31.0, 38.0, 40.0, 41.0, 44.0, 37.0, 27.0, 33.0, 25.0, 30.0, 17.0, 26.0, 22.0, 17.0, 18.0, 11.0, 18.0, 14.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5760162568767555e-05, -1.528339635115117e-05, -1.4806630133534782e-05, -1.4329863006423693e-05, -1.3853096788807306e-05, -1.337633057119092e-05, -1.2899564353574533e-05, -1.2422797226463445e-05, -1.1946031008847058e-05, -1.1469264791230671e-05, -1.0992498573614284e-05, -1.0515731446503196e-05, -1.003896522888681e-05, -9.562199011270422e-06, -9.085432793654036e-06, -8.608665666542947e-06, -8.13189944892656e-06, -7.655133231310174e-06, -7.178366558946436e-06, -6.7016003413300496e-06, -6.224833668966312e-06, -5.748067451349925e-06, -5.2713012337335385e-06, -4.794534561369801e-06, -4.317768798500765e-06, -3.841002580884378e-06, -3.364235908520641e-06, -2.887469690904254e-06, -2.4107030185405165e-06, -1.9339368009241298e-06, -1.4571703559340676e-06, -9.804039109440055e-07, -5.036372385802679e-07, -2.6870822011915152e-08, 4.4989559455643757e-07, 9.266619827030809e-07, 1.403428427693143e-06, 1.8801947589963675e-06, 2.3569612039864296e-06, 2.8337276489764918e-06, 3.310494093966554e-06, 3.787260538956616e-06, 4.264026756573003e-06, 4.74079342893674e-06, 5.217559646553127e-06, 5.694326318916865e-06, 6.171092536533251e-06, 6.647858754149638e-06, 7.124625426513376e-06, 7.6013916441297624e-06, 8.0781583164935e-06, 8.554924534109887e-06, 9.031690751726273e-06, 9.508457878837362e-06, 9.985224096453749e-06, 1.0461990314070135e-05, 1.0938756531686522e-05, 1.1415522749302909e-05, 1.1892288966919295e-05, 1.2369056094030384e-05, 1.284582231164677e-05, 1.3322588529263157e-05, 1.3799354746879544e-05, 1.4276121873990633e-05, 1.475288809160702e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 2.0, 9.0, 8.0, 13.0, 18.0, 30.0, 30.0, 51.0, 88.0, 153.0, 200.0, 366.0, 625.0, 943.0, 1593.0, 2731.0, 4318.0, 8663.0, 17997.0, 40907.0, 108109.0, 316608.0, 325886.0, 128989.0, 47973.0, 20233.0, 9713.0, 5036.0, 2873.0, 1658.0, 1034.0, 655.0, 384.0, 242.0, 139.0, 89.0, 72.0, 33.0, 27.0, 15.0, 12.0, 10.0, 7.0, 0.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.193450927734375e-05, -2.1228566765785217e-05, -2.0522624254226685e-05, -1.9816681742668152e-05, -1.911073923110962e-05, -1.8404796719551086e-05, -1.7698854207992554e-05, -1.699291169643402e-05, -1.6286969184875488e-05, -1.5581026673316956e-05, -1.4875084161758423e-05, -1.416914165019989e-05, -1.3463199138641357e-05, -1.2757256627082825e-05, -1.2051314115524292e-05, -1.134537160396576e-05, -1.0639429092407227e-05, -9.933486580848694e-06, -9.227544069290161e-06, -8.521601557731628e-06, -7.815659046173096e-06, -7.109716534614563e-06, -6.40377402305603e-06, -5.6978315114974976e-06, -4.991888999938965e-06, -4.285946488380432e-06, -3.5800039768218994e-06, -2.8740614652633667e-06, -2.168118953704834e-06, -1.4621764421463013e-06, -7.562339305877686e-07, -5.029141902923584e-08, 6.556510925292969e-07, 1.3615936040878296e-06, 2.0675361156463623e-06, 2.773478627204895e-06, 3.4794211387634277e-06, 4.1853636503219604e-06, 4.891306161880493e-06, 5.597248673439026e-06, 6.303191184997559e-06, 7.009133696556091e-06, 7.715076208114624e-06, 8.421018719673157e-06, 9.12696123123169e-06, 9.832903742790222e-06, 1.0538846254348755e-05, 1.1244788765907288e-05, 1.195073127746582e-05, 1.2656673789024353e-05, 1.3362616300582886e-05, 1.4068558812141418e-05, 1.4774501323699951e-05, 1.5480443835258484e-05, 1.6186386346817017e-05, 1.689232885837555e-05, 1.7598271369934082e-05, 1.8304213881492615e-05, 1.9010156393051147e-05, 1.971609890460968e-05, 2.0422041416168213e-05, 2.1127983927726746e-05, 2.183392643928528e-05, 2.253986895084381e-05, 2.3245811462402344e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 6.0, 4.0, 15.0, 14.0, 12.0, 18.0, 21.0, 25.0, 21.0, 26.0, 31.0, 31.0, 42.0, 33.0, 39.0, 44.0, 49.0, 34.0, 48.0, 49.0, 44.0, 43.0, 37.0, 43.0, 37.0, 30.0, 15.0, 31.0, 24.0, 18.0, 19.0, 16.0, 13.0, 12.0, 11.0, 14.0, 6.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7642974853515625e-05, -1.7095357179641724e-05, -1.6547739505767822e-05, -1.600012183189392e-05, -1.545250415802002e-05, -1.4904886484146118e-05, -1.4357268810272217e-05, -1.3809651136398315e-05, -1.3262033462524414e-05, -1.2714415788650513e-05, -1.2166798114776611e-05, -1.161918044090271e-05, -1.1071562767028809e-05, -1.0523945093154907e-05, -9.976327419281006e-06, -9.428709745407104e-06, -8.881092071533203e-06, -8.333474397659302e-06, -7.7858567237854e-06, -7.238239049911499e-06, -6.690621376037598e-06, -6.143003702163696e-06, -5.595386028289795e-06, -5.0477683544158936e-06, -4.500150680541992e-06, -3.952533006668091e-06, -3.4049153327941895e-06, -2.857297658920288e-06, -2.3096799850463867e-06, -1.7620623111724854e-06, -1.214444637298584e-06, -6.668269634246826e-07, -1.1920928955078125e-07, 4.284083843231201e-07, 9.760260581970215e-07, 1.5236437320709229e-06, 2.0712614059448242e-06, 2.6188790798187256e-06, 3.166496753692627e-06, 3.7141144275665283e-06, 4.26173210144043e-06, 4.809349775314331e-06, 5.356967449188232e-06, 5.904585123062134e-06, 6.452202796936035e-06, 6.9998204708099365e-06, 7.547438144683838e-06, 8.09505581855774e-06, 8.64267349243164e-06, 9.190291166305542e-06, 9.737908840179443e-06, 1.0285526514053345e-05, 1.0833144187927246e-05, 1.1380761861801147e-05, 1.1928379535675049e-05, 1.247599720954895e-05, 1.3023614883422852e-05, 1.3571232557296753e-05, 1.4118850231170654e-05, 1.4666467905044556e-05, 1.5214085578918457e-05, 1.576170325279236e-05, 1.630932092666626e-05, 1.685693860054016e-05, 1.7404556274414062e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 13.0, 12.0, 16.0, 15.0, 24.0, 40.0, 60.0, 82.0, 125.0, 204.0, 288.0, 594.0, 952.0, 1912.0, 4249.0, 10557.0, 32932.0, 177820.0, 724422.0, 64692.0, 17310.0, 6249.0, 2752.0, 1332.0, 742.0, 418.0, 236.0, 158.0, 104.0, 78.0, 45.0, 24.0, 23.0, 18.0, 17.0, 9.0, 4.0, 12.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.272294998168945e-05, -3.170780837535858e-05, -3.069266676902771e-05, -2.967752516269684e-05, -2.8662383556365967e-05, -2.7647241950035095e-05, -2.6632100343704224e-05, -2.5616958737373352e-05, -2.460181713104248e-05, -2.358667552471161e-05, -2.2571533918380737e-05, -2.1556392312049866e-05, -2.0541250705718994e-05, -1.9526109099388123e-05, -1.851096749305725e-05, -1.749582588672638e-05, -1.6480684280395508e-05, -1.5465542674064636e-05, -1.4450401067733765e-05, -1.3435259461402893e-05, -1.2420117855072021e-05, -1.140497624874115e-05, -1.0389834642410278e-05, -9.374693036079407e-06, -8.359551429748535e-06, -7.3444098234176636e-06, -6.329268217086792e-06, -5.31412661075592e-06, -4.298985004425049e-06, -3.2838433980941772e-06, -2.2687017917633057e-06, -1.253560185432434e-06, -2.384185791015625e-07, 7.767230272293091e-07, 1.7918646335601807e-06, 2.8070062398910522e-06, 3.822147846221924e-06, 4.837289452552795e-06, 5.852431058883667e-06, 6.8675726652145386e-06, 7.88271427154541e-06, 8.897855877876282e-06, 9.912997484207153e-06, 1.0928139090538025e-05, 1.1943280696868896e-05, 1.2958422303199768e-05, 1.397356390953064e-05, 1.4988705515861511e-05, 1.6003847122192383e-05, 1.7018988728523254e-05, 1.8034130334854126e-05, 1.9049271941184998e-05, 2.006441354751587e-05, 2.107955515384674e-05, 2.2094696760177612e-05, 2.3109838366508484e-05, 2.4124979972839355e-05, 2.5140121579170227e-05, 2.61552631855011e-05, 2.717040479183197e-05, 2.8185546398162842e-05, 2.9200688004493713e-05, 3.0215829610824585e-05, 3.1230971217155457e-05, 3.224611282348633e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 5.0, 8.0, 10.0, 7.0, 7.0, 12.0, 13.0, 20.0, 11.0, 17.0, 14.0, 30.0, 28.0, 40.0, 33.0, 36.0, 50.0, 46.0, 65.0, 151.0, 36.0, 34.0, 45.0, 33.0, 30.0, 35.0, 28.0, 20.0, 23.0, 16.0, 19.0, 20.0, 11.0, 8.0, 12.0, 6.0, 7.0, 1.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.463859558105469e-06, -8.172355592250824e-06, -7.88085162639618e-06, -7.5893476605415344e-06, -7.29784369468689e-06, -7.006339728832245e-06, -6.7148357629776e-06, -6.423331797122955e-06, -6.1318278312683105e-06, -5.840323865413666e-06, -5.548819899559021e-06, -5.257315933704376e-06, -4.9658119678497314e-06, -4.674308001995087e-06, -4.382804036140442e-06, -4.091300070285797e-06, -3.7997961044311523e-06, -3.5082921385765076e-06, -3.216788172721863e-06, -2.925284206867218e-06, -2.6337802410125732e-06, -2.3422762751579285e-06, -2.0507723093032837e-06, -1.759268343448639e-06, -1.4677643775939941e-06, -1.1762604117393494e-06, -8.847564458847046e-07, -5.932524800300598e-07, -3.0174851417541504e-07, -1.0244548320770264e-08, 2.812594175338745e-07, 5.727633833885193e-07, 8.642673492431641e-07, 1.1557713150978088e-06, 1.4472752809524536e-06, 1.7387792468070984e-06, 2.030283212661743e-06, 2.321787178516388e-06, 2.6132911443710327e-06, 2.9047951102256775e-06, 3.1962990760803223e-06, 3.487803041934967e-06, 3.779307007789612e-06, 4.070810973644257e-06, 4.362314939498901e-06, 4.653818905353546e-06, 4.945322871208191e-06, 5.236826837062836e-06, 5.5283308029174805e-06, 5.819834768772125e-06, 6.11133873462677e-06, 6.402842700481415e-06, 6.6943466663360596e-06, 6.985850632190704e-06, 7.277354598045349e-06, 7.568858563899994e-06, 7.860362529754639e-06, 8.151866495609283e-06, 8.443370461463928e-06, 8.734874427318573e-06, 9.026378393173218e-06, 9.317882359027863e-06, 9.609386324882507e-06, 9.900890290737152e-06, 1.0192394256591797e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 3.0, 4.0, 2.0, 3.0, 9.0, 6.0, 14.0, 13.0, 19.0, 24.0, 34.0, 55.0, 57.0, 84.0, 109.0, 195.0, 294.0, 435.0, 673.0, 1011.0, 1926.0, 3238.0, 6516.0, 16061.0, 63108.0, 905836.0, 28322.0, 9891.0, 4517.0, 2326.0, 1237.0, 814.0, 526.0, 315.0, 267.0, 159.0, 107.0, 77.0, 64.0, 51.0, 46.0, 27.0, 21.0, 18.0, 10.0, 7.0, 4.0, 8.0, 3.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.6954879760742188e-06, -3.577210009098053e-06, -3.458932042121887e-06, -3.3406540751457214e-06, -3.2223761081695557e-06, -3.10409814119339e-06, -2.985820174217224e-06, -2.8675422072410583e-06, -2.7492642402648926e-06, -2.630986273288727e-06, -2.512708306312561e-06, -2.3944303393363953e-06, -2.2761523723602295e-06, -2.1578744053840637e-06, -2.039596438407898e-06, -1.921318471431732e-06, -1.8030405044555664e-06, -1.6847625374794006e-06, -1.5664845705032349e-06, -1.448206603527069e-06, -1.3299286365509033e-06, -1.2116506695747375e-06, -1.0933727025985718e-06, -9.75094735622406e-07, -8.568167686462402e-07, -7.385388016700745e-07, -6.202608346939087e-07, -5.019828677177429e-07, -3.8370490074157715e-07, -2.654269337654114e-07, -1.471489667892456e-07, -2.8870999813079834e-08, 8.940696716308594e-08, 2.076849341392517e-07, 3.259629011154175e-07, 4.4424086809158325e-07, 5.62518835067749e-07, 6.807968020439148e-07, 7.990747690200806e-07, 9.173527359962463e-07, 1.0356307029724121e-06, 1.1539086699485779e-06, 1.2721866369247437e-06, 1.3904646039009094e-06, 1.5087425708770752e-06, 1.627020537853241e-06, 1.7452985048294067e-06, 1.8635764718055725e-06, 1.9818544387817383e-06, 2.100132405757904e-06, 2.21841037273407e-06, 2.3366883397102356e-06, 2.4549663066864014e-06, 2.573244273662567e-06, 2.691522240638733e-06, 2.8098002076148987e-06, 2.9280781745910645e-06, 3.0463561415672302e-06, 3.164634108543396e-06, 3.2829120755195618e-06, 3.4011900424957275e-06, 3.5194680094718933e-06, 3.637745976448059e-06, 3.756023943424225e-06, 3.874301910400391e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 9.0, 2.0, 0.0, 10.0, 0.0, 37.0, 0.0, 16.0, 0.0, 22.0, 0.0, 46.0, 0.0, 3.0, 0.0, 718.0, 0.0, 5.0, 48.0, 0.0, 30.0, 0.0, 17.0, 0.0, 23.0, 0.0, 5.0, 0.0, 4.0, 0.0, 7.0, 0.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.220093488693237e-07, -8.903443813323975e-07, -8.586794137954712e-07, -8.270144462585449e-07, -7.953494787216187e-07, -7.636845111846924e-07, -7.320195436477661e-07, -7.003545761108398e-07, -6.686896085739136e-07, -6.370246410369873e-07, -6.05359673500061e-07, -5.736947059631348e-07, -5.420297384262085e-07, -5.103647708892822e-07, -4.78699803352356e-07, -4.470348358154297e-07, -4.153698682785034e-07, -3.8370490074157715e-07, -3.520399332046509e-07, -3.203749656677246e-07, -2.8870999813079834e-07, -2.5704503059387207e-07, -2.253800630569458e-07, -1.9371509552001953e-07, -1.6205012798309326e-07, -1.30385160446167e-07, -9.872019290924072e-08, -6.705522537231445e-08, -3.5390257835388184e-08, -3.725290298461914e-09, 2.7939677238464355e-08, 5.960464477539063e-08, 9.12696123123169e-08, 1.2293457984924316e-07, 1.5459954738616943e-07, 1.862645149230957e-07, 2.1792948246002197e-07, 2.4959444999694824e-07, 2.812594175338745e-07, 3.129243850708008e-07, 3.4458935260772705e-07, 3.762543201446533e-07, 4.079192876815796e-07, 4.3958425521850586e-07, 4.7124922275543213e-07, 5.029141902923584e-07, 5.345791578292847e-07, 5.662441253662109e-07, 5.979090929031372e-07, 6.295740604400635e-07, 6.612390279769897e-07, 6.92903995513916e-07, 7.245689630508423e-07, 7.562339305877686e-07, 7.878988981246948e-07, 8.195638656616211e-07, 8.512288331985474e-07, 8.828938007354736e-07, 9.145587682723999e-07, 9.462237358093262e-07, 9.778887033462524e-07, 1.0095536708831787e-06, 1.041218638420105e-06, 1.0728836059570312e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 13.0, 3.0, 4.0, 17.0, 29.0, 50.0, 84.0, 170.0, 407.0, 777.0, 1847.0, 4826.0, 16142.0, 103661.0, 881933.0, 27115.0, 6990.0, 2465.0, 1039.0, 464.0, 221.0, 107.0, 80.0, 35.0, 17.0, 23.0, 3.0, 6.0, 11.0, 0.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.4373016357421875e-06, -6.259419023990631e-06, -6.081536412239075e-06, -5.903653800487518e-06, -5.725771188735962e-06, -5.5478885769844055e-06, -5.370005965232849e-06, -5.192123353481293e-06, -5.014240741729736e-06, -4.83635812997818e-06, -4.6584755182266235e-06, -4.480592906475067e-06, -4.302710294723511e-06, -4.124827682971954e-06, -3.946945071220398e-06, -3.7690624594688416e-06, -3.591179847717285e-06, -3.4132972359657288e-06, -3.2354146242141724e-06, -3.057532012462616e-06, -2.8796494007110596e-06, -2.701766788959503e-06, -2.5238841772079468e-06, -2.3460015654563904e-06, -2.168118953704834e-06, -1.9902363419532776e-06, -1.8123537302017212e-06, -1.6344711184501648e-06, -1.4565885066986084e-06, -1.278705894947052e-06, -1.1008232831954956e-06, -9.229406714439392e-07, -7.450580596923828e-07, -5.671754479408264e-07, -3.8929283618927e-07, -2.1141022443771362e-07, -3.3527612686157227e-08, 1.4435499906539917e-07, 3.2223761081695557e-07, 5.00120222568512e-07, 6.780028343200684e-07, 8.558854460716248e-07, 1.0337680578231812e-06, 1.2116506695747375e-06, 1.389533281326294e-06, 1.5674158930778503e-06, 1.7452985048294067e-06, 1.923181116580963e-06, 2.1010637283325195e-06, 2.278946340084076e-06, 2.4568289518356323e-06, 2.6347115635871887e-06, 2.812594175338745e-06, 2.9904767870903015e-06, 3.168359398841858e-06, 3.3462420105934143e-06, 3.5241246223449707e-06, 3.702007234096527e-06, 3.8798898458480835e-06, 4.05777245759964e-06, 4.235655069351196e-06, 4.413537681102753e-06, 4.591420292854309e-06, 4.7693029046058655e-06, 4.947185516357422e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 14.0, 0.0, 0.0, 10.0, 0.0, 0.0, 28.0, 0.0, 0.0, 47.0, 0.0, 0.0, 81.0, 0.0, 682.0, 0.0, 0.0, 58.0, 0.0, 0.0, 47.0, 0.0, 0.0, 20.0, 0.0, 9.0, 0.0, 0.0, 9.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.746260285377502e-07, -5.532056093215942e-07, -5.317851901054382e-07, -5.103647708892822e-07, -4.889443516731262e-07, -4.675239324569702e-07, -4.461035132408142e-07, -4.246830940246582e-07, -4.032626748085022e-07, -3.818422555923462e-07, -3.604218363761902e-07, -3.390014171600342e-07, -3.175809979438782e-07, -2.9616057872772217e-07, -2.7474015951156616e-07, -2.5331974029541016e-07, -2.3189932107925415e-07, -2.1047890186309814e-07, -1.8905848264694214e-07, -1.6763806343078613e-07, -1.4621764421463013e-07, -1.2479722499847412e-07, -1.0337680578231812e-07, -8.195638656616211e-08, -6.05359673500061e-08, -3.91155481338501e-08, -1.7695128917694092e-08, 3.725290298461914e-09, 2.514570951461792e-08, 4.6566128730773926e-08, 6.798654794692993e-08, 8.940696716308594e-08, 1.1082738637924194e-07, 1.3224780559539795e-07, 1.5366822481155396e-07, 1.7508864402770996e-07, 1.9650906324386597e-07, 2.1792948246002197e-07, 2.39349901676178e-07, 2.60770320892334e-07, 2.8219074010849e-07, 3.03611159324646e-07, 3.25031578540802e-07, 3.46451997756958e-07, 3.67872416973114e-07, 3.8929283618927e-07, 4.10713255405426e-07, 4.3213367462158203e-07, 4.5355409383773804e-07, 4.7497451305389404e-07, 4.9639493227005e-07, 5.178153514862061e-07, 5.392357707023621e-07, 5.606561899185181e-07, 5.820766091346741e-07, 6.034970283508301e-07, 6.249174475669861e-07, 6.463378667831421e-07, 6.677582859992981e-07, 6.891787052154541e-07, 7.105991244316101e-07, 7.320195436477661e-07, 7.534399628639221e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 16.0, 10.0, 17.0, 20.0, 27.0, 32.0, 63.0, 72.0, 120.0, 159.0, 130.0, 81.0, 53.0, 50.0, 33.0, 19.0, 16.0, 13.0, 8.0, 12.0, 6.0, 6.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.385479067219421e-05, -3.29536669596564e-05, -3.20525468850974e-05, -3.115142317255959e-05, -3.0250301279011182e-05, -2.9349177566473372e-05, -2.8448055672924966e-05, -2.7546931960387155e-05, -2.664581006683875e-05, -2.5744688173290342e-05, -2.4843564460752532e-05, -2.3942442567204125e-05, -2.304132067365572e-05, -2.214019696111791e-05, -2.1239075067569502e-05, -2.0337953174021095e-05, -1.9436829461483285e-05, -1.8535707567934878e-05, -1.7634583855397068e-05, -1.673346196184866e-05, -1.5832340068300255e-05, -1.4931216355762444e-05, -1.4030094462214038e-05, -1.312897165917093e-05, -1.2227850675117224e-05, -1.1326727872074116e-05, -1.042560597852571e-05, -9.524483175482601e-06, -8.623360372439492e-06, -7.722237569396384e-06, -6.821115675847977e-06, -5.919992872804869e-06, -5.0188700697617605e-06, -4.117747721466003e-06, -3.2166249184228946e-06, -2.315502570127137e-06, -1.414379994457704e-06, -5.13257418788271e-07, 3.878649295074865e-07, 1.288987732550595e-06, 2.1901100808463525e-06, 3.0912326565157855e-06, 3.9923552321852185e-06, 4.893477580480976e-06, 5.794599928776734e-06, 6.695722731819842e-06, 7.5968450801155996e-06, 8.497967428411357e-06, 9.399090231454466e-06, 1.0300213034497574e-05, 1.120133492804598e-05, 1.2102457731089089e-05, 1.3003580534132197e-05, 1.3904702427680604e-05, 1.4805825230723713e-05, 1.570694803376682e-05, 1.6608069927315228e-05, 1.7509191820863634e-05, 1.8410315533401445e-05, 1.931143742694985e-05, 2.0212559320498258e-05, 2.1113683033036068e-05, 2.2014804926584475e-05, 2.291592682013288e-05, 2.381705053267069e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 1.0, 4.0, 7.0, 10.0, 14.0, 14.0, 13.0, 13.0, 21.0, 23.0, 23.0, 25.0, 23.0, 27.0, 28.0, 37.0, 34.0, 32.0, 40.0, 44.0, 39.0, 35.0, 36.0, 41.0, 31.0, 42.0, 43.0, 30.0, 27.0, 36.0, 23.0, 26.0, 18.0, 25.0, 23.0, 16.0, 10.0, 18.0, 16.0, 10.0, 4.0, 6.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.5805895600351505e-05, -1.533443901280407e-05, -1.486298151576193e-05, -1.4391524018719792e-05, -1.3920067431172356e-05, -1.3448609934130218e-05, -1.297715243708808e-05, -1.2505695849540643e-05, -1.2034238352498505e-05, -1.1562780855456367e-05, -1.109132426790893e-05, -1.0619866770866793e-05, -1.0148410183319356e-05, -9.676952686277218e-06, -9.205496098729782e-06, -8.734038601687644e-06, -8.262581104645506e-06, -7.791123607603367e-06, -7.319667020055931e-06, -6.848209523013793e-06, -6.376752480719006e-06, -5.9052954384242184e-06, -5.433838396129431e-06, -4.962381353834644e-06, -4.490924766287208e-06, -4.01946772399242e-06, -3.5480104543239577e-06, -3.0765534120291704e-06, -2.6050961423607077e-06, -2.1336391000659205e-06, -1.6621820577711333e-06, -1.1907247881026706e-06, -7.192675184342079e-07, -2.4781039087429235e-07, 2.2364673668562318e-07, 6.951038358238293e-07, 1.1665609918054543e-06, 1.6380181477870792e-06, 2.1094751900818665e-06, 2.580932459750329e-06, 3.0523895020451164e-06, 3.5238465443399036e-06, 3.995303814008366e-06, 4.4667608563031536e-06, 4.938217898597941e-06, 5.409675395640079e-06, 5.881131983187515e-06, 6.352589480229653e-06, 6.824046522524441e-06, 7.295503564819228e-06, 7.766961061861366e-06, 8.238417649408802e-06, 8.70987514645094e-06, 9.181332643493079e-06, 9.652789231040515e-06, 1.0124246728082653e-05, 1.059570331563009e-05, 1.1067160812672228e-05, 1.1538617400219664e-05, 1.2010074897261802e-05, 1.2481531484809238e-05, 1.2952988981851377e-05, 1.3424445569398813e-05, 1.3895903066440951e-05, 1.436736056348309e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 1.0, 4.0, 8.0, 8.0, 21.0, 27.0, 35.0, 67.0, 99.0, 135.0, 175.0, 289.0, 495.0, 753.0, 1253.0, 1999.0, 3123.0, 5565.0, 9202.0, 16938.0, 30878.0, 58084.0, 137596.0, 368058.0, 234002.0, 86603.0, 40462.0, 22389.0, 12294.0, 7224.0, 4240.0, 2371.0, 1592.0, 928.0, 591.0, 376.0, 209.0, 149.0, 125.0, 65.0, 46.0, 21.0, 19.0, 14.0, 5.0, 2.0, 7.0, 3.0, 0.0, 3.0, 2.0, 3.0], "bins": [-6.520748138427734e-05, -6.338302046060562e-05, -6.15585595369339e-05, -5.9734098613262177e-05, -5.7909637689590454e-05, -5.608517676591873e-05, -5.426071584224701e-05, -5.243625491857529e-05, -5.0611793994903564e-05, -4.878733307123184e-05, -4.696287214756012e-05, -4.51384112238884e-05, -4.3313950300216675e-05, -4.148948937654495e-05, -3.966502845287323e-05, -3.784056752920151e-05, -3.6016106605529785e-05, -3.419164568185806e-05, -3.236718475818634e-05, -3.054272383451462e-05, -2.8718262910842896e-05, -2.6893801987171173e-05, -2.506934106349945e-05, -2.3244880139827728e-05, -2.1420419216156006e-05, -1.9595958292484283e-05, -1.777149736881256e-05, -1.594703644514084e-05, -1.4122575521469116e-05, -1.2298114597797394e-05, -1.0473653674125671e-05, -8.649192750453949e-06, -6.8247318267822266e-06, -5.000270903110504e-06, -3.1758099794387817e-06, -1.3513490557670593e-06, 4.731118679046631e-07, 2.2975727915763855e-06, 4.122033715248108e-06, 5.94649463891983e-06, 7.770955562591553e-06, 9.595416486263275e-06, 1.1419877409934998e-05, 1.324433833360672e-05, 1.5068799257278442e-05, 1.6893260180950165e-05, 1.8717721104621887e-05, 2.054218202829361e-05, 2.2366642951965332e-05, 2.4191103875637054e-05, 2.6015564799308777e-05, 2.78400257229805e-05, 2.966448664665222e-05, 3.1488947570323944e-05, 3.3313408493995667e-05, 3.513786941766739e-05, 3.696233034133911e-05, 3.8786791265010834e-05, 4.0611252188682556e-05, 4.243571311235428e-05, 4.4260174036026e-05, 4.6084634959697723e-05, 4.7909095883369446e-05, 4.973355680704117e-05, 5.155801773071289e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 2.0, 0.0, 4.0, 5.0, 6.0, 8.0, 13.0, 9.0, 13.0, 21.0, 10.0, 14.0, 19.0, 27.0, 18.0, 29.0, 32.0, 28.0, 31.0, 28.0, 39.0, 40.0, 47.0, 36.0, 33.0, 40.0, 38.0, 29.0, 35.0, 51.0, 36.0, 32.0, 24.0, 28.0, 23.0, 22.0, 24.0, 18.0, 14.0, 21.0, 15.0, 13.0, 3.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0], "bins": [-8.761882781982422e-06, -8.516013622283936e-06, -8.27014446258545e-06, -8.024275302886963e-06, -7.778406143188477e-06, -7.53253698348999e-06, -7.286667823791504e-06, -7.040798664093018e-06, -6.794929504394531e-06, -6.549060344696045e-06, -6.303191184997559e-06, -6.057322025299072e-06, -5.811452865600586e-06, -5.5655837059021e-06, -5.319714546203613e-06, -5.073845386505127e-06, -4.827976226806641e-06, -4.582107067108154e-06, -4.336237907409668e-06, -4.090368747711182e-06, -3.844499588012695e-06, -3.598630428314209e-06, -3.3527612686157227e-06, -3.1068921089172363e-06, -2.86102294921875e-06, -2.6151537895202637e-06, -2.3692846298217773e-06, -2.123415470123291e-06, -1.8775463104248047e-06, -1.6316771507263184e-06, -1.385807991027832e-06, -1.1399388313293457e-06, -8.940696716308594e-07, -6.48200511932373e-07, -4.023313522338867e-07, -1.564621925354004e-07, 8.940696716308594e-08, 3.3527612686157227e-07, 5.811452865600586e-07, 8.270144462585449e-07, 1.0728836059570312e-06, 1.3187527656555176e-06, 1.564621925354004e-06, 1.8104910850524902e-06, 2.0563602447509766e-06, 2.302229404449463e-06, 2.5480985641479492e-06, 2.7939677238464355e-06, 3.039836883544922e-06, 3.285706043243408e-06, 3.5315752029418945e-06, 3.777444362640381e-06, 4.023313522338867e-06, 4.2691826820373535e-06, 4.51505184173584e-06, 4.760921001434326e-06, 5.0067901611328125e-06, 5.252659320831299e-06, 5.498528480529785e-06, 5.7443976402282715e-06, 5.990266799926758e-06, 6.236135959625244e-06, 6.4820051193237305e-06, 6.727874279022217e-06, 6.973743438720703e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 7.0, 7.0, 15.0, 16.0, 44.0, 48.0, 63.0, 90.0, 158.0, 233.0, 359.0, 539.0, 906.0, 1480.0, 2280.0, 3854.0, 6613.0, 10928.0, 19394.0, 38261.0, 76181.0, 188182.0, 430415.0, 137447.0, 60042.0, 31468.0, 15934.0, 9298.0, 5723.0, 3245.0, 1946.0, 1273.0, 722.0, 506.0, 321.0, 194.0, 121.0, 86.0, 49.0, 37.0, 27.0, 18.0, 11.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6776065826416016e-05, -3.556441515684128e-05, -3.435276448726654e-05, -3.31411138176918e-05, -3.1929463148117065e-05, -3.071781247854233e-05, -2.950616180896759e-05, -2.8294511139392853e-05, -2.7082860469818115e-05, -2.5871209800243378e-05, -2.465955913066864e-05, -2.3447908461093903e-05, -2.2236257791519165e-05, -2.1024607121944427e-05, -1.981295645236969e-05, -1.8601305782794952e-05, -1.7389655113220215e-05, -1.6178004443645477e-05, -1.496635377407074e-05, -1.3754703104496002e-05, -1.2543052434921265e-05, -1.1331401765346527e-05, -1.011975109577179e-05, -8.908100426197052e-06, -7.696449756622314e-06, -6.484799087047577e-06, -5.273148417472839e-06, -4.061497747898102e-06, -2.8498470783233643e-06, -1.6381964087486267e-06, -4.2654573917388916e-07, 7.851049304008484e-07, 1.996755599975586e-06, 3.2084062695503235e-06, 4.420056939125061e-06, 5.631707608699799e-06, 6.843358278274536e-06, 8.055008947849274e-06, 9.266659617424011e-06, 1.0478310286998749e-05, 1.1689960956573486e-05, 1.2901611626148224e-05, 1.4113262295722961e-05, 1.53249129652977e-05, 1.6536563634872437e-05, 1.7748214304447174e-05, 1.895986497402191e-05, 2.017151564359665e-05, 2.1383166313171387e-05, 2.2594816982746124e-05, 2.3806467652320862e-05, 2.50181183218956e-05, 2.6229768991470337e-05, 2.7441419661045074e-05, 2.8653070330619812e-05, 2.986472100019455e-05, 3.107637166976929e-05, 3.2288022339344025e-05, 3.349967300891876e-05, 3.47113236784935e-05, 3.592297434806824e-05, 3.7134625017642975e-05, 3.834627568721771e-05, 3.955792635679245e-05, 4.076957702636719e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 8.0, 5.0, 7.0, 10.0, 9.0, 13.0, 13.0, 17.0, 17.0, 33.0, 23.0, 31.0, 29.0, 55.0, 49.0, 52.0, 54.0, 49.0, 60.0, 41.0, 66.0, 40.0, 40.0, 39.0, 43.0, 22.0, 36.0, 16.0, 14.0, 27.0, 15.0, 19.0, 14.0, 8.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1622905731201172e-05, -1.1292286217212677e-05, -1.0961666703224182e-05, -1.0631047189235687e-05, -1.0300427675247192e-05, -9.969808161258698e-06, -9.639188647270203e-06, -9.308569133281708e-06, -8.977949619293213e-06, -8.647330105304718e-06, -8.316710591316223e-06, -7.986091077327728e-06, -7.655471563339233e-06, -7.3248520493507385e-06, -6.994232535362244e-06, -6.663613021373749e-06, -6.332993507385254e-06, -6.002373993396759e-06, -5.671754479408264e-06, -5.341134965419769e-06, -5.010515451431274e-06, -4.6798959374427795e-06, -4.349276423454285e-06, -4.01865690946579e-06, -3.688037395477295e-06, -3.3574178814888e-06, -3.026798367500305e-06, -2.6961788535118103e-06, -2.3655593395233154e-06, -2.0349398255348206e-06, -1.7043203115463257e-06, -1.3737007975578308e-06, -1.043081283569336e-06, -7.124617695808411e-07, -3.818422555923462e-07, -5.122274160385132e-08, 2.7939677238464355e-07, 6.100162863731384e-07, 9.406358003616333e-07, 1.2712553143501282e-06, 1.601874828338623e-06, 1.932494342327118e-06, 2.263113856315613e-06, 2.5937333703041077e-06, 2.9243528842926025e-06, 3.2549723982810974e-06, 3.5855919122695923e-06, 3.916211426258087e-06, 4.246830940246582e-06, 4.577450454235077e-06, 4.908069968223572e-06, 5.238689482212067e-06, 5.5693089962005615e-06, 5.899928510189056e-06, 6.230548024177551e-06, 6.561167538166046e-06, 6.891787052154541e-06, 7.222406566143036e-06, 7.553026080131531e-06, 7.883645594120026e-06, 8.21426510810852e-06, 8.544884622097015e-06, 8.87550413608551e-06, 9.206123650074005e-06, 9.5367431640625e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 9.0, 0.0, 19.0, 0.0, 0.0, 50.0, 0.0, 55.0, 0.0, 171.0, 0.0, 0.0, 214.0, 0.0, 684.0, 0.0, 1137.0, 0.0, 3216.0, 0.0, 0.0, 11571.0, 0.0, 1014381.0, 0.0, 11482.0, 0.0, 0.0, 3175.0, 0.0, 1172.0, 0.0, 720.0, 0.0, 224.0, 0.0, 0.0, 151.0, 0.0, 58.0, 0.0, 48.0, 0.0, 0.0, 23.0, 0.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.891787052154541e-07, -6.631016731262207e-07, -6.370246410369873e-07, -6.109476089477539e-07, -5.848705768585205e-07, -5.587935447692871e-07, -5.327165126800537e-07, -5.066394805908203e-07, -4.805624485015869e-07, -4.544854164123535e-07, -4.284083843231201e-07, -4.023313522338867e-07, -3.762543201446533e-07, -3.501772880554199e-07, -3.241002559661865e-07, -2.980232238769531e-07, -2.7194619178771973e-07, -2.4586915969848633e-07, -2.1979212760925293e-07, -1.9371509552001953e-07, -1.6763806343078613e-07, -1.4156103134155273e-07, -1.1548399925231934e-07, -8.940696716308594e-08, -6.332993507385254e-08, -3.725290298461914e-08, -1.1175870895385742e-08, 1.4901161193847656e-08, 4.0978193283081055e-08, 6.705522537231445e-08, 9.313225746154785e-08, 1.1920928955078125e-07, 1.4528632164001465e-07, 1.7136335372924805e-07, 1.9744038581848145e-07, 2.2351741790771484e-07, 2.4959444999694824e-07, 2.7567148208618164e-07, 3.0174851417541504e-07, 3.2782554626464844e-07, 3.5390257835388184e-07, 3.7997961044311523e-07, 4.0605664253234863e-07, 4.3213367462158203e-07, 4.5821070671081543e-07, 4.842877388000488e-07, 5.103647708892822e-07, 5.364418029785156e-07, 5.62518835067749e-07, 5.885958671569824e-07, 6.146728992462158e-07, 6.407499313354492e-07, 6.668269634246826e-07, 6.92903995513916e-07, 7.189810276031494e-07, 7.450580596923828e-07, 7.711350917816162e-07, 7.972121238708496e-07, 8.23289155960083e-07, 8.493661880493164e-07, 8.754432201385498e-07, 9.015202522277832e-07, 9.275972843170166e-07, 9.5367431640625e-07]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 63.0, 0.0, 0.0, 0.0, 0.0, 469.0, 0.0, 0.0, 0.0, 3907.0, 0.0, 0.0, 0.0, 0.0, 17223.0, 0.0, 0.0, 0.0, 0.0, 1005159.0, 0.0, 0.0, 0.0, 17199.0, 0.0, 0.0, 0.0, 0.0, 3959.0, 0.0, 0.0, 0.0, 509.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 945.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 5.0, 9.0, 6.0, 15.0, 11.0, 9.0, 19.0, 19.0, 35.0, 45.0, 60.0, 77.0, 111.0, 146.0, 107.0, 79.0, 52.0, 35.0, 33.0, 27.0, 24.0, 12.0, 12.0, 7.0, 8.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0], "bins": [-1.6626181604806334e-05, -1.6203868653974496e-05, -1.5781555703142658e-05, -1.535924275231082e-05, -1.4936929801478982e-05, -1.4514616850647144e-05, -1.4092303899815306e-05, -1.3669990948983468e-05, -1.324767799815163e-05, -1.2825365047319792e-05, -1.2403052096487954e-05, -1.1980739145656116e-05, -1.1558426194824278e-05, -1.113611324399244e-05, -1.0713800293160602e-05, -1.0291487342328764e-05, -9.869175300991628e-06, -9.44686235015979e-06, -9.024549399327952e-06, -8.602236448496114e-06, -8.179923497664277e-06, -7.757610546832439e-06, -7.3352980507479515e-06, -6.9129850999161135e-06, -6.490672149084276e-06, -6.068359198252438e-06, -5.6460462474206e-06, -5.223733751336113e-06, -4.801420800504275e-06, -4.379107849672437e-06, -3.956794898840599e-06, -3.534481948008761e-06, -3.1121699066716246e-06, -2.6898569558397867e-06, -2.2675440050079487e-06, -1.8452312815497862e-06, -1.4229183307179483e-06, -1.0006053798861103e-06, -5.782926564279478e-07, -1.5597970559610985e-07, 2.663332452357281e-07, 6.886461392241472e-07, 1.1109590332125663e-06, 1.5332718703575665e-06, 1.9555848211894045e-06, 2.3778977720212424e-06, 2.800210495479405e-06, 3.222523446311243e-06, 3.644836397143081e-06, 4.067149347974919e-06, 4.489462298806757e-06, 4.911775249638595e-06, 5.334088200470433e-06, 5.756401151302271e-06, 6.178713647386758e-06, 6.601026598218596e-06, 7.0233395490504336e-06, 7.4456524998822715e-06, 7.867964995966759e-06, 8.290277946798597e-06, 8.712590897630434e-06, 9.134903848462272e-06, 9.55721679929411e-06, 9.979529750125948e-06, 1.0401842700957786e-05]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 4.0, 9.0, 5.0, 10.0, 13.0, 15.0, 9.0, 15.0, 18.0, 18.0, 24.0, 18.0, 14.0, 23.0, 32.0, 39.0, 29.0, 34.0, 31.0, 32.0, 33.0, 36.0, 27.0, 30.0, 33.0, 35.0, 31.0, 34.0, 30.0, 30.0, 30.0, 30.0, 25.0, 25.0, 21.0, 22.0, 21.0, 20.0, 17.0, 11.0, 11.0, 7.0, 7.0, 7.0, 8.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.278578323166585e-06, -7.040957370918477e-06, -6.80333687341772e-06, -6.5657159211696126e-06, -6.328094968921505e-06, -6.090474016673397e-06, -5.85285306442529e-06, -5.615232566924533e-06, -5.377611614676425e-06, -5.139990662428318e-06, -4.902370164927561e-06, -4.664749212679453e-06, -4.4271282604313456e-06, -4.189507308183238e-06, -3.95188635593513e-06, -3.7142658584343735e-06, -3.476644906186266e-06, -3.2390239539381582e-06, -3.001403229063726e-06, -2.763782504189294e-06, -2.526161551941186e-06, -2.2885405996930785e-06, -2.0509198748186463e-06, -1.8132990362573764e-06, -1.5756781976961065e-06, -1.3380573591348366e-06, -1.1004365205735667e-06, -8.628156820122967e-07, -6.251948434510268e-07, -3.875740048897569e-07, -1.4995316632848699e-07, 8.766767223278293e-08, 3.2528896554140374e-07, 5.629098041026737e-07, 8.005306426639436e-07, 1.0381514812252135e-06, 1.2757723197864834e-06, 1.5133931583477533e-06, 1.7510139969090233e-06, 1.9886347217834555e-06, 2.226255674031563e-06, 2.4638766262796707e-06, 2.701497351154103e-06, 2.939118076028535e-06, 3.1767390282766428e-06, 3.4143599805247504e-06, 3.6519807053991826e-06, 3.889601430273615e-06, 4.1272223825217225e-06, 4.36484333476983e-06, 4.602464287017938e-06, 4.8400847845186945e-06, 5.077705736766802e-06, 5.31532668901491e-06, 5.5529471865156665e-06, 5.790568138763774e-06, 6.028189091011882e-06, 6.2658100432599895e-06, 6.503430995508097e-06, 6.741051493008854e-06, 6.9786724452569615e-06, 7.216293397505069e-06, 7.453913895005826e-06, 7.691534847253934e-06, 7.929155799502041e-06]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 6.0, 11.0, 11.0, 15.0, 39.0, 35.0, 86.0, 157.0, 282.0, 352.0, 370.0, 872.0, 1300.0, 1803.0, 3064.0, 4547.0, 6580.0, 5996.0, 13631.0, 19875.0, 30241.0, 47865.0, 71610.0, 113267.0, 106221.0, 247821.0, 410310.0, 1430094.0, 712211.0, 374277.0, 214192.0, 91942.0, 98986.0, 62061.0, 41416.0, 26923.0, 18107.0, 12185.0, 5789.0, 6554.0, 4210.0, 2987.0, 1910.0, 1432.0, 932.0, 407.0, 428.0, 321.0, 208.0, 135.0, 82.0, 64.0, 30.0, 15.0, 15.0, 13.0, 3.0, 2.0, 0.0, 2.0], "bins": [-5.424022674560547e-06, -5.253590643405914e-06, -5.083158612251282e-06, -4.912726581096649e-06, -4.742294549942017e-06, -4.571862518787384e-06, -4.4014304876327515e-06, -4.230998456478119e-06, -4.060566425323486e-06, -3.890134394168854e-06, -3.719702363014221e-06, -3.5492703318595886e-06, -3.378838300704956e-06, -3.2084062695503235e-06, -3.037974238395691e-06, -2.8675422072410583e-06, -2.6971101760864258e-06, -2.5266781449317932e-06, -2.3562461137771606e-06, -2.185814082622528e-06, -2.0153820514678955e-06, -1.844950020313263e-06, -1.6745179891586304e-06, -1.5040859580039978e-06, -1.3336539268493652e-06, -1.1632218956947327e-06, -9.927898645401e-07, -8.223578333854675e-07, -6.51925802230835e-07, -4.814937710762024e-07, -3.110617399215698e-07, -1.4062970876693726e-07, 2.9802322387695312e-08, 2.0023435354232788e-07, 3.7066638469696045e-07, 5.41098415851593e-07, 7.115304470062256e-07, 8.819624781608582e-07, 1.0523945093154907e-06, 1.2228265404701233e-06, 1.3932585716247559e-06, 1.5636906027793884e-06, 1.734122633934021e-06, 1.9045546650886536e-06, 2.074986696243286e-06, 2.2454187273979187e-06, 2.4158507585525513e-06, 2.586282789707184e-06, 2.7567148208618164e-06, 2.927146852016449e-06, 3.0975788831710815e-06, 3.268010914325714e-06, 3.4384429454803467e-06, 3.6088749766349792e-06, 3.779307007789612e-06, 3.949739038944244e-06, 4.120171070098877e-06, 4.2906031012535095e-06, 4.461035132408142e-06, 4.631467163562775e-06, 4.801899194717407e-06, 4.97233122587204e-06, 5.142763257026672e-06, 5.313195288181305e-06, 5.4836273193359375e-06]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 45.0, 0.0, 0.0, 0.0, 83.0, 0.0, 0.0, 0.0, 112.0, 0.0, 0.0, 0.0, 138.0, 0.0, 0.0, 0.0, 162.0, 0.0, 0.0, 0.0, 158.0, 0.0, 0.0, 0.0, 120.0, 0.0, 0.0, 0.0, 78.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 2.0], "bins": [-4.76837158203125e-07, -4.6193599700927734e-07, -4.470348358154297e-07, -4.3213367462158203e-07, -4.172325134277344e-07, -4.023313522338867e-07, -3.8743019104003906e-07, -3.725290298461914e-07, -3.5762786865234375e-07, -3.427267074584961e-07, -3.2782554626464844e-07, -3.129243850708008e-07, -2.980232238769531e-07, -2.8312206268310547e-07, -2.682209014892578e-07, -2.5331974029541016e-07, -2.384185791015625e-07, -2.2351741790771484e-07, -2.086162567138672e-07, -1.9371509552001953e-07, -1.7881393432617188e-07, -1.6391277313232422e-07, -1.4901161193847656e-07, -1.341104507446289e-07, -1.1920928955078125e-07, -1.043081283569336e-07, -8.940696716308594e-08, -7.450580596923828e-08, -5.960464477539063e-08, -4.470348358154297e-08, -2.9802322387695312e-08, -1.4901161193847656e-08, 0.0, 1.4901161193847656e-08, 2.9802322387695312e-08, 4.470348358154297e-08, 5.960464477539063e-08, 7.450580596923828e-08, 8.940696716308594e-08, 1.043081283569336e-07, 1.1920928955078125e-07, 1.341104507446289e-07, 1.4901161193847656e-07, 1.6391277313232422e-07, 1.7881393432617188e-07, 1.9371509552001953e-07, 2.086162567138672e-07, 2.2351741790771484e-07, 2.384185791015625e-07, 2.5331974029541016e-07, 2.682209014892578e-07, 2.8312206268310547e-07, 2.980232238769531e-07, 3.129243850708008e-07, 3.2782554626464844e-07, 3.427267074584961e-07, 3.5762786865234375e-07, 3.725290298461914e-07, 3.8743019104003906e-07, 4.023313522338867e-07, 4.172325134277344e-07, 4.3213367462158203e-07, 4.470348358154297e-07, 4.6193599700927734e-07, 4.76837158203125e-07]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 7.0, 15.0, 21.0, 18.0, 35.0, 44.0, 59.0, 78.0, 121.0, 198.0, 235.0, 473.0, 598.0, 1633.0, 4561.0, 17600.0, 86209.0, 724983.0, 3016264.0, 281225.0, 44642.0, 9472.0, 3165.0, 1105.0, 544.0, 288.0, 211.0, 148.0, 124.0, 73.0, 52.0, 34.0, 19.0, 11.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1026859283447266e-05, -1.0730698704719543e-05, -1.0434538125991821e-05, -1.0138377547264099e-05, -9.842216968536377e-06, -9.546056389808655e-06, -9.249895811080933e-06, -8.95373523235321e-06, -8.657574653625488e-06, -8.361414074897766e-06, -8.065253496170044e-06, -7.769092917442322e-06, -7.4729323387146e-06, -7.1767717599868774e-06, -6.880611181259155e-06, -6.584450602531433e-06, -6.288290023803711e-06, -5.992129445075989e-06, -5.695968866348267e-06, -5.3998082876205444e-06, -5.103647708892822e-06, -4.8074871301651e-06, -4.511326551437378e-06, -4.215165972709656e-06, -3.919005393981934e-06, -3.6228448152542114e-06, -3.3266842365264893e-06, -3.030523657798767e-06, -2.734363079071045e-06, -2.4382025003433228e-06, -2.1420419216156006e-06, -1.8458813428878784e-06, -1.5497207641601562e-06, -1.253560185432434e-06, -9.57399606704712e-07, -6.612390279769897e-07, -3.650784492492676e-07, -6.891787052154541e-08, 2.2724270820617676e-07, 5.234032869338989e-07, 8.195638656616211e-07, 1.1157244443893433e-06, 1.4118850231170654e-06, 1.7080456018447876e-06, 2.0042061805725098e-06, 2.300366759300232e-06, 2.596527338027954e-06, 2.8926879167556763e-06, 3.1888484954833984e-06, 3.4850090742111206e-06, 3.7811696529388428e-06, 4.077330231666565e-06, 4.373490810394287e-06, 4.669651389122009e-06, 4.9658119678497314e-06, 5.261972546577454e-06, 5.558133125305176e-06, 5.854293704032898e-06, 6.15045428276062e-06, 6.446614861488342e-06, 6.7427754402160645e-06, 7.038936018943787e-06, 7.335096597671509e-06, 7.631257176399231e-06, 7.927417755126953e-06]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 0.0, 13.0, 23.0, 0.0, 58.0, 0.0, 106.0, 0.0, 130.0, 0.0, 199.0, 0.0, 298.0, 420.0, 0.0, 482.0, 0.0, 751.0, 0.0, 500.0, 0.0, 346.0, 0.0, 271.0, 187.0, 0.0, 116.0, 0.0, 62.0, 0.0, 48.0, 0.0, 27.0, 0.0, 22.0, 8.0, 0.0, 9.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.01868736743927e-07, -7.692724466323853e-07, -7.366761565208435e-07, -7.040798664093018e-07, -6.7148357629776e-07, -6.388872861862183e-07, -6.062909960746765e-07, -5.736947059631348e-07, -5.41098415851593e-07, -5.085021257400513e-07, -4.759058356285095e-07, -4.4330954551696777e-07, -4.10713255405426e-07, -3.781169652938843e-07, -3.4552067518234253e-07, -3.129243850708008e-07, -2.8032809495925903e-07, -2.477318048477173e-07, -2.1513551473617554e-07, -1.825392246246338e-07, -1.4994293451309204e-07, -1.1734664440155029e-07, -8.475035429000854e-08, -5.21540641784668e-08, -1.955777406692505e-08, 1.30385160446167e-08, 4.563480615615845e-08, 7.82310962677002e-08, 1.1082738637924194e-07, 1.434236764907837e-07, 1.7601996660232544e-07, 2.086162567138672e-07, 2.4121254682540894e-07, 2.738088369369507e-07, 3.0640512704849243e-07, 3.390014171600342e-07, 3.7159770727157593e-07, 4.041939973831177e-07, 4.367902874946594e-07, 4.6938657760620117e-07, 5.019828677177429e-07, 5.345791578292847e-07, 5.671754479408264e-07, 5.997717380523682e-07, 6.323680281639099e-07, 6.649643182754517e-07, 6.975606083869934e-07, 7.301568984985352e-07, 7.627531886100769e-07, 7.953494787216187e-07, 8.279457688331604e-07, 8.605420589447021e-07, 8.931383490562439e-07, 9.257346391677856e-07, 9.583309292793274e-07, 9.909272193908691e-07, 1.0235235095024109e-06, 1.0561197996139526e-06, 1.0887160897254944e-06, 1.1213123798370361e-06, 1.1539086699485779e-06, 1.1865049600601196e-06, 1.2191012501716614e-06, 1.2516975402832031e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 4.0, 8.0, 8.0, 6.0, 16.0, 22.0, 36.0, 61.0, 77.0, 130.0, 195.0, 156.0, 86.0, 62.0, 40.0, 29.0, 16.0, 13.0, 13.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.0824422689620405e-06, -5.921195224800613e-06, -5.759948180639185e-06, -5.598701136477757e-06, -5.437453637568979e-06, -5.276206593407551e-06, -5.114959549246123e-06, -4.953712505084695e-06, -4.792465006175917e-06, -4.631217962014489e-06, -4.469970917853061e-06, -4.308723873691633e-06, -4.147476374782855e-06, -3.986229330621427e-06, -3.824982286459999e-06, -3.6637352422985714e-06, -3.5024881981371436e-06, -3.341241153975716e-06, -3.1799938824406127e-06, -3.018746838279185e-06, -2.8574995667440817e-06, -2.696252522582654e-06, -2.535005478421226e-06, -2.3737584342597984e-06, -2.212511162724695e-06, -2.0512641185632674e-06, -1.8900168470281642e-06, -1.7287698028667364e-06, -1.567522645018471e-06, -1.4062754871702055e-06, -1.2450284430087777e-06, -1.0837812851605122e-06, -9.225336725648958e-07, -7.612865147166303e-07, -6.000394137117837e-07, -4.387923127069371e-07, -2.775451548586716e-07, -1.1629799701040611e-07, 4.494904715102166e-08, 2.0619620499928715e-07, 3.6744336284755263e-07, 5.286905206958181e-07, 6.899376217006647e-07, 8.511847227055114e-07, 1.0124318805537769e-06, 1.1736790384020424e-06, 1.3349260825634701e-06, 1.4961732404117356e-06, 1.657420398260001e-06, 1.8186675561082666e-06, 1.979914713956532e-06, 2.14116175811796e-06, 2.302409029653063e-06, 2.463656073814491e-06, 2.6249031179759186e-06, 2.7861501621373463e-06, 2.9473974336724496e-06, 3.1086444778338773e-06, 3.2698917493689805e-06, 3.4311387935304083e-06, 3.592385837691836e-06, 3.7536331092269393e-06, 3.914879926014692e-06, 4.07612742492347e-06, 4.237374469084898e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 6.0, 6.0, 5.0, 9.0, 9.0, 9.0, 6.0, 8.0, 20.0, 13.0, 15.0, 15.0, 28.0, 28.0, 24.0, 29.0, 42.0, 34.0, 26.0, 35.0, 32.0, 52.0, 40.0, 40.0, 40.0, 49.0, 38.0, 37.0, 22.0, 24.0, 29.0, 37.0, 26.0, 26.0, 18.0, 20.0, 11.0, 17.0, 12.0, 19.0, 8.0, 10.0, 11.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9435362901276676e-06, -1.8799637473421171e-06, -1.8163912045565667e-06, -1.7528185480841785e-06, -1.689246005298628e-06, -1.6256734625130775e-06, -1.5621008060406893e-06, -1.4985282632551389e-06, -1.4349557204695884e-06, -1.371383177684038e-06, -1.3078106348984875e-06, -1.2442379784260993e-06, -1.1806654356405488e-06, -1.1170928928549984e-06, -1.0535202363826102e-06, -9.899476935970597e-07, -9.263751508115092e-07, -8.628026080259588e-07, -7.992300083969894e-07, -7.356574087680201e-07, -6.720848659824696e-07, -6.085123231969192e-07, -5.449397235679498e-07, -4.813671239389805e-07, -4.1779458115343004e-07, -3.5422200994617015e-07, -2.9064943873891025e-07, -2.2707686753165035e-07, -1.6350429632439045e-07, -9.993172511713055e-08, -3.6359153909870656e-08, 2.7213417297389242e-08, 9.078598850464914e-08, 1.5435855971190904e-07, 2.1793113091916894e-07, 2.8150370212642883e-07, 3.4507627333368873e-07, 4.0864884454094863e-07, 4.7222141574820853e-07, 5.357940153771779e-07, 5.993665581627283e-07, 6.629391009482788e-07, 7.265117005772481e-07, 7.900843002062174e-07, 8.536568429917679e-07, 9.172293857773184e-07, 9.808020422497066e-07, 1.044374585035257e-06, 1.1079471278208075e-06, 1.171519670606358e-06, 1.2350922133919084e-06, 1.2986648698642966e-06, 1.362237412649847e-06, 1.4258099554353976e-06, 1.4893826119077858e-06, 1.5529551546933362e-06, 1.6165276974788867e-06, 1.6801002402644372e-06, 1.7436727830499876e-06, 1.8072454395223758e-06, 1.8708179823079263e-06, 1.9343906387803145e-06, 1.997963181565865e-06, 2.0615357243514154e-06, 2.125108267136966e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 5.0, 8.0, 16.0, 10.0, 27.0, 21.0, 20.0, 95.0, 67.0, 194.0, 144.0, 447.0, 375.0, 1321.0, 1193.0, 4055.0, 3824.0, 5963.0, 25799.0, 27899.0, 137048.0, 172467.0, 459306.0, 88560.0, 76072.0, 16204.0, 15705.0, 3773.0, 2396.0, 2663.0, 746.0, 943.0, 303.0, 385.0, 125.0, 161.0, 49.0, 79.0, 23.0, 15.0, 15.0, 6.0, 17.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0], "bins": [-3.2186508178710938e-06, -3.1320378184318542e-06, -3.0454248189926147e-06, -2.9588118195533752e-06, -2.8721988201141357e-06, -2.7855858206748962e-06, -2.6989728212356567e-06, -2.6123598217964172e-06, -2.5257468223571777e-06, -2.4391338229179382e-06, -2.3525208234786987e-06, -2.2659078240394592e-06, -2.1792948246002197e-06, -2.0926818251609802e-06, -2.0060688257217407e-06, -1.9194558262825012e-06, -1.8328428268432617e-06, -1.7462298274040222e-06, -1.6596168279647827e-06, -1.5730038285255432e-06, -1.4863908290863037e-06, -1.3997778296470642e-06, -1.3131648302078247e-06, -1.2265518307685852e-06, -1.1399388313293457e-06, -1.0533258318901062e-06, -9.667128324508667e-07, -8.800998330116272e-07, -7.934868335723877e-07, -7.068738341331482e-07, -6.202608346939087e-07, -5.336478352546692e-07, -4.470348358154297e-07, -3.604218363761902e-07, -2.738088369369507e-07, -1.8719583749771118e-07, -1.0058283805847168e-07, -1.3969838619232178e-08, 7.264316082000732e-08, 1.5925616025924683e-07, 2.4586915969848633e-07, 3.3248215913772583e-07, 4.1909515857696533e-07, 5.057081580162048e-07, 5.923211574554443e-07, 6.789341568946838e-07, 7.655471563339233e-07, 8.521601557731628e-07, 9.387731552124023e-07, 1.0253861546516418e-06, 1.1119991540908813e-06, 1.1986121535301208e-06, 1.2852251529693604e-06, 1.3718381524085999e-06, 1.4584511518478394e-06, 1.5450641512870789e-06, 1.6316771507263184e-06, 1.7182901501655579e-06, 1.8049031496047974e-06, 1.8915161490440369e-06, 1.9781291484832764e-06, 2.064742147922516e-06, 2.1513551473617554e-06, 2.237968146800995e-06, 2.3245811462402344e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 6.0, 1.0, 6.0, 1.0, 12.0, 8.0, 16.0, 10.0, 23.0, 13.0, 28.0, 28.0, 42.0, 21.0, 30.0, 63.0, 31.0, 72.0, 39.0, 84.0, 35.0, 72.0, 38.0, 52.0, 21.0, 61.0, 19.0, 35.0, 15.0, 33.0, 12.0, 13.0, 23.0, 8.0, 12.0, 4.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.2186508178710938e-06, -3.1311064958572388e-06, -3.043562173843384e-06, -2.956017851829529e-06, -2.868473529815674e-06, -2.780929207801819e-06, -2.693384885787964e-06, -2.605840563774109e-06, -2.518296241760254e-06, -2.430751919746399e-06, -2.343207597732544e-06, -2.255663275718689e-06, -2.168118953704834e-06, -2.080574631690979e-06, -1.993030309677124e-06, -1.905485987663269e-06, -1.817941665649414e-06, -1.730397343635559e-06, -1.642853021621704e-06, -1.5553086996078491e-06, -1.4677643775939941e-06, -1.3802200555801392e-06, -1.2926757335662842e-06, -1.2051314115524292e-06, -1.1175870895385742e-06, -1.0300427675247192e-06, -9.424984455108643e-07, -8.549541234970093e-07, -7.674098014831543e-07, -6.798654794692993e-07, -5.923211574554443e-07, -5.047768354415894e-07, -4.172325134277344e-07, -3.296881914138794e-07, -2.421438694000244e-07, -1.5459954738616943e-07, -6.705522537231445e-08, 2.0489096641540527e-08, 1.0803341865539551e-07, 1.955777406692505e-07, 2.8312206268310547e-07, 3.7066638469696045e-07, 4.5821070671081543e-07, 5.457550287246704e-07, 6.332993507385254e-07, 7.208436727523804e-07, 8.083879947662354e-07, 8.959323167800903e-07, 9.834766387939453e-07, 1.0710209608078003e-06, 1.1585652828216553e-06, 1.2461096048355103e-06, 1.3336539268493652e-06, 1.4211982488632202e-06, 1.5087425708770752e-06, 1.5962868928909302e-06, 1.6838312149047852e-06, 1.7713755369186401e-06, 1.8589198589324951e-06, 1.94646418094635e-06, 2.034008502960205e-06, 2.12155282497406e-06, 2.209097146987915e-06, 2.29664146900177e-06, 2.384185791015625e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [5.0, 2.0, 3.0, 10.0, 4.0, 7.0, 18.0, 20.0, 25.0, 28.0, 26.0, 31.0, 59.0, 76.0, 90.0, 98.0, 326.0, 264.0, 303.0, 456.0, 663.0, 785.0, 1238.0, 1789.0, 2677.0, 4109.0, 7221.0, 13815.0, 35827.0, 908895.0, 35753.0, 13635.0, 11415.0, 2610.0, 1840.0, 1150.0, 765.0, 649.0, 438.0, 336.0, 266.0, 203.0, 155.0, 106.0, 93.0, 73.0, 38.0, 36.0, 63.0, 22.0, 10.0, 6.0, 7.0, 9.0, 5.0, 3.0, 7.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-1.8477439880371094e-06, -1.7844140529632568e-06, -1.7210841178894043e-06, -1.6577541828155518e-06, -1.5944242477416992e-06, -1.5310943126678467e-06, -1.4677643775939941e-06, -1.4044344425201416e-06, -1.341104507446289e-06, -1.2777745723724365e-06, -1.214444637298584e-06, -1.1511147022247314e-06, -1.087784767150879e-06, -1.0244548320770264e-06, -9.611248970031738e-07, -8.977949619293213e-07, -8.344650268554688e-07, -7.711350917816162e-07, -7.078051567077637e-07, -6.444752216339111e-07, -5.811452865600586e-07, -5.178153514862061e-07, -4.544854164123535e-07, -3.91155481338501e-07, -3.2782554626464844e-07, -2.644956111907959e-07, -2.0116567611694336e-07, -1.3783574104309082e-07, -7.450580596923828e-08, -1.1175870895385742e-08, 5.21540641784668e-08, 1.1548399925231934e-07, 1.7881393432617188e-07, 2.421438694000244e-07, 3.0547380447387695e-07, 3.688037395477295e-07, 4.3213367462158203e-07, 4.954636096954346e-07, 5.587935447692871e-07, 6.221234798431396e-07, 6.854534149169922e-07, 7.487833499908447e-07, 8.121132850646973e-07, 8.754432201385498e-07, 9.387731552124023e-07, 1.0021030902862549e-06, 1.0654330253601074e-06, 1.12876296043396e-06, 1.1920928955078125e-06, 1.255422830581665e-06, 1.3187527656555176e-06, 1.3820827007293701e-06, 1.4454126358032227e-06, 1.5087425708770752e-06, 1.5720725059509277e-06, 1.6354024410247803e-06, 1.6987323760986328e-06, 1.7620623111724854e-06, 1.8253922462463379e-06, 1.8887221813201904e-06, 1.952052116394043e-06, 2.0153820514678955e-06, 2.078711986541748e-06, 2.1420419216156006e-06, 2.205371856689453e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 0.0, 5.0, 0.0, 5.0, 0.0, 5.0, 0.0, 6.0, 0.0, 16.0, 0.0, 14.0, 0.0, 17.0, 0.0, 20.0, 0.0, 25.0, 0.0, 786.0, 0.0, 19.0, 0.0, 0.0, 16.0, 0.0, 18.0, 0.0, 12.0, 0.0, 20.0, 0.0, 3.0, 0.0, 7.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.055940270423889e-07, -7.767230272293091e-07, -7.478520274162292e-07, -7.189810276031494e-07, -6.901100277900696e-07, -6.612390279769897e-07, -6.323680281639099e-07, -6.034970283508301e-07, -5.746260285377502e-07, -5.457550287246704e-07, -5.168840289115906e-07, -4.880130290985107e-07, -4.591420292854309e-07, -4.302710294723511e-07, -4.0140002965927124e-07, -3.725290298461914e-07, -3.4365803003311157e-07, -3.1478703022003174e-07, -2.859160304069519e-07, -2.5704503059387207e-07, -2.2817403078079224e-07, -1.993030309677124e-07, -1.7043203115463257e-07, -1.4156103134155273e-07, -1.126900315284729e-07, -8.381903171539307e-08, -5.494803190231323e-08, -2.60770320892334e-08, 2.7939677238464355e-09, 3.166496753692627e-08, 6.05359673500061e-08, 8.940696716308594e-08, 1.1827796697616577e-07, 1.471489667892456e-07, 1.7601996660232544e-07, 2.0489096641540527e-07, 2.337619662284851e-07, 2.6263296604156494e-07, 2.915039658546448e-07, 3.203749656677246e-07, 3.4924596548080444e-07, 3.781169652938843e-07, 4.069879651069641e-07, 4.3585896492004395e-07, 4.647299647331238e-07, 4.936009645462036e-07, 5.224719643592834e-07, 5.513429641723633e-07, 5.802139639854431e-07, 6.09084963798523e-07, 6.379559636116028e-07, 6.668269634246826e-07, 6.956979632377625e-07, 7.245689630508423e-07, 7.534399628639221e-07, 7.82310962677002e-07, 8.111819624900818e-07, 8.400529623031616e-07, 8.689239621162415e-07, 8.977949619293213e-07, 9.266659617424011e-07, 9.55536961555481e-07, 9.844079613685608e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 1.0, 8.0, 6.0, 4.0, 14.0, 13.0, 18.0, 31.0, 39.0, 68.0, 86.0, 152.0, 187.0, 108.0, 84.0, 47.0, 41.0, 23.0, 17.0, 9.0, 13.0, 11.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.360045750217978e-06, -4.2162605495832395e-06, -4.072475348948501e-06, -3.9286906030611135e-06, -3.784905402426375e-06, -3.6411202017916366e-06, -3.4973352285305737e-06, -3.3535502552695107e-06, -3.2097650546347722e-06, -3.065979854000034e-06, -2.922194880738971e-06, -2.778409907477908e-06, -2.6346247068431694e-06, -2.490839506208431e-06, -2.347054532947368e-06, -2.203269559686305e-06, -2.0594843590515666e-06, -1.915699158416828e-06, -1.7719141851557652e-06, -1.6281290982078644e-06, -1.4843440112599637e-06, -1.340558924312063e-06, -1.1967738373641623e-06, -1.0529887504162616e-06, -9.092036634683609e-07, -7.654185765204602e-07, -6.216334895725595e-07, -4.778484026246588e-07, -3.3406331567675807e-07, -1.9027822872885736e-07, -4.649314178095665e-08, 9.729194516694406e-08, 2.4107703211484477e-07, 3.848621190627455e-07, 5.286472060106462e-07, 6.724322929585469e-07, 8.162173799064476e-07, 9.600024668543483e-07, 1.103787553802249e-06, 1.2475726407501497e-06, 1.3913577276980504e-06, 1.5351428146459511e-06, 1.6789279015938519e-06, 1.8227129885417526e-06, 1.9664980754896533e-06, 2.1102832761243917e-06, 2.2540682493854547e-06, 2.3978532226465177e-06, 2.541638423281256e-06, 2.6854236239159945e-06, 2.8292085971770575e-06, 2.9729935704381205e-06, 3.116778771072859e-06, 3.2605639717075974e-06, 3.4043489449686604e-06, 3.5481339182297233e-06, 3.6919191188644618e-06, 3.8357043194992e-06, 3.979489520133939e-06, 4.123274266021326e-06, 4.267059466656065e-06, 4.410844667290803e-06, 4.554629413178191e-06, 4.698414613812929e-06, 4.8421998144476674e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 4.0, 5.0, 15.0, 10.0, 8.0, 6.0, 12.0, 15.0, 16.0, 16.0, 15.0, 31.0, 27.0, 26.0, 33.0, 38.0, 28.0, 41.0, 24.0, 41.0, 44.0, 49.0, 38.0, 43.0, 48.0, 36.0, 33.0, 15.0, 32.0, 39.0, 23.0, 30.0, 19.0, 22.0, 13.0, 17.0, 14.0, 16.0, 12.0, 10.0, 12.0, 7.0, 2.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.911345862026792e-06, -1.8497253222449217e-06, -1.788104896149889e-06, -1.7264843563680188e-06, -1.6648639302729862e-06, -1.6032433904911159e-06, -1.5416228507092455e-06, -1.480002424614213e-06, -1.4183819985191803e-06, -1.35676145873731e-06, -1.2951410326422774e-06, -1.233520492860407e-06, -1.1719000667653745e-06, -1.1102795269835042e-06, -1.0486589872016339e-06, -9.870385611066013e-07, -9.254180213247309e-07, -8.637975383862795e-07, -8.02177055447828e-07, -7.405565156659577e-07, -6.789360895709251e-07, -6.173155497890548e-07, -5.556950668506033e-07, -4.940745839121519e-07, -4.324541009737004e-07, -3.7083361803524895e-07, -3.092131350967975e-07, -2.475926237366366e-07, -1.8597214079818514e-07, -1.2435165785973368e-07, -6.273114649957279e-08, -1.1106635611213278e-09, 6.050981937733013e-08, 1.221303023157816e-07, 1.8375079946508777e-07, 2.4537129661439394e-07, 3.069917795528454e-07, 3.6861226249129686e-07, 4.3023277385145775e-07, 4.918532567899092e-07, 5.534737397283607e-07, 6.150942226668121e-07, 6.767147056052636e-07, 7.38335188543715e-07, 7.999557283255854e-07, 8.61576154420618e-07, 9.231966942024883e-07, 9.848172339843586e-07, 1.0464376600793912e-06, 1.1080581998612615e-06, 1.1696786259562941e-06, 1.2312991657381644e-06, 1.292919591833197e-06, 1.3545401316150674e-06, 1.4161605577101e-06, 1.4777810974919703e-06, 1.5394016372738406e-06, 1.601022177055711e-06, 1.6626426031507435e-06, 1.7242631429326138e-06, 1.7858835690276464e-06, 1.8475041088095168e-06, 1.909124648591387e-06, 1.970744960999582e-06, 2.0323655007814523e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 13.0, 8.0, 21.0, 12.0, 37.0, 26.0, 45.0, 60.0, 66.0, 116.0, 140.0, 203.0, 265.0, 436.0, 385.0, 837.0, 1245.0, 1998.0, 3227.0, 5558.0, 10149.0, 19555.0, 39427.0, 90209.0, 173199.0, 430947.0, 151476.0, 58408.0, 27413.0, 13935.0, 7622.0, 4165.0, 2589.0, 1542.0, 958.0, 543.0, 453.0, 340.0, 272.0, 146.0, 149.0, 88.0, 78.0, 52.0, 38.0, 29.0, 16.0, 17.0, 9.0, 9.0, 6.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-7.510185241699219e-06, -7.277354598045349e-06, -7.0445239543914795e-06, -6.81169331073761e-06, -6.57886266708374e-06, -6.346032023429871e-06, -6.113201379776001e-06, -5.880370736122131e-06, -5.647540092468262e-06, -5.414709448814392e-06, -5.1818788051605225e-06, -4.949048161506653e-06, -4.716217517852783e-06, -4.4833868741989136e-06, -4.250556230545044e-06, -4.017725586891174e-06, -3.7848949432373047e-06, -3.552064299583435e-06, -3.3192336559295654e-06, -3.086403012275696e-06, -2.853572368621826e-06, -2.6207417249679565e-06, -2.387911081314087e-06, -2.1550804376602173e-06, -1.9222497940063477e-06, -1.689419150352478e-06, -1.4565885066986084e-06, -1.2237578630447388e-06, -9.909272193908691e-07, -7.580965757369995e-07, -5.252659320831299e-07, -2.9243528842926025e-07, -5.960464477539063e-08, 1.73225998878479e-07, 4.0605664253234863e-07, 6.388872861862183e-07, 8.717179298400879e-07, 1.1045485734939575e-06, 1.3373792171478271e-06, 1.5702098608016968e-06, 1.8030405044555664e-06, 2.035871148109436e-06, 2.2687017917633057e-06, 2.5015324354171753e-06, 2.734363079071045e-06, 2.9671937227249146e-06, 3.200024366378784e-06, 3.432855010032654e-06, 3.6656856536865234e-06, 3.898516297340393e-06, 4.131346940994263e-06, 4.364177584648132e-06, 4.597008228302002e-06, 4.829838871955872e-06, 5.062669515609741e-06, 5.295500159263611e-06, 5.5283308029174805e-06, 5.76116144657135e-06, 5.99399209022522e-06, 6.226822733879089e-06, 6.459653377532959e-06, 6.692484021186829e-06, 6.925314664840698e-06, 7.158145308494568e-06, 7.3909759521484375e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 5.0, 0.0, 6.0, 0.0, 11.0, 0.0, 12.0, 0.0, 19.0, 0.0, 20.0, 0.0, 31.0, 0.0, 38.0, 0.0, 58.0, 0.0, 53.0, 0.0, 48.0, 0.0, 81.0, 0.0, 79.0, 0.0, 97.0, 0.0, 91.0, 0.0, 76.0, 0.0, 59.0, 0.0, 56.0, 0.0, 39.0, 0.0, 32.0, 0.0, 31.0, 0.0, 29.0, 0.0, 17.0, 0.0, 12.0, 0.0, 6.0, 0.0, 6.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07, 9.834766387939453e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 11.0, 10.0, 26.0, 22.0, 50.0, 40.0, 88.0, 77.0, 89.0, 223.0, 191.0, 422.0, 396.0, 947.0, 990.0, 2211.0, 2395.0, 6028.0, 6935.0, 18019.0, 21581.0, 63958.0, 89712.0, 208254.0, 411345.0, 89441.0, 64211.0, 21740.0, 18152.0, 6746.0, 5980.0, 2400.0, 2297.0, 948.0, 970.0, 416.0, 411.0, 195.0, 210.0, 88.0, 70.0, 77.0, 37.0, 41.0, 28.0, 28.0, 9.0, 10.0, 6.0, 6.0, 3.0, 6.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.708766937255859e-06, -4.561617970466614e-06, -4.414469003677368e-06, -4.2673200368881226e-06, -4.120171070098877e-06, -3.973022103309631e-06, -3.825873136520386e-06, -3.67872416973114e-06, -3.5315752029418945e-06, -3.384426236152649e-06, -3.2372772693634033e-06, -3.0901283025741577e-06, -2.942979335784912e-06, -2.7958303689956665e-06, -2.648681402206421e-06, -2.5015324354171753e-06, -2.3543834686279297e-06, -2.207234501838684e-06, -2.0600855350494385e-06, -1.912936568260193e-06, -1.7657876014709473e-06, -1.6186386346817017e-06, -1.471489667892456e-06, -1.3243407011032104e-06, -1.1771917343139648e-06, -1.0300427675247192e-06, -8.828938007354736e-07, -7.35744833946228e-07, -5.885958671569824e-07, -4.414469003677368e-07, -2.942979335784912e-07, -1.471489667892456e-07, 0.0, 1.471489667892456e-07, 2.942979335784912e-07, 4.414469003677368e-07, 5.885958671569824e-07, 7.35744833946228e-07, 8.828938007354736e-07, 1.0300427675247192e-06, 1.1771917343139648e-06, 1.3243407011032104e-06, 1.471489667892456e-06, 1.6186386346817017e-06, 1.7657876014709473e-06, 1.912936568260193e-06, 2.0600855350494385e-06, 2.207234501838684e-06, 2.3543834686279297e-06, 2.5015324354171753e-06, 2.648681402206421e-06, 2.7958303689956665e-06, 2.942979335784912e-06, 3.0901283025741577e-06, 3.2372772693634033e-06, 3.384426236152649e-06, 3.5315752029418945e-06, 3.67872416973114e-06, 3.825873136520386e-06, 3.973022103309631e-06, 4.120171070098877e-06, 4.2673200368881226e-06, 4.414469003677368e-06, 4.561617970466614e-06, 4.708766937255859e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 0.0, 13.0, 17.0, 25.0, 0.0, 29.0, 43.0, 47.0, 0.0, 54.0, 61.0, 86.0, 0.0, 86.0, 97.0, 77.0, 61.0, 0.0, 53.0, 64.0, 54.0, 0.0, 26.0, 31.0, 15.0, 0.0, 17.0, 12.0, 7.0, 0.0, 6.0, 8.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.430511474609375e-06, -1.3848766684532166e-06, -1.339241862297058e-06, -1.2936070561408997e-06, -1.2479722499847412e-06, -1.2023374438285828e-06, -1.1567026376724243e-06, -1.1110678315162659e-06, -1.0654330253601074e-06, -1.019798219203949e-06, -9.741634130477905e-07, -9.285286068916321e-07, -8.828938007354736e-07, -8.372589945793152e-07, -7.916241884231567e-07, -7.459893822669983e-07, -7.003545761108398e-07, -6.547197699546814e-07, -6.09084963798523e-07, -5.634501576423645e-07, -5.178153514862061e-07, -4.721805453300476e-07, -4.2654573917388916e-07, -3.809109330177307e-07, -3.3527612686157227e-07, -2.896413207054138e-07, -2.4400651454925537e-07, -1.9837170839309692e-07, -1.5273690223693848e-07, -1.0710209608078003e-07, -6.146728992462158e-08, -1.5832483768463135e-08, 2.9802322387695312e-08, 7.543712854385376e-08, 1.210719347000122e-07, 1.6670674085617065e-07, 2.123415470123291e-07, 2.5797635316848755e-07, 3.03611159324646e-07, 3.4924596548080444e-07, 3.948807716369629e-07, 4.4051557779312134e-07, 4.861503839492798e-07, 5.317851901054382e-07, 5.774199962615967e-07, 6.230548024177551e-07, 6.686896085739136e-07, 7.14324414730072e-07, 7.599592208862305e-07, 8.055940270423889e-07, 8.512288331985474e-07, 8.968636393547058e-07, 9.424984455108643e-07, 9.881332516670227e-07, 1.0337680578231812e-06, 1.0794028639793396e-06, 1.125037670135498e-06, 1.1706724762916565e-06, 1.216307282447815e-06, 1.2619420886039734e-06, 1.3075768947601318e-06, 1.3532117009162903e-06, 1.3988465070724487e-06, 1.4444813132286072e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 9.0, 10.0, 12.0, 9.0, 15.0, 14.0, 15.0, 18.0, 41.0, 28.0, 39.0, 64.0, 98.0, 126.0, 132.0, 85.0, 58.0, 43.0, 24.0, 31.0, 14.0, 15.0, 21.0, 8.0, 9.0, 9.0, 9.0, 5.0, 5.0, 3.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7726252963257139e-06, -1.715277448965935e-06, -1.6579294879193185e-06, -1.6005816405595397e-06, -1.5432336795129231e-06, -1.4858858321531443e-06, -1.4285378711065277e-06, -1.371190023746749e-06, -1.31384217638697e-06, -1.2564943290271913e-06, -1.1991463679805747e-06, -1.141798520620796e-06, -1.0844505595741794e-06, -1.0271027122144005e-06, -9.697548648546217e-07, -9.124069038080052e-07, -8.550589427613886e-07, -7.977110385581909e-07, -7.403631343549932e-07, -6.830152869952144e-07, -6.256673259485979e-07, -5.68319478588819e-07, -5.109715743856214e-07, -4.5362367018242367e-07, -3.96275765979226e-07, -3.389278617760283e-07, -2.815799575728306e-07, -2.2423208179134235e-07, -1.6688417758814467e-07, -1.0953627338494698e-07, -5.2188397603458725e-08, 5.159506599738961e-09, 6.250741080293665e-08, 1.1985531500613433e-07, 1.772032049984773e-07, 2.3455109499082027e-07, 2.9189899919401796e-07, 3.4924690339721565e-07, 4.065947791787039e-07, 4.639426833819016e-07, 5.212905875850993e-07, 5.78638491788297e-07, 6.359863959914946e-07, 6.933343001946923e-07, 7.506821475544712e-07, 8.080301086010877e-07, 8.653779559608665e-07, 9.227258601640642e-07, 9.80073764367262e-07, 1.0374216117270407e-06, 1.0947695727736573e-06, 1.152117420133436e-06, 1.2094653811800526e-06, 1.2668132285398315e-06, 1.3241610758996103e-06, 1.3815090369462268e-06, 1.4388569979928434e-06, 1.4962048453526222e-06, 1.5535528063992388e-06, 1.6109006537590176e-06, 1.6682486148056341e-06, 1.725596462165413e-06, 1.7829443095251918e-06, 1.8402922705718083e-06, 1.8976401179315872e-06]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 8.0, 8.0, 12.0, 12.0, 14.0, 17.0, 25.0, 22.0, 20.0, 18.0, 16.0, 31.0, 23.0, 33.0, 36.0, 42.0, 50.0, 52.0, 47.0, 49.0, 34.0, 50.0, 42.0, 38.0, 35.0, 27.0, 27.0, 31.0, 28.0, 13.0, 22.0, 14.0, 22.0, 18.0, 12.0, 16.0, 11.0, 5.0, 7.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0782442814161186e-06, -1.036101593854255e-06, -9.939587926055538e-07, -9.518161050436902e-07, -9.096733606384078e-07, -8.675306162331253e-07, -8.253879286712618e-07, -7.832451842659793e-07, -7.411024398606969e-07, -6.989596954554145e-07, -6.568170078935509e-07, -6.146742634882685e-07, -5.72531519082986e-07, -5.303887746777036e-07, -4.882460871158401e-07, -4.4610334271055763e-07, -4.0396065514869406e-07, -3.6181793916512106e-07, -3.1967519475983863e-07, -2.7753247877626563e-07, -2.3538974858183792e-07, -1.932470183874102e-07, -1.511043024038372e-07, -1.0896155799855478e-07, -6.681884201498178e-08, -2.467611537326775e-08, 1.7466611268446286e-08, 5.960933435744664e-08, 1.0175206455187435e-07, 1.4389479474630207e-07, 1.8603751072987507e-07, 2.281802551351575e-07, 2.703229711187305e-07, 3.124656871023035e-07, 3.546084315075859e-07, 3.967511474911589e-07, 4.3889389189644135e-07, 4.810366363017238e-07, 5.231793238635873e-07, 5.653220682688698e-07, 6.074648126741522e-07, 6.496075570794346e-07, 6.917502446412982e-07, 7.338929890465806e-07, 7.76035733451863e-07, 8.181784778571455e-07, 8.60321165419009e-07, 9.024639098242915e-07, 9.44606597386155e-07, 9.867493417914375e-07, 1.028892029353301e-06, 1.0710348306020023e-06, 1.113177518163866e-06, 1.1553202057257295e-06, 1.1974630069744308e-06, 1.2396056945362943e-06, 1.2817483820981579e-06, 1.3238910696600215e-06, 1.3660338709087227e-06, 1.4081765584705863e-06, 1.4503192460324499e-06, 1.4924620472811512e-06, 1.5346047348430147e-06, 1.576747536091716e-06, 1.6188902236535796e-06]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 10.0, 0.0, 28.0, 0.0, 80.0, 0.0, 196.0, 0.0, 286.0, 0.0, 554.0, 0.0, 1000.0, 0.0, 2910.0, 0.0, 13878.0, 0.0, 43544.0, 0.0, 95609.0, 0.0, 129598.0, 0.0, 120257.0, 0.0, 119194.0, 0.0, 3077338.0, 126549.0, 0.0, 135932.0, 0.0, 147274.0, 0.0, 107473.0, 0.0, 49581.0, 0.0, 16064.0, 0.0, 3580.0, 0.0, 1450.0, 0.0, 881.0, 0.0, 477.0, 0.0, 329.0, 0.0, 139.0, 0.0, 56.0, 0.0, 21.0, 0.0, 0.0, 0.0, 8.0, 2.0], "bins": [-9.5367431640625e-07, -9.229406714439392e-07, -8.922070264816284e-07, -8.614733815193176e-07, -8.307397365570068e-07, -8.00006091594696e-07, -7.692724466323853e-07, -7.385388016700745e-07, -7.078051567077637e-07, -6.770715117454529e-07, -6.463378667831421e-07, -6.156042218208313e-07, -5.848705768585205e-07, -5.541369318962097e-07, -5.234032869338989e-07, -4.926696419715881e-07, -4.6193599700927734e-07, -4.3120235204696655e-07, -4.0046870708465576e-07, -3.6973506212234497e-07, -3.390014171600342e-07, -3.082677721977234e-07, -2.775341272354126e-07, -2.468004822731018e-07, -2.1606683731079102e-07, -1.8533319234848022e-07, -1.5459954738616943e-07, -1.2386590242385864e-07, -9.313225746154785e-08, -6.239861249923706e-08, -3.166496753692627e-08, -9.313225746154785e-10, 2.9802322387695312e-08, 6.05359673500061e-08, 9.12696123123169e-08, 1.2200325727462769e-07, 1.5273690223693848e-07, 1.8347054719924927e-07, 2.1420419216156006e-07, 2.4493783712387085e-07, 2.7567148208618164e-07, 3.0640512704849243e-07, 3.371387720108032e-07, 3.67872416973114e-07, 3.986060619354248e-07, 4.293397068977356e-07, 4.600733518600464e-07, 4.908069968223572e-07, 5.21540641784668e-07, 5.522742867469788e-07, 5.830079317092896e-07, 6.137415766716003e-07, 6.444752216339111e-07, 6.752088665962219e-07, 7.059425115585327e-07, 7.366761565208435e-07, 7.674098014831543e-07, 7.981434464454651e-07, 8.288770914077759e-07, 8.596107363700867e-07, 8.903443813323975e-07, 9.210780262947083e-07, 9.51811671257019e-07, 9.825453162193298e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 125.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 753.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 141.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 99.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 898.0, 0.0, 4.0, 7.0, 279.0, 2317.0, 22289.0, 558611.0, 3584535.0, 21713.0, 2247.0, 217.0, 94.0, 13.0, 0.0, 16.0, 811.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 115.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7550926208496094e-06, -3.6209821701049805e-06, -3.4868717193603516e-06, -3.3527612686157227e-06, -3.2186508178710938e-06, -3.084540367126465e-06, -2.950429916381836e-06, -2.816319465637207e-06, -2.682209014892578e-06, -2.5480985641479492e-06, -2.4139881134033203e-06, -2.2798776626586914e-06, -2.1457672119140625e-06, -2.0116567611694336e-06, -1.8775463104248047e-06, -1.7434358596801758e-06, -1.6093254089355469e-06, -1.475214958190918e-06, -1.341104507446289e-06, -1.2069940567016602e-06, -1.0728836059570312e-06, -9.387731552124023e-07, -8.046627044677734e-07, -6.705522537231445e-07, -5.364418029785156e-07, -4.023313522338867e-07, -2.682209014892578e-07, -1.341104507446289e-07, 0.0, 1.341104507446289e-07, 2.682209014892578e-07, 4.023313522338867e-07, 5.364418029785156e-07, 6.705522537231445e-07, 8.046627044677734e-07, 9.387731552124023e-07, 1.0728836059570312e-06, 1.2069940567016602e-06, 1.341104507446289e-06, 1.475214958190918e-06, 1.6093254089355469e-06, 1.7434358596801758e-06, 1.8775463104248047e-06, 2.0116567611694336e-06, 2.1457672119140625e-06, 2.2798776626586914e-06, 2.4139881134033203e-06, 2.5480985641479492e-06, 2.682209014892578e-06, 2.816319465637207e-06, 2.950429916381836e-06, 3.084540367126465e-06, 3.2186508178710938e-06, 3.3527612686157227e-06, 3.4868717193603516e-06, 3.6209821701049805e-06, 3.7550926208496094e-06, 3.889203071594238e-06, 4.023313522338867e-06, 4.157423973083496e-06, 4.291534423828125e-06, 4.425644874572754e-06, 4.559755325317383e-06, 4.693865776062012e-06, 4.827976226806641e-06]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 119.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 827.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2119.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 906.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 104.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-2.384185791015625e-07, -2.3189932107925415e-07, -2.253800630569458e-07, -2.1886080503463745e-07, -2.123415470123291e-07, -2.0582228899002075e-07, -1.993030309677124e-07, -1.9278377294540405e-07, -1.862645149230957e-07, -1.7974525690078735e-07, -1.73225998878479e-07, -1.6670674085617065e-07, -1.601874828338623e-07, -1.5366822481155396e-07, -1.471489667892456e-07, -1.4062970876693726e-07, -1.341104507446289e-07, -1.2759119272232056e-07, -1.210719347000122e-07, -1.1455267667770386e-07, -1.0803341865539551e-07, -1.0151416063308716e-07, -9.499490261077881e-08, -8.847564458847046e-08, -8.195638656616211e-08, -7.543712854385376e-08, -6.891787052154541e-08, -6.239861249923706e-08, -5.587935447692871e-08, -4.936009645462036e-08, -4.284083843231201e-08, -3.632158041000366e-08, -2.9802322387695312e-08, -2.3283064365386963e-08, -1.6763806343078613e-08, -1.0244548320770264e-08, -3.725290298461914e-09, 2.7939677238464355e-09, 9.313225746154785e-09, 1.5832483768463135e-08, 2.2351741790771484e-08, 2.8870999813079834e-08, 3.5390257835388184e-08, 4.190951585769653e-08, 4.842877388000488e-08, 5.494803190231323e-08, 6.146728992462158e-08, 6.798654794692993e-08, 7.450580596923828e-08, 8.102506399154663e-08, 8.754432201385498e-08, 9.406358003616333e-08, 1.0058283805847168e-07, 1.0710209608078003e-07, 1.1362135410308838e-07, 1.2014061212539673e-07, 1.2665987014770508e-07, 1.3317912817001343e-07, 1.3969838619232178e-07, 1.4621764421463013e-07, 1.5273690223693848e-07, 1.5925616025924683e-07, 1.6577541828155518e-07, 1.7229467630386353e-07, 1.7881393432617188e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 11.0, 9.0, 12.0, 21.0, 20.0, 45.0, 66.0, 115.0, 190.0, 177.0, 105.0, 68.0, 51.0, 30.0, 13.0, 9.0, 11.0, 9.0, 5.0, 11.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0547637430136092e-06, -1.0218321904176264e-06, -9.889005241348059e-07, -9.55968971538823e-07, -9.230373052560026e-07, -8.901057526600198e-07, -8.571741432206181e-07, -8.242425337812165e-07, -7.913109243418148e-07, -7.583793149024132e-07, -7.254477054630115e-07, -6.925160960236099e-07, -6.595845434276271e-07, -6.266528771448066e-07, -5.937213245488238e-07, -5.607897151094221e-07, -5.278581056700204e-07, -4.949264962306188e-07, -4.6199488679121714e-07, -4.290633057735249e-07, -3.9613169633412326e-07, -3.632000868947216e-07, -3.302685058770294e-07, -2.9733689643762773e-07, -2.644052869982261e-07, -2.3147367755882442e-07, -1.9854208233027748e-07, -1.6561048710173054e-07, -1.326788776623289e-07, -9.974726822292723e-08, -6.681567299438029e-08, -3.3884077765833354e-08, -9.52468326431699e-10, 3.19791340075426e-08, 6.49107363415169e-08, 9.784233867549119e-08, 1.307739410094655e-07, 1.6370555044886714e-07, 1.9663714567741408e-07, 2.2956874090596102e-07, 2.625003503453627e-07, 2.9543195978476433e-07, 3.28363569224166e-07, 3.612951502418582e-07, 3.9422675968125986e-07, 4.271583691206615e-07, 4.6008995013835374e-07, 4.930215595777554e-07, 5.25953169017157e-07, 5.588847784565587e-07, 5.918163878959604e-07, 6.24747997335362e-07, 6.576796067747637e-07, 6.906111593707465e-07, 7.235427688101481e-07, 7.564743782495498e-07, 7.894059876889514e-07, 8.223375971283531e-07, 8.552692065677547e-07, 8.882008160071564e-07, 9.211323686031392e-07, 9.540640348859597e-07, 9.869955874819425e-07, 1.0199271400779253e-06, 1.0528588063607458e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 8.0, 10.0, 11.0, 5.0, 13.0, 15.0, 18.0, 18.0, 25.0, 19.0, 24.0, 26.0, 36.0, 31.0, 36.0, 33.0, 51.0, 36.0, 33.0, 49.0, 42.0, 35.0, 51.0, 42.0, 37.0, 34.0, 44.0, 24.0, 12.0, 22.0, 25.0, 23.0, 13.0, 13.0, 13.0, 17.0, 10.0, 7.0, 7.0, 1.0, 6.0, 6.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.137451353220968e-07, -4.975277647645271e-07, -4.813103373635386e-07, -4.6509293838425947e-07, -4.4887553940498037e-07, -4.326581404257013e-07, -4.164407414464222e-07, -4.002233708888525e-07, -3.84005943487864e-07, -3.677885445085849e-07, -3.515711455293058e-07, -3.353537465500267e-07, -3.191363475707476e-07, -3.029189485914685e-07, -2.867015496121894e-07, -2.7048417905461974e-07, -2.5426678007534065e-07, -2.3804938109606155e-07, -2.2183198211678246e-07, -2.0561458313750336e-07, -1.8939718415822426e-07, -1.7317978517894517e-07, -1.5696240041052079e-07, -1.407450014312417e-07, -1.245276024519626e-07, -1.083102034726835e-07, -9.20928044934044e-08, -7.587541261955266e-08, -5.965801364027357e-08, -4.344061466099447e-08, -2.722322278714273e-08, -1.1005823807863635e-08, 5.211575171415461e-09, 2.1428972374337718e-08, 3.7646369577259975e-08, 5.386376500382539e-08, 7.008116398310449e-08, 8.629856296238358e-08, 1.0251595483623532e-07, 1.1873335381551442e-07, 1.3495075279479352e-07, 1.511681517740726e-07, 1.673855507533517e-07, 1.836029355217761e-07, 1.9982033450105519e-07, 2.1603773348033428e-07, 2.3225513245961338e-07, 2.484725314388925e-07, 2.6468993041817157e-07, 2.8090732939745067e-07, 2.9712472837672976e-07, 3.1334212735600886e-07, 3.2955952633528796e-07, 3.4577692531456705e-07, 3.619942958721367e-07, 3.7821172327312524e-07, 3.944290938306949e-07, 4.10646492809974e-07, 4.268638917892531e-07, 4.430812907685322e-07, 4.592986897478113e-07, 4.755160887270904e-07, 4.917334877063695e-07, 5.079508582639392e-07, 5.241682856649277e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 0.0, 2.0, 0.0, 18.0, 8.0, 0.0, 22.0, 21.0, 0.0, 55.0, 109.0, 0.0, 203.0, 297.0, 0.0, 560.0, 0.0, 1415.0, 4015.0, 0.0, 14843.0, 99625.0, 0.0, 806369.0, 99462.0, 0.0, 14801.0, 0.0, 3962.0, 1458.0, 0.0, 561.0, 311.0, 0.0, 210.0, 102.0, 0.0, 56.0, 35.0, 0.0, 9.0, 0.0, 9.0, 14.0, 0.0, 3.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3113021850585938e-06, -1.2731179594993591e-06, -1.2349337339401245e-06, -1.1967495083808899e-06, -1.1585652828216553e-06, -1.1203810572624207e-06, -1.082196831703186e-06, -1.0440126061439514e-06, -1.0058283805847168e-06, -9.676441550254822e-07, -9.294599294662476e-07, -8.912757039070129e-07, -8.530914783477783e-07, -8.149072527885437e-07, -7.767230272293091e-07, -7.385388016700745e-07, -7.003545761108398e-07, -6.621703505516052e-07, -6.239861249923706e-07, -5.85801899433136e-07, -5.476176738739014e-07, -5.094334483146667e-07, -4.7124922275543213e-07, -4.330649971961975e-07, -3.948807716369629e-07, -3.5669654607772827e-07, -3.1851232051849365e-07, -2.8032809495925903e-07, -2.421438694000244e-07, -2.039596438407898e-07, -1.6577541828155518e-07, -1.2759119272232056e-07, -8.940696716308594e-08, -5.122274160385132e-08, -1.30385160446167e-08, 2.514570951461792e-08, 6.332993507385254e-08, 1.0151416063308716e-07, 1.3969838619232178e-07, 1.778826117515564e-07, 2.1606683731079102e-07, 2.5425106287002563e-07, 2.9243528842926025e-07, 3.3061951398849487e-07, 3.688037395477295e-07, 4.069879651069641e-07, 4.4517219066619873e-07, 4.833564162254333e-07, 5.21540641784668e-07, 5.597248673439026e-07, 5.979090929031372e-07, 6.360933184623718e-07, 6.742775440216064e-07, 7.124617695808411e-07, 7.506459951400757e-07, 7.888302206993103e-07, 8.270144462585449e-07, 8.651986718177795e-07, 9.033828973770142e-07, 9.415671229362488e-07, 9.797513484954834e-07, 1.017935574054718e-06, 1.0561197996139526e-06, 1.0943040251731873e-06, 1.1324882507324219e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 76.0, 0.0, 0.0, 0.0, 119.0, 0.0, 0.0, 165.0, 0.0, 0.0, 0.0, 168.0, 0.0, 0.0, 0.0, 160.0, 0.0, 0.0, 114.0, 0.0, 0.0, 0.0, 67.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.600733518600464e-07, -4.4330954551696777e-07, -4.2654573917388916e-07, -4.0978193283081055e-07, -3.9301812648773193e-07, -3.762543201446533e-07, -3.594905138015747e-07, -3.427267074584961e-07, -3.259629011154175e-07, -3.0919909477233887e-07, -2.9243528842926025e-07, -2.7567148208618164e-07, -2.5890767574310303e-07, -2.421438694000244e-07, -2.253800630569458e-07, -2.086162567138672e-07, -1.9185245037078857e-07, -1.7508864402770996e-07, -1.5832483768463135e-07, -1.4156103134155273e-07, -1.2479722499847412e-07, -1.0803341865539551e-07, -9.12696123123169e-08, -7.450580596923828e-08, -5.774199962615967e-08, -4.0978193283081055e-08, -2.421438694000244e-08, -7.450580596923828e-09, 9.313225746154785e-09, 2.60770320892334e-08, 4.284083843231201e-08, 5.960464477539063e-08, 7.636845111846924e-08, 9.313225746154785e-08, 1.0989606380462646e-07, 1.2665987014770508e-07, 1.434236764907837e-07, 1.601874828338623e-07, 1.7695128917694092e-07, 1.9371509552001953e-07, 2.1047890186309814e-07, 2.2724270820617676e-07, 2.4400651454925537e-07, 2.60770320892334e-07, 2.775341272354126e-07, 2.942979335784912e-07, 3.110617399215698e-07, 3.2782554626464844e-07, 3.4458935260772705e-07, 3.6135315895080566e-07, 3.781169652938843e-07, 3.948807716369629e-07, 4.116445779800415e-07, 4.284083843231201e-07, 4.4517219066619873e-07, 4.6193599700927734e-07, 4.78699803352356e-07, 4.954636096954346e-07, 5.122274160385132e-07, 5.289912223815918e-07, 5.457550287246704e-07, 5.62518835067749e-07, 5.792826414108276e-07, 5.960464477539062e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 12.0, 0.0, 21.0, 0.0, 0.0, 45.0, 0.0, 0.0, 27.0, 0.0, 0.0, 120.0, 0.0, 0.0, 144.0, 0.0, 381.0, 0.0, 0.0, 1047064.0, 0.0, 0.0, 369.0, 0.0, 0.0, 138.0, 0.0, 90.0, 0.0, 0.0, 54.0, 0.0, 0.0, 36.0, 0.0, 0.0, 21.0, 0.0, 0.0, 15.0, 0.0, 3.0, 0.0, 0.0, 15.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.556510925292969e-07, -6.342306733131409e-07, -6.128102540969849e-07, -5.913898348808289e-07, -5.699694156646729e-07, -5.485489964485168e-07, -5.271285772323608e-07, -5.057081580162048e-07, -4.842877388000488e-07, -4.628673195838928e-07, -4.414469003677368e-07, -4.200264811515808e-07, -3.986060619354248e-07, -3.771856427192688e-07, -3.557652235031128e-07, -3.343448042869568e-07, -3.129243850708008e-07, -2.915039658546448e-07, -2.7008354663848877e-07, -2.4866312742233276e-07, -2.2724270820617676e-07, -2.0582228899002075e-07, -1.8440186977386475e-07, -1.6298145055770874e-07, -1.4156103134155273e-07, -1.2014061212539673e-07, -9.872019290924072e-08, -7.729977369308472e-08, -5.587935447692871e-08, -3.4458935260772705e-08, -1.30385160446167e-08, 8.381903171539307e-09, 2.9802322387695312e-08, 5.122274160385132e-08, 7.264316082000732e-08, 9.406358003616333e-08, 1.1548399925231934e-07, 1.3690441846847534e-07, 1.5832483768463135e-07, 1.7974525690078735e-07, 2.0116567611694336e-07, 2.2258609533309937e-07, 2.4400651454925537e-07, 2.654269337654114e-07, 2.868473529815674e-07, 3.082677721977234e-07, 3.296881914138794e-07, 3.511086106300354e-07, 3.725290298461914e-07, 3.939494490623474e-07, 4.153698682785034e-07, 4.367902874946594e-07, 4.5821070671081543e-07, 4.796311259269714e-07, 5.010515451431274e-07, 5.224719643592834e-07, 5.438923835754395e-07, 5.653128027915955e-07, 5.867332220077515e-07, 6.081536412239075e-07, 6.295740604400635e-07, 6.509944796562195e-07, 6.724148988723755e-07, 6.938353180885315e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1021.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08, 6.146728992462158e-08, 6.332993507385254e-08, 6.51925802230835e-08, 6.705522537231445e-08, 6.891787052154541e-08, 7.078051567077637e-08, 7.264316082000732e-08, 7.450580596923828e-08, 7.636845111846924e-08, 7.82310962677002e-08, 8.009374141693115e-08, 8.195638656616211e-08, 8.381903171539307e-08, 8.568167686462402e-08, 8.754432201385498e-08, 8.940696716308594e-08, 9.12696123123169e-08, 9.313225746154785e-08, 9.499490261077881e-08, 9.685754776000977e-08, 9.872019290924072e-08, 1.0058283805847168e-07, 1.0244548320770264e-07, 1.043081283569336e-07, 1.0617077350616455e-07, 1.0803341865539551e-07, 1.0989606380462646e-07, 1.1175870895385742e-07, 1.1362135410308838e-07, 1.1548399925231934e-07, 1.1734664440155029e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 6.0, 9.0, 13.0, 12.0, 25.0, 29.0, 49.0, 64.0, 120.0, 188.0, 163.0, 96.0, 58.0, 38.0, 27.0, 25.0, 17.0, 10.0, 7.0, 5.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.86342342912394e-07, -9.572577255312353e-07, -9.281732218369143e-07, -8.990886044557556e-07, -8.700040439180157e-07, -8.409194833802758e-07, -8.118349228425359e-07, -7.82750362304796e-07, -7.536657449236372e-07, -7.245811843858974e-07, -6.954966238481575e-07, -6.664120064669987e-07, -6.373274459292588e-07, -6.082428853915189e-07, -5.79158324853779e-07, -5.500737643160392e-07, -5.209892037782993e-07, -4.919046432405594e-07, -4.6282005428111006e-07, -4.3373549374337017e-07, -4.0465090478392085e-07, -3.7556634424618096e-07, -3.4648178370844107e-07, -3.173972231707012e-07, -2.8831263421125186e-07, -2.5922807367351197e-07, -2.3014348471406265e-07, -2.0105892417632276e-07, -1.7197434942772816e-07, -1.4288977467913355e-07, -1.1380521414139366e-07, -8.472063939279906e-08, -5.563600780078559e-08, -2.6551436604904666e-08, 2.5331345909762604e-09, 3.161770223414351e-08, 6.070227698273811e-08, 8.978685173133272e-08, 1.1887141226907261e-07, 1.479559870176672e-07, 1.7704056176626182e-07, 2.0612513651485642e-07, 2.3520971126345103e-07, 2.642942718011909e-07, 2.933788323389308e-07, 3.224634212983801e-07, 3.5154798183612e-07, 3.8063257079556934e-07, 4.097171313333092e-07, 4.388016918710491e-07, 4.6788628083049844e-07, 4.969708697899478e-07, 5.260554303276876e-07, 5.551399908654275e-07, 5.842245514031674e-07, 6.133091119409073e-07, 6.423937293220661e-07, 6.71478289859806e-07, 7.005628503975458e-07, 7.296474677787046e-07, 7.587320283164445e-07, 7.878165888541844e-07, 8.169011493919243e-07, 8.459857099296642e-07, 8.75070270467404e-07]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 6.0, 13.0, 8.0, 15.0, 14.0, 15.0, 21.0, 20.0, 22.0, 25.0, 26.0, 35.0, 31.0, 32.0, 36.0, 47.0, 38.0, 33.0, 51.0, 35.0, 46.0, 51.0, 37.0, 40.0, 36.0, 40.0, 22.0, 16.0, 22.0, 29.0, 20.0, 12.0, 14.0, 14.0, 14.0, 13.0, 5.0, 7.0, 1.0, 6.0, 4.0, 9.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.5338416043705365e-07, -4.3917910375057545e-07, -4.2497404706409725e-07, -4.1076899037761905e-07, -3.965639621128503e-07, -3.823589054263721e-07, -3.681538487398939e-07, -3.5394879205341567e-07, -3.3974373536693747e-07, -3.2553867868045927e-07, -3.1133362199398107e-07, -2.9712856530750287e-07, -2.8292350862102467e-07, -2.6871845193454647e-07, -2.545134236697777e-07, -2.403083669832995e-07, -2.261033102968213e-07, -2.118982536103431e-07, -1.976931969238649e-07, -1.834881544482414e-07, -1.692830977617632e-07, -1.55078041075285e-07, -1.4087299859966151e-07, -1.266679419131833e-07, -1.1246288522670511e-07, -9.825782854022691e-08, -8.405277895917607e-08, -6.984772937812522e-08, -5.564267269164702e-08, -4.143761600516882e-08, -2.7232566424117977e-08, -1.3027516843067133e-08, 1.177511421701638e-09, 1.538256455546616e-08, 2.9587617689230683e-08, 4.3792670822995206e-08, 5.799772395675973e-08, 7.220278064323793e-08, 8.640783022428877e-08, 1.0061287980533962e-07, 1.1481793649181782e-07, 1.2902299317829602e-07, 1.4322804986477422e-07, 1.574330923403977e-07, 1.716381490268759e-07, 1.858432057133541e-07, 2.000482481889776e-07, 2.142533048754558e-07, 2.28458361561934e-07, 2.426634182484122e-07, 2.568684749348904e-07, 2.710735316213686e-07, 2.852785883078468e-07, 2.99483644994325e-07, 3.136886732590938e-07, 3.27893729945572e-07, 3.420987866320502e-07, 3.563038433185284e-07, 3.705089000050066e-07, 3.847139566914848e-07, 3.9891898495625355e-07, 4.1312404164273175e-07, 4.2732909832920996e-07, 4.4153415501568816e-07, 4.5573921170216636e-07]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 10.0, 8.0, 3.0, 8.0, 6.0, 11.0, 82.0, 79.0, 78.0, 142.0, 227.0, 352.0, 809.0, 3794.0, 5734.0, 9981.0, 22185.0, 63491.0, 170439.0, 493767.0, 233658.0, 22479.0, 9923.0, 5723.0, 2207.0, 1593.0, 781.0, 562.0, 128.0, 86.0, 77.0, 53.0, 29.0, 7.0, 17.0, 3.0, 11.0, 12.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-06, -1.7797574400901794e-06, -1.7117708921432495e-06, -1.6437843441963196e-06, -1.5757977962493896e-06, -1.5078112483024597e-06, -1.4398247003555298e-06, -1.3718381524085999e-06, -1.30385160446167e-06, -1.23586505651474e-06, -1.16787850856781e-06, -1.0998919606208801e-06, -1.0319054126739502e-06, -9.639188647270203e-07, -8.959323167800903e-07, -8.279457688331604e-07, -7.599592208862305e-07, -6.919726729393005e-07, -6.239861249923706e-07, -5.559995770454407e-07, -4.880130290985107e-07, -4.200264811515808e-07, -3.520399332046509e-07, -2.8405338525772095e-07, -2.1606683731079102e-07, -1.4808028936386108e-07, -8.009374141693115e-08, -1.210719347000122e-08, 5.587935447692871e-08, 1.2386590242385864e-07, 1.9185245037078857e-07, 2.598389983177185e-07, 3.2782554626464844e-07, 3.9581209421157837e-07, 4.637986421585083e-07, 5.317851901054382e-07, 5.997717380523682e-07, 6.677582859992981e-07, 7.35744833946228e-07, 8.03731381893158e-07, 8.717179298400879e-07, 9.397044777870178e-07, 1.0076910257339478e-06, 1.0756775736808777e-06, 1.1436641216278076e-06, 1.2116506695747375e-06, 1.2796372175216675e-06, 1.3476237654685974e-06, 1.4156103134155273e-06, 1.4835968613624573e-06, 1.5515834093093872e-06, 1.6195699572563171e-06, 1.687556505203247e-06, 1.755543053150177e-06, 1.823529601097107e-06, 1.8915161490440369e-06, 1.959502696990967e-06, 2.0274892449378967e-06, 2.0954757928848267e-06, 2.1634623408317566e-06, 2.2314488887786865e-06, 2.2994354367256165e-06, 2.3674219846725464e-06, 2.4354085326194763e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 0.0, 0.0, 101.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 226.0, 0.0, 0.0, 0.0, 0.0, 0.0, 327.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 216.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.2910535335540771e-07, -2.1979212760925293e-07, -2.1047890186309814e-07, -2.0116567611694336e-07, -1.9185245037078857e-07, -1.825392246246338e-07, -1.73225998878479e-07, -1.6391277313232422e-07, -1.5459954738616943e-07, -1.4528632164001465e-07, -1.3597309589385986e-07, -1.2665987014770508e-07, -1.1734664440155029e-07, -1.0803341865539551e-07, -9.872019290924072e-08, -8.940696716308594e-08, -8.009374141693115e-08, -7.078051567077637e-08, -6.146728992462158e-08, -5.21540641784668e-08, -4.284083843231201e-08, -3.3527612686157227e-08, -2.421438694000244e-08, -1.4901161193847656e-08, -5.587935447692871e-09, 3.725290298461914e-09, 1.30385160446167e-08, 2.2351741790771484e-08, 3.166496753692627e-08, 4.0978193283081055e-08, 5.029141902923584e-08, 5.960464477539063e-08, 6.891787052154541e-08, 7.82310962677002e-08, 8.754432201385498e-08, 9.685754776000977e-08, 1.0617077350616455e-07, 1.1548399925231934e-07, 1.2479722499847412e-07, 1.341104507446289e-07, 1.434236764907837e-07, 1.5273690223693848e-07, 1.6205012798309326e-07, 1.7136335372924805e-07, 1.8067657947540283e-07, 1.8998980522155762e-07, 1.993030309677124e-07, 2.086162567138672e-07, 2.1792948246002197e-07, 2.2724270820617676e-07, 2.3655593395233154e-07, 2.4586915969848633e-07, 2.551823854446411e-07, 2.644956111907959e-07, 2.738088369369507e-07, 2.8312206268310547e-07, 2.9243528842926025e-07, 3.0174851417541504e-07, 3.110617399215698e-07, 3.203749656677246e-07, 3.296881914138794e-07, 3.390014171600342e-07, 3.4831464290618896e-07, 3.5762786865234375e-07]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 11.0, 3.0, 8.0, 16.0, 13.0, 10.0, 25.0, 33.0, 75.0, 184.0, 195.0, 349.0, 440.0, 829.0, 1477.0, 2657.0, 6040.0, 12145.0, 95064.0, 177099.0, 455666.0, 177194.0, 67482.0, 27220.0, 12134.0, 6059.0, 2542.0, 2323.0, 436.0, 310.0, 147.0, 124.0, 75.0, 52.0, 42.0, 24.0, 30.0, 9.0, 4.0, 6.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9669532775878906e-06, -1.9008293747901917e-06, -1.8347054719924927e-06, -1.7685815691947937e-06, -1.7024576663970947e-06, -1.6363337635993958e-06, -1.5702098608016968e-06, -1.5040859580039978e-06, -1.4379620552062988e-06, -1.3718381524085999e-06, -1.3057142496109009e-06, -1.239590346813202e-06, -1.173466444015503e-06, -1.107342541217804e-06, -1.041218638420105e-06, -9.75094735622406e-07, -9.08970832824707e-07, -8.428469300270081e-07, -7.767230272293091e-07, -7.105991244316101e-07, -6.444752216339111e-07, -5.783513188362122e-07, -5.122274160385132e-07, -4.461035132408142e-07, -3.7997961044311523e-07, -3.1385570764541626e-07, -2.477318048477173e-07, -1.816079020500183e-07, -1.1548399925231934e-07, -4.936009645462036e-08, 1.6763806343078613e-08, 8.288770914077759e-08, 1.4901161193847656e-07, 2.1513551473617554e-07, 2.812594175338745e-07, 3.473833203315735e-07, 4.1350722312927246e-07, 4.796311259269714e-07, 5.457550287246704e-07, 6.118789315223694e-07, 6.780028343200684e-07, 7.441267371177673e-07, 8.102506399154663e-07, 8.763745427131653e-07, 9.424984455108643e-07, 1.0086223483085632e-06, 1.0747462511062622e-06, 1.1408701539039612e-06, 1.2069940567016602e-06, 1.2731179594993591e-06, 1.339241862297058e-06, 1.405365765094757e-06, 1.471489667892456e-06, 1.537613570690155e-06, 1.603737473487854e-06, 1.669861376285553e-06, 1.735985279083252e-06, 1.802109181880951e-06, 1.86823308467865e-06, 1.934356987476349e-06, 2.000480890274048e-06, 2.066604793071747e-06, 2.132728695869446e-06, 2.1988525986671448e-06, 2.2649765014648438e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 19.0, 0.0, 0.0, 0.0, 47.0, 0.0, 0.0, 0.0, 131.0, 0.0, 0.0, 0.0, 213.0, 0.0, 0.0, 244.0, 0.0, 0.0, 0.0, 183.0, 0.0, 0.0, 0.0, 114.0, 0.0, 0.0, 0.0, 41.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.364418029785156e-07, -5.206093192100525e-07, -5.047768354415894e-07, -4.889443516731262e-07, -4.731118679046631e-07, -4.5727938413619995e-07, -4.414469003677368e-07, -4.256144165992737e-07, -4.0978193283081055e-07, -3.939494490623474e-07, -3.781169652938843e-07, -3.6228448152542114e-07, -3.46451997756958e-07, -3.3061951398849487e-07, -3.1478703022003174e-07, -2.989545464515686e-07, -2.8312206268310547e-07, -2.6728957891464233e-07, -2.514570951461792e-07, -2.3562461137771606e-07, -2.1979212760925293e-07, -2.039596438407898e-07, -1.8812716007232666e-07, -1.7229467630386353e-07, -1.564621925354004e-07, -1.4062970876693726e-07, -1.2479722499847412e-07, -1.0896474123001099e-07, -9.313225746154785e-08, -7.729977369308472e-08, -6.146728992462158e-08, -4.563480615615845e-08, -2.9802322387695312e-08, -1.3969838619232178e-08, 1.862645149230957e-09, 1.7695128917694092e-08, 3.3527612686157227e-08, 4.936009645462036e-08, 6.51925802230835e-08, 8.102506399154663e-08, 9.685754776000977e-08, 1.126900315284729e-07, 1.2852251529693604e-07, 1.4435499906539917e-07, 1.601874828338623e-07, 1.7601996660232544e-07, 1.9185245037078857e-07, 2.076849341392517e-07, 2.2351741790771484e-07, 2.39349901676178e-07, 2.551823854446411e-07, 2.7101486921310425e-07, 2.868473529815674e-07, 3.026798367500305e-07, 3.1851232051849365e-07, 3.343448042869568e-07, 3.501772880554199e-07, 3.6600977182388306e-07, 3.818422555923462e-07, 3.976747393608093e-07, 4.1350722312927246e-07, 4.293397068977356e-07, 4.4517219066619873e-07, 4.6100467443466187e-07, 4.76837158203125e-07]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 3.0, 10.0, 13.0, 13.0, 20.0, 18.0, 37.0, 55.0, 56.0, 99.0, 196.0, 156.0, 85.0, 71.0, 42.0, 25.0, 18.0, 19.0, 16.0, 5.0, 7.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.565080863969342e-07, -7.34124796508695e-07, -7.117415634638746e-07, -6.893582735756354e-07, -6.66975040530815e-07, -6.445917506425758e-07, -6.222085175977554e-07, -5.998252277095162e-07, -5.77441937821277e-07, -5.550586479330377e-07, -5.326754148882173e-07, -5.102921249999781e-07, -4.879088919551577e-07, -4.655256020669185e-07, -4.431423406003887e-07, -4.207590791338589e-07, -3.983758176673291e-07, -3.759925562007993e-07, -3.536092947342695e-07, -3.312260332677397e-07, -3.0884274337950046e-07, -2.8645948191297066e-07, -2.6407622044644086e-07, -2.416929305582016e-07, -2.1930968330252654e-07, -1.9692642183599673e-07, -1.7454314615861222e-07, -1.5215988469208241e-07, -1.297766232255526e-07, -1.073933475481681e-07, -8.501008608163829e-08, -6.262681040425377e-08, -4.024354893772397e-08, -1.786028214212365e-08, 4.522984653476669e-09, 2.690624967272015e-08, 4.928951824467731e-08, 7.167278681663447e-08, 9.405604828316427e-08, 1.1643932396054879e-07, 1.388225854270786e-07, 1.612058468936084e-07, 1.835891225709929e-07, 2.0597238403752272e-07, 2.2835564550405252e-07, 2.5073893539229175e-07, 2.731221684371121e-07, 2.9550545832535136e-07, 3.1788871979188116e-07, 3.4027198125841096e-07, 3.6265524272494076e-07, 3.8503850419147057e-07, 4.074217940797098e-07, 4.298050555462396e-07, 4.521883170127694e-07, 4.7457160690100864e-07, 4.96954839945829e-07, 5.193381298340682e-07, 5.417213628788886e-07, 5.641046527671278e-07, 5.864878858119482e-07, 6.088711757001875e-07, 6.312544655884267e-07, 6.536376986332471e-07, 6.760209885214863e-07]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 6.0, 11.0, 5.0, 12.0, 13.0, 12.0, 22.0, 19.0, 30.0, 27.0, 37.0, 39.0, 41.0, 41.0, 42.0, 31.0, 37.0, 52.0, 49.0, 58.0, 40.0, 43.0, 29.0, 33.0, 28.0, 43.0, 32.0, 25.0, 24.0, 13.0, 16.0, 12.0, 20.0, 10.0, 15.0, 6.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.320403436646302e-07, -3.2032986041485856e-07, -3.0861940558679635e-07, -2.969089223370247e-07, -2.8519843908725306e-07, -2.734879558374814e-07, -2.617775010094192e-07, -2.5006701775964757e-07, -2.3835654872073064e-07, -2.2664607968181372e-07, -2.1493559643204208e-07, -2.0322512739312515e-07, -1.9151465835420822e-07, -1.7980417510443658e-07, -1.6809370606551965e-07, -1.5638323702660273e-07, -1.4467275377683109e-07, -1.3296228473791416e-07, -1.2125180148814252e-07, -1.0954133244922559e-07, -9.783085630488131e-08, -8.612038016053702e-08, -7.44099111216201e-08, -6.269943497727581e-08, -5.098895883293153e-08, -3.9278482688587246e-08, -2.756801009695664e-08, -1.5857537505326036e-08, -4.147061360981752e-09, 7.563414783362532e-09, 1.927388382227946e-08, 3.098435996662374e-08, 4.2694807689258596e-08, 5.440528383360288e-08, 6.611575997794716e-08, 7.782622901686409e-08, 8.953670516120837e-08, 1.0124718130555266e-07, 1.1295765034446958e-07, 1.2466813359424123e-07, 1.3637860263315815e-07, 1.4808907167207508e-07, 1.5979955492184672e-07, 1.7151002396076365e-07, 1.8322049299968057e-07, 1.9493097624945221e-07, 2.0664144528836914e-07, 2.1835191432728607e-07, 2.300623975770577e-07, 2.4177288082682935e-07, 2.5348333565489156e-07, 2.651938189046632e-07, 2.7690430215443484e-07, 2.886147854042065e-07, 3.003252402322687e-07, 3.1203572348204034e-07, 3.2374617831010255e-07, 3.354566615598742e-07, 3.471671163879364e-07, 3.5887759963770804e-07, 3.705880828874797e-07, 3.822985377155419e-07, 3.9400902096531354e-07, 4.057195042150852e-07, 4.174299874648568e-07]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 0.0, 6.0, 8.0, 0.0, 14.0, 1.0, 16.0, 38.0, 1.0, 55.0, 11.0, 41.0, 176.0, 79.0, 301.0, 1024.0, 1277.0, 9414.0, 32887.0, 4101303.0, 41602.0, 2730.0, 1315.0, 1140.0, 338.0, 240.0, 50.0, 39.0, 32.0, 39.0, 4.0, 33.0, 28.0, 1.0, 14.0, 0.0, 13.0, 11.0, 0.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3245811462402344e-06, -2.2426247596740723e-06, -2.16066837310791e-06, -2.078711986541748e-06, -1.996755599975586e-06, -1.914799213409424e-06, -1.8328428268432617e-06, -1.7508864402770996e-06, -1.6689300537109375e-06, -1.5869736671447754e-06, -1.5050172805786133e-06, -1.4230608940124512e-06, -1.341104507446289e-06, -1.259148120880127e-06, -1.1771917343139648e-06, -1.0952353477478027e-06, -1.0132789611816406e-06, -9.313225746154785e-07, -8.493661880493164e-07, -7.674098014831543e-07, -6.854534149169922e-07, -6.034970283508301e-07, -5.21540641784668e-07, -4.3958425521850586e-07, -3.5762786865234375e-07, -2.7567148208618164e-07, -1.9371509552001953e-07, -1.1175870895385742e-07, -2.9802322387695312e-08, 5.21540641784668e-08, 1.341104507446289e-07, 2.1606683731079102e-07, 2.980232238769531e-07, 3.7997961044311523e-07, 4.6193599700927734e-07, 5.438923835754395e-07, 6.258487701416016e-07, 7.078051567077637e-07, 7.897615432739258e-07, 8.717179298400879e-07, 9.5367431640625e-07, 1.0356307029724121e-06, 1.1175870895385742e-06, 1.1995434761047363e-06, 1.2814998626708984e-06, 1.3634562492370605e-06, 1.4454126358032227e-06, 1.5273690223693848e-06, 1.6093254089355469e-06, 1.691281795501709e-06, 1.773238182067871e-06, 1.8551945686340332e-06, 1.9371509552001953e-06, 2.0191073417663574e-06, 2.1010637283325195e-06, 2.1830201148986816e-06, 2.2649765014648438e-06, 2.346932888031006e-06, 2.428889274597168e-06, 2.51084566116333e-06, 2.592802047729492e-06, 2.6747584342956543e-06, 2.7567148208618164e-06, 2.8386712074279785e-06, 2.9206275939941406e-06]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.0, 0.0, 0.0, 0.0, 0.0, 0.0, 230.0, 0.0, 0.0, 0.0, 0.0, 0.0, 315.0, 0.0, 0.0, 0.0, 0.0, 189.0, 0.0, 0.0, 0.0, 0.0, 0.0, 108.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.980232238769531e-07, -2.8777867555618286e-07, -2.775341272354126e-07, -2.6728957891464233e-07, -2.5704503059387207e-07, -2.468004822731018e-07, -2.3655593395233154e-07, -2.2631138563156128e-07, -2.1606683731079102e-07, -2.0582228899002075e-07, -1.955777406692505e-07, -1.8533319234848022e-07, -1.7508864402770996e-07, -1.648440957069397e-07, -1.5459954738616943e-07, -1.4435499906539917e-07, -1.341104507446289e-07, -1.2386590242385864e-07, -1.1362135410308838e-07, -1.0337680578231812e-07, -9.313225746154785e-08, -8.288770914077759e-08, -7.264316082000732e-08, -6.239861249923706e-08, -5.21540641784668e-08, -4.190951585769653e-08, -3.166496753692627e-08, -2.1420419216156006e-08, -1.1175870895385742e-08, -9.313225746154785e-10, 9.313225746154785e-09, 1.955777406692505e-08, 2.9802322387695312e-08, 4.0046870708465576e-08, 5.029141902923584e-08, 6.05359673500061e-08, 7.078051567077637e-08, 8.102506399154663e-08, 9.12696123123169e-08, 1.0151416063308716e-07, 1.1175870895385742e-07, 1.2200325727462769e-07, 1.3224780559539795e-07, 1.424923539161682e-07, 1.5273690223693848e-07, 1.6298145055770874e-07, 1.73225998878479e-07, 1.8347054719924927e-07, 1.9371509552001953e-07, 2.039596438407898e-07, 2.1420419216156006e-07, 2.2444874048233032e-07, 2.3469328880310059e-07, 2.4493783712387085e-07, 2.551823854446411e-07, 2.654269337654114e-07, 2.7567148208618164e-07, 2.859160304069519e-07, 2.9616057872772217e-07, 3.0640512704849243e-07, 3.166496753692627e-07, 3.2689422369003296e-07, 3.371387720108032e-07, 3.473833203315735e-07, 3.5762786865234375e-07]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 4.0, 1.0, 1.0, 59.0, 47.0, 62.0, 718.0, 83977.0, 4108485.0, 682.0, 54.0, 50.0, 89.0, 6.0, 2.0, 3.0, 15.0, 5.0, 0.0, 2.0, 1.0, 5.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.238719940185547e-06, -8.920207619667053e-06, -8.60169529914856e-06, -8.283182978630066e-06, -7.964670658111572e-06, -7.646158337593079e-06, -7.327646017074585e-06, -7.009133696556091e-06, -6.690621376037598e-06, -6.372109055519104e-06, -6.05359673500061e-06, -5.735084414482117e-06, -5.416572093963623e-06, -5.098059773445129e-06, -4.779547452926636e-06, -4.461035132408142e-06, -4.1425228118896484e-06, -3.824010491371155e-06, -3.505498170852661e-06, -3.1869858503341675e-06, -2.868473529815674e-06, -2.54996120929718e-06, -2.2314488887786865e-06, -1.912936568260193e-06, -1.5944242477416992e-06, -1.2759119272232056e-06, -9.57399606704712e-07, -6.388872861862183e-07, -3.203749656677246e-07, -1.862645149230957e-09, 3.166496753692627e-07, 6.351619958877563e-07, 9.5367431640625e-07, 1.2721866369247437e-06, 1.5906989574432373e-06, 1.909211277961731e-06, 2.2277235984802246e-06, 2.5462359189987183e-06, 2.864748239517212e-06, 3.1832605600357056e-06, 3.5017728805541992e-06, 3.820285201072693e-06, 4.1387975215911865e-06, 4.45730984210968e-06, 4.775822162628174e-06, 5.0943344831466675e-06, 5.412846803665161e-06, 5.731359124183655e-06, 6.0498714447021484e-06, 6.368383765220642e-06, 6.686896085739136e-06, 7.005408406257629e-06, 7.323920726776123e-06, 7.642433047294617e-06, 7.96094536781311e-06, 8.279457688331604e-06, 8.597970008850098e-06, 8.916482329368591e-06, 9.234994649887085e-06, 9.553506970405579e-06, 9.872019290924072e-06, 1.0190531611442566e-05, 1.050904393196106e-05, 1.0827556252479553e-05, 1.1146068572998047e-05]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 108.0, 0.0, 0.0, 0.0, 3774.0, 0.0, 0.0, 0.0, 0.0, 143.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.032626748085022e-07, -3.8929283618927e-07, -3.7532299757003784e-07, -3.6135315895080566e-07, -3.473833203315735e-07, -3.334134817123413e-07, -3.1944364309310913e-07, -3.0547380447387695e-07, -2.915039658546448e-07, -2.775341272354126e-07, -2.635642886161804e-07, -2.4959444999694824e-07, -2.3562461137771606e-07, -2.2165477275848389e-07, -2.076849341392517e-07, -1.9371509552001953e-07, -1.7974525690078735e-07, -1.6577541828155518e-07, -1.51805579662323e-07, -1.3783574104309082e-07, -1.2386590242385864e-07, -1.0989606380462646e-07, -9.592622518539429e-08, -8.195638656616211e-08, -6.798654794692993e-08, -5.4016709327697754e-08, -4.0046870708465576e-08, -2.60770320892334e-08, -1.210719347000122e-08, 1.862645149230957e-09, 1.5832483768463135e-08, 2.9802322387695312e-08, 4.377216100692749e-08, 5.774199962615967e-08, 7.171183824539185e-08, 8.568167686462402e-08, 9.96515154838562e-08, 1.1362135410308838e-07, 1.2759119272232056e-07, 1.4156103134155273e-07, 1.555308699607849e-07, 1.695007085800171e-07, 1.8347054719924927e-07, 1.9744038581848145e-07, 2.1141022443771362e-07, 2.253800630569458e-07, 2.39349901676178e-07, 2.5331974029541016e-07, 2.6728957891464233e-07, 2.812594175338745e-07, 2.952292561531067e-07, 3.0919909477233887e-07, 3.2316893339157104e-07, 3.371387720108032e-07, 3.511086106300354e-07, 3.650784492492676e-07, 3.7904828786849976e-07, 3.9301812648773193e-07, 4.069879651069641e-07, 4.209578037261963e-07, 4.3492764234542847e-07, 4.4889748096466064e-07, 4.628673195838928e-07, 4.76837158203125e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 8.0, 10.0, 16.0, 16.0, 25.0, 53.0, 84.0, 143.0, 266.0, 142.0, 88.0, 56.0, 32.0, 28.0, 13.0, 8.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-1.1732416851373273e-06, -1.1495633316371823e-06, -1.1258849781370373e-06, -1.1022066246368922e-06, -1.0785282711367472e-06, -1.0548499176366022e-06, -1.0311715641364572e-06, -1.0074932106363121e-06, -9.838148571361671e-07, -9.60136503636022e-07, -9.364581501358771e-07, -9.127797966357321e-07, -8.89101443135587e-07, -8.65423089635442e-07, -8.41744736135297e-07, -8.180663257917331e-07, -7.943879154481692e-07, -7.707095619480242e-07, -7.470312084478792e-07, -7.233528549477342e-07, -6.996745014475891e-07, -6.759961479474441e-07, -6.523177944472991e-07, -6.286393841037352e-07, -6.04961087447009e-07, -5.81282733946864e-07, -5.57604380446719e-07, -5.33926026946574e-07, -5.10247673446429e-07, -4.865693199462839e-07, -4.628909380244295e-07, -4.3921255610257504e-07, -4.155341741807206e-07, -3.9185582068057556e-07, -3.6817746718043054e-07, -3.444990852585761e-07, -3.2082073175843107e-07, -2.9714237825828604e-07, -2.73464024758141e-07, -2.49785671257996e-07, -2.2610730354699626e-07, -2.0242895004685124e-07, -1.787505823358515e-07, -1.5507222883570648e-07, -1.3139387533556146e-07, -1.0771550762456172e-07, -8.40371541244167e-08, -6.035878641341696e-08, -3.668043291327194e-08, -1.3002074084056403e-08, 1.0676284745159137e-08, 3.435464179801784e-08, 5.803300240359022e-08, 8.17113630091626e-08, 1.0538971650930762e-07, 1.2906808422030736e-07, 1.5274643772045238e-07, 1.764247912205974e-07, 2.0010315893159714e-07, 2.2378151243174216e-07, 2.474598659318872e-07, 2.711382194320322e-07, 2.948165729321772e-07, 3.184949548540317e-07, 3.421733083541767e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 3.0, 9.0, 16.0, 12.0, 17.0, 24.0, 25.0, 17.0, 17.0, 30.0, 22.0, 30.0, 25.0, 37.0, 46.0, 30.0, 34.0, 47.0, 42.0, 35.0, 48.0, 35.0, 37.0, 40.0, 32.0, 47.0, 22.0, 31.0, 23.0, 23.0, 12.0, 15.0, 12.0, 15.0, 16.0, 10.0, 14.0, 5.0, 6.0, 8.0, 4.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.52870529241045e-07, -3.4143982929890626e-07, -3.3000915777847695e-07, -3.185784578363382e-07, -3.071477863159089e-07, -2.9571708637377014e-07, -2.842863864316314e-07, -2.728557149112021e-07, -2.6142504339077277e-07, -2.4999434344863403e-07, -2.385636719282047e-07, -2.2713297198606597e-07, -2.1570230046563665e-07, -2.042716005234979e-07, -1.9284091479221388e-07, -1.8141022906092985e-07, -1.699795291187911e-07, -1.5854884338750708e-07, -1.4711815765622305e-07, -1.356874577140843e-07, -1.24256786193655e-07, -1.128260933569436e-07, -1.0139540052023222e-07, -8.996471478894819e-08, -7.853402905766416e-08, -6.710334332638013e-08, -5.567265404238242e-08, -4.424196475838471e-08, -3.281127902710068e-08, -2.1380593295816652e-08, -9.949900459105265e-09, 1.480785272178764e-09, 1.2911442581753363e-08, 2.434213008939423e-08, 3.57728175970351e-08, 4.720350688103281e-08, 5.863419261231684e-08, 7.006487834360087e-08, 8.149557118031225e-08, 9.292625691159628e-08, 1.0435694264288031e-07, 1.1578762837416434e-07, 1.2721831410544837e-07, 1.386489998367324e-07, 1.5007969977887115e-07, 1.6151037129930046e-07, 1.729410712414392e-07, 1.8437175697272323e-07, 1.9580244270400726e-07, 2.072331284352913e-07, 2.1866381416657532e-07, 2.3009451410871407e-07, 2.415251856291434e-07, 2.529558855712821e-07, 2.6438658551342087e-07, 2.758172570338502e-07, 2.872479285542795e-07, 2.9867862849641824e-07, 3.1010930001684756e-07, 3.215399999589863e-07, 3.329706714794156e-07, 3.4440137142155436e-07, 3.558320713636931e-07, 3.672627428841224e-07, 3.7869344282626116e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1913.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47331.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 949871.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47370.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1887.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 103.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 241.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 340.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 211.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 10.0, 14.0, 14.0, 23.0, 29.0, 45.0, 93.0, 89.0, 205.0, 175.0, 81.0, 62.0, 47.0, 27.0, 24.0, 16.0, 10.0, 12.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.826181445125258e-07, -7.651247528883687e-07, -7.476314181076305e-07, -7.301380264834734e-07, -7.126446917027351e-07, -6.951513000785781e-07, -6.776579652978398e-07, -6.601645736736828e-07, -6.426712388929445e-07, -6.251778472687874e-07, -6.076845124880492e-07, -5.901911208638921e-07, -5.726977860831539e-07, -5.552043944589968e-07, -5.377110596782586e-07, -5.202176680541015e-07, -5.027243332733633e-07, -4.852309416492062e-07, -4.67737606868468e-07, -4.5024424366602034e-07, -4.327508804635727e-07, -4.1525751726112503e-07, -3.977641540586774e-07, -3.802707624345203e-07, -3.627773708103632e-07, -3.4528400760791556e-07, -3.277906444054679e-07, -3.1029728120302025e-07, -2.928039180005726e-07, -2.7531055479812494e-07, -2.578171915956773e-07, -2.403237999715202e-07, -2.228304936124914e-07, -2.0533713041004376e-07, -1.878437672075961e-07, -1.7035040400514845e-07, -1.528570408027008e-07, -1.3536367760025314e-07, -1.1787030018695077e-07, -1.0037693698450312e-07, -8.288357378205546e-08, -6.539021057960781e-08, -4.789684382444648e-08, -3.0403477069285145e-08, -1.2910113866837492e-08, 4.583249335610162e-09, 2.2076619643485174e-08, 3.956998284593283e-08, 5.706334604838048e-08, 7.455670925082813e-08, 9.205007245327579e-08, 1.095434427611508e-07, 1.270367988581711e-07, 1.4453016206061875e-07, 1.6202353947392112e-07, 1.7951690267636877e-07, 1.9701026587881643e-07, 2.1450362908126408e-07, 2.3199699228371173e-07, 2.494903696970141e-07, 2.6698373289946176e-07, 2.844770961019094e-07, 3.0197045930435706e-07, 3.194638225068047e-07, 3.3695718570925237e-07]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 4.0, 13.0, 13.0, 17.0, 21.0, 21.0, 23.0, 18.0, 27.0, 19.0, 26.0, 37.0, 30.0, 33.0, 34.0, 38.0, 39.0, 47.0, 59.0, 44.0, 35.0, 39.0, 30.0, 44.0, 35.0, 28.0, 26.0, 27.0, 20.0, 17.0, 20.0, 15.0, 12.0, 10.0, 15.0, 9.0, 9.0, 7.0, 6.0, 3.0, 3.0, 3.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4509645868420193e-07, -2.3727000098006101e-07, -2.294435574867748e-07, -2.2161709978263389e-07, -2.1379065628934768e-07, -2.0596419858520676e-07, -1.9813774088106584e-07, -1.9031129738777963e-07, -1.8248485389449343e-07, -1.746583961903525e-07, -1.668319526970663e-07, -1.5900549499292538e-07, -1.5117905149963917e-07, -1.4335259379549825e-07, -1.3552613609135733e-07, -1.2769969259807112e-07, -1.198732348939302e-07, -1.1204678429521664e-07, -1.0422033369650308e-07, -9.639387599236215e-08, -8.856743249907595e-08, -8.074097479493503e-08, -7.291452419622146e-08, -6.50880735975079e-08, -5.726162299879434e-08, -4.9435172400080774e-08, -4.160872180136721e-08, -3.378226764993997e-08, -2.5955817051226404e-08, -1.812936645251284e-08, -1.0302912301085598e-08, -2.4764617023720348e-09, 5.349988896341529e-09, 1.3176440383233512e-08, 2.1002891870125495e-08, 2.8829344245195898e-08, 3.665579484390946e-08, 4.4482245442623025e-08, 5.230869959405027e-08, 6.013515019276383e-08, 6.79616007914774e-08, 7.578805139019096e-08, 8.361450198890452e-08, 9.144095258761809e-08, 9.9267410291759e-08, 1.0709385378504521e-07, 1.1492031148918613e-07, 1.2274676919332705e-07, 1.3057321268661326e-07, 1.3839967039075418e-07, 1.462261138840404e-07, 1.540525715881813e-07, 1.6187901508146751e-07, 1.6970547278560844e-07, 1.7753191627889464e-07, 1.8535837398303556e-07, 1.9318483168717648e-07, 2.010112893913174e-07, 2.088377328846036e-07, 2.1666419058874453e-07, 2.2449063408203074e-07, 2.3231709178617166e-07, 2.401435494903126e-07, 2.4796997877274407e-07, 2.55796436476885e-07]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 7.0, 0.0, 16.0, 0.0, 35.0, 0.0, 51.0, 0.0, 102.0, 0.0, 189.0, 0.0, 400.0, 0.0, 742.0, 0.0, 1408.0, 0.0, 4970.0, 0.0, 11931.0, 0.0, 39972.0, 0.0, 0.0, 159515.0, 0.0, 610127.0, 0.0, 159111.0, 0.0, 40055.0, 0.0, 12047.0, 0.0, 5000.0, 0.0, 1343.0, 0.0, 746.0, 0.0, 389.0, 0.0, 193.0, 0.0, 101.0, 0.0, 47.0, 0.0, 33.0, 0.0, 22.0, 0.0, 9.0, 0.0, 8.0], "bins": [-1.0132789611816406e-06, -9.844079613685608e-07, -9.55536961555481e-07, -9.266659617424011e-07, -8.977949619293213e-07, -8.689239621162415e-07, -8.400529623031616e-07, -8.111819624900818e-07, -7.82310962677002e-07, -7.534399628639221e-07, -7.245689630508423e-07, -6.956979632377625e-07, -6.668269634246826e-07, -6.379559636116028e-07, -6.09084963798523e-07, -5.802139639854431e-07, -5.513429641723633e-07, -5.224719643592834e-07, -4.936009645462036e-07, -4.647299647331238e-07, -4.3585896492004395e-07, -4.069879651069641e-07, -3.781169652938843e-07, -3.4924596548080444e-07, -3.203749656677246e-07, -2.915039658546448e-07, -2.6263296604156494e-07, -2.337619662284851e-07, -2.0489096641540527e-07, -1.7601996660232544e-07, -1.471489667892456e-07, -1.1827796697616577e-07, -8.940696716308594e-08, -6.05359673500061e-08, -3.166496753692627e-08, -2.7939677238464355e-09, 2.60770320892334e-08, 5.494803190231323e-08, 8.381903171539307e-08, 1.126900315284729e-07, 1.4156103134155273e-07, 1.7043203115463257e-07, 1.993030309677124e-07, 2.2817403078079224e-07, 2.5704503059387207e-07, 2.859160304069519e-07, 3.1478703022003174e-07, 3.4365803003311157e-07, 3.725290298461914e-07, 4.0140002965927124e-07, 4.302710294723511e-07, 4.591420292854309e-07, 4.880130290985107e-07, 5.168840289115906e-07, 5.457550287246704e-07, 5.746260285377502e-07, 6.034970283508301e-07, 6.323680281639099e-07, 6.612390279769897e-07, 6.901100277900696e-07, 7.189810276031494e-07, 7.478520274162292e-07, 7.767230272293091e-07, 8.055940270423889e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 245.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 389.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 233.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0], "bins": [-2.384185791015625e-07, -2.3189932107925415e-07, -2.253800630569458e-07, -2.1886080503463745e-07, -2.123415470123291e-07, -2.0582228899002075e-07, -1.993030309677124e-07, -1.9278377294540405e-07, -1.862645149230957e-07, -1.7974525690078735e-07, -1.73225998878479e-07, -1.6670674085617065e-07, -1.601874828338623e-07, -1.5366822481155396e-07, -1.471489667892456e-07, -1.4062970876693726e-07, -1.341104507446289e-07, -1.2759119272232056e-07, -1.210719347000122e-07, -1.1455267667770386e-07, -1.0803341865539551e-07, -1.0151416063308716e-07, -9.499490261077881e-08, -8.847564458847046e-08, -8.195638656616211e-08, -7.543712854385376e-08, -6.891787052154541e-08, -6.239861249923706e-08, -5.587935447692871e-08, -4.936009645462036e-08, -4.284083843231201e-08, -3.632158041000366e-08, -2.9802322387695312e-08, -2.3283064365386963e-08, -1.6763806343078613e-08, -1.0244548320770264e-08, -3.725290298461914e-09, 2.7939677238464355e-09, 9.313225746154785e-09, 1.5832483768463135e-08, 2.2351741790771484e-08, 2.8870999813079834e-08, 3.5390257835388184e-08, 4.190951585769653e-08, 4.842877388000488e-08, 5.494803190231323e-08, 6.146728992462158e-08, 6.798654794692993e-08, 7.450580596923828e-08, 8.102506399154663e-08, 8.754432201385498e-08, 9.406358003616333e-08, 1.0058283805847168e-07, 1.0710209608078003e-07, 1.1362135410308838e-07, 1.2014061212539673e-07, 1.2665987014770508e-07, 1.3317912817001343e-07, 1.3969838619232178e-07, 1.4621764421463013e-07, 1.5273690223693848e-07, 1.5925616025924683e-07, 1.6577541828155518e-07, 1.7229467630386353e-07, 1.7881393432617188e-07]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 2.0, 21.0, 0.0, 1.0, 39.0, 9.0, 3.0, 3.0, 20.0, 17.0, 154.0, 52.0, 344.0, 750.0, 2047.0, 6256.0, 26942.0, 138475.0, 698896.0, 137996.0, 26963.0, 6175.0, 2017.0, 981.0, 112.0, 43.0, 138.0, 19.0, 13.0, 7.0, 3.0, 10.0, 30.0, 0.0, 1.0, 17.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-06, -1.7229467630386353e-06, -1.6577541828155518e-06, -1.5925616025924683e-06, -1.5273690223693848e-06, -1.4621764421463013e-06, -1.3969838619232178e-06, -1.3317912817001343e-06, -1.2665987014770508e-06, -1.2014061212539673e-06, -1.1362135410308838e-06, -1.0710209608078003e-06, -1.0058283805847168e-06, -9.406358003616333e-07, -8.754432201385498e-07, -8.102506399154663e-07, -7.450580596923828e-07, -6.798654794692993e-07, -6.146728992462158e-07, -5.494803190231323e-07, -4.842877388000488e-07, -4.1909515857696533e-07, -3.5390257835388184e-07, -2.8870999813079834e-07, -2.2351741790771484e-07, -1.5832483768463135e-07, -9.313225746154785e-08, -2.7939677238464355e-08, 3.725290298461914e-08, 1.0244548320770264e-07, 1.6763806343078613e-07, 2.3283064365386963e-07, 2.980232238769531e-07, 3.632158041000366e-07, 4.284083843231201e-07, 4.936009645462036e-07, 5.587935447692871e-07, 6.239861249923706e-07, 6.891787052154541e-07, 7.543712854385376e-07, 8.195638656616211e-07, 8.847564458847046e-07, 9.499490261077881e-07, 1.0151416063308716e-06, 1.080334186553955e-06, 1.1455267667770386e-06, 1.210719347000122e-06, 1.2759119272232056e-06, 1.341104507446289e-06, 1.4062970876693726e-06, 1.471489667892456e-06, 1.5366822481155396e-06, 1.601874828338623e-06, 1.6670674085617065e-06, 1.73225998878479e-06, 1.7974525690078735e-06, 1.862645149230957e-06, 1.9278377294540405e-06, 1.993030309677124e-06, 2.0582228899002075e-06, 2.123415470123291e-06, 2.1886080503463745e-06, 2.253800630569458e-06, 2.3189932107925415e-06, 2.384185791015625e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 244.0, 0.0, 0.0, 0.0, 0.0, 0.0, 421.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 206.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.2910535335540771e-07, -2.1979212760925293e-07, -2.1047890186309814e-07, -2.0116567611694336e-07, -1.9185245037078857e-07, -1.825392246246338e-07, -1.73225998878479e-07, -1.6391277313232422e-07, -1.5459954738616943e-07, -1.4528632164001465e-07, -1.3597309589385986e-07, -1.2665987014770508e-07, -1.1734664440155029e-07, -1.0803341865539551e-07, -9.872019290924072e-08, -8.940696716308594e-08, -8.009374141693115e-08, -7.078051567077637e-08, -6.146728992462158e-08, -5.21540641784668e-08, -4.284083843231201e-08, -3.3527612686157227e-08, -2.421438694000244e-08, -1.4901161193847656e-08, -5.587935447692871e-09, 3.725290298461914e-09, 1.30385160446167e-08, 2.2351741790771484e-08, 3.166496753692627e-08, 4.0978193283081055e-08, 5.029141902923584e-08, 5.960464477539063e-08, 6.891787052154541e-08, 7.82310962677002e-08, 8.754432201385498e-08, 9.685754776000977e-08, 1.0617077350616455e-07, 1.1548399925231934e-07, 1.2479722499847412e-07, 1.341104507446289e-07, 1.434236764907837e-07, 1.5273690223693848e-07, 1.6205012798309326e-07, 1.7136335372924805e-07, 1.8067657947540283e-07, 1.8998980522155762e-07, 1.993030309677124e-07, 2.086162567138672e-07, 2.1792948246002197e-07, 2.2724270820617676e-07, 2.3655593395233154e-07, 2.4586915969848633e-07, 2.551823854446411e-07, 2.644956111907959e-07, 2.738088369369507e-07, 2.8312206268310547e-07, 2.9243528842926025e-07, 3.0174851417541504e-07, 3.110617399215698e-07, 3.203749656677246e-07, 3.296881914138794e-07, 3.390014171600342e-07, 3.4831464290618896e-07, 3.5762786865234375e-07]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 12.0, 15.0, 50.0, 72.0, 212.0, 366.0, 140.0, 61.0, 41.0, 21.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5975082305885735e-06, -1.565150341775734e-06, -1.5327924529628945e-06, -1.500434564150055e-06, -1.4680766753372154e-06, -1.435718786524376e-06, -1.4033608977115364e-06, -1.3710030088986969e-06, -1.338645233772695e-06, -1.3062873449598555e-06, -1.273929456147016e-06, -1.2415715673341765e-06, -1.209213678521337e-06, -1.1768557897084975e-06, -1.144497900895658e-06, -1.1121401257696562e-06, -1.079782123269979e-06, -1.0474242344571394e-06, -1.0150663456442999e-06, -9.827084568314604e-07, -9.503505680186208e-07, -9.179926792057813e-07, -8.856348472363607e-07, -8.532769584235211e-07, -8.209190696106816e-07, -7.885611807978421e-07, -7.562032919850026e-07, -7.238454031721631e-07, -6.914875712027424e-07, -6.591296823899029e-07, -6.267717935770634e-07, -5.944139047642238e-07, -5.62056129638222e-07, -5.296982408253825e-07, -4.97340352012543e-07, -4.649824916214129e-07, -4.326246028085734e-07, -4.002667139957339e-07, -3.679088536046038e-07, -3.3555096479176427e-07, -3.031930475572153e-07, -2.708351587443758e-07, -2.384772983532457e-07, -2.061194095404062e-07, -1.7376152072756668e-07, -1.4140363191472716e-07, -1.0904575731274235e-07, -7.668788271075755e-08, -4.432999389791803e-08, -1.1972112190505868e-08, 2.0385769516906294e-08, 5.2743651224318455e-08, 8.510153293173062e-08, 1.1745942174457014e-07, 1.4981729634655494e-07, 1.8217517094853974e-07, 2.1453305976137926e-07, 2.468909485742188e-07, 2.7924880896534887e-07, 3.116066977781884e-07, 3.439645865910279e-07, 3.7632247540386743e-07, 4.0868036421670695e-07, 4.4103822460783704e-07, 4.7339611342067656e-07]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 5.0, 8.0, 12.0, 7.0, 6.0, 17.0, 21.0, 27.0, 26.0, 22.0, 27.0, 34.0, 26.0, 33.0, 35.0, 42.0, 42.0, 33.0, 39.0, 42.0, 44.0, 34.0, 37.0, 38.0, 42.0, 37.0, 40.0, 25.0, 19.0, 15.0, 17.0, 27.0, 19.0, 14.0, 9.0, 11.0, 11.0, 6.0, 7.0, 12.0, 6.0, 4.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.606881537303707e-07, -2.525656555008027e-07, -2.4444315727123467e-07, -2.3632064483081194e-07, -2.2819814660124393e-07, -2.2007564837167592e-07, -2.119531359312532e-07, -2.038306377016852e-07, -1.9570813947211718e-07, -1.8758564124254917e-07, -1.7946314301298116e-07, -1.7134063057255844e-07, -1.6321813234299043e-07, -1.5509563411342242e-07, -1.469731216729997e-07, -1.3885062344343169e-07, -1.3072812521386368e-07, -1.2260562698429567e-07, -1.144831216493003e-07, -1.0636061631430493e-07, -9.823811808473693e-08, -9.011561985516892e-08, -8.199311452017355e-08, -7.387060918517818e-08, -6.574811095561017e-08, -5.7625609173328485e-08, -4.95031073910468e-08, -4.138060560876511e-08, -3.325810382648342e-08, -2.5135602044201732e-08, -1.7013100261920044e-08, -8.890598479638356e-09, -7.680966973566683e-10, 7.35440508492502e-09, 1.5476906867206708e-08, 2.3599408649488396e-08, 3.1721910431770084e-08, 3.984441221405177e-08, 4.796691399633346e-08, 5.608941577861515e-08, 6.421191756089684e-08, 7.233441579046485e-08, 8.045692112546021e-08, 8.857942646045558e-08, 9.670192469002359e-08, 1.048244229195916e-07, 1.1294692825458696e-07, 1.2106943358958233e-07, 1.2919193181915034e-07, 1.3731443004871835e-07, 1.4543692827828636e-07, 1.5355944071870908e-07, 1.616819389482771e-07, 1.698044371778451e-07, 1.7792694961826783e-07, 1.8604944784783584e-07, 1.9417194607740385e-07, 2.0229444430697185e-07, 2.1041694253653986e-07, 2.185394549769626e-07, 2.266619532065306e-07, 2.347844514360986e-07, 2.4290696387652133e-07, 2.5102946210608934e-07, 2.5915196033565735e-07]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 162.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2052.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9912.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4153844.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23128.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4788.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 378.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1004.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 493.0, 0.0, 4193279.0, 502.0, 8.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7285346984863281e-06, -1.6745179891586304e-06, -1.6205012798309326e-06, -1.5664845705032349e-06, -1.5124678611755371e-06, -1.4584511518478394e-06, -1.4044344425201416e-06, -1.3504177331924438e-06, -1.296401023864746e-06, -1.2423843145370483e-06, -1.1883676052093506e-06, -1.1343508958816528e-06, -1.080334186553955e-06, -1.0263174772262573e-06, -9.723007678985596e-07, -9.182840585708618e-07, -8.642673492431641e-07, -8.102506399154663e-07, -7.562339305877686e-07, -7.022172212600708e-07, -6.48200511932373e-07, -5.941838026046753e-07, -5.401670932769775e-07, -4.861503839492798e-07, -4.3213367462158203e-07, -3.781169652938843e-07, -3.241002559661865e-07, -2.7008354663848877e-07, -2.1606683731079102e-07, -1.6205012798309326e-07, -1.0803341865539551e-07, -5.4016709327697754e-08, 0.0, 5.4016709327697754e-08, 1.0803341865539551e-07, 1.6205012798309326e-07, 2.1606683731079102e-07, 2.7008354663848877e-07, 3.241002559661865e-07, 3.781169652938843e-07, 4.3213367462158203e-07, 4.861503839492798e-07, 5.401670932769775e-07, 5.941838026046753e-07, 6.48200511932373e-07, 7.022172212600708e-07, 7.562339305877686e-07, 8.102506399154663e-07, 8.642673492431641e-07, 9.182840585708618e-07, 9.723007678985596e-07, 1.0263174772262573e-06, 1.080334186553955e-06, 1.1343508958816528e-06, 1.1883676052093506e-06, 1.2423843145370483e-06, 1.296401023864746e-06, 1.3504177331924438e-06, 1.4044344425201416e-06, 1.4584511518478394e-06, 1.5124678611755371e-06, 1.5664845705032349e-06, 1.6205012798309326e-06, 1.6745179891586304e-06, 1.7285346984863281e-06]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4091.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 17.0, 22.0, 29.0, 37.0, 62.0, 109.0, 208.0, 225.0, 113.0, 63.0, 44.0, 18.0, 12.0, 10.0, 12.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.104441917566874e-08, -7.896938569729173e-08, -7.689435221891472e-08, -7.481932584596507e-08, -7.274429236758806e-08, -7.066925888921105e-08, -6.859422541083404e-08, -6.651919193245703e-08, -6.444416555950738e-08, -6.236913208113037e-08, -6.029409860275337e-08, -5.8219068677090036e-08, -5.6144038751426706e-08, -5.40690052730497e-08, -5.199397179467269e-08, -4.991894186900936e-08, -4.784390839063235e-08, -4.576887491225534e-08, -4.369384498659201e-08, -4.1618811508215003e-08, -3.9543781582551674e-08, -3.7468748104174665e-08, -3.5393718178511335e-08, -3.331868470013433e-08, -3.124365122175732e-08, -2.916861951973715e-08, -2.709358781771698e-08, -2.501855433933997e-08, -2.294352441367664e-08, -2.0868490935299633e-08, -1.8793459233279464e-08, -1.6718427531259294e-08, -1.4643401158309644e-08, -1.2568369456289474e-08, -1.0493337754269305e-08, -8.418305164070716e-09, -6.343273462050547e-09, -4.268241760030378e-09, -2.193209169831789e-09, -1.1817746781161986e-10, 1.9568542342085493e-09, 4.0318859362287185e-09, 6.1069180823380975e-09, 8.181950228447477e-09, 1.0256981930467646e-08, 1.2332013632487815e-08, 1.4407046222686404e-08, 1.6482077924706573e-08, 1.8557109626726742e-08, 2.063214132874691e-08, 2.270717303076708e-08, 2.478220650914409e-08, 2.685723643480742e-08, 2.8932269913184427e-08, 3.1007303391561436e-08, 3.3082333317224766e-08, 3.5157363242888096e-08, 3.7232396721265104e-08, 3.9307426646928434e-08, 4.138246012530544e-08, 4.345749005096877e-08, 4.553252352934578e-08, 4.760755700772279e-08, 4.968258693338612e-08, 5.175762041176313e-08]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 9.0, 5.0, 7.0, 9.0, 8.0, 7.0, 13.0, 13.0, 12.0, 22.0, 31.0, 25.0, 24.0, 15.0, 24.0, 31.0, 39.0, 40.0, 37.0, 44.0, 27.0, 41.0, 22.0, 40.0, 40.0, 32.0, 40.0, 39.0, 37.0, 44.0, 22.0, 24.0, 28.0, 14.0, 21.0, 15.0, 20.0, 9.0, 12.0, 5.0, 8.0, 10.0, 3.0, 9.0, 6.0, 4.0, 2.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 4.0], "bins": [-4.106736284370527e-08, -3.977901386065241e-08, -3.8490668430313235e-08, -3.720231944726038e-08, -3.59139740169212e-08, -3.4625625033868346e-08, -3.333727960352917e-08, -3.204893062047631e-08, -3.0760581637423456e-08, -2.947223443072744e-08, -2.8183887224031423e-08, -2.6895538240978567e-08, -2.560719281063939e-08, -2.4318843827586534e-08, -2.3030496620890517e-08, -2.17421494141945e-08, -2.0453803983855323e-08, -1.9165456777159307e-08, -1.787710957046329e-08, -1.6588760587410434e-08, -1.5300415157071257e-08, -1.401206706219682e-08, -1.2723718967322384e-08, -1.1435371760626367e-08, -1.014702455393035e-08, -8.858677347234334e-09, -7.570330140538317e-09, -6.281982045663881e-09, -4.993634838967864e-09, -3.7052876322718475e-09, -2.416939537397411e-09, -1.1285923307013945e-09, 1.5975842870830093e-10, 1.4481058574489225e-09, 2.736453286189544e-09, 4.024800936974771e-09, 5.313148143670787e-09, 6.601495350366804e-09, 7.88984344524124e-09, 9.178190651937257e-09, 1.0466537858633274e-08, 1.175488506532929e-08, 1.3043232272025307e-08, 1.4331580366899743e-08, 1.561992846177418e-08, 1.6908273892113357e-08, 1.8196622875166213e-08, 1.948497008186223e-08, 2.0773317288558246e-08, 2.2061664495254263e-08, 2.335001170195028e-08, 2.4638360685003136e-08, 2.5926706115342313e-08, 2.721505509839517e-08, 2.8503402305091186e-08, 2.9791749511787202e-08, 3.108009849484006e-08, 3.2368447477892914e-08, 3.365679290823209e-08, 3.494514189128495e-08, 3.6233487321624125e-08, 3.752183630467698e-08, 3.881018528772984e-08, 4.0098530718069014e-08, 4.138687614840819e-08]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 8.0, 9.0, 12.0, 13.0, 28.0, 29.0, 47.0, 81.0, 120.0, 232.0, 154.0, 78.0, 58.0, 36.0, 12.0, 27.0, 13.0, 8.0, 9.0, 6.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6762681787649854e-08, -3.520313285321208e-08, -3.364358036606063e-08, -3.208403143162286e-08, -3.052448249718509e-08, -2.896493001003364e-08, -2.740538107559587e-08, -2.584583036480126e-08, -2.4286279654006648e-08, -2.2726728943212038e-08, -2.1167178232417427e-08, -1.9607629297979656e-08, -1.8048078587185046e-08, -1.6488527876390435e-08, -1.4928978941952664e-08, -1.3369428231158054e-08, -1.1809877520363443e-08, -1.0250326809568833e-08, -8.690776986952642e-09, -7.131226720247241e-09, -5.571676453541841e-09, -4.01212574274723e-09, -2.4525759201310393e-09, -8.930260975148485e-10, 6.66524613279762e-10, 2.2260748799851626e-09, 3.785625146690563e-09, 5.345175413395964e-09, 6.9047256801013646e-09, 8.464276390895975e-09, 1.0023826213512166e-08, 1.1583376036128357e-08, 1.3142923194209288e-08, 1.4702473905003899e-08, 1.626202461579851e-08, 1.782157355023628e-08, 1.938112426103089e-08, 2.09406749718255e-08, 2.2500223906263273e-08, 2.4059774617057883e-08, 2.5619325327852494e-08, 2.7178876038647104e-08, 2.8738426749441714e-08, 3.0297975683879486e-08, 3.1857524618317257e-08, 3.3417077105468707e-08, 3.497662603990648e-08, 3.653617852705793e-08, 3.80957274614957e-08, 3.965527639593347e-08, 4.121482888308492e-08, 4.277437781752269e-08, 4.433393030467414e-08, 4.589347923911191e-08, 4.745302817354968e-08, 4.9012577107987454e-08, 5.0572129595138904e-08, 5.2131678529576675e-08, 5.3691231016728125e-08, 5.5250779951165896e-08, 5.681032888560367e-08, 5.836988137275512e-08, 5.992943385990657e-08, 6.148898279434434e-08, 6.304853172878211e-08]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 7.0, 8.0, 4.0, 14.0, 13.0, 15.0, 8.0, 23.0, 17.0, 30.0, 28.0, 28.0, 26.0, 27.0, 46.0, 35.0, 39.0, 30.0, 35.0, 43.0, 48.0, 38.0, 45.0, 34.0, 41.0, 46.0, 31.0, 31.0, 32.0, 29.0, 15.0, 16.0, 16.0, 20.0, 16.0, 10.0, 7.0, 6.0, 9.0, 9.0, 9.0, 6.0, 4.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.635405138562419e-08, -2.5521670110606465e-08, -2.468929061194558e-08, -2.3856909336927856e-08, -2.3024528061910132e-08, -2.2192146786892408e-08, -2.1359767288231524e-08, -2.05273860132138e-08, -1.9695004738196076e-08, -1.8862623463178352e-08, -1.8030243964517467e-08, -1.7197862689499743e-08, -1.636548141448202e-08, -1.5533100139464295e-08, -1.470072064080341e-08, -1.3868339365785687e-08, -1.3035959867124802e-08, -1.2203579480285498e-08, -1.1371198205267774e-08, -1.053881781842847e-08, -9.706436543410746e-09, -8.874056156571442e-09, -8.041675769732137e-09, -7.209294938803623e-09, -6.376914107875109e-09, -5.544533276946595e-09, -4.712152446018081e-09, -3.8797720591787765e-09, -3.0473912282502624e-09, -2.2150103973217483e-09, -1.382630010482444e-09, -5.502491795539299e-10, 2.821316513745842e-10, 1.1145123712807958e-09, 1.9468930911870075e-09, 2.7792737000709167e-09, 3.6116545309994308e-09, 4.444035361927945e-09, 5.276415748767249e-09, 6.108796579695763e-09, 6.941177410624277e-09, 7.773557797463582e-09, 8.605939072481306e-09, 9.43831945932061e-09, 1.0270699846159914e-08, 1.1103081121177638e-08, 1.1935461508016942e-08, 1.2767841894856247e-08, 1.360022316987397e-08, 1.4432603556713275e-08, 1.526498394355258e-08, 1.6097365218570303e-08, 1.6929746493588027e-08, 1.776212599224891e-08, 1.8594507267266636e-08, 1.942688854228436e-08, 2.0259268040945244e-08, 2.1091649315962968e-08, 2.1924028814623853e-08, 2.2756410089641577e-08, 2.35887913646593e-08, 2.4421172639677025e-08, 2.525355213833791e-08, 2.6085933413355633e-08, 2.6918314688373357e-08]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 3.0, 7.0, 7.0, 10.0, 15.0, 18.0, 38.0, 42.0, 80.0, 174.0, 262.0, 121.0, 73.0, 44.0, 37.0, 14.0, 9.0, 12.0, 8.0, 5.0, 1.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6490660332001426e-08, -2.5183718221910567e-08, -2.387677611181971e-08, -2.256983577808569e-08, -2.126289189163799e-08, -1.9955951557903973e-08, -1.8649009447813114e-08, -1.7342067337722256e-08, -1.6035125227631397e-08, -1.4728183117540539e-08, -1.342124100744968e-08, -1.2114299785537241e-08, -1.0807357675446383e-08, -9.500415565355524e-09, -8.193474343443086e-09, -6.886532233352227e-09, -5.579590123261369e-09, -4.27264801317051e-09, -2.9657063471688616e-09, -1.658764681167213e-09, -3.518225710763545e-10, 9.55119539014504e-10, 2.2620607609269427e-09, 3.5690028710178012e-09, 4.87594498110866e-09, 6.182887091199518e-09, 7.489829201290377e-09, 8.796770423202815e-09, 1.0103712533293674e-08, 1.1410654643384532e-08, 1.2717595865296971e-08, 1.402453797538783e-08, 1.533147653276501e-08, 1.6638418642855868e-08, 1.7945360752946726e-08, 1.9252301086680745e-08, 2.0559244973128443e-08, 2.1866185306862462e-08, 2.317312741695332e-08, 2.448006952704418e-08, 2.5787011637135038e-08, 2.7093953747225896e-08, 2.8400895857316755e-08, 2.9707837967407613e-08, 3.101477830114163e-08, 3.232172218758933e-08, 3.362866252132335e-08, 3.493560285505737e-08, 3.6242546741505066e-08, 3.7549487075239085e-08, 3.885643096168678e-08, 4.01633712954208e-08, 4.14703151818685e-08, 4.277725551560252e-08, 4.408419584933654e-08, 4.5391139735784236e-08, 4.6698083622231934e-08, 4.800502395596595e-08, 4.931196784241365e-08, 5.061890817614767e-08, 5.192585206259537e-08, 5.323279239632939e-08, 5.4539732730063406e-08, 5.5846676616511104e-08, 5.715361695024512e-08]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 11.0, 8.0, 9.0, 7.0, 12.0, 16.0, 32.0, 23.0, 23.0, 28.0, 27.0, 31.0, 34.0, 29.0, 37.0, 44.0, 33.0, 48.0, 39.0, 46.0, 39.0, 39.0, 43.0, 33.0, 48.0, 30.0, 28.0, 25.0, 17.0, 19.0, 25.0, 17.0, 18.0, 9.0, 10.0, 7.0, 9.0, 9.0, 8.0, 7.0, 8.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.0418555735091104e-08, -1.9784550886470242e-08, -1.915054781420622e-08, -1.851654296558536e-08, -1.7882538116964497e-08, -1.7248535044700475e-08, -1.6614530196079613e-08, -1.598052534745875e-08, -1.534652227519473e-08, -1.4712518314752288e-08, -1.4078513466131426e-08, -1.3444509505688984e-08, -1.2810505545246542e-08, -1.21765015848041e-08, -1.1542496736183239e-08, -1.0908492775740797e-08, -1.0274487927119935e-08, -9.640483966677493e-09, -9.006479118056632e-09, -8.37247515761419e-09, -7.738471197171748e-09, -7.104466792640096e-09, -6.4704623881084444e-09, -5.8364584276660025e-09, -5.202454023134351e-09, -4.568449618602699e-09, -3.934445658160257e-09, -3.3004412536286054e-09, -2.6664370711415586e-09, -2.0324328886545118e-09, -1.39842848412286e-09, -7.644245236804181e-10, -1.304201191487664e-10, 5.035841188494317e-10, 1.1375883568476297e-09, 1.771592650356979e-09, 2.405596832844026e-09, 3.0396010153310726e-09, 3.6736054198627244e-09, 4.307609380305166e-09, 4.941613784836818e-09, 5.57561818936847e-09, 6.209622149810912e-09, 6.843626554342563e-09, 7.477630958874215e-09, 8.111634919316657e-09, 8.745638879759099e-09, 9.37964372837996e-09, 1.0013647688822402e-08, 1.0647651649264844e-08, 1.1281656497885706e-08, 1.1915660458328148e-08, 1.254966441877059e-08, 1.3183669267391451e-08, 1.3817673227833893e-08, 1.4451677188276335e-08, 1.5085682036897197e-08, 1.5719686885518058e-08, 1.635368995778208e-08, 1.6987694806402942e-08, 1.7621699655023804e-08, 1.8255702727287826e-08, 1.8889707575908687e-08, 1.952371064817271e-08, 2.015771549679357e-08]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 12.0, 10.0, 21.0, 33.0, 73.0, 197.0, 282.0, 195.0, 79.0, 45.0, 25.0, 15.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.237740907659827e-09, -5.129732194575354e-09, -5.0217239255800905e-09, -4.913715212495617e-09, -4.805706943500354e-09, -4.697698230415881e-09, -4.589689961420618e-09, -4.4816812483361446e-09, -4.373672979340881e-09, -4.265664266256408e-09, -4.157655997261145e-09, -4.049647284176672e-09, -3.9416390151814085e-09, -3.833630302096935e-09, -3.725622033101672e-09, -3.617613320017199e-09, -3.5096048289773307e-09, -3.4015963379374625e-09, -3.2935878468975943e-09, -3.185579355857726e-09, -3.077570864817858e-09, -2.9695623737779897e-09, -2.8615536606935166e-09, -2.7535453916982533e-09, -2.64553667861378e-09, -2.537528187573912e-09, -2.4295196965340438e-09, -2.3215112054941756e-09, -2.2135027144543074e-09, -2.105494223414439e-09, -1.997485732374571e-09, -1.889477019290098e-09, -1.781468639272532e-09, -1.6734601482326639e-09, -1.5654516571927957e-09, -1.457443055130625e-09, -1.3494345640907568e-09, -1.2414260730508886e-09, -1.1334175820110204e-09, -1.0254090909711522e-09, -9.17400599931284e-10, -8.093921088914158e-10, -7.013836178515476e-10, -5.933750713005281e-10, -4.853665802606599e-10, -3.7735808922079173e-10, -2.693495426697723e-10, -1.6134105162990409e-10, -5.333256059003588e-11, 5.467594432762013e-11, 1.6268444924527614e-10, 2.7069296804071996e-10, 3.7870145908058817e-10, 4.867099501204564e-10, 5.947184966714758e-10, 7.02726987711344e-10, 8.107354787512122e-10, 9.187439697910804e-10, 1.0267524608309486e-09, 1.1347609518708168e-09, 1.242769442910685e-09, 1.3507779339505532e-09, 1.458786536012724e-09, 1.5667950270525921e-09, 1.6748035180924603e-09]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 7.0, 8.0, 6.0, 10.0, 12.0, 15.0, 16.0, 19.0, 29.0, 21.0, 27.0, 24.0, 23.0, 41.0, 32.0, 38.0, 29.0, 48.0, 50.0, 43.0, 46.0, 49.0, 33.0, 27.0, 36.0, 44.0, 27.0, 33.0, 29.0, 19.0, 26.0, 13.0, 19.0, 17.0, 13.0, 8.0, 11.0, 7.0, 6.0, 9.0, 7.0, 10.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.4582792751127727e-09, -1.4115654201063421e-09, -1.3648515650999116e-09, -1.318137710093481e-09, -1.2714238550870505e-09, -1.2247098890583175e-09, -1.177996034051887e-09, -1.1312821790454564e-09, -1.0845683240390258e-09, -1.0378544690325953e-09, -9.911406140261647e-10, -9.444267590197342e-10, -8.977128485021524e-10, -8.509989934957218e-10, -8.042850829781401e-10, -7.575712279717095e-10, -7.10857372965279e-10, -6.641435179588484e-10, -6.174296629524179e-10, -5.707157524348361e-10, -5.240018974284055e-10, -4.77288042421975e-10, -4.305741596599688e-10, -3.8386027689796265e-10, -3.371464218915321e-10, -2.9043256688510155e-10, -2.437186841230954e-10, -1.9700481523887703e-10, -1.5029094635465867e-10, -1.0357709134822812e-10, -5.686320858622196e-11, -1.0149325824215794e-11, 3.656464020451722e-11, 8.327850908873558e-11, 1.2999237797295393e-10, 1.767062468571723e-10, 2.2342011574139065e-10, 2.701339707478212e-10, 3.1684785350982736e-10, 3.635617362718335e-10, 4.1027559127826407e-10, 4.569894462846946e-10, 5.037033012911252e-10, 5.50417211808707e-10, 5.971310668151375e-10, 6.43844921821568e-10, 6.905588323391498e-10, 7.372726873455804e-10, 7.839865423520109e-10, 8.307003973584415e-10, 8.77414252364872e-10, 9.241281628824538e-10, 9.708420734000356e-10, 1.0175558173841637e-09, 1.0642697834128967e-09, 1.1109836384193272e-09, 1.1576974934257578e-09, 1.2044113484321883e-09, 1.2511252034386189e-09, 1.2978390584450494e-09, 1.34455291345148e-09, 1.391266879480213e-09, 1.4379807344866435e-09, 1.484694589493074e-09, 1.5314084444995046e-09]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 7.0, 2.0, 10.0, 13.0, 21.0, 27.0, 26.0, 50.0, 72.0, 123.0, 152.0, 143.0, 97.0, 70.0, 52.0, 26.0, 19.0, 20.0, 17.0, 10.0, 10.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3352978722735998e-09, -1.2871537169445446e-09, -1.2390095616154895e-09, -1.1908652952641319e-09, -1.1427211399350767e-09, -1.0945769846060216e-09, -1.046432718254664e-09, -9.982885629256089e-10, -9.501444075965537e-10, -9.020002522674986e-10, -8.538560414272922e-10, -8.057118305870858e-10, -7.575676752580307e-10, -7.094235199289756e-10, -6.612793090887692e-10, -6.131350982485628e-10, -5.649909429195077e-10, -5.168467875904525e-10, -4.687025767502462e-10, -4.2055839366561543e-10, -3.7241421058098467e-10, -3.242700274963539e-10, -2.7612584441172316e-10, -2.279816613270924e-10, -1.7983747824246166e-10, -1.316932951578309e-10, -8.354911207320015e-11, -3.5404928988569395e-11, 1.2739254096061359e-11, 6.088343718069211e-11, 1.0902762026532287e-10, 1.5717180334995362e-10, 2.0531609745688684e-10, 2.534602805415176e-10, 3.0160446362614834e-10, 3.497486467107791e-10, 3.9789282979540985e-10, 4.460370128800406e-10, 4.941811959646714e-10, 5.423254068048777e-10, 5.904695621339329e-10, 6.38613717462988e-10, 6.867579283031944e-10, 7.349021391434007e-10, 7.830462944724559e-10, 8.31190449801511e-10, 8.793346606417174e-10, 9.274788714819238e-10, 9.75623026810979e-10, 1.023767182140034e-09, 1.0719114484913916e-09, 1.1200556038204468e-09, 1.168199759149502e-09, 1.216343914478557e-09, 1.2644880698076122e-09, 1.3126323361589698e-09, 1.360776491488025e-09, 1.40892064681708e-09, 1.4570649131684377e-09, 1.5052090684974928e-09, 1.553353223826548e-09, 1.601497379155603e-09, 1.6496415344846582e-09, 1.6977858008360158e-09, 1.745929956165071e-09]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 11.0, 3.0, 6.0, 8.0, 13.0, 24.0, 23.0, 24.0, 27.0, 26.0, 27.0, 26.0, 29.0, 40.0, 44.0, 40.0, 39.0, 58.0, 51.0, 37.0, 48.0, 24.0, 34.0, 33.0, 33.0, 42.0, 29.0, 26.0, 22.0, 15.0, 19.0, 20.0, 16.0, 7.0, 15.0, 5.0, 8.0, 12.0, 8.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.17931342048206e-10, -8.881635427115953e-10, -8.583956878638332e-10, -8.286278885272225e-10, -7.988600891906117e-10, -7.690922343428497e-10, -7.393244350062389e-10, -7.095566356696281e-10, -6.797887808218661e-10, -6.500209814852553e-10, -6.202531266374933e-10, -5.904853273008825e-10, -5.607174724531205e-10, -5.309496731165098e-10, -5.01181873779899e-10, -4.71414018932137e-10, -4.416462195955262e-10, -4.118783925033398e-10, -3.821105654111534e-10, -3.523427660745426e-10, -3.2257493898235623e-10, -2.9280711189016984e-10, -2.6303931255355906e-10, -2.3327148546137266e-10, -2.0350365836918627e-10, -1.7373583127699987e-10, -1.439680180626013e-10, -1.142001979093088e-10, -8.443237775601631e-11, -5.4664550663829914e-11, -2.4896737449431328e-11, 4.871075764967259e-12, 3.463884734600242e-11, 6.440666749929491e-11, 9.41744876525874e-11, 1.23942300866986e-10, 1.5371012795917238e-10, 1.8347795505135878e-10, 2.1324576826575736e-10, 2.4301358148015595e-10, 2.7278140857234234e-10, 3.0254923566452874e-10, 3.3231706275671513e-10, 3.620848620933259e-10, 3.918526891855123e-10, 4.216205162776987e-10, 4.513883156143095e-10, 4.811561149509203e-10, 5.109239697986823e-10, 5.40691769135293e-10, 5.704596239830551e-10, 6.002274233196658e-10, 6.299952781674278e-10, 6.597630775040386e-10, 6.895308768406494e-10, 7.192987316884114e-10, 7.490665310250222e-10, 7.78834330361633e-10, 8.08602185209395e-10, 8.383699845460058e-10, 8.681377838826165e-10, 8.979056387303785e-10, 9.276734380669893e-10, 9.574412374036e-10, 9.872090922513621e-10]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 11.0, 46.0, 475.0, 421.0, 39.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0464839661494807e-08, -1.0215508439159748e-08, -9.96617632864627e-09, -9.716845106311212e-09, -9.467513883976153e-09, -9.218181773462675e-09, -8.968850551127616e-09, -8.719519328792558e-09, -8.470188106457499e-09, -8.22085688412244e-09, -7.971524773608962e-09, -7.722193551273904e-09, -7.472862328938845e-09, -7.223530662514577e-09, -6.974198996090308e-09, -6.72486777375525e-09, -6.4755356632417715e-09, -6.226203996817503e-09, -5.9768727744824446e-09, -5.727541108058176e-09, -5.478209885723118e-09, -5.228878219298849e-09, -4.979546552874581e-09, -4.730215330539522e-09, -4.480883664115254e-09, -4.2315519976909854e-09, -3.982220775355927e-09, -3.7328891089316585e-09, -3.483557664551995e-09, -3.2342262201723315e-09, -2.984894553748063e-09, -2.7355631093683996e-09, -2.4862312208995263e-09, -2.236899776519863e-09, -1.9875683321401993e-09, -1.738236665715931e-09, -1.4889052213362675e-09, -1.239573776956604e-09, -9.90242221554638e-10, -7.409106661526721e-10, -4.915792217730086e-10, -2.422477218821939e-10, 7.083778008620811e-12, 2.564152778994355e-10, 5.057467777902502e-10, 7.550782221699137e-10, 1.0044097775718797e-09, 1.2537413329738456e-09, 1.503072777353509e-09, 1.7524042217331726e-09, 2.001735666112836e-09, 2.2510673325371044e-09, 2.500398776916768e-09, 2.7497302212964314e-09, 2.9990618877207e-09, 3.2483933321003633e-09, 3.4977247764800268e-09, 3.747056442904295e-09, 3.996387665239354e-09, 4.245719331663622e-09, 4.495050553998681e-09, 4.744382220422949e-09, 4.9937138868472175e-09, 5.243045109182276e-09, 5.4923767756065445e-09]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 7.0, 10.0, 14.0, 13.0, 19.0, 20.0, 23.0, 23.0, 26.0, 24.0, 23.0, 32.0, 32.0, 44.0, 54.0, 39.0, 55.0, 49.0, 47.0, 45.0, 40.0, 33.0, 38.0, 38.0, 39.0, 25.0, 25.0, 21.0, 22.0, 18.0, 18.0, 12.0, 5.0, 8.0, 10.0, 4.0, 12.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.6528668151115653e-09, -2.5692743488292535e-09, -2.4856818825469418e-09, -2.402089194220025e-09, -2.3184967279377133e-09, -2.2349042616554016e-09, -2.15131179537309e-09, -2.067719329090778e-09, -1.9841266407638614e-09, -1.9005341744815496e-09, -1.8169415971769354e-09, -1.7333491308946236e-09, -1.6497565535900094e-09, -1.5661640873076976e-09, -1.4825716210253859e-09, -1.3989791547430741e-09, -1.3153866884607623e-09, -1.2317942221784506e-09, -1.1482016448738364e-09, -1.0646091785915246e-09, -9.810166012869104e-10, -8.974241350045986e-10, -8.138316687222868e-10, -7.302391469288239e-10, -6.466466251353609e-10, -5.630541033418979e-10, -4.794615815484349e-10, -3.958691152661231e-10, -3.122765934726601e-10, -2.2868407167919713e-10, -1.4509160539688537e-10, -6.149908360342238e-11, 2.209366023464554e-11, 1.0568616815032073e-10, 1.892786760659959e-10, 2.728711701038833e-10, 3.564636918973463e-10, 4.4005621369080927e-10, 5.23648679973121e-10, 6.07241201766584e-10, 6.90833723560047e-10, 7.7442624535351e-10, 8.58018767146973e-10, 9.416112334292848e-10, 1.0252036997115965e-09, 1.1087962770162108e-09, 1.1923887432985225e-09, 1.2759813206031367e-09, 1.3595737868854485e-09, 1.4431662531677603e-09, 1.5267588304723745e-09, 1.6103512967546862e-09, 1.6939438740593005e-09, 1.7775363403416122e-09, 1.861128806623924e-09, 1.9447212729062358e-09, 2.0283139612331524e-09, 2.111906427515464e-09, 2.195498893797776e-09, 2.2790915821246926e-09, 2.3626840484070044e-09, 2.446276514689316e-09, 2.529868980971628e-09, 2.6134614472539397e-09, 2.6970539135362515e-09]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 5.0, 7.0, 8.0, 11.0, 15.0, 22.0, 22.0, 17.0, 23.0, 25.0, 25.0, 23.0, 35.0, 39.0, 59.0, 95.0, 170.0, 544.0, 508410.0, 13583.0, 524.0, 168.0, 77.0, 65.0, 54.0, 34.0, 30.0, 21.0, 24.0, 18.0, 20.0, 11.0, 14.0, 6.0, 10.0, 10.0, 6.0, 4.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.5971146183346718e-08, -1.5455729140967378e-08, -1.4940313874944877e-08, -1.4424897720743957e-08, -1.3909481566543036e-08, -1.3394065412342115e-08, -1.2878649258141195e-08, -1.2363233103940274e-08, -1.1847816949739354e-08, -1.1332400795538433e-08, -1.0816984641337513e-08, -1.0301568487136592e-08, -9.786152332935671e-09, -9.270736178734751e-09, -8.75532002453383e-09, -8.23990387033291e-09, -7.724487716131989e-09, -7.2090715619310686e-09, -6.693655407730148e-09, -6.1782392535292274e-09, -5.662823099328307e-09, -5.147406945127386e-09, -4.631990790926466e-09, -4.116574636725545e-09, -3.6011584825246246e-09, -3.085742328323704e-09, -2.5703261741227834e-09, -2.054910019921863e-09, -1.5394938657209423e-09, -1.0240777115200217e-09, -5.086615573191011e-10, 6.754596881819452e-12, 5.221725274395794e-10, 1.0375886816405e-09, 1.5530048358414206e-09, 2.068420990042341e-09, 2.5838371442432617e-09, 3.0992532984441823e-09, 3.614669452645103e-09, 4.1300856068460234e-09, 4.645501761046944e-09, 5.1609179152478646e-09, 5.676334069448785e-09, 6.191750223649706e-09, 6.707166377850626e-09, 7.222582532051547e-09, 7.737998686252467e-09, 8.253414840453388e-09, 8.768830994654309e-09, 9.284247148855229e-09, 9.79966330305615e-09, 1.031507945725707e-08, 1.0830495611457991e-08, 1.1345911765658911e-08, 1.1861327919859832e-08, 1.2376744074060753e-08, 1.2892160228261673e-08, 1.3407576382462594e-08, 1.3922992536663514e-08, 1.4438408690864435e-08, 1.4953824845065355e-08, 1.5469240111087856e-08, 1.5984657153467197e-08, 1.6500074195846537e-08, 1.7015489461869038e-08]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 9.0, 9.0, 10.0, 16.0, 20.0, 20.0, 20.0, 20.0, 37.0, 24.0, 26.0, 34.0, 46.0, 36.0, 37.0, 58.0, 75.0, 1077.0, 42.0, 48.0, 38.0, 39.0, 41.0, 40.0, 21.0, 20.0, 21.0, 14.0, 18.0, 25.0, 8.0, 8.0, 10.0, 7.0, 9.0, 11.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0], "bins": [-1.9262818895526834e-08, -1.8698623094337563e-08, -1.8134427293148292e-08, -1.757022971560218e-08, -1.700603391441291e-08, -1.644183811322364e-08, -1.5877642312034368e-08, -1.5313446510845097e-08, -1.4749248933298986e-08, -1.4185053132109715e-08, -1.3620856442742024e-08, -1.3056660641552753e-08, -1.2492463952185062e-08, -1.1928268150995791e-08, -1.136407234980652e-08, -1.0799875660438829e-08, -1.0235679859249558e-08, -9.671484058060287e-09, -9.107287368692596e-09, -8.543091567503325e-09, -7.978894878135634e-09, -7.414699076946363e-09, -6.850502831667882e-09, -6.286306586389401e-09, -5.72211034111092e-09, -5.157914095832439e-09, -4.593717850553958e-09, -4.029521605275477e-09, -3.4653255820416007e-09, -2.9011293367631197e-09, -2.3369333135292436e-09, -1.7727370682507626e-09, -1.2085408229722816e-09, -6.443446332049518e-10, -8.014844343762206e-11, 4.840476908185565e-10, 1.0482439360970375e-09, 1.6124401813755185e-09, 2.1766362046093946e-09, 2.7408324498878756e-09, 3.3050286951663566e-09, 3.8692249404448376e-09, 4.4334211857233186e-09, 4.9976174310017996e-09, 5.561813232191071e-09, 6.1260099215587616e-09, 6.690205722748033e-09, 7.254401968026514e-09, 7.818598213304995e-09, 8.382794014494266e-09, 8.946990703861957e-09, 9.511186505051228e-09, 1.0075383194418919e-08, 1.063957899560819e-08, 1.120377568497588e-08, 1.1767971486165152e-08, 1.2332167287354423e-08, 1.2896363088543694e-08, 1.3460559777911385e-08, 1.4024755579100656e-08, 1.4588952268468347e-08, 1.5153148069657618e-08, 1.571734387084689e-08, 1.628153967203616e-08, 1.684573724958227e-08]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 13.0, 8.0, 21.0, 33.0, 50.0, 71.0, 106.0, 182.0, 293.0, 503.0, 864.0, 1454.0, 3139.0, 8441.0, 26030.0, 87766.0, 31066648.0, 39099.0, 13621.0, 2891.0, 1327.0, 680.0, 446.0, 288.0, 194.0, 131.0, 79.0, 52.0, 33.0, 11.0, 8.0, 9.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-245.75, -238.5625, -231.375, -224.1875, -217.0, -209.8125, -202.625, -195.4375, -188.25, -181.0625, -173.875, -166.6875, -159.5, -152.3125, -145.125, -137.9375, -130.75, -123.5625, -116.375, -109.1875, -102.0, -94.8125, -87.625, -80.4375, -73.25, -66.0625, -58.875, -51.6875, -44.5, -37.3125, -30.125, -22.9375, -15.75, -8.5625, -1.375, 5.8125, 13.0, 20.1875, 27.375, 34.5625, 41.75, 48.9375, 56.125, 63.3125, 70.5, 77.6875, 84.875, 92.0625, 99.25, 106.4375, 113.625, 120.8125, 128.0, 135.1875, 142.375, 149.5625, 156.75, 163.9375, 171.125, 178.3125, 185.5, 192.6875, 199.875, 207.0625, 214.25]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 11.0, 13.0, 20.0, 26.0, 45.0, 101.0, 147.0, 212.0, 287.0, 425.0, 648.0, 862.0, 1474.0, 2331.0, 3562.0, 5786.0, 9778.0, 17239.0, 30881.0, 58778.0, 118366.0, 274996.0, 900551.0, 3776804.0, 648144.0, 224415.0, 100541.0, 50625.0, 26505.0, 15142.0, 8693.0, 5192.0, 3217.0, 1929.0, 1272.0, 826.0, 563.0, 352.0, 223.0, 155.0, 91.0, 49.0, 53.0, 41.0, 25.0, 10.0, 6.0, 11.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.578125, -5.40045166015625, -5.2227783203125, -5.04510498046875, -4.867431640625, -4.68975830078125, -4.5120849609375, -4.33441162109375, -4.15673828125, -3.97906494140625, -3.8013916015625, -3.62371826171875, -3.446044921875, -3.26837158203125, -3.0906982421875, -2.91302490234375, -2.7353515625, -2.55767822265625, -2.3800048828125, -2.20233154296875, -2.024658203125, -1.84698486328125, -1.6693115234375, -1.49163818359375, -1.31396484375, -1.13629150390625, -0.9586181640625, -0.78094482421875, -0.603271484375, -0.42559814453125, -0.2479248046875, -0.07025146484375, 0.107421875, 0.28509521484375, 0.4627685546875, 0.64044189453125, 0.818115234375, 0.99578857421875, 1.1734619140625, 1.35113525390625, 1.52880859375, 1.70648193359375, 1.8841552734375, 2.06182861328125, 2.239501953125, 2.41717529296875, 2.5948486328125, 2.77252197265625, 2.9501953125, 3.12786865234375, 3.3055419921875, 3.48321533203125, 3.660888671875, 3.83856201171875, 4.0162353515625, 4.19390869140625, 4.37158203125, 4.54925537109375, 4.7269287109375, 4.90460205078125, 5.082275390625, 5.25994873046875, 5.4376220703125, 5.61529541015625, 5.79296875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 4.0, 9.0, 12.0, 20.0, 16.0, 17.0, 36.0, 41.0, 59.0, 90.0, 139.0, 234.0, 507.0, 326.0, 144.0, 76.0, 62.0, 46.0, 40.0, 23.0, 21.0, 16.0, 14.0, 9.0, 12.0, 8.0, 7.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.8077392578125, -7.537353515625, -7.2669677734375, -6.99658203125, -6.7261962890625, -6.455810546875, -6.1854248046875, -5.9150390625, -5.6446533203125, -5.374267578125, -5.1038818359375, -4.83349609375, -4.5631103515625, -4.292724609375, -4.0223388671875, -3.751953125, -3.4815673828125, -3.211181640625, -2.9407958984375, -2.67041015625, -2.4000244140625, -2.129638671875, -1.8592529296875, -1.5888671875, -1.3184814453125, -1.048095703125, -0.7777099609375, -0.50732421875, -0.2369384765625, 0.033447265625, 0.3038330078125, 0.57421875, 0.8446044921875, 1.114990234375, 1.3853759765625, 1.65576171875, 1.9261474609375, 2.196533203125, 2.4669189453125, 2.7373046875, 3.0076904296875, 3.278076171875, 3.5484619140625, 3.81884765625, 4.0892333984375, 4.359619140625, 4.6300048828125, 4.900390625, 5.1707763671875, 5.441162109375, 5.7115478515625, 5.98193359375, 6.2523193359375, 6.522705078125, 6.7930908203125, 7.0634765625, 7.3338623046875, 7.604248046875, 7.8746337890625, 8.14501953125, 8.4154052734375, 8.685791015625, 8.9561767578125, 9.2265625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 8.0, 7.0, 7.0, 3.0, 17.0, 11.0, 32.0, 25.0, 63.0, 69.0, 55.0, 84.0, 112.0, 151.0, 204.0, 277.0, 447.0, 657.0, 808.0, 1091.0, 1644.0, 2446.0, 3805.0, 5744.0, 9217.0, 15795.0, 28035.0, 53250.0, 117769.0, 368037.0, 4450950.0, 875402.0, 188023.0, 76030.0, 36841.0, 20341.0, 11770.0, 7406.0, 4702.0, 3114.0, 2100.0, 1554.0, 948.0, 633.0, 484.0, 303.0, 233.0, 187.0, 149.0, 126.0, 69.0, 62.0, 35.0, 40.0, 16.0, 14.0, 13.0, 7.0, 3.0, 11.0, 6.0, 8.0, 3.0], "bins": [-8.3359375, -8.0732421875, -7.810546875, -7.5478515625, -7.28515625, -7.0224609375, -6.759765625, -6.4970703125, -6.234375, -5.9716796875, -5.708984375, -5.4462890625, -5.18359375, -4.9208984375, -4.658203125, -4.3955078125, -4.1328125, -3.8701171875, -3.607421875, -3.3447265625, -3.08203125, -2.8193359375, -2.556640625, -2.2939453125, -2.03125, -1.7685546875, -1.505859375, -1.2431640625, -0.98046875, -0.7177734375, -0.455078125, -0.1923828125, 0.0703125, 0.3330078125, 0.595703125, 0.8583984375, 1.12109375, 1.3837890625, 1.646484375, 1.9091796875, 2.171875, 2.4345703125, 2.697265625, 2.9599609375, 3.22265625, 3.4853515625, 3.748046875, 4.0107421875, 4.2734375, 4.5361328125, 4.798828125, 5.0615234375, 5.32421875, 5.5869140625, 5.849609375, 6.1123046875, 6.375, 6.6376953125, 6.900390625, 7.1630859375, 7.42578125, 7.6884765625, 7.951171875, 8.2138671875, 8.4765625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 3.0, 5.0, 4.0, 4.0, 6.0, 10.0, 12.0, 10.0, 10.0, 8.0, 21.0, 27.0, 25.0, 37.0, 49.0, 58.0, 79.0, 111.0, 230.0, 587.0, 258.0, 132.0, 68.0, 36.0, 42.0, 32.0, 24.0, 19.0, 18.0, 19.0, 20.0, 12.0, 10.0, 5.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.0703125, -12.682861328125, -12.29541015625, -11.907958984375, -11.5205078125, -11.133056640625, -10.74560546875, -10.358154296875, -9.970703125, -9.583251953125, -9.19580078125, -8.808349609375, -8.4208984375, -8.033447265625, -7.64599609375, -7.258544921875, -6.87109375, -6.483642578125, -6.09619140625, -5.708740234375, -5.3212890625, -4.933837890625, -4.54638671875, -4.158935546875, -3.771484375, -3.384033203125, -2.99658203125, -2.609130859375, -2.2216796875, -1.834228515625, -1.44677734375, -1.059326171875, -0.671875, -0.284423828125, 0.10302734375, 0.490478515625, 0.8779296875, 1.265380859375, 1.65283203125, 2.040283203125, 2.427734375, 2.815185546875, 3.20263671875, 3.590087890625, 3.9775390625, 4.364990234375, 4.75244140625, 5.139892578125, 5.52734375, 5.914794921875, 6.30224609375, 6.689697265625, 7.0771484375, 7.464599609375, 7.85205078125, 8.239501953125, 8.626953125, 9.014404296875, 9.40185546875, 9.789306640625, 10.1767578125, 10.564208984375, 10.95166015625, 11.339111328125, 11.7265625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 0.0, 0.0, 2.0, 7.0, 18.0, 3.0, 13.0, 21.0, 5.0, 19.0, 36.0, 44.0, 66.0, 106.0, 86.0, 184.0, 214.0, 248.0, 391.0, 501.0, 882.0, 1261.0, 1944.0, 3410.0, 6323.0, 13664.0, 42827.0, 5903419.0, 257182.0, 32826.0, 11886.0, 5379.0, 2887.0, 1792.0, 1124.0, 747.0, 520.0, 383.0, 246.0, 166.0, 155.0, 141.0, 54.0, 80.0, 41.0, 26.0, 29.0, 24.0, 26.0, 6.0, 0.0, 9.0, 6.0, 0.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-63.59375, -61.53564453125, -59.4775390625, -57.41943359375, -55.361328125, -53.30322265625, -51.2451171875, -49.18701171875, -47.12890625, -45.07080078125, -43.0126953125, -40.95458984375, -38.896484375, -36.83837890625, -34.7802734375, -32.72216796875, -30.6640625, -28.60595703125, -26.5478515625, -24.48974609375, -22.431640625, -20.37353515625, -18.3154296875, -16.25732421875, -14.19921875, -12.14111328125, -10.0830078125, -8.02490234375, -5.966796875, -3.90869140625, -1.8505859375, 0.20751953125, 2.265625, 4.32373046875, 6.3818359375, 8.43994140625, 10.498046875, 12.55615234375, 14.6142578125, 16.67236328125, 18.73046875, 20.78857421875, 22.8466796875, 24.90478515625, 26.962890625, 29.02099609375, 31.0791015625, 33.13720703125, 35.1953125, 37.25341796875, 39.3115234375, 41.36962890625, 43.427734375, 45.48583984375, 47.5439453125, 49.60205078125, 51.66015625, 53.71826171875, 55.7763671875, 57.83447265625, 59.892578125, 61.95068359375, 64.0087890625, 66.06689453125, 68.125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 7.0, 5.0, 8.0, 11.0, 8.0, 16.0, 16.0, 21.0, 18.0, 15.0, 22.0, 25.0, 29.0, 43.0, 53.0, 81.0, 165.0, 682.0, 354.0, 105.0, 45.0, 52.0, 36.0, 34.0, 32.0, 29.0, 21.0, 14.0, 13.0, 9.0, 12.0, 8.0, 11.0, 6.0, 7.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.421875, -20.72705078125, -20.0322265625, -19.33740234375, -18.642578125, -17.94775390625, -17.2529296875, -16.55810546875, -15.86328125, -15.16845703125, -14.4736328125, -13.77880859375, -13.083984375, -12.38916015625, -11.6943359375, -10.99951171875, -10.3046875, -9.60986328125, -8.9150390625, -8.22021484375, -7.525390625, -6.83056640625, -6.1357421875, -5.44091796875, -4.74609375, -4.05126953125, -3.3564453125, -2.66162109375, -1.966796875, -1.27197265625, -0.5771484375, 0.11767578125, 0.8125, 1.50732421875, 2.2021484375, 2.89697265625, 3.591796875, 4.28662109375, 4.9814453125, 5.67626953125, 6.37109375, 7.06591796875, 7.7607421875, 8.45556640625, 9.150390625, 9.84521484375, 10.5400390625, 11.23486328125, 11.9296875, 12.62451171875, 13.3193359375, 14.01416015625, 14.708984375, 15.40380859375, 16.0986328125, 16.79345703125, 17.48828125, 18.18310546875, 18.8779296875, 19.57275390625, 20.267578125, 20.96240234375, 21.6572265625, 22.35205078125, 23.046875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 16.0, 83.0, 845.0, 34.0, 11.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-406.57421875, -390.4063415527344, -374.23846435546875, -358.0705871582031, -341.9027099609375, -325.73486328125, -309.5669860839844, -293.39910888671875, -277.2312316894531, -261.0633544921875, -244.89547729492188, -228.7276153564453, -212.5597381591797, -196.39186096191406, -180.2239990234375, -164.05612182617188, -147.88824462890625, -131.72036743164062, -115.55249786376953, -99.38462829589844, -83.21675109863281, -67.04887390136719, -50.881004333496094, -34.713134765625, -18.545257568359375, -2.3773841857910156, 13.790489196777344, 29.958362579345703, 46.12623596191406, 62.29411315917969, 78.46198272705078, 94.62985229492188, 110.7977294921875, 126.96560668945312, 143.13348388671875, 159.3013458251953, 175.46922302246094, 191.63710021972656, 207.80496215820312, 223.97283935546875, 240.14071655273438, 256.30859375, 272.4764709472656, 288.64434814453125, 304.81219482421875, 320.9801025390625, 337.14794921875, 353.3158264160156, 369.48370361328125, 385.6515808105469, 401.8194580078125, 417.9873352050781, 434.15521240234375, 450.32305908203125, 466.4909362792969, 482.6588134765625, 498.8266906738281, 514.9945678710938, 531.1624145507812, 547.330322265625, 563.4981689453125, 579.6660766601562, 595.8339233398438, 612.0018310546875, 628.169677734375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 27.0, 34.0, 794.0, 84.0, 34.0, 6.0, 13.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-670.26220703125, -653.452392578125, -636.6426391601562, -619.8328247070312, -603.0230712890625, -586.2132568359375, -569.4034423828125, -552.5936889648438, -535.7838745117188, -518.9740600585938, -502.164306640625, -485.3544921875, -468.5447082519531, -451.73492431640625, -434.92510986328125, -418.1153259277344, -401.3055419921875, -384.4957580566406, -367.68597412109375, -350.87615966796875, -334.0663757324219, -317.256591796875, -300.44677734375, -283.6369934082031, -266.82720947265625, -250.01742553710938, -233.20762634277344, -216.3978271484375, -199.58804321289062, -182.77825927734375, -165.9684600830078, -149.15866088867188, -132.348876953125, -115.5390853881836, -98.72929382324219, -81.91950225830078, -65.10971069335938, -48.29991912841797, -31.490127563476562, -14.680335998535156, 2.12945556640625, 18.939247131347656, 35.74903869628906, 52.55883026123047, 69.36862182617188, 86.17841339111328, 102.98820495605469, 119.7979965209961, 136.6077880859375, 153.41757202148438, 170.2273712158203, 187.03717041015625, 203.84695434570312, 220.65673828125, 237.46653747558594, 254.27633666992188, 271.08612060546875, 287.8959045410156, 304.7056884765625, 321.5155029296875, 338.3252868652344, 355.13507080078125, 371.94488525390625, 388.7546691894531, 405.564453125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 7.0, 7.0, 7.0, 6.0, 29.0, 22.0, 39.0, 50.0, 75.0, 118.0, 223.0, 375.0, 818.0, 1651.0, 3918.0, 15868.0, 4043574.0, 112531.0, 10016.0, 2728.0, 956.0, 453.0, 285.0, 163.0, 109.0, 75.0, 45.0, 25.0, 29.0, 21.0, 11.0, 13.0, 6.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0], "bins": [-0.66259765625, -0.6467552185058594, -0.6309127807617188, -0.6150703430175781, -0.5992279052734375, -0.5833854675292969, -0.5675430297851562, -0.5517005920410156, -0.535858154296875, -0.5200157165527344, -0.5041732788085938, -0.4883308410644531, -0.4724884033203125, -0.4566459655761719, -0.44080352783203125, -0.4249610900878906, -0.40911865234375, -0.3932762145996094, -0.37743377685546875, -0.3615913391113281, -0.3457489013671875, -0.3299064636230469, -0.31406402587890625, -0.2982215881347656, -0.282379150390625, -0.2665367126464844, -0.25069427490234375, -0.23485183715820312, -0.2190093994140625, -0.20316696166992188, -0.18732452392578125, -0.17148208618164062, -0.1556396484375, -0.13979721069335938, -0.12395477294921875, -0.10811233520507812, -0.0922698974609375, -0.07642745971679688, -0.06058502197265625, -0.044742584228515625, -0.028900146484375, -0.013057708740234375, 0.00278472900390625, 0.018627166748046875, 0.0344696044921875, 0.050312042236328125, 0.06615447998046875, 0.08199691772460938, 0.09783935546875, 0.11368179321289062, 0.12952423095703125, 0.14536666870117188, 0.1612091064453125, 0.17705154418945312, 0.19289398193359375, 0.20873641967773438, 0.224578857421875, 0.24042129516601562, 0.25626373291015625, 0.2721061706542969, 0.2879486083984375, 0.3037910461425781, 0.31963348388671875, 0.3354759216308594, 0.351318359375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 4.0, 6.0, 8.0, 12.0, 15.0, 49.0, 57.0, 88.0, 110.0, 134.0, 124.0, 122.0, 87.0, 61.0, 43.0, 28.0, 9.0, 9.0, 4.0, 7.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00785064697265625, -0.007663130760192871, -0.007475614547729492, -0.007288098335266113, -0.007100582122802734, -0.0069130659103393555, -0.0067255496978759766, -0.006538033485412598, -0.006350517272949219, -0.00616300106048584, -0.005975484848022461, -0.005787968635559082, -0.005600452423095703, -0.005412936210632324, -0.005225419998168945, -0.005037903785705566, -0.0048503875732421875, -0.004662871360778809, -0.00447535514831543, -0.004287838935852051, -0.004100322723388672, -0.003912806510925293, -0.003725290298461914, -0.003537774085998535, -0.0033502578735351562, -0.0031627416610717773, -0.0029752254486083984, -0.0027877092361450195, -0.0026001930236816406, -0.0024126768112182617, -0.002225160598754883, -0.002037644386291504, -0.001850128173828125, -0.001662611961364746, -0.0014750957489013672, -0.0012875795364379883, -0.0011000633239746094, -0.0009125471115112305, -0.0007250308990478516, -0.0005375146865844727, -0.00034999847412109375, -0.00016248226165771484, 2.5033950805664062e-05, 0.00021255016326904297, 0.0004000663757324219, 0.0005875825881958008, 0.0007750988006591797, 0.0009626150131225586, 0.0011501312255859375, 0.0013376474380493164, 0.0015251636505126953, 0.0017126798629760742, 0.0019001960754394531, 0.002087712287902832, 0.002275228500366211, 0.00246274471282959, 0.0026502609252929688, 0.0028377771377563477, 0.0030252933502197266, 0.0032128095626831055, 0.0034003257751464844, 0.0035878419876098633, 0.003775358200073242, 0.003962874412536621, 0.004150390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 0.0, 4.0, 2.0, 4.0, 10.0, 11.0, 15.0, 19.0, 36.0, 40.0, 55.0, 70.0, 117.0, 168.0, 285.0, 506.0, 1014.0, 2574.0, 9929.0, 83611.0, 3894636.0, 179510.0, 15007.0, 3556.0, 1322.0, 678.0, 386.0, 224.0, 160.0, 108.0, 59.0, 39.0, 44.0, 23.0, 17.0, 8.0, 11.0, 6.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.355712890625, -0.3432884216308594, -0.33086395263671875, -0.3184394836425781, -0.3060150146484375, -0.2935905456542969, -0.28116607666015625, -0.2687416076660156, -0.256317138671875, -0.24389266967773438, -0.23146820068359375, -0.21904373168945312, -0.2066192626953125, -0.19419479370117188, -0.18177032470703125, -0.16934585571289062, -0.15692138671875, -0.14449691772460938, -0.13207244873046875, -0.11964797973632812, -0.1072235107421875, -0.09479904174804688, -0.08237457275390625, -0.06995010375976562, -0.057525634765625, -0.045101165771484375, -0.03267669677734375, -0.020252227783203125, -0.0078277587890625, 0.004596710205078125, 0.01702117919921875, 0.029445648193359375, 0.0418701171875, 0.054294586181640625, 0.06671905517578125, 0.07914352416992188, 0.0915679931640625, 0.10399246215820312, 0.11641693115234375, 0.12884140014648438, 0.141265869140625, 0.15369033813476562, 0.16611480712890625, 0.17853927612304688, 0.1909637451171875, 0.20338821411132812, 0.21581268310546875, 0.22823715209960938, 0.24066162109375, 0.2530860900878906, 0.26551055908203125, 0.2779350280761719, 0.2903594970703125, 0.3027839660644531, 0.31520843505859375, 0.3276329040527344, 0.340057373046875, 0.3524818420410156, 0.36490631103515625, 0.3773307800292969, 0.3897552490234375, 0.4021797180175781, 0.41460418701171875, 0.4270286560058594, 0.439453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 7.0, 8.0, 17.0, 13.0, 24.0, 29.0, 33.0, 29.0, 45.0, 55.0, 74.0, 77.0, 78.0, 95.0, 122.0, 194.0, 329.0, 1442.0, 502.0, 216.0, 189.0, 88.0, 88.0, 78.0, 52.0, 40.0, 27.0, 24.0, 11.0, 9.0, 17.0, 7.0, 7.0, 4.0, 7.0, 6.0, 1.0, 2.0, 6.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0302276611328125, -0.02927088737487793, -0.02831411361694336, -0.02735733985900879, -0.02640056610107422, -0.02544379234313965, -0.024487018585205078, -0.023530244827270508, -0.022573471069335938, -0.021616697311401367, -0.020659923553466797, -0.019703149795532227, -0.018746376037597656, -0.017789602279663086, -0.016832828521728516, -0.015876054763793945, -0.014919281005859375, -0.013962507247924805, -0.013005733489990234, -0.012048959732055664, -0.011092185974121094, -0.010135412216186523, -0.009178638458251953, -0.008221864700317383, -0.0072650909423828125, -0.006308317184448242, -0.005351543426513672, -0.0043947696685791016, -0.0034379959106445312, -0.002481222152709961, -0.0015244483947753906, -0.0005676746368408203, 0.00038909912109375, 0.0013458728790283203, 0.0023026466369628906, 0.003259420394897461, 0.004216194152832031, 0.0051729679107666016, 0.006129741668701172, 0.007086515426635742, 0.008043289184570312, 0.009000062942504883, 0.009956836700439453, 0.010913610458374023, 0.011870384216308594, 0.012827157974243164, 0.013783931732177734, 0.014740705490112305, 0.015697479248046875, 0.016654253005981445, 0.017611026763916016, 0.018567800521850586, 0.019524574279785156, 0.020481348037719727, 0.021438121795654297, 0.022394895553588867, 0.023351669311523438, 0.024308443069458008, 0.025265216827392578, 0.02622199058532715, 0.02717876434326172, 0.02813553810119629, 0.02909231185913086, 0.03004908561706543, 0.031005859375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 11.0, 29.0, 80.0, 233.0, 532.0, 98.0, 12.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8034946918487549, -1.7494028806686401, -1.6953109502792358, -1.641219139099121, -1.5871273279190063, -1.5330355167388916, -1.4789435863494873, -1.4248517751693726, -1.3707599639892578, -1.316668152809143, -1.2625762224197388, -1.208484411239624, -1.1543926000595093, -1.1003007888793945, -1.0462088584899902, -0.9921170473098755, -0.9380251169204712, -0.8839332461357117, -0.8298414349555969, -0.7757495641708374, -0.7216577529907227, -0.6675658822059631, -0.6134740114212036, -0.5593822002410889, -0.5052903294563293, -0.4511984884738922, -0.3971066474914551, -0.34301477670669556, -0.2889229357242584, -0.2348310947418213, -0.18073922395706177, -0.12664738297462463, -0.07255566120147705, -0.01846381276845932, 0.03562803566455841, 0.08971989154815674, 0.14381173253059387, 0.197903573513031, 0.2519954442977905, 0.30608728528022766, 0.3601791262626648, 0.41427096724510193, 0.46836280822753906, 0.5224546790122986, 0.5765465497970581, 0.6306383609771729, 0.6847302317619324, 0.7388221025466919, 0.7929139137268066, 0.8470057845115662, 0.9010975956916809, 0.9551894664764404, 1.0092812776565552, 1.06337308883667, 1.1174650192260742, 1.171556830406189, 1.2256486415863037, 1.2797404527664185, 1.3338323831558228, 1.3879241943359375, 1.4420160055160522, 1.496107816696167, 1.5501997470855713, 1.604291558265686, 1.6583834886550903]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 11.0, 17.0, 24.0, 33.0, 51.0, 80.0, 85.0, 85.0, 95.0, 108.0, 93.0, 80.0, 67.0, 71.0, 33.0, 35.0, 14.0, 10.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.714702308177948, -0.6984243988990784, -0.682146430015564, -0.6658685207366943, -0.6495906114578247, -0.6333127021789551, -0.6170347332954407, -0.600756824016571, -0.5844788551330566, -0.568200945854187, -0.5519229769706726, -0.535645067691803, -0.5193671584129333, -0.503089189529419, -0.4868112802505493, -0.4705333709716797, -0.45425546169281006, -0.43797752261161804, -0.4216996133327484, -0.4054216742515564, -0.38914376497268677, -0.37286582589149475, -0.35658788681030273, -0.3403099775314331, -0.3240320384502411, -0.3077540993690491, -0.29147619009017944, -0.2751982510089874, -0.2589203119277954, -0.24264240264892578, -0.22636446356773376, -0.21008653938770294, -0.1938086748123169, -0.17753075063228607, -0.16125282645225525, -0.14497488737106323, -0.1286969631910324, -0.11241903901100159, -0.09614110738039017, -0.07986317574977875, -0.06358525156974792, -0.047307323664426804, -0.031029395759105682, -0.014751467853784561, 0.00152646005153656, 0.017804384231567383, 0.0340823158621788, 0.05036024749279022, 0.06663817167282104, 0.08291609585285187, 0.09919402748346329, 0.11547195911407471, 0.13174988329410553, 0.14802780747413635, 0.16430574655532837, 0.1805836707353592, 0.19686159491539001, 0.21313951909542084, 0.22941744327545166, 0.24569538235664368, 0.2619733214378357, 0.2782512307167053, 0.29452916979789734, 0.31080710887908936, 0.327085018157959]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 9.0, 9.0, 15.0, 17.0, 22.0, 19.0, 57.0, 80.0, 109.0, 185.0, 292.0, 538.0, 1102.0, 2525.0, 7140.0, 36980.0, 947840.0, 39297.0, 7349.0, 2478.0, 1100.0, 546.0, 294.0, 189.0, 110.0, 64.0, 59.0, 40.0, 18.0, 20.0, 11.0, 13.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.399658203125, -0.3880767822265625, -0.376495361328125, -0.3649139404296875, -0.35333251953125, -0.3417510986328125, -0.330169677734375, -0.3185882568359375, -0.3070068359375, -0.2954254150390625, -0.283843994140625, -0.2722625732421875, -0.26068115234375, -0.2490997314453125, -0.237518310546875, -0.2259368896484375, -0.21435546875, -0.2027740478515625, -0.191192626953125, -0.1796112060546875, -0.16802978515625, -0.1564483642578125, -0.144866943359375, -0.1332855224609375, -0.1217041015625, -0.1101226806640625, -0.098541259765625, -0.0869598388671875, -0.07537841796875, -0.0637969970703125, -0.052215576171875, -0.0406341552734375, -0.029052734375, -0.0174713134765625, -0.005889892578125, 0.0056915283203125, 0.01727294921875, 0.0288543701171875, 0.040435791015625, 0.0520172119140625, 0.0635986328125, 0.0751800537109375, 0.086761474609375, 0.0983428955078125, 0.10992431640625, 0.1215057373046875, 0.133087158203125, 0.1446685791015625, 0.15625, 0.1678314208984375, 0.179412841796875, 0.1909942626953125, 0.20257568359375, 0.2141571044921875, 0.225738525390625, 0.2373199462890625, 0.2489013671875, 0.2604827880859375, 0.272064208984375, 0.2836456298828125, 0.29522705078125, 0.3068084716796875, 0.318389892578125, 0.3299713134765625, 0.341552734375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 8.0, 18.0, 37.0, 73.0, 124.0, 166.0, 174.0, 156.0, 120.0, 65.0, 35.0, 14.0, 12.0, 4.0, 1.0, 2.0], "bins": [-0.02398681640625, -0.02354520559310913, -0.02310359477996826, -0.022661983966827393, -0.022220373153686523, -0.021778762340545654, -0.021337151527404785, -0.020895540714263916, -0.020453929901123047, -0.020012319087982178, -0.01957070827484131, -0.01912909746170044, -0.01868748664855957, -0.0182458758354187, -0.017804265022277832, -0.017362654209136963, -0.016921043395996094, -0.016479432582855225, -0.016037821769714355, -0.015596210956573486, -0.015154600143432617, -0.014712989330291748, -0.014271378517150879, -0.01382976770401001, -0.01338815689086914, -0.012946546077728271, -0.012504935264587402, -0.012063324451446533, -0.011621713638305664, -0.011180102825164795, -0.010738492012023926, -0.010296881198883057, -0.009855270385742188, -0.009413659572601318, -0.00897204875946045, -0.00853043794631958, -0.008088827133178711, -0.007647216320037842, -0.007205605506896973, -0.0067639946937561035, -0.006322383880615234, -0.005880773067474365, -0.005439162254333496, -0.004997551441192627, -0.004555940628051758, -0.004114329814910889, -0.0036727190017700195, -0.0032311081886291504, -0.0027894973754882812, -0.002347886562347412, -0.001906275749206543, -0.0014646649360656738, -0.0010230541229248047, -0.0005814433097839355, -0.0001398324966430664, 0.00030177831649780273, 0.0007433891296386719, 0.001184999942779541, 0.0016266107559204102, 0.0020682215690612793, 0.0025098323822021484, 0.0029514431953430176, 0.0033930540084838867, 0.003834664821624756, 0.004276275634765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 9.0, 6.0, 18.0, 21.0, 32.0, 38.0, 60.0, 91.0, 120.0, 212.0, 327.0, 663.0, 1323.0, 3118.0, 10348.0, 92414.0, 890244.0, 37875.0, 6776.0, 2373.0, 1052.0, 547.0, 320.0, 204.0, 119.0, 72.0, 42.0, 37.0, 30.0, 17.0, 12.0, 14.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.445068359375, -0.4317207336425781, -0.41837310791015625, -0.4050254821777344, -0.3916778564453125, -0.3783302307128906, -0.36498260498046875, -0.3516349792480469, -0.338287353515625, -0.3249397277832031, -0.31159210205078125, -0.2982444763183594, -0.2848968505859375, -0.2715492248535156, -0.25820159912109375, -0.24485397338867188, -0.23150634765625, -0.21815872192382812, -0.20481109619140625, -0.19146347045898438, -0.1781158447265625, -0.16476821899414062, -0.15142059326171875, -0.13807296752929688, -0.124725341796875, -0.11137771606445312, -0.09803009033203125, -0.08468246459960938, -0.0713348388671875, -0.057987213134765625, -0.04463958740234375, -0.031291961669921875, -0.0179443359375, -0.004596710205078125, 0.00875091552734375, 0.022098541259765625, 0.0354461669921875, 0.048793792724609375, 0.06214141845703125, 0.07548904418945312, 0.088836669921875, 0.10218429565429688, 0.11553192138671875, 0.12887954711914062, 0.1422271728515625, 0.15557479858398438, 0.16892242431640625, 0.18227005004882812, 0.19561767578125, 0.20896530151367188, 0.22231292724609375, 0.23566055297851562, 0.2490081787109375, 0.2623558044433594, 0.27570343017578125, 0.2890510559082031, 0.302398681640625, 0.3157463073730469, 0.32909393310546875, 0.3424415588378906, 0.3557891845703125, 0.3691368103027344, 0.38248443603515625, 0.3958320617675781, 0.4091796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 11.0, 11.0, 13.0, 11.0, 21.0, 29.0, 28.0, 29.0, 35.0, 38.0, 35.0, 40.0, 47.0, 60.0, 47.0, 52.0, 51.0, 46.0, 52.0, 52.0, 41.0, 42.0, 31.0, 17.0, 33.0, 21.0, 22.0, 17.0, 17.0, 18.0, 6.0, 7.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.041900634765625, -0.0406651496887207, -0.039429664611816406, -0.03819417953491211, -0.03695869445800781, -0.035723209381103516, -0.03448772430419922, -0.03325223922729492, -0.032016754150390625, -0.030781269073486328, -0.02954578399658203, -0.028310298919677734, -0.027074813842773438, -0.02583932876586914, -0.024603843688964844, -0.023368358612060547, -0.02213287353515625, -0.020897388458251953, -0.019661903381347656, -0.01842641830444336, -0.017190933227539062, -0.015955448150634766, -0.014719963073730469, -0.013484477996826172, -0.012248992919921875, -0.011013507843017578, -0.009778022766113281, -0.008542537689208984, -0.0073070526123046875, -0.006071567535400391, -0.004836082458496094, -0.003600597381591797, -0.0023651123046875, -0.0011296272277832031, 0.00010585784912109375, 0.0013413429260253906, 0.0025768280029296875, 0.0038123130798339844, 0.005047798156738281, 0.006283283233642578, 0.007518768310546875, 0.008754253387451172, 0.009989738464355469, 0.011225223541259766, 0.012460708618164062, 0.01369619369506836, 0.014931678771972656, 0.016167163848876953, 0.01740264892578125, 0.018638134002685547, 0.019873619079589844, 0.02110910415649414, 0.022344589233398438, 0.023580074310302734, 0.02481555938720703, 0.026051044464111328, 0.027286529541015625, 0.028522014617919922, 0.02975749969482422, 0.030992984771728516, 0.03222846984863281, 0.03346395492553711, 0.034699440002441406, 0.0359349250793457, 0.03717041015625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 10.0, 1.0, 10.0, 21.0, 60.0, 127.0, 407.0, 3094.0, 1032438.0, 11288.0, 813.0, 164.0, 64.0, 26.0, 12.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8828125, -1.8233642578125, -1.763916015625, -1.7044677734375, -1.64501953125, -1.5855712890625, -1.526123046875, -1.4666748046875, -1.4072265625, -1.3477783203125, -1.288330078125, -1.2288818359375, -1.16943359375, -1.1099853515625, -1.050537109375, -0.9910888671875, -0.931640625, -0.8721923828125, -0.812744140625, -0.7532958984375, -0.69384765625, -0.6343994140625, -0.574951171875, -0.5155029296875, -0.4560546875, -0.3966064453125, -0.337158203125, -0.2777099609375, -0.21826171875, -0.1588134765625, -0.099365234375, -0.0399169921875, 0.01953125, 0.0789794921875, 0.138427734375, 0.1978759765625, 0.25732421875, 0.3167724609375, 0.376220703125, 0.4356689453125, 0.4951171875, 0.5545654296875, 0.614013671875, 0.6734619140625, 0.73291015625, 0.7923583984375, 0.851806640625, 0.9112548828125, 0.970703125, 1.0301513671875, 1.089599609375, 1.1490478515625, 1.20849609375, 1.2679443359375, 1.327392578125, 1.3868408203125, 1.4462890625, 1.5057373046875, 1.565185546875, 1.6246337890625, 1.68408203125, 1.7435302734375, 1.802978515625, 1.8624267578125, 1.921875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 8.0, 9.0, 6.0, 13.0, 17.0, 19.0, 17.0, 20.0, 24.0, 38.0, 45.0, 46.0, 55.0, 61.0, 103.0, 101.0, 59.0, 59.0, 41.0, 38.0, 34.0, 33.0, 18.0, 19.0, 16.0, 25.0, 9.0, 11.0, 6.0, 8.0, 7.0, 4.0, 5.0, 0.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0014219284057617188, -0.0013772696256637573, -0.001332610845565796, -0.0012879520654678345, -0.001243293285369873, -0.0011986345052719116, -0.0011539757251739502, -0.0011093169450759888, -0.0010646581649780273, -0.001019999384880066, -0.0009753406047821045, -0.0009306818246841431, -0.0008860230445861816, -0.0008413642644882202, -0.0007967054843902588, -0.0007520467042922974, -0.0007073879241943359, -0.0006627291440963745, -0.0006180703639984131, -0.0005734115839004517, -0.0005287528038024902, -0.0004840940237045288, -0.0004394352436065674, -0.00039477646350860596, -0.00035011768341064453, -0.0003054589033126831, -0.0002608001232147217, -0.00021614134311676025, -0.00017148256301879883, -0.0001268237829208374, -8.216500282287598e-05, -3.750622272491455e-05, 7.152557373046875e-06, 5.18113374710083e-05, 9.647011756896973e-05, 0.00014112889766693115, 0.00018578767776489258, 0.000230446457862854, 0.00027510523796081543, 0.00031976401805877686, 0.0003644227981567383, 0.0004090815782546997, 0.00045374035835266113, 0.0004983991384506226, 0.000543057918548584, 0.0005877166986465454, 0.0006323754787445068, 0.0006770342588424683, 0.0007216930389404297, 0.0007663518190383911, 0.0008110105991363525, 0.000855669379234314, 0.0009003281593322754, 0.0009449869394302368, 0.0009896457195281982, 0.0010343044996261597, 0.001078963279724121, 0.0011236220598220825, 0.001168280839920044, 0.0012129396200180054, 0.0012575984001159668, 0.0013022571802139282, 0.0013469159603118896, 0.001391574740409851, 0.0014362335205078125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 3.0, 5.0, 4.0, 10.0, 7.0, 15.0, 8.0, 19.0, 34.0, 42.0, 58.0, 125.0, 146.0, 288.0, 728.0, 2994.0, 915179.0, 125104.0, 2402.0, 639.0, 280.0, 156.0, 81.0, 60.0, 45.0, 35.0, 20.0, 14.0, 14.0, 12.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9111328125, -1.8513031005859375, -1.791473388671875, -1.7316436767578125, -1.67181396484375, -1.6119842529296875, -1.552154541015625, -1.4923248291015625, -1.4324951171875, -1.3726654052734375, -1.312835693359375, -1.2530059814453125, -1.19317626953125, -1.1333465576171875, -1.073516845703125, -1.0136871337890625, -0.953857421875, -0.8940277099609375, -0.834197998046875, -0.7743682861328125, -0.71453857421875, -0.6547088623046875, -0.594879150390625, -0.5350494384765625, -0.4752197265625, -0.4153900146484375, -0.355560302734375, -0.2957305908203125, -0.23590087890625, -0.1760711669921875, -0.116241455078125, -0.0564117431640625, 0.00341796875, 0.0632476806640625, 0.123077392578125, 0.1829071044921875, 0.24273681640625, 0.3025665283203125, 0.362396240234375, 0.4222259521484375, 0.4820556640625, 0.5418853759765625, 0.601715087890625, 0.6615447998046875, 0.72137451171875, 0.7812042236328125, 0.841033935546875, 0.9008636474609375, 0.960693359375, 1.0205230712890625, 1.080352783203125, 1.1401824951171875, 1.20001220703125, 1.2598419189453125, 1.319671630859375, 1.3795013427734375, 1.4393310546875, 1.4991607666015625, 1.558990478515625, 1.6188201904296875, 1.67864990234375, 1.7384796142578125, 1.798309326171875, 1.8581390380859375, 1.91796875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 18.0, 35.0, 180.0, 455.0, 197.0, 56.0, 18.0, 11.0, 3.0, 4.0, 0.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.407470703125, -0.3949432373046875, -0.382415771484375, -0.3698883056640625, -0.35736083984375, -0.3448333740234375, -0.332305908203125, -0.3197784423828125, -0.3072509765625, -0.2947235107421875, -0.282196044921875, -0.2696685791015625, -0.25714111328125, -0.2446136474609375, -0.232086181640625, -0.2195587158203125, -0.20703125, -0.1945037841796875, -0.181976318359375, -0.1694488525390625, -0.15692138671875, -0.1443939208984375, -0.131866455078125, -0.1193389892578125, -0.1068115234375, -0.0942840576171875, -0.081756591796875, -0.0692291259765625, -0.05670166015625, -0.0441741943359375, -0.031646728515625, -0.0191192626953125, -0.006591796875, 0.0059356689453125, 0.018463134765625, 0.0309906005859375, 0.04351806640625, 0.0560455322265625, 0.068572998046875, 0.0811004638671875, 0.0936279296875, 0.1061553955078125, 0.118682861328125, 0.1312103271484375, 0.14373779296875, 0.1562652587890625, 0.168792724609375, 0.1813201904296875, 0.19384765625, 0.2063751220703125, 0.218902587890625, 0.2314300537109375, 0.24395751953125, 0.2564849853515625, 0.269012451171875, 0.2815399169921875, 0.2940673828125, 0.3065948486328125, 0.319122314453125, 0.3316497802734375, 0.34417724609375, 0.3567047119140625, 0.369232177734375, 0.3817596435546875, 0.394287109375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 8.0, 6.0, 35.0, 100.0, 329.0, 426.0, 57.0, 18.0, 16.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.675384044647217, -4.542251110076904, -4.40911865234375, -4.2759857177734375, -4.142852783203125, -4.0097198486328125, -3.876587152481079, -3.7434544563293457, -3.610321521759033, -3.4771885871887207, -3.3440558910369873, -3.210923194885254, -3.0777902603149414, -2.944657325744629, -2.8115246295928955, -2.678391933441162, -2.5452589988708496, -2.412126064300537, -2.2789933681488037, -2.1458606719970703, -2.012727737426758, -1.8795949220657349, -1.746462106704712, -1.613329291343689, -1.480196475982666, -1.347063660621643, -1.2139308452606201, -1.0807980298995972, -0.9476652145385742, -0.8145323991775513, -0.6813995838165283, -0.5482667684555054, -0.4151344299316406, -0.2820016145706177, -0.14886879920959473, -0.015735983848571777, 0.11739683151245117, 0.2505296468734741, 0.38366246223449707, 0.51679527759552, 0.649928092956543, 0.7830609083175659, 0.9161937236785889, 1.0493265390396118, 1.1824593544006348, 1.3155921697616577, 1.4487249851226807, 1.5818578004837036, 1.7149906158447266, 1.8481234312057495, 1.9812562465667725, 2.114388942718506, 2.2475218772888184, 2.380654811859131, 2.5137875080108643, 2.6469202041625977, 2.78005313873291, 2.9131860733032227, 3.046318769454956, 3.1794514656066895, 3.312584400177002, 3.4457173347473145, 3.578850030899048, 3.7119827270507812, 3.8451156616210938]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 9.0, 6.0, 11.0, 23.0, 32.0, 47.0, 82.0, 89.0, 125.0, 132.0, 120.0, 106.0, 77.0, 60.0, 36.0, 25.0, 13.0, 12.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7798275351524353, -0.7470832467079163, -0.7143389582633972, -0.6815946698188782, -0.6488503217697144, -0.6161060333251953, -0.5833617448806763, -0.5506174564361572, -0.5178731679916382, -0.48512887954711914, -0.4523845911026001, -0.41964027285575867, -0.3868959844112396, -0.3541516959667206, -0.32140737771987915, -0.2886630892753601, -0.25591880083084106, -0.22317451238632202, -0.19043020904064178, -0.15768590569496155, -0.1249416172504425, -0.09219732880592346, -0.059453025460243225, -0.02670872211456299, 0.006035566329956055, 0.038779862225055695, 0.07152415812015533, 0.10426845401525497, 0.13701274991035461, 0.16975703835487366, 0.2025013417005539, 0.23524564504623413, 0.2679898738861084, 0.30073416233062744, 0.3334784507751465, 0.3662227690219879, 0.39896705746650696, 0.431711345911026, 0.46445566415786743, 0.4971999526023865, 0.5299442410469055, 0.5626885294914246, 0.5954328179359436, 0.6281771063804626, 0.6609214544296265, 0.6936657428741455, 0.7264100313186646, 0.7591543197631836, 0.7918986082077026, 0.8246428966522217, 0.8573871850967407, 0.8901314735412598, 0.9228757619857788, 0.9556200504302979, 0.9883643984794617, 1.021108627319336, 1.0538530349731445, 1.0865973234176636, 1.1193416118621826, 1.1520859003067017, 1.1848301887512207, 1.2175744771957397, 1.2503187656402588, 1.2830631732940674, 1.3158073425292969]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 5.0, 6.0, 12.0, 22.0, 24.0, 42.0, 136.0, 821.0, 4161429.0, 31351.0, 293.0, 65.0, 25.0, 14.0, 12.0, 6.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-66.25, -64.66796875, -63.0859375, -61.50390625, -59.921875, -58.33984375, -56.7578125, -55.17578125, -53.59375, -52.01171875, -50.4296875, -48.84765625, -47.265625, -45.68359375, -44.1015625, -42.51953125, -40.9375, -39.35546875, -37.7734375, -36.19140625, -34.609375, -33.02734375, -31.4453125, -29.86328125, -28.28125, -26.69921875, -25.1171875, -23.53515625, -21.953125, -20.37109375, -18.7890625, -17.20703125, -15.625, -14.04296875, -12.4609375, -10.87890625, -9.296875, -7.71484375, -6.1328125, -4.55078125, -2.96875, -1.38671875, 0.1953125, 1.77734375, 3.359375, 4.94140625, 6.5234375, 8.10546875, 9.6875, 11.26953125, 12.8515625, 14.43359375, 16.015625, 17.59765625, 19.1796875, 20.76171875, 22.34375, 23.92578125, 25.5078125, 27.08984375, 28.671875, 30.25390625, 31.8359375, 33.41796875, 35.0]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 9.0, 14.0, 15.0, 36.0, 75.0, 117.0, 147.0, 150.0, 142.0, 118.0, 70.0, 42.0, 23.0, 8.0, 12.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01739501953125, -0.01692986488342285, -0.016464710235595703, -0.015999555587768555, -0.015534400939941406, -0.015069246292114258, -0.01460409164428711, -0.014138936996459961, -0.013673782348632812, -0.013208627700805664, -0.012743473052978516, -0.012278318405151367, -0.011813163757324219, -0.01134800910949707, -0.010882854461669922, -0.010417699813842773, -0.009952545166015625, -0.009487390518188477, -0.009022235870361328, -0.00855708122253418, -0.008091926574707031, -0.007626771926879883, -0.007161617279052734, -0.006696462631225586, -0.0062313079833984375, -0.005766153335571289, -0.005300998687744141, -0.004835844039916992, -0.004370689392089844, -0.0039055347442626953, -0.003440380096435547, -0.0029752254486083984, -0.00251007080078125, -0.0020449161529541016, -0.0015797615051269531, -0.0011146068572998047, -0.0006494522094726562, -0.0001842975616455078, 0.0002808570861816406, 0.0007460117340087891, 0.0012111663818359375, 0.001676321029663086, 0.0021414756774902344, 0.002606630325317383, 0.0030717849731445312, 0.0035369396209716797, 0.004002094268798828, 0.0044672489166259766, 0.004932403564453125, 0.0053975582122802734, 0.005862712860107422, 0.00632786750793457, 0.006793022155761719, 0.007258176803588867, 0.007723331451416016, 0.008188486099243164, 0.008653640747070312, 0.009118795394897461, 0.00958395004272461, 0.010049104690551758, 0.010514259338378906, 0.010979413986206055, 0.011444568634033203, 0.011909723281860352, 0.0123748779296875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 14.0, 24.0, 37.0, 70.0, 117.0, 373.0, 13486.0, 4174137.0, 4340.0, 552.0, 243.0, 198.0, 137.0, 120.0, 82.0, 74.0, 48.0, 46.0, 35.0, 34.0, 21.0, 10.0, 12.0, 12.0, 12.0, 5.0, 7.0, 6.0, 4.0, 5.0, 3.0, 6.0, 3.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -3.87725830078125, -3.5865478515625, -3.29583740234375, -3.005126953125, -2.71441650390625, -2.4237060546875, -2.13299560546875, -1.84228515625, -1.55157470703125, -1.2608642578125, -0.97015380859375, -0.679443359375, -0.38873291015625, -0.0980224609375, 0.19268798828125, 0.4833984375, 0.77410888671875, 1.0648193359375, 1.35552978515625, 1.646240234375, 1.93695068359375, 2.2276611328125, 2.51837158203125, 2.80908203125, 3.09979248046875, 3.3905029296875, 3.68121337890625, 3.971923828125, 4.26263427734375, 4.5533447265625, 4.84405517578125, 5.134765625, 5.42547607421875, 5.7161865234375, 6.00689697265625, 6.297607421875, 6.58831787109375, 6.8790283203125, 7.16973876953125, 7.46044921875, 7.75115966796875, 8.0418701171875, 8.33258056640625, 8.623291015625, 8.91400146484375, 9.2047119140625, 9.49542236328125, 9.7861328125, 10.07684326171875, 10.3675537109375, 10.65826416015625, 10.948974609375, 11.23968505859375, 11.5303955078125, 11.82110595703125, 12.11181640625, 12.40252685546875, 12.6932373046875, 12.98394775390625, 13.274658203125, 13.56536865234375, 13.8560791015625, 14.14678955078125, 14.4375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 13.0, 11.0, 18.0, 29.0, 60.0, 112.0, 175.0, 340.0, 1348.0, 462.0, 360.0, 269.0, 204.0, 163.0, 126.0, 88.0, 81.0, 53.0, 33.0, 39.0, 20.0, 19.0, 7.0, 10.0, 6.0, 8.0, 10.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0360107421875, -0.03354644775390625, -0.0310821533203125, -0.02861785888671875, -0.026153564453125, -0.02368927001953125, -0.0212249755859375, -0.01876068115234375, -0.01629638671875, -0.01383209228515625, -0.0113677978515625, -0.00890350341796875, -0.006439208984375, -0.00397491455078125, -0.0015106201171875, 0.00095367431640625, 0.00341796875, 0.00588226318359375, 0.0083465576171875, 0.01081085205078125, 0.013275146484375, 0.01573944091796875, 0.0182037353515625, 0.02066802978515625, 0.02313232421875, 0.02559661865234375, 0.0280609130859375, 0.03052520751953125, 0.032989501953125, 0.03545379638671875, 0.0379180908203125, 0.04038238525390625, 0.0428466796875, 0.04531097412109375, 0.0477752685546875, 0.05023956298828125, 0.052703857421875, 0.05516815185546875, 0.0576324462890625, 0.06009674072265625, 0.06256103515625, 0.06502532958984375, 0.0674896240234375, 0.06995391845703125, 0.072418212890625, 0.07488250732421875, 0.0773468017578125, 0.07981109619140625, 0.082275390625, 0.08473968505859375, 0.0872039794921875, 0.08966827392578125, 0.092132568359375, 0.09459686279296875, 0.0970611572265625, 0.09952545166015625, 0.10198974609375, 0.10445404052734375, 0.1069183349609375, 0.10938262939453125, 0.111846923828125, 0.11431121826171875, 0.1167755126953125, 0.11923980712890625, 0.1217041015625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 9.0, 802.0, 176.0, 23.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.216266632080078, -2.0136044025421143, -0.8109421730041504, 0.3917200565338135, 1.5943822860717773, 2.7970447540283203, 3.999706745147705, 5.20236873626709, 6.405031204223633, 7.607693672180176, 8.810356140136719, 10.013017654418945, 11.215680122375488, 12.418342590332031, 13.621004104614258, 14.8236665725708, 16.026329040527344, 17.22899055480957, 18.43165397644043, 19.634315490722656, 20.836978912353516, 22.039640426635742, 23.24230194091797, 24.444965362548828, 25.647626876831055, 26.85028839111328, 28.05295181274414, 29.255613327026367, 30.458274841308594, 31.660938262939453, 32.86360168457031, 34.066261291503906, 35.2689208984375, 36.47158432006836, 37.67424392700195, 38.87690734863281, 40.07957077026367, 41.28223419189453, 42.484893798828125, 43.687557220458984, 44.890220642089844, 46.0928840637207, 47.2955436706543, 48.498207092285156, 49.700870513916016, 50.903533935546875, 52.10619354248047, 53.30885696411133, 54.51151657104492, 55.71417999267578, 56.916839599609375, 58.119503021240234, 59.322166442871094, 60.52482604980469, 61.72748947143555, 62.930152893066406, 64.1328125, 65.3354721069336, 66.53813934326172, 67.74079895019531, 68.9434585571289, 70.14612579345703, 71.34878540039062, 72.55144500732422, 73.75411224365234]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 14.0, 20.0, 22.0, 25.0, 46.0, 62.0, 75.0, 85.0, 101.0, 126.0, 80.0, 102.0, 70.0, 58.0, 34.0, 23.0, 13.0, 9.0, 6.0, 10.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.167879581451416, -3.040595293045044, -2.913311004638672, -2.7860267162323, -2.6587424278259277, -2.5314581394195557, -2.4041738510131836, -2.2768893241882324, -2.1496052742004395, -2.0223209857940674, -1.8950366973876953, -1.7677524089813232, -1.6404681205749512, -1.513183832168579, -1.3858994245529175, -1.2586151361465454, -1.1313307285308838, -1.0040464401245117, -0.8767621517181396, -0.7494778037071228, -0.6221935153007507, -0.49490922689437866, -0.3676248788833618, -0.24034059047698975, -0.11305630207061768, 0.014228001236915588, 0.14151230454444885, 0.2687966227531433, 0.3960809111595154, 0.5233651995658875, 0.6506495475769043, 0.7779338359832764, 0.9052181243896484, 1.0325024127960205, 1.1597867012023926, 1.2870709896087646, 1.4143552780151367, 1.5416395664215088, 1.6689239740371704, 1.7962082624435425, 1.9234925508499146, 2.050776958465576, 2.1780612468719482, 2.3053455352783203, 2.4326298236846924, 2.5599141120910645, 2.6871984004974365, 2.8144826889038086, 2.9417669773101807, 3.0690512657165527, 3.196335554122925, 3.323619842529297, 3.450904130935669, 3.578188419342041, 3.705472946166992, 3.832756996154785, 3.9600415229797363, 4.0873260498046875, 4.2146100997924805, 4.341894626617432, 4.469178676605225, 4.596463203430176, 4.723747253417969, 4.85103178024292, 4.978315830230713]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 10.0, 5.0, 4.0, 9.0, 6.0, 10.0, 14.0, 17.0, 13.0, 24.0, 25.0, 37.0, 55.0, 93.0, 195.0, 602.0, 2160.0, 10818.0, 277073.0, 737433.0, 15719.0, 2879.0, 785.0, 236.0, 101.0, 51.0, 27.0, 21.0, 17.0, 18.0, 22.0, 16.0, 7.0, 7.0, 3.0, 9.0, 4.0, 2.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1845703125, -1.1464691162109375, -1.108367919921875, -1.0702667236328125, -1.03216552734375, -0.9940643310546875, -0.955963134765625, -0.9178619384765625, -0.8797607421875, -0.8416595458984375, -0.803558349609375, -0.7654571533203125, -0.72735595703125, -0.6892547607421875, -0.651153564453125, -0.6130523681640625, -0.574951171875, -0.5368499755859375, -0.498748779296875, -0.4606475830078125, -0.42254638671875, -0.3844451904296875, -0.346343994140625, -0.3082427978515625, -0.2701416015625, -0.2320404052734375, -0.193939208984375, -0.1558380126953125, -0.11773681640625, -0.0796356201171875, -0.041534423828125, -0.0034332275390625, 0.03466796875, 0.0727691650390625, 0.110870361328125, 0.1489715576171875, 0.18707275390625, 0.2251739501953125, 0.263275146484375, 0.3013763427734375, 0.3394775390625, 0.3775787353515625, 0.415679931640625, 0.4537811279296875, 0.49188232421875, 0.5299835205078125, 0.568084716796875, 0.6061859130859375, 0.644287109375, 0.6823883056640625, 0.720489501953125, 0.7585906982421875, 0.79669189453125, 0.8347930908203125, 0.872894287109375, 0.9109954833984375, 0.9490966796875, 0.9871978759765625, 1.025299072265625, 1.0634002685546875, 1.10150146484375, 1.1396026611328125, 1.177703857421875, 1.2158050537109375, 1.25390625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 7.0, 8.0, 14.0, 24.0, 79.0, 224.0, 286.0, 229.0, 88.0, 30.0, 12.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0145721435546875, -0.013043642044067383, -0.011515140533447266, -0.009986639022827148, -0.008458137512207031, -0.006929636001586914, -0.005401134490966797, -0.0038726329803466797, -0.0023441314697265625, -0.0008156299591064453, 0.0007128715515136719, 0.002241373062133789, 0.0037698745727539062, 0.0052983760833740234, 0.006826877593994141, 0.008355379104614258, 0.009883880615234375, 0.011412382125854492, 0.01294088363647461, 0.014469385147094727, 0.015997886657714844, 0.01752638816833496, 0.019054889678955078, 0.020583391189575195, 0.022111892700195312, 0.02364039421081543, 0.025168895721435547, 0.026697397232055664, 0.02822589874267578, 0.0297544002532959, 0.031282901763916016, 0.03281140327453613, 0.03433990478515625, 0.03586840629577637, 0.037396907806396484, 0.0389254093170166, 0.04045391082763672, 0.041982412338256836, 0.04351091384887695, 0.04503941535949707, 0.04656791687011719, 0.048096418380737305, 0.04962491989135742, 0.05115342140197754, 0.052681922912597656, 0.05421042442321777, 0.05573892593383789, 0.05726742744445801, 0.058795928955078125, 0.06032443046569824, 0.06185293197631836, 0.06338143348693848, 0.0649099349975586, 0.06643843650817871, 0.06796693801879883, 0.06949543952941895, 0.07102394104003906, 0.07255244255065918, 0.0740809440612793, 0.07560944557189941, 0.07713794708251953, 0.07866644859313965, 0.08019495010375977, 0.08172345161437988, 0.083251953125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 6.0, 2.0, 7.0, 4.0, 6.0, 11.0, 9.0, 9.0, 19.0, 33.0, 10.0, 28.0, 28.0, 41.0, 44.0, 44.0, 65.0, 146.0, 812.0, 8594.0, 965233.0, 70621.0, 2125.0, 304.0, 83.0, 40.0, 33.0, 32.0, 32.0, 23.0, 20.0, 15.0, 18.0, 8.0, 8.0, 4.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.2548828125, -1.2165679931640625, -1.178253173828125, -1.1399383544921875, -1.10162353515625, -1.0633087158203125, -1.024993896484375, -0.9866790771484375, -0.9483642578125, -0.9100494384765625, -0.871734619140625, -0.8334197998046875, -0.79510498046875, -0.7567901611328125, -0.718475341796875, -0.6801605224609375, -0.641845703125, -0.6035308837890625, -0.565216064453125, -0.5269012451171875, -0.48858642578125, -0.4502716064453125, -0.411956787109375, -0.3736419677734375, -0.3353271484375, -0.2970123291015625, -0.258697509765625, -0.2203826904296875, -0.18206787109375, -0.1437530517578125, -0.105438232421875, -0.0671234130859375, -0.02880859375, 0.0095062255859375, 0.047821044921875, 0.0861358642578125, 0.12445068359375, 0.1627655029296875, 0.201080322265625, 0.2393951416015625, 0.2777099609375, 0.3160247802734375, 0.354339599609375, 0.3926544189453125, 0.43096923828125, 0.4692840576171875, 0.507598876953125, 0.5459136962890625, 0.584228515625, 0.6225433349609375, 0.660858154296875, 0.6991729736328125, 0.73748779296875, 0.7758026123046875, 0.814117431640625, 0.8524322509765625, 0.8907470703125, 0.9290618896484375, 0.967376708984375, 1.0056915283203125, 1.04400634765625, 1.0823211669921875, 1.120635986328125, 1.1589508056640625, 1.197265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 4.0, 4.0, 8.0, 7.0, 15.0, 12.0, 17.0, 20.0, 24.0, 20.0, 28.0, 33.0, 34.0, 42.0, 54.0, 46.0, 44.0, 45.0, 42.0, 55.0, 59.0, 43.0, 39.0, 41.0, 39.0, 36.0, 28.0, 29.0, 22.0, 17.0, 15.0, 16.0, 14.0, 7.0, 8.0, 8.0, 4.0, 2.0, 5.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0650634765625, -0.06288623809814453, -0.06070899963378906, -0.058531761169433594, -0.056354522705078125, -0.054177284240722656, -0.05200004577636719, -0.04982280731201172, -0.04764556884765625, -0.04546833038330078, -0.04329109191894531, -0.041113853454589844, -0.038936614990234375, -0.036759376525878906, -0.03458213806152344, -0.03240489959716797, -0.0302276611328125, -0.02805042266845703, -0.025873184204101562, -0.023695945739746094, -0.021518707275390625, -0.019341468811035156, -0.017164230346679688, -0.014986991882324219, -0.01280975341796875, -0.010632514953613281, -0.008455276489257812, -0.006278038024902344, -0.004100799560546875, -0.0019235610961914062, 0.0002536773681640625, 0.0024309158325195312, 0.004608154296875, 0.006785392761230469, 0.008962631225585938, 0.011139869689941406, 0.013317108154296875, 0.015494346618652344, 0.017671585083007812, 0.01984882354736328, 0.02202606201171875, 0.02420330047607422, 0.026380538940429688, 0.028557777404785156, 0.030735015869140625, 0.032912254333496094, 0.03508949279785156, 0.03726673126220703, 0.0394439697265625, 0.04162120819091797, 0.04379844665527344, 0.045975685119628906, 0.048152923583984375, 0.050330162048339844, 0.05250740051269531, 0.05468463897705078, 0.05686187744140625, 0.05903911590576172, 0.06121635437011719, 0.06339359283447266, 0.06557083129882812, 0.0677480697631836, 0.06992530822753906, 0.07210254669189453, 0.07427978515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 5.0, 5.0, 9.0, 7.0, 9.0, 7.0, 15.0, 19.0, 36.0, 64.0, 225.0, 1051.0, 18215.0, 1016282.0, 11348.0, 886.0, 161.0, 66.0, 42.0, 13.0, 14.0, 13.0, 11.0, 11.0, 2.0, 5.0, 4.0, 4.0, 2.0, 3.0, 7.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97412109375, -0.9386215209960938, -0.9031219482421875, -0.8676223754882812, -0.832122802734375, -0.7966232299804688, -0.7611236572265625, -0.7256240844726562, -0.69012451171875, -0.6546249389648438, -0.6191253662109375, -0.5836257934570312, -0.548126220703125, -0.5126266479492188, -0.4771270751953125, -0.44162750244140625, -0.4061279296875, -0.37062835693359375, -0.3351287841796875, -0.29962921142578125, -0.264129638671875, -0.22863006591796875, -0.1931304931640625, -0.15763092041015625, -0.12213134765625, -0.08663177490234375, -0.0511322021484375, -0.01563262939453125, 0.019866943359375, 0.05536651611328125, 0.0908660888671875, 0.12636566162109375, 0.161865234375, 0.19736480712890625, 0.2328643798828125, 0.26836395263671875, 0.303863525390625, 0.33936309814453125, 0.3748626708984375, 0.41036224365234375, 0.44586181640625, 0.48136138916015625, 0.5168609619140625, 0.5523605346679688, 0.587860107421875, 0.6233596801757812, 0.6588592529296875, 0.6943588256835938, 0.7298583984375, 0.7653579711914062, 0.8008575439453125, 0.8363571166992188, 0.871856689453125, 0.9073562622070312, 0.9428558349609375, 0.9783554077148438, 1.01385498046875, 1.0493545532226562, 1.0848541259765625, 1.1203536987304688, 1.155853271484375, 1.1913528442382812, 1.2268524169921875, 1.2623519897460938, 1.2978515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 12.0, 9.0, 11.0, 7.0, 18.0, 15.0, 24.0, 29.0, 44.0, 65.0, 70.0, 102.0, 205.0, 110.0, 71.0, 50.0, 39.0, 22.0, 11.0, 11.0, 22.0, 6.0, 12.0, 5.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004734039306640625, -0.004578769207000732, -0.00442349910736084, -0.004268229007720947, -0.004112958908081055, -0.003957688808441162, -0.0038024187088012695, -0.003647148609161377, -0.0034918785095214844, -0.003336608409881592, -0.0031813383102416992, -0.0030260682106018066, -0.002870798110961914, -0.0027155280113220215, -0.002560257911682129, -0.0024049878120422363, -0.0022497177124023438, -0.002094447612762451, -0.0019391775131225586, -0.001783907413482666, -0.0016286373138427734, -0.0014733672142028809, -0.0013180971145629883, -0.0011628270149230957, -0.0010075569152832031, -0.0008522868156433105, -0.000697016716003418, -0.0005417466163635254, -0.0003864765167236328, -0.00023120641708374023, -7.593631744384766e-05, 7.933378219604492e-05, 0.0002346038818359375, 0.0003898739814758301, 0.0005451440811157227, 0.0007004141807556152, 0.0008556842803955078, 0.0010109543800354004, 0.001166224479675293, 0.0013214945793151855, 0.0014767646789550781, 0.0016320347785949707, 0.0017873048782348633, 0.0019425749778747559, 0.0020978450775146484, 0.002253115177154541, 0.0024083852767944336, 0.002563655376434326, 0.0027189254760742188, 0.0028741955757141113, 0.003029465675354004, 0.0031847357749938965, 0.003340005874633789, 0.0034952759742736816, 0.0036505460739135742, 0.003805816173553467, 0.003961086273193359, 0.004116356372833252, 0.0042716264724731445, 0.004426896572113037, 0.00458216667175293, 0.004737436771392822, 0.004892706871032715, 0.005047976970672607, 0.0052032470703125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 4.0, 5.0, 17.0, 28.0, 87.0, 683.0, 94379.0, 952049.0, 1089.0, 121.0, 33.0, 14.0, 9.0, 4.0, 6.0, 5.0, 1.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5234375, -2.4571685791015625, -2.390899658203125, -2.3246307373046875, -2.25836181640625, -2.1920928955078125, -2.125823974609375, -2.0595550537109375, -1.9932861328125, -1.9270172119140625, -1.860748291015625, -1.7944793701171875, -1.72821044921875, -1.6619415283203125, -1.595672607421875, -1.5294036865234375, -1.463134765625, -1.3968658447265625, -1.330596923828125, -1.2643280029296875, -1.19805908203125, -1.1317901611328125, -1.065521240234375, -0.9992523193359375, -0.9329833984375, -0.8667144775390625, -0.800445556640625, -0.7341766357421875, -0.66790771484375, -0.6016387939453125, -0.535369873046875, -0.4691009521484375, -0.40283203125, -0.3365631103515625, -0.270294189453125, -0.2040252685546875, -0.13775634765625, -0.0714874267578125, -0.005218505859375, 0.0610504150390625, 0.1273193359375, 0.1935882568359375, 0.259857177734375, 0.3261260986328125, 0.39239501953125, 0.4586639404296875, 0.524932861328125, 0.5912017822265625, 0.657470703125, 0.7237396240234375, 0.790008544921875, 0.8562774658203125, 0.92254638671875, 0.9888153076171875, 1.055084228515625, 1.1213531494140625, 1.1876220703125, 1.2538909912109375, 1.320159912109375, 1.3864288330078125, 1.45269775390625, 1.5189666748046875, 1.585235595703125, 1.6515045166015625, 1.7177734375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 13.0, 10.0, 19.0, 11.0, 32.0, 39.0, 65.0, 137.0, 355.0, 103.0, 58.0, 39.0, 26.0, 19.0, 13.0, 15.0, 9.0, 6.0, 3.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1580810546875, -0.15373897552490234, -0.1493968963623047, -0.14505481719970703, -0.14071273803710938, -0.13637065887451172, -0.13202857971191406, -0.1276865005493164, -0.12334442138671875, -0.1190023422241211, -0.11466026306152344, -0.11031818389892578, -0.10597610473632812, -0.10163402557373047, -0.09729194641113281, -0.09294986724853516, -0.0886077880859375, -0.08426570892333984, -0.07992362976074219, -0.07558155059814453, -0.07123947143554688, -0.06689739227294922, -0.06255531311035156, -0.058213233947753906, -0.05387115478515625, -0.049529075622558594, -0.04518699645996094, -0.04084491729736328, -0.036502838134765625, -0.03216075897216797, -0.027818679809570312, -0.023476600646972656, -0.019134521484375, -0.014792442321777344, -0.010450363159179688, -0.006108283996582031, -0.001766204833984375, 0.0025758743286132812, 0.0069179534912109375, 0.011260032653808594, 0.01560211181640625, 0.019944190979003906, 0.024286270141601562, 0.02862834930419922, 0.032970428466796875, 0.03731250762939453, 0.04165458679199219, 0.045996665954589844, 0.0503387451171875, 0.054680824279785156, 0.05902290344238281, 0.06336498260498047, 0.06770706176757812, 0.07204914093017578, 0.07639122009277344, 0.0807332992553711, 0.08507537841796875, 0.0894174575805664, 0.09375953674316406, 0.09810161590576172, 0.10244369506835938, 0.10678577423095703, 0.11112785339355469, 0.11546993255615234, 0.11981201171875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 7.0, 11.0, 23.0, 81.0, 249.0, 315.0, 182.0, 66.0, 26.0, 16.0, 11.0, 5.0, 2.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.1726813316345215, -2.114391803741455, -2.0561022758483887, -1.9978127479553223, -1.9395233392715454, -1.881233811378479, -1.8229442834854126, -1.7646547555923462, -1.7063653469085693, -1.648075819015503, -1.5897862911224365, -1.5314967632293701, -1.4732073545455933, -1.4149178266525269, -1.3566282987594604, -1.298338770866394, -1.2400492429733276, -1.1817597150802612, -1.1234701871871948, -1.065180778503418, -1.0068912506103516, -0.9486017227172852, -0.8903121948242188, -0.8320226669311523, -0.7737331986427307, -0.7154436707496643, -0.6571542024612427, -0.5988646745681763, -0.5405751466751099, -0.48228567838668823, -0.4239961504936218, -0.3657066524028778, -0.30741703510284424, -0.24912753701210022, -0.190838024020195, -0.1325485110282898, -0.07425901293754578, -0.015969514846801758, 0.04232001304626465, 0.10060951113700867, 0.15889900922775269, 0.2171885073184967, 0.2754780054092407, 0.33376753330230713, 0.39205703139305115, 0.45034652948379517, 0.5086360573768616, 0.5669255256652832, 0.6252150535583496, 0.683504581451416, 0.7417940497398376, 0.800083577632904, 0.8583730459213257, 0.9166625738143921, 0.9749521017074585, 1.033241629600525, 1.0915310382843018, 1.1498205661773682, 1.2081100940704346, 1.266399621963501, 1.3246890306472778, 1.3829785585403442, 1.4412680864334106, 1.499557614326477, 1.5578471422195435]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 7.0, 2.0, 12.0, 17.0, 23.0, 29.0, 46.0, 54.0, 69.0, 72.0, 99.0, 94.0, 96.0, 86.0, 80.0, 82.0, 37.0, 23.0, 23.0, 19.0, 15.0, 5.0, 6.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0650171041488647, -1.0389881134033203, -1.0129590034484863, -0.9869300127029419, -0.9609009623527527, -0.9348719120025635, -0.908842921257019, -0.8828138709068298, -0.8567848205566406, -0.8307557702064514, -0.8047267198562622, -0.7786977291107178, -0.7526686787605286, -0.7266396284103394, -0.7006106376647949, -0.6745815873146057, -0.6485525369644165, -0.6225234866142273, -0.5964944362640381, -0.5704654455184937, -0.5444363951683044, -0.5184073448181152, -0.4923783242702484, -0.4663493037223816, -0.4403202533721924, -0.4142912030220032, -0.38826218247413635, -0.36223316192626953, -0.3362041115760803, -0.3101750612258911, -0.2841460406780243, -0.25811702013015747, -0.2320879101753235, -0.20605887472629547, -0.18002983927726746, -0.15400080382823944, -0.12797176837921143, -0.10194273293018341, -0.0759136974811554, -0.04988466203212738, -0.023855626583099365, 0.00217340886592865, 0.028202444314956665, 0.05423147976398468, 0.0802605152130127, 0.10628955066204071, 0.13231858611106873, 0.15834762156009674, 0.18437665700912476, 0.21040569245815277, 0.2364347279071808, 0.2624637484550476, 0.2884927988052368, 0.314521849155426, 0.34055086970329285, 0.36657989025115967, 0.3926089406013489, 0.4186379909515381, 0.4446670114994049, 0.47069603204727173, 0.49672508239746094, 0.5227541327476501, 0.5487831830978394, 0.5748121738433838, 0.600841224193573]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 2.0, 6.0, 6.0, 4.0, 10.0, 8.0, 6.0, 6.0, 10.0, 10.0, 24.0, 24.0, 42.0, 62.0, 118.0, 195.0, 332.0, 4191941.0, 853.0, 246.0, 127.0, 72.0, 42.0, 22.0, 18.0, 14.0, 14.0, 8.0, 10.0, 9.0, 9.0, 6.0, 14.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-12.7890625, -12.3714599609375, -11.953857421875, -11.5362548828125, -11.11865234375, -10.7010498046875, -10.283447265625, -9.8658447265625, -9.4482421875, -9.0306396484375, -8.613037109375, -8.1954345703125, -7.77783203125, -7.3602294921875, -6.942626953125, -6.5250244140625, -6.107421875, -5.6898193359375, -5.272216796875, -4.8546142578125, -4.43701171875, -4.0194091796875, -3.601806640625, -3.1842041015625, -2.7666015625, -2.3489990234375, -1.931396484375, -1.5137939453125, -1.09619140625, -0.6785888671875, -0.260986328125, 0.1566162109375, 0.57421875, 0.9918212890625, 1.409423828125, 1.8270263671875, 2.24462890625, 2.6622314453125, 3.079833984375, 3.4974365234375, 3.9150390625, 4.3326416015625, 4.750244140625, 5.1678466796875, 5.58544921875, 6.0030517578125, 6.420654296875, 6.8382568359375, 7.255859375, 7.6734619140625, 8.091064453125, 8.5086669921875, 8.92626953125, 9.3438720703125, 9.761474609375, 10.1790771484375, 10.5966796875, 11.0142822265625, 11.431884765625, 11.8494873046875, 12.26708984375, 12.6846923828125, 13.102294921875, 13.5198974609375, 13.9375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 4.0, 3.0, 6.0, 5.0, 9.0, 4.0, 15.0, 30.0, 62.0, 110.0, 168.0, 167.0, 170.0, 111.0, 63.0, 36.0, 17.0, 17.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014495849609375, -0.013496875762939453, -0.012497901916503906, -0.01149892807006836, -0.010499954223632812, -0.009500980377197266, -0.008502006530761719, -0.007503032684326172, -0.006504058837890625, -0.005505084991455078, -0.004506111145019531, -0.0035071372985839844, -0.0025081634521484375, -0.0015091896057128906, -0.0005102157592773438, 0.0004887580871582031, 0.00148773193359375, 0.002486705780029297, 0.0034856796264648438, 0.004484653472900391, 0.0054836273193359375, 0.006482601165771484, 0.007481575012207031, 0.008480548858642578, 0.009479522705078125, 0.010478496551513672, 0.011477470397949219, 0.012476444244384766, 0.013475418090820312, 0.01447439193725586, 0.015473365783691406, 0.016472339630126953, 0.0174713134765625, 0.018470287322998047, 0.019469261169433594, 0.02046823501586914, 0.021467208862304688, 0.022466182708740234, 0.02346515655517578, 0.024464130401611328, 0.025463104248046875, 0.026462078094482422, 0.02746105194091797, 0.028460025787353516, 0.029458999633789062, 0.03045797348022461, 0.031456947326660156, 0.0324559211730957, 0.03345489501953125, 0.0344538688659668, 0.035452842712402344, 0.03645181655883789, 0.03745079040527344, 0.038449764251708984, 0.03944873809814453, 0.04044771194458008, 0.041446685791015625, 0.04244565963745117, 0.04344463348388672, 0.044443607330322266, 0.04544258117675781, 0.04644155502319336, 0.047440528869628906, 0.04843950271606445, 0.0494384765625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 42.0, 335.0, 4099352.0, 94415.0, 131.0, 14.0, 4.0], "bins": [-44.90625, -44.15753173828125, -43.4088134765625, -42.66009521484375, -41.911376953125, -41.16265869140625, -40.4139404296875, -39.66522216796875, -38.91650390625, -38.16778564453125, -37.4190673828125, -36.67034912109375, -35.921630859375, -35.17291259765625, -34.4241943359375, -33.67547607421875, -32.9267578125, -32.17803955078125, -31.4293212890625, -30.68060302734375, -29.931884765625, -29.18316650390625, -28.4344482421875, -27.68572998046875, -26.93701171875, -26.18829345703125, -25.4395751953125, -24.69085693359375, -23.942138671875, -23.19342041015625, -22.4447021484375, -21.69598388671875, -20.947265625, -20.19854736328125, -19.4498291015625, -18.70111083984375, -17.952392578125, -17.20367431640625, -16.4549560546875, -15.70623779296875, -14.95751953125, -14.20880126953125, -13.4600830078125, -12.71136474609375, -11.962646484375, -11.21392822265625, -10.4652099609375, -9.71649169921875, -8.9677734375, -8.21905517578125, -7.4703369140625, -6.72161865234375, -5.972900390625, -5.22418212890625, -4.4754638671875, -3.72674560546875, -2.97802734375, -2.22930908203125, -1.4805908203125, -0.73187255859375, 0.016845703125, 0.76556396484375, 1.5142822265625, 2.26300048828125, 3.01171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 19.0, 50.0, 161.0, 451.0, 2756.0, 482.0, 99.0, 37.0, 20.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.341552734375, -0.3350648880004883, -0.32857704162597656, -0.32208919525146484, -0.3156013488769531, -0.3091135025024414, -0.3026256561279297, -0.29613780975341797, -0.28964996337890625, -0.28316211700439453, -0.2766742706298828, -0.2701864242553711, -0.2636985778808594, -0.25721073150634766, -0.25072288513183594, -0.24423503875732422, -0.2377471923828125, -0.23125934600830078, -0.22477149963378906, -0.21828365325927734, -0.21179580688476562, -0.2053079605102539, -0.1988201141357422, -0.19233226776123047, -0.18584442138671875, -0.17935657501220703, -0.1728687286376953, -0.1663808822631836, -0.15989303588867188, -0.15340518951416016, -0.14691734313964844, -0.14042949676513672, -0.133941650390625, -0.12745380401611328, -0.12096595764160156, -0.11447811126708984, -0.10799026489257812, -0.1015024185180664, -0.09501457214355469, -0.08852672576904297, -0.08203887939453125, -0.07555103302001953, -0.06906318664550781, -0.0625753402709961, -0.056087493896484375, -0.049599647521972656, -0.04311180114746094, -0.03662395477294922, -0.0301361083984375, -0.02364826202392578, -0.017160415649414062, -0.010672569274902344, -0.004184722900390625, 0.0023031234741210938, 0.008790969848632812, 0.015278816223144531, 0.02176666259765625, 0.02825450897216797, 0.03474235534667969, 0.041230201721191406, 0.047718048095703125, 0.054205894470214844, 0.06069374084472656, 0.06718158721923828, 0.07366943359375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 12.0, 1006.0, 2.0], "bins": [-109.62127685546875, -107.8634033203125, -106.10552215576172, -104.34764862060547, -102.58976745605469, -100.83189392089844, -99.07401275634766, -97.3161392211914, -95.55825805664062, -93.80038452148438, -92.0425033569336, -90.28462982177734, -88.52674865722656, -86.76887512207031, -85.01099395751953, -83.25312042236328, -81.49524688720703, -79.73737335205078, -77.9794921875, -76.22161865234375, -74.46373748779297, -72.70586395263672, -70.94798278808594, -69.19010925292969, -67.4322280883789, -65.67435455322266, -63.916473388671875, -62.15859603881836, -60.400718688964844, -58.642845153808594, -56.88496398925781, -55.12709045410156, -53.36921310424805, -51.61133575439453, -49.853458404541016, -48.0955810546875, -46.337703704833984, -44.57982635498047, -42.82195281982422, -41.0640754699707, -39.30619430541992, -37.548316955566406, -35.79043960571289, -34.032562255859375, -32.27468490600586, -30.516809463500977, -28.75893211364746, -27.001056671142578, -25.243179321289062, -23.485301971435547, -21.72742462158203, -19.969547271728516, -18.211671829223633, -16.453794479370117, -14.695917129516602, -12.938040733337402, -11.180164337158203, -9.422286987304688, -7.664410591125488, -5.906533241271973, -4.148656368255615, -2.390779495239258, -0.6329021453857422, 1.124974250793457, 2.882852077484131]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 12.0, 28.0, 53.0, 133.0, 187.0, 229.0, 160.0, 119.0, 55.0, 21.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.178565979003906, -7.032254695892334, -6.8859429359436035, -6.739631652832031, -6.593319892883301, -6.4470086097717285, -6.300697326660156, -6.154385566711426, -6.0080742835998535, -5.861763000488281, -5.715451240539551, -5.5691399574279785, -5.422828197479248, -5.276516914367676, -5.130205154418945, -4.983893871307373, -4.837582588195801, -4.6912713050842285, -4.544959545135498, -4.398648262023926, -4.252336502075195, -4.106025218963623, -3.9597136974334717, -3.8134021759033203, -3.66709041595459, -3.5207788944244385, -3.374467372894287, -3.228156089782715, -3.0818445682525635, -2.935533046722412, -2.7892215251922607, -2.6429100036621094, -2.496598482131958, -2.3502869606018066, -2.2039754390716553, -2.057663917541504, -1.9113526344299316, -1.7650411128997803, -1.618729591369629, -1.472418189048767, -1.3261066675186157, -1.1797951459884644, -1.0334837436676025, -0.8871722221374512, -0.7408607602119446, -0.594549298286438, -0.4482377767562866, -0.3019263744354248, -0.15561485290527344, -0.009303376078605652, 0.13700810074806213, 0.2833195924758911, 0.4296310544013977, 0.5759425163269043, 0.7222540378570557, 0.8685654401779175, 1.0148769617080688, 1.1611884832382202, 1.307499885559082, 1.4538114070892334, 1.6001229286193848, 1.7464343309402466, 1.892745852470398, 2.0390572547912598, 2.185368776321411]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 9.0, 12.0, 13.0, 15.0, 15.0, 22.0, 31.0, 29.0, 40.0, 36.0, 44.0, 61.0, 79.0, 153.0, 462.0, 1027689.0, 19128.0, 220.0, 109.0, 73.0, 49.0, 36.0, 36.0, 27.0, 18.0, 22.0, 16.0, 16.0, 17.0, 15.0, 8.0, 11.0, 11.0, 4.0, 4.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.96240234375, -11.5732421875, -11.18408203125, -10.794921875, -10.40576171875, -10.0166015625, -9.62744140625, -9.23828125, -8.84912109375, -8.4599609375, -8.07080078125, -7.681640625, -7.29248046875, -6.9033203125, -6.51416015625, -6.125, -5.73583984375, -5.3466796875, -4.95751953125, -4.568359375, -4.17919921875, -3.7900390625, -3.40087890625, -3.01171875, -2.62255859375, -2.2333984375, -1.84423828125, -1.455078125, -1.06591796875, -0.6767578125, -0.28759765625, 0.1015625, 0.49072265625, 0.8798828125, 1.26904296875, 1.658203125, 2.04736328125, 2.4365234375, 2.82568359375, 3.21484375, 3.60400390625, 3.9931640625, 4.38232421875, 4.771484375, 5.16064453125, 5.5498046875, 5.93896484375, 6.328125, 6.71728515625, 7.1064453125, 7.49560546875, 7.884765625, 8.27392578125, 8.6630859375, 9.05224609375, 9.44140625, 9.83056640625, 10.2197265625, 10.60888671875, 10.998046875, 11.38720703125, 11.7763671875, 12.16552734375, 12.5546875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 39.0, 181.0, 381.0, 306.0, 94.0, 17.0], "bins": [-1.0869140625, -1.0690064430236816, -1.0510988235473633, -1.033191204071045, -1.0152835845947266, -0.9973759651184082, -0.9794683456420898, -0.9615607261657715, -0.9436531066894531, -0.9257454872131348, -0.9078378677368164, -0.889930248260498, -0.8720226287841797, -0.8541150093078613, -0.836207389831543, -0.8182997703552246, -0.8003921508789062, -0.7824845314025879, -0.7645769119262695, -0.7466692924499512, -0.7287616729736328, -0.7108540534973145, -0.6929464340209961, -0.6750388145446777, -0.6571311950683594, -0.639223575592041, -0.6213159561157227, -0.6034083366394043, -0.5855007171630859, -0.5675930976867676, -0.5496854782104492, -0.5317778587341309, -0.5138702392578125, -0.49596261978149414, -0.4780550003051758, -0.4601473808288574, -0.44223976135253906, -0.4243321418762207, -0.40642452239990234, -0.388516902923584, -0.3706092834472656, -0.35270166397094727, -0.3347940444946289, -0.31688642501831055, -0.2989788055419922, -0.28107118606567383, -0.26316356658935547, -0.2452559471130371, -0.22734832763671875, -0.2094407081604004, -0.19153308868408203, -0.17362546920776367, -0.1557178497314453, -0.13781023025512695, -0.1199026107788086, -0.10199499130249023, -0.08408737182617188, -0.06617975234985352, -0.048272132873535156, -0.030364513397216797, -0.012456893920898438, 0.005450725555419922, 0.02335834503173828, 0.04126596450805664, 0.059173583984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 4.0, 6.0, 15.0, 14.0, 23.0, 23.0, 41.0, 55.0, 95.0, 164.0, 388.0, 866.0, 2712.0, 10308.0, 56147.0, 584154.0, 343709.0, 38338.0, 7683.0, 2272.0, 764.0, 324.0, 141.0, 96.0, 61.0, 51.0, 25.0, 8.0, 11.0, 10.0, 14.0, 8.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.70703125, -3.5787353515625, -3.450439453125, -3.3221435546875, -3.19384765625, -3.0655517578125, -2.937255859375, -2.8089599609375, -2.6806640625, -2.5523681640625, -2.424072265625, -2.2957763671875, -2.16748046875, -2.0391845703125, -1.910888671875, -1.7825927734375, -1.654296875, -1.5260009765625, -1.397705078125, -1.2694091796875, -1.14111328125, -1.0128173828125, -0.884521484375, -0.7562255859375, -0.6279296875, -0.4996337890625, -0.371337890625, -0.2430419921875, -0.11474609375, 0.0135498046875, 0.141845703125, 0.2701416015625, 0.3984375, 0.5267333984375, 0.655029296875, 0.7833251953125, 0.91162109375, 1.0399169921875, 1.168212890625, 1.2965087890625, 1.4248046875, 1.5531005859375, 1.681396484375, 1.8096923828125, 1.93798828125, 2.0662841796875, 2.194580078125, 2.3228759765625, 2.451171875, 2.5794677734375, 2.707763671875, 2.8360595703125, 2.96435546875, 3.0926513671875, 3.220947265625, 3.3492431640625, 3.4775390625, 3.6058349609375, 3.734130859375, 3.8624267578125, 3.99072265625, 4.1190185546875, 4.247314453125, 4.3756103515625, 4.50390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 11.0, 7.0, 10.0, 19.0, 17.0, 19.0, 25.0, 29.0, 20.0, 36.0, 35.0, 41.0, 55.0, 47.0, 51.0, 62.0, 52.0, 45.0, 42.0, 50.0, 35.0, 52.0, 45.0, 28.0, 32.0, 29.0, 15.0, 13.0, 14.0, 13.0, 13.0, 11.0, 4.0, 3.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8681640625, -0.8350982666015625, -0.802032470703125, -0.7689666748046875, -0.73590087890625, -0.7028350830078125, -0.669769287109375, -0.6367034912109375, -0.6036376953125, -0.5705718994140625, -0.537506103515625, -0.5044403076171875, -0.47137451171875, -0.4383087158203125, -0.405242919921875, -0.3721771240234375, -0.339111328125, -0.3060455322265625, -0.272979736328125, -0.2399139404296875, -0.20684814453125, -0.1737823486328125, -0.140716552734375, -0.1076507568359375, -0.0745849609375, -0.0415191650390625, -0.008453369140625, 0.0246124267578125, 0.05767822265625, 0.0907440185546875, 0.123809814453125, 0.1568756103515625, 0.18994140625, 0.2230072021484375, 0.256072998046875, 0.2891387939453125, 0.32220458984375, 0.3552703857421875, 0.388336181640625, 0.4214019775390625, 0.4544677734375, 0.4875335693359375, 0.520599365234375, 0.5536651611328125, 0.58673095703125, 0.6197967529296875, 0.652862548828125, 0.6859283447265625, 0.718994140625, 0.7520599365234375, 0.785125732421875, 0.8181915283203125, 0.85125732421875, 0.8843231201171875, 0.917388916015625, 0.9504547119140625, 0.9835205078125, 1.0165863037109375, 1.049652099609375, 1.0827178955078125, 1.11578369140625, 1.1488494873046875, 1.181915283203125, 1.2149810791015625, 1.248046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 10.0, 7.0, 7.0, 21.0, 23.0, 34.0, 66.0, 112.0, 190.0, 454.0, 1012.0, 2854.0, 10570.0, 77706.0, 844869.0, 93586.0, 11817.0, 3113.0, 1127.0, 466.0, 219.0, 112.0, 60.0, 44.0, 30.0, 16.0, 6.0, 5.0, 7.0, 2.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09765625, -2.992767333984375, -2.88787841796875, -2.782989501953125, -2.6781005859375, -2.573211669921875, -2.46832275390625, -2.363433837890625, -2.258544921875, -2.153656005859375, -2.04876708984375, -1.943878173828125, -1.8389892578125, -1.734100341796875, -1.62921142578125, -1.524322509765625, -1.41943359375, -1.314544677734375, -1.20965576171875, -1.104766845703125, -0.9998779296875, -0.894989013671875, -0.79010009765625, -0.685211181640625, -0.580322265625, -0.475433349609375, -0.37054443359375, -0.265655517578125, -0.1607666015625, -0.055877685546875, 0.04901123046875, 0.153900146484375, 0.2587890625, 0.363677978515625, 0.46856689453125, 0.573455810546875, 0.6783447265625, 0.783233642578125, 0.88812255859375, 0.993011474609375, 1.097900390625, 1.202789306640625, 1.30767822265625, 1.412567138671875, 1.5174560546875, 1.622344970703125, 1.72723388671875, 1.832122802734375, 1.93701171875, 2.041900634765625, 2.14678955078125, 2.251678466796875, 2.3565673828125, 2.461456298828125, 2.56634521484375, 2.671234130859375, 2.776123046875, 2.881011962890625, 2.98590087890625, 3.090789794921875, 3.1956787109375, 3.300567626953125, 3.40545654296875, 3.510345458984375, 3.615234375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 3.0, 3.0, 9.0, 7.0, 7.0, 16.0, 18.0, 18.0, 19.0, 41.0, 49.0, 92.0, 129.0, 181.0, 109.0, 87.0, 50.0, 30.0, 26.0, 17.0, 20.0, 4.0, 10.0, 9.0, 8.0, 7.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0008754730224609375, -0.0008520856499671936, -0.0008286982774734497, -0.0008053109049797058, -0.0007819235324859619, -0.000758536159992218, -0.0007351487874984741, -0.0007117614150047302, -0.0006883740425109863, -0.0006649866700172424, -0.0006415992975234985, -0.0006182119250297546, -0.0005948245525360107, -0.0005714371800422668, -0.000548049807548523, -0.000524662435054779, -0.0005012750625610352, -0.00047788769006729126, -0.00045450031757354736, -0.00043111294507980347, -0.00040772557258605957, -0.0003843382000923157, -0.0003609508275985718, -0.0003375634551048279, -0.000314176082611084, -0.0002907887101173401, -0.0002674013376235962, -0.0002440139651298523, -0.0002206265926361084, -0.0001972392201423645, -0.0001738518476486206, -0.0001504644751548767, -0.0001270771026611328, -0.00010368973016738892, -8.030235767364502e-05, -5.691498517990112e-05, -3.3527612686157227e-05, -1.014024019241333e-05, 1.3247132301330566e-05, 3.663450479507446e-05, 6.002187728881836e-05, 8.340924978256226e-05, 0.00010679662227630615, 0.00013018399477005005, 0.00015357136726379395, 0.00017695873975753784, 0.00020034611225128174, 0.00022373348474502563, 0.00024712085723876953, 0.00027050822973251343, 0.0002938956022262573, 0.0003172829747200012, 0.0003406703472137451, 0.000364057719707489, 0.0003874450922012329, 0.0004108324646949768, 0.0004342198371887207, 0.0004576072096824646, 0.0004809945821762085, 0.0005043819546699524, 0.0005277693271636963, 0.0005511566996574402, 0.0005745440721511841, 0.000597931444644928, 0.0006213188171386719]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 17.0, 22.0, 38.0, 48.0, 95.0, 161.0, 265.0, 528.0, 1226.0, 3479.0, 13397.0, 114000.0, 834871.0, 66117.0, 9762.0, 2659.0, 962.0, 390.0, 219.0, 103.0, 55.0, 40.0, 30.0, 14.0, 9.0, 5.0, 6.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248046875, -3.144622802734375, -3.04119873046875, -2.937774658203125, -2.8343505859375, -2.730926513671875, -2.62750244140625, -2.524078369140625, -2.420654296875, -2.317230224609375, -2.21380615234375, -2.110382080078125, -2.0069580078125, -1.903533935546875, -1.80010986328125, -1.696685791015625, -1.59326171875, -1.489837646484375, -1.38641357421875, -1.282989501953125, -1.1795654296875, -1.076141357421875, -0.97271728515625, -0.869293212890625, -0.765869140625, -0.662445068359375, -0.55902099609375, -0.455596923828125, -0.3521728515625, -0.248748779296875, -0.14532470703125, -0.041900634765625, 0.0615234375, 0.164947509765625, 0.26837158203125, 0.371795654296875, 0.4752197265625, 0.578643798828125, 0.68206787109375, 0.785491943359375, 0.888916015625, 0.992340087890625, 1.09576416015625, 1.199188232421875, 1.3026123046875, 1.406036376953125, 1.50946044921875, 1.612884521484375, 1.71630859375, 1.819732666015625, 1.92315673828125, 2.026580810546875, 2.1300048828125, 2.233428955078125, 2.33685302734375, 2.440277099609375, 2.543701171875, 2.647125244140625, 2.75054931640625, 2.853973388671875, 2.9573974609375, 3.060821533203125, 3.16424560546875, 3.267669677734375, 3.37109375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 3.0, 12.0, 9.0, 21.0, 26.0, 38.0, 39.0, 82.0, 114.0, 136.0, 132.0, 120.0, 80.0, 58.0, 35.0, 22.0, 13.0, 8.0, 6.0, 14.0, 6.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5439453125, -1.5088882446289062, -1.4738311767578125, -1.4387741088867188, -1.403717041015625, -1.3686599731445312, -1.3336029052734375, -1.2985458374023438, -1.26348876953125, -1.2284317016601562, -1.1933746337890625, -1.1583175659179688, -1.123260498046875, -1.0882034301757812, -1.0531463623046875, -1.0180892944335938, -0.9830322265625, -0.9479751586914062, -0.9129180908203125, -0.8778610229492188, -0.842803955078125, -0.8077468872070312, -0.7726898193359375, -0.7376327514648438, -0.70257568359375, -0.6675186157226562, -0.6324615478515625, -0.5974044799804688, -0.562347412109375, -0.5272903442382812, -0.4922332763671875, -0.45717620849609375, -0.422119140625, -0.38706207275390625, -0.3520050048828125, -0.31694793701171875, -0.281890869140625, -0.24683380126953125, -0.2117767333984375, -0.17671966552734375, -0.14166259765625, -0.10660552978515625, -0.0715484619140625, -0.03649139404296875, -0.001434326171875, 0.03362274169921875, 0.0686798095703125, 0.10373687744140625, 0.1387939453125, 0.17385101318359375, 0.2089080810546875, 0.24396514892578125, 0.279022216796875, 0.31407928466796875, 0.3491363525390625, 0.38419342041015625, 0.41925048828125, 0.45430755615234375, 0.4893646240234375, 0.5244216918945312, 0.559478759765625, 0.5945358276367188, 0.6295928955078125, 0.6646499633789062, 0.69970703125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 31.0, 584.0, 367.0, 26.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.187950134277344, -21.119478225708008, -18.051006317138672, -14.982534408569336, -11.9140625, -8.845590591430664, -5.777118682861328, -2.708646774291992, 0.35982513427734375, 3.4282970428466797, 6.496768951416016, 9.565240859985352, 12.633712768554688, 15.702184677124023, 18.77065658569336, 21.839128494262695, 24.90760040283203, 27.976072311401367, 31.044544219970703, 34.113014221191406, 37.181488037109375, 40.249961853027344, 43.31843185424805, 46.38690185546875, 49.45537567138672, 52.52384948730469, 55.59231948852539, 58.660789489746094, 61.72926330566406, 64.79773712158203, 67.8662109375, 70.93467712402344, 74.00315856933594, 77.0716323852539, 80.14010620117188, 83.20857238769531, 86.27704620361328, 89.34552001953125, 92.41398620605469, 95.48246002197266, 98.55093383789062, 101.6194076538086, 104.68788146972656, 107.75634765625, 110.82482147216797, 113.89329528808594, 116.96176147460938, 120.03023529052734, 123.09870910644531, 126.16718292236328, 129.23565673828125, 132.3041229248047, 135.37258911132812, 138.44107055664062, 141.50953674316406, 144.57801818847656, 147.646484375, 150.71495056152344, 153.78343200683594, 156.85189819335938, 159.92037963867188, 162.9888458251953, 166.05731201171875, 169.12579345703125, 172.1942596435547]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 9.0, 16.0, 40.0, 38.0, 66.0, 82.0, 108.0, 124.0, 127.0, 109.0, 109.0, 56.0, 47.0, 36.0, 26.0, 5.0, 9.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6742525100708, -15.137526512145996, -14.600801467895508, -14.064075469970703, -13.527349472045898, -12.99062442779541, -12.453898429870605, -11.917173385620117, -11.380447387695312, -10.843721389770508, -10.30699634552002, -9.770270347595215, -9.233545303344727, -8.696819305419922, -8.160093307495117, -7.623367786407471, -7.086642265319824, -6.549916744232178, -6.013191223144531, -5.476465225219727, -4.93973970413208, -4.403014183044434, -3.866288423538208, -3.3295626640319824, -2.792837142944336, -2.2561116218566895, -1.7193858623504639, -1.1826602220535278, -0.6459345817565918, -0.10920906066894531, 0.4275166988372803, 0.9642424583435059, 1.5009689331054688, 2.0376944541931152, 2.574420213699341, 3.1111459732055664, 3.647871494293213, 4.184597015380859, 4.721323013305664, 5.2580485343933105, 5.794774055480957, 6.3314995765686035, 6.86822509765625, 7.404951095581055, 7.941676616668701, 8.478402137756348, 9.015128135681152, 9.55185317993164, 10.088579177856445, 10.62530517578125, 11.162030220031738, 11.698756217956543, 12.235481262207031, 12.772207260131836, 13.30893325805664, 13.845659255981445, 14.382384300231934, 14.919110298156738, 15.455835342407227, 15.992561340332031, 16.529287338256836, 17.06601333618164, 17.602737426757812, 18.139463424682617, 18.676189422607422]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 8.0, 8.0, 17.0, 21.0, 17.0, 43.0, 100.0, 222.0, 895.0, 4081166.0, 110851.0, 625.0, 147.0, 66.0, 35.0, 25.0, 14.0, 10.0, 5.0, 3.0, 3.0, 3.0], "bins": [-40.5625, -39.7813720703125, -39.000244140625, -38.2191162109375, -37.43798828125, -36.6568603515625, -35.875732421875, -35.0946044921875, -34.3134765625, -33.5323486328125, -32.751220703125, -31.9700927734375, -31.18896484375, -30.4078369140625, -29.626708984375, -28.8455810546875, -28.064453125, -27.2833251953125, -26.502197265625, -25.7210693359375, -24.93994140625, -24.1588134765625, -23.377685546875, -22.5965576171875, -21.8154296875, -21.0343017578125, -20.253173828125, -19.4720458984375, -18.69091796875, -17.9097900390625, -17.128662109375, -16.3475341796875, -15.56640625, -14.7852783203125, -14.004150390625, -13.2230224609375, -12.44189453125, -11.6607666015625, -10.879638671875, -10.0985107421875, -9.3173828125, -8.5362548828125, -7.755126953125, -6.9739990234375, -6.19287109375, -5.4117431640625, -4.630615234375, -3.8494873046875, -3.068359375, -2.2872314453125, -1.506103515625, -0.7249755859375, 0.05615234375, 0.8372802734375, 1.618408203125, 2.3995361328125, 3.1806640625, 3.9617919921875, 4.742919921875, 5.5240478515625, 6.30517578125, 7.0863037109375, 7.867431640625, 8.6485595703125, 9.4296875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 37.0, 91.0, 170.0, 250.0, 259.0, 120.0, 46.0, 22.0, 10.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9814453125, -0.9628334045410156, -0.9442214965820312, -0.9256095886230469, -0.9069976806640625, -0.8883857727050781, -0.8697738647460938, -0.8511619567871094, -0.832550048828125, -0.8139381408691406, -0.7953262329101562, -0.7767143249511719, -0.7581024169921875, -0.7394905090332031, -0.7208786010742188, -0.7022666931152344, -0.68365478515625, -0.6650428771972656, -0.6464309692382812, -0.6278190612792969, -0.6092071533203125, -0.5905952453613281, -0.5719833374023438, -0.5533714294433594, -0.534759521484375, -0.5161476135253906, -0.49753570556640625, -0.4789237976074219, -0.4603118896484375, -0.4416999816894531, -0.42308807373046875, -0.4044761657714844, -0.3858642578125, -0.3672523498535156, -0.34864044189453125, -0.3300285339355469, -0.3114166259765625, -0.2928047180175781, -0.27419281005859375, -0.2555809020996094, -0.236968994140625, -0.21835708618164062, -0.19974517822265625, -0.18113327026367188, -0.1625213623046875, -0.14390945434570312, -0.12529754638671875, -0.10668563842773438, -0.08807373046875, -0.06946182250976562, -0.05084991455078125, -0.032238006591796875, -0.0136260986328125, 0.004985809326171875, 0.02359771728515625, 0.042209625244140625, 0.060821533203125, 0.07943344116210938, 0.09804534912109375, 0.11665725708007812, 0.1352691650390625, 0.15388107299804688, 0.17249298095703125, 0.19110488891601562, 0.209716796875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 16.0, 23.0, 53.0, 87.0, 116.0, 144.0, 211.0, 373.0, 84068.0, 4108263.0, 440.0, 200.0, 124.0, 79.0, 33.0, 30.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.65625, -59.14306640625, -57.6298828125, -56.11669921875, -54.603515625, -53.09033203125, -51.5771484375, -50.06396484375, -48.55078125, -47.03759765625, -45.5244140625, -44.01123046875, -42.498046875, -40.98486328125, -39.4716796875, -37.95849609375, -36.4453125, -34.93212890625, -33.4189453125, -31.90576171875, -30.392578125, -28.87939453125, -27.3662109375, -25.85302734375, -24.33984375, -22.82666015625, -21.3134765625, -19.80029296875, -18.287109375, -16.77392578125, -15.2607421875, -13.74755859375, -12.234375, -10.72119140625, -9.2080078125, -7.69482421875, -6.181640625, -4.66845703125, -3.1552734375, -1.64208984375, -0.12890625, 1.38427734375, 2.8974609375, 4.41064453125, 5.923828125, 7.43701171875, 8.9501953125, 10.46337890625, 11.9765625, 13.48974609375, 15.0029296875, 16.51611328125, 18.029296875, 19.54248046875, 21.0556640625, 22.56884765625, 24.08203125, 25.59521484375, 27.1083984375, 28.62158203125, 30.134765625, 31.64794921875, 33.1611328125, 34.67431640625, 36.1875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 12.0, 54.0, 180.0, 3670.0, 150.0, 16.0, 5.0, 4.0], "bins": [-7.6796875, -7.550689697265625, -7.42169189453125, -7.292694091796875, -7.1636962890625, -7.034698486328125, -6.90570068359375, -6.776702880859375, -6.647705078125, -6.518707275390625, -6.38970947265625, -6.260711669921875, -6.1317138671875, -6.002716064453125, -5.87371826171875, -5.744720458984375, -5.61572265625, -5.486724853515625, -5.35772705078125, -5.228729248046875, -5.0997314453125, -4.970733642578125, -4.84173583984375, -4.712738037109375, -4.583740234375, -4.454742431640625, -4.32574462890625, -4.196746826171875, -4.0677490234375, -3.938751220703125, -3.80975341796875, -3.680755615234375, -3.5517578125, -3.422760009765625, -3.29376220703125, -3.164764404296875, -3.0357666015625, -2.906768798828125, -2.77777099609375, -2.648773193359375, -2.519775390625, -2.390777587890625, -2.26177978515625, -2.132781982421875, -2.0037841796875, -1.874786376953125, -1.74578857421875, -1.616790771484375, -1.48779296875, -1.358795166015625, -1.22979736328125, -1.100799560546875, -0.9718017578125, -0.842803955078125, -0.71380615234375, -0.584808349609375, -0.455810546875, -0.326812744140625, -0.19781494140625, -0.068817138671875, 0.0601806640625, 0.189178466796875, 0.31817626953125, 0.447174072265625, 0.576171875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 56.0, 807.0, 134.0, 12.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-140.2589874267578, -137.78521728515625, -135.3114471435547, -132.83767700195312, -130.36390686035156, -127.89014434814453, -125.41637420654297, -122.94261169433594, -120.46884155273438, -117.99507141113281, -115.52130126953125, -113.04753875732422, -110.57376861572266, -108.0999984741211, -105.62622833251953, -103.1524658203125, -100.67869567871094, -98.20492553710938, -95.73115539550781, -93.25739288330078, -90.78362274169922, -88.30985260009766, -85.8360824584961, -83.36231994628906, -80.88854217529297, -78.4147720336914, -75.94100189208984, -73.46723937988281, -70.99346923828125, -68.51969909667969, -66.04592895507812, -63.57216262817383, -61.098392486572266, -58.6246223449707, -56.150856018066406, -53.677085876464844, -51.20331954956055, -48.729549407958984, -46.25578308105469, -43.782012939453125, -41.30824279785156, -38.83447265625, -36.3607063293457, -33.88693618774414, -31.413169860839844, -28.93939971923828, -26.46563148498535, -23.991863250732422, -21.518096923828125, -19.044328689575195, -16.570560455322266, -14.09679126739502, -11.62302303314209, -9.14925479888916, -6.675485610961914, -4.201717376708984, -1.7279491424560547, 0.7458193302154541, 3.219587802886963, 5.693356513977051, 8.16712474822998, 10.64089298248291, 13.114662170410156, 15.588430404663086, 18.062198638916016]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 17.0, 22.0, 59.0, 91.0, 132.0, 161.0, 173.0, 126.0, 103.0, 68.0, 27.0, 13.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.814254760742188, -16.145212173461914, -15.476170539855957, -14.80712890625, -14.138087272644043, -13.469045639038086, -12.800003051757812, -12.130961418151855, -11.461919784545898, -10.792878150939941, -10.123835563659668, -9.454793930053711, -8.785752296447754, -8.116710662841797, -7.447668075561523, -6.778626441955566, -6.109583854675293, -5.440541744232178, -4.771500110626221, -4.1024580001831055, -3.4334161281585693, -2.764374256134033, -2.095332145690918, -1.426290512084961, -0.7572484016418457, -0.0882064700126648, 0.5808354616165161, 1.2498774528503418, 1.918919324874878, 2.587961196899414, 3.2570033073425293, 3.9260449409484863, 4.595087051391602, 5.264129161834717, 5.933170795440674, 6.602212905883789, 7.271254539489746, 7.940296649932861, 8.609338760375977, 9.278380393981934, 9.94742202758789, 10.616463661193848, 11.285506248474121, 11.954547882080078, 12.623589515686035, 13.292631149291992, 13.961673736572266, 14.630715370178223, 15.299757957458496, 15.968799591064453, 16.637842178344727, 17.306884765625, 17.97592544555664, 18.644968032836914, 19.314010620117188, 19.983051300048828, 20.6520938873291, 21.321136474609375, 21.990177154541016, 22.65921974182129, 23.328262329101562, 23.997303009033203, 24.666345596313477, 25.33538818359375, 26.00442886352539]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 4.0, 13.0, 12.0, 12.0, 14.0, 24.0, 36.0, 37.0, 59.0, 117.0, 219.0, 595.0, 2701.0, 49254.0, 959354.0, 32637.0, 2372.0, 568.0, 195.0, 93.0, 64.0, 45.0, 34.0, 20.0, 16.0, 16.0, 14.0, 9.0, 6.0, 2.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.5546875, -15.0753173828125, -14.595947265625, -14.1165771484375, -13.63720703125, -13.1578369140625, -12.678466796875, -12.1990966796875, -11.7197265625, -11.2403564453125, -10.760986328125, -10.2816162109375, -9.80224609375, -9.3228759765625, -8.843505859375, -8.3641357421875, -7.884765625, -7.4053955078125, -6.926025390625, -6.4466552734375, -5.96728515625, -5.4879150390625, -5.008544921875, -4.5291748046875, -4.0498046875, -3.5704345703125, -3.091064453125, -2.6116943359375, -2.13232421875, -1.6529541015625, -1.173583984375, -0.6942138671875, -0.21484375, 0.2645263671875, 0.743896484375, 1.2232666015625, 1.70263671875, 2.1820068359375, 2.661376953125, 3.1407470703125, 3.6201171875, 4.0994873046875, 4.578857421875, 5.0582275390625, 5.53759765625, 6.0169677734375, 6.496337890625, 6.9757080078125, 7.455078125, 7.9344482421875, 8.413818359375, 8.8931884765625, 9.37255859375, 9.8519287109375, 10.331298828125, 10.8106689453125, 11.2900390625, 11.7694091796875, 12.248779296875, 12.7281494140625, 13.20751953125, 13.6868896484375, 14.166259765625, 14.6456298828125, 15.125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 11.0, 27.0, 52.0, 82.0, 100.0, 156.0, 190.0, 142.0, 97.0, 72.0, 40.0, 18.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3369140625, -1.3080062866210938, -1.2790985107421875, -1.2501907348632812, -1.221282958984375, -1.1923751831054688, -1.1634674072265625, -1.1345596313476562, -1.10565185546875, -1.0767440795898438, -1.0478363037109375, -1.0189285278320312, -0.990020751953125, -0.9611129760742188, -0.9322052001953125, -0.9032974243164062, -0.8743896484375, -0.8454818725585938, -0.8165740966796875, -0.7876663208007812, -0.758758544921875, -0.7298507690429688, -0.7009429931640625, -0.6720352172851562, -0.64312744140625, -0.6142196655273438, -0.5853118896484375, -0.5564041137695312, -0.527496337890625, -0.49858856201171875, -0.4696807861328125, -0.44077301025390625, -0.411865234375, -0.38295745849609375, -0.3540496826171875, -0.32514190673828125, -0.296234130859375, -0.26732635498046875, -0.2384185791015625, -0.20951080322265625, -0.18060302734375, -0.15169525146484375, -0.1227874755859375, -0.09387969970703125, -0.064971923828125, -0.03606414794921875, -0.0071563720703125, 0.02175140380859375, 0.0506591796875, 0.07956695556640625, 0.1084747314453125, 0.13738250732421875, 0.166290283203125, 0.19519805908203125, 0.2241058349609375, 0.25301361083984375, 0.28192138671875, 0.31082916259765625, 0.3397369384765625, 0.36864471435546875, 0.397552490234375, 0.42646026611328125, 0.4553680419921875, 0.48427581787109375, 0.51318359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 12.0, 11.0, 13.0, 21.0, 34.0, 41.0, 74.0, 104.0, 175.0, 357.0, 774.0, 1979.0, 7204.0, 47429.0, 584461.0, 366611.0, 30941.0, 5345.0, 1600.0, 599.0, 303.0, 172.0, 96.0, 71.0, 44.0, 20.0, 15.0, 13.0, 12.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-6.71484375, -6.542236328125, -6.36962890625, -6.197021484375, -6.0244140625, -5.851806640625, -5.67919921875, -5.506591796875, -5.333984375, -5.161376953125, -4.98876953125, -4.816162109375, -4.6435546875, -4.470947265625, -4.29833984375, -4.125732421875, -3.953125, -3.780517578125, -3.60791015625, -3.435302734375, -3.2626953125, -3.090087890625, -2.91748046875, -2.744873046875, -2.572265625, -2.399658203125, -2.22705078125, -2.054443359375, -1.8818359375, -1.709228515625, -1.53662109375, -1.364013671875, -1.19140625, -1.018798828125, -0.84619140625, -0.673583984375, -0.5009765625, -0.328369140625, -0.15576171875, 0.016845703125, 0.189453125, 0.362060546875, 0.53466796875, 0.707275390625, 0.8798828125, 1.052490234375, 1.22509765625, 1.397705078125, 1.5703125, 1.742919921875, 1.91552734375, 2.088134765625, 2.2607421875, 2.433349609375, 2.60595703125, 2.778564453125, 2.951171875, 3.123779296875, 3.29638671875, 3.468994140625, 3.6416015625, 3.814208984375, 3.98681640625, 4.159423828125, 4.33203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 11.0, 12.0, 18.0, 21.0, 25.0, 32.0, 35.0, 47.0, 34.0, 45.0, 62.0, 63.0, 55.0, 72.0, 58.0, 53.0, 55.0, 44.0, 50.0, 32.0, 33.0, 23.0, 22.0, 28.0, 11.0, 11.0, 7.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0], "bins": [-2.431640625, -2.36859130859375, -2.3055419921875, -2.24249267578125, -2.179443359375, -2.11639404296875, -2.0533447265625, -1.99029541015625, -1.92724609375, -1.86419677734375, -1.8011474609375, -1.73809814453125, -1.675048828125, -1.61199951171875, -1.5489501953125, -1.48590087890625, -1.4228515625, -1.35980224609375, -1.2967529296875, -1.23370361328125, -1.170654296875, -1.10760498046875, -1.0445556640625, -0.98150634765625, -0.91845703125, -0.85540771484375, -0.7923583984375, -0.72930908203125, -0.666259765625, -0.60321044921875, -0.5401611328125, -0.47711181640625, -0.4140625, -0.35101318359375, -0.2879638671875, -0.22491455078125, -0.161865234375, -0.09881591796875, -0.0357666015625, 0.02728271484375, 0.09033203125, 0.15338134765625, 0.2164306640625, 0.27947998046875, 0.342529296875, 0.40557861328125, 0.4686279296875, 0.53167724609375, 0.5947265625, 0.65777587890625, 0.7208251953125, 0.78387451171875, 0.846923828125, 0.90997314453125, 0.9730224609375, 1.03607177734375, 1.09912109375, 1.16217041015625, 1.2252197265625, 1.28826904296875, 1.351318359375, 1.41436767578125, 1.4774169921875, 1.54046630859375, 1.603515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 9.0, 14.0, 20.0, 15.0, 34.0, 41.0, 66.0, 111.0, 209.0, 306.0, 631.0, 1349.0, 3543.0, 11289.0, 59407.0, 663406.0, 268889.0, 27996.0, 6677.0, 2415.0, 986.0, 474.0, 267.0, 133.0, 83.0, 63.0, 31.0, 29.0, 13.0, 12.0, 9.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.662109375, -3.559814453125, -3.45751953125, -3.355224609375, -3.2529296875, -3.150634765625, -3.04833984375, -2.946044921875, -2.84375, -2.741455078125, -2.63916015625, -2.536865234375, -2.4345703125, -2.332275390625, -2.22998046875, -2.127685546875, -2.025390625, -1.923095703125, -1.82080078125, -1.718505859375, -1.6162109375, -1.513916015625, -1.41162109375, -1.309326171875, -1.20703125, -1.104736328125, -1.00244140625, -0.900146484375, -0.7978515625, -0.695556640625, -0.59326171875, -0.490966796875, -0.388671875, -0.286376953125, -0.18408203125, -0.081787109375, 0.0205078125, 0.122802734375, 0.22509765625, 0.327392578125, 0.4296875, 0.531982421875, 0.63427734375, 0.736572265625, 0.8388671875, 0.941162109375, 1.04345703125, 1.145751953125, 1.248046875, 1.350341796875, 1.45263671875, 1.554931640625, 1.6572265625, 1.759521484375, 1.86181640625, 1.964111328125, 2.06640625, 2.168701171875, 2.27099609375, 2.373291015625, 2.4755859375, 2.577880859375, 2.68017578125, 2.782470703125, 2.884765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 6.0, 7.0, 9.0, 14.0, 15.0, 22.0, 21.0, 37.0, 33.0, 54.0, 77.0, 72.0, 92.0, 110.0, 79.0, 82.0, 60.0, 51.0, 43.0, 27.0, 24.0, 12.0, 17.0, 10.0, 6.0, 10.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000545501708984375, -0.0005295723676681519, -0.0005136430263519287, -0.0004977136850357056, -0.0004817843437194824, -0.0004658550024032593, -0.00044992566108703613, -0.000433996319770813, -0.00041806697845458984, -0.0004021376371383667, -0.00038620829582214355, -0.0003702789545059204, -0.00035434961318969727, -0.0003384202718734741, -0.000322490930557251, -0.00030656158924102783, -0.0002906322479248047, -0.00027470290660858154, -0.0002587735652923584, -0.00024284422397613525, -0.0002269148826599121, -0.00021098554134368896, -0.00019505620002746582, -0.00017912685871124268, -0.00016319751739501953, -0.0001472681760787964, -0.00013133883476257324, -0.0001154094934463501, -9.948015213012695e-05, -8.355081081390381e-05, -6.762146949768066e-05, -5.169212818145752e-05, -3.5762786865234375e-05, -1.983344554901123e-05, -3.904104232788086e-06, 1.2025237083435059e-05, 2.7954578399658203e-05, 4.388391971588135e-05, 5.981326103210449e-05, 7.574260234832764e-05, 9.167194366455078e-05, 0.00010760128498077393, 0.00012353062629699707, 0.00013945996761322021, 0.00015538930892944336, 0.0001713186502456665, 0.00018724799156188965, 0.0002031773328781128, 0.00021910667419433594, 0.00023503601551055908, 0.0002509653568267822, 0.00026689469814300537, 0.0002828240394592285, 0.00029875338077545166, 0.0003146827220916748, 0.00033061206340789795, 0.0003465414047241211, 0.00036247074604034424, 0.0003784000873565674, 0.00039432942867279053, 0.00041025876998901367, 0.0004261881113052368, 0.00044211745262145996, 0.0004580467939376831, 0.00047397613525390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 13.0, 10.0, 25.0, 34.0, 74.0, 136.0, 252.0, 674.0, 2756.0, 27436.0, 854885.0, 153448.0, 6751.0, 1277.0, 400.0, 173.0, 87.0, 57.0, 24.0, 16.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.859375, -4.6959228515625, -4.532470703125, -4.3690185546875, -4.20556640625, -4.0421142578125, -3.878662109375, -3.7152099609375, -3.5517578125, -3.3883056640625, -3.224853515625, -3.0614013671875, -2.89794921875, -2.7344970703125, -2.571044921875, -2.4075927734375, -2.244140625, -2.0806884765625, -1.917236328125, -1.7537841796875, -1.59033203125, -1.4268798828125, -1.263427734375, -1.0999755859375, -0.9365234375, -0.7730712890625, -0.609619140625, -0.4461669921875, -0.28271484375, -0.1192626953125, 0.044189453125, 0.2076416015625, 0.37109375, 0.5345458984375, 0.697998046875, 0.8614501953125, 1.02490234375, 1.1883544921875, 1.351806640625, 1.5152587890625, 1.6787109375, 1.8421630859375, 2.005615234375, 2.1690673828125, 2.33251953125, 2.4959716796875, 2.659423828125, 2.8228759765625, 2.986328125, 3.1497802734375, 3.313232421875, 3.4766845703125, 3.64013671875, 3.8035888671875, 3.967041015625, 4.1304931640625, 4.2939453125, 4.4573974609375, 4.620849609375, 4.7843017578125, 4.94775390625, 5.1112060546875, 5.274658203125, 5.4381103515625, 5.6015625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 6.0, 5.0, 7.0, 9.0, 10.0, 18.0, 24.0, 34.0, 26.0, 51.0, 60.0, 74.0, 69.0, 83.0, 99.0, 81.0, 71.0, 60.0, 51.0, 42.0, 25.0, 12.0, 18.0, 9.0, 12.0, 11.0, 7.0, 7.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86376953125, -0.8319778442382812, -0.8001861572265625, -0.7683944702148438, -0.736602783203125, -0.7048110961914062, -0.6730194091796875, -0.6412277221679688, -0.60943603515625, -0.5776443481445312, -0.5458526611328125, -0.5140609741210938, -0.482269287109375, -0.45047760009765625, -0.4186859130859375, -0.38689422607421875, -0.3551025390625, -0.32331085205078125, -0.2915191650390625, -0.25972747802734375, -0.227935791015625, -0.19614410400390625, -0.1643524169921875, -0.13256072998046875, -0.10076904296875, -0.06897735595703125, -0.0371856689453125, -0.00539398193359375, 0.026397705078125, 0.05818939208984375, 0.0899810791015625, 0.12177276611328125, 0.153564453125, 0.18535614013671875, 0.2171478271484375, 0.24893951416015625, 0.280731201171875, 0.31252288818359375, 0.3443145751953125, 0.37610626220703125, 0.40789794921875, 0.43968963623046875, 0.4714813232421875, 0.5032730102539062, 0.535064697265625, 0.5668563842773438, 0.5986480712890625, 0.6304397583007812, 0.6622314453125, 0.6940231323242188, 0.7258148193359375, 0.7576065063476562, 0.789398193359375, 0.8211898803710938, 0.8529815673828125, 0.8847732543945312, 0.91656494140625, 0.9483566284179688, 0.9801483154296875, 1.0119400024414062, 1.043731689453125, 1.0755233764648438, 1.1073150634765625, 1.1391067504882812, 1.1708984375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 17.0, 407.0, 520.0, 61.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.073455810546875, -16.70117950439453, -13.32890510559082, -9.956629753112793, -6.584354400634766, -3.212078094482422, 0.16019630432128906, 3.532470703125, 6.904747009277344, 10.277022361755371, 13.649297714233398, 17.02157211303711, 20.393848419189453, 23.766124725341797, 27.138399124145508, 30.51067352294922, 33.88294982910156, 37.255226135253906, 40.62750244140625, 43.99977493286133, 47.37205123901367, 50.744327545166016, 54.116600036621094, 57.48887634277344, 60.86115264892578, 64.23342895507812, 67.60570526123047, 70.97798156738281, 74.35025024414062, 77.7225341796875, 81.09480285644531, 84.46707916259766, 87.83935546875, 91.21163177490234, 94.58390808105469, 97.95618438720703, 101.32846069335938, 104.70072937011719, 108.07300567626953, 111.44528198242188, 114.81755828857422, 118.18983459472656, 121.5621109008789, 124.93438720703125, 128.30665588378906, 131.67893981933594, 135.05120849609375, 138.42349243164062, 141.79576110839844, 145.16802978515625, 148.54031372070312, 151.91258239746094, 155.2848663330078, 158.65713500976562, 162.0294189453125, 165.4016876220703, 168.77395629882812, 172.14622497558594, 175.5185089111328, 178.89077758789062, 182.2630615234375, 185.6353302001953, 189.0076141357422, 192.3798828125, 195.75216674804688]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 8.0, 6.0, 11.0, 27.0, 26.0, 36.0, 49.0, 64.0, 62.0, 86.0, 110.0, 74.0, 85.0, 92.0, 71.0, 55.0, 38.0, 39.0, 22.0, 16.0, 8.0, 12.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.214298248291016, -20.613985061645508, -20.013671875, -19.413358688354492, -18.813045501708984, -18.212730407714844, -17.61241912841797, -17.012104034423828, -16.41179084777832, -15.811477661132812, -15.211164474487305, -14.610851287841797, -14.010537147521973, -13.410223960876465, -12.809910774230957, -12.209596633911133, -11.609284400939941, -11.008971214294434, -10.408658027648926, -9.808343887329102, -9.208030700683594, -8.607717514038086, -8.007404327392578, -7.407090663909912, -6.806777477264404, -6.2064642906188965, -5.6061506271362305, -5.005837440490723, -4.405524253845215, -3.805210590362549, -3.204897403717041, -2.604583740234375, -2.004270553588867, -1.4039571285247803, -0.8036438226699829, -0.20333051681518555, 0.39698290824890137, 0.9972963333129883, 1.597609519958496, 2.197923183441162, 2.79823637008667, 3.398549795150757, 3.9988632202148438, 4.599176406860352, 5.199489593505859, 5.799803256988525, 6.400116443634033, 7.000430107116699, 7.600743293762207, 8.201056480407715, 8.801369667053223, 9.401683807373047, 10.001996994018555, 10.602310180664062, 11.20262336730957, 11.802936553955078, 12.403249740600586, 13.003562927246094, 13.603876113891602, 14.20418930053711, 14.804503440856934, 15.404816627502441, 16.005130767822266, 16.605443954467773, 17.20575714111328]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 7.0, 18.0, 26.0, 60.0, 131.0, 267.0, 1351.0, 248051.0, 3942685.0, 1349.0, 174.0, 77.0, 37.0, 21.0, 10.0, 8.0, 2.0, 3.0], "bins": [-36.1875, -35.51837158203125, -34.8492431640625, -34.18011474609375, -33.510986328125, -32.84185791015625, -32.1727294921875, -31.50360107421875, -30.83447265625, -30.16534423828125, -29.4962158203125, -28.82708740234375, -28.157958984375, -27.48883056640625, -26.8197021484375, -26.15057373046875, -25.4814453125, -24.81231689453125, -24.1431884765625, -23.47406005859375, -22.804931640625, -22.13580322265625, -21.4666748046875, -20.79754638671875, -20.12841796875, -19.45928955078125, -18.7901611328125, -18.12103271484375, -17.451904296875, -16.78277587890625, -16.1136474609375, -15.44451904296875, -14.775390625, -14.10626220703125, -13.4371337890625, -12.76800537109375, -12.098876953125, -11.42974853515625, -10.7606201171875, -10.09149169921875, -9.42236328125, -8.75323486328125, -8.0841064453125, -7.41497802734375, -6.745849609375, -6.07672119140625, -5.4075927734375, -4.73846435546875, -4.0693359375, -3.40020751953125, -2.7310791015625, -2.06195068359375, -1.392822265625, -0.72369384765625, -0.0545654296875, 0.61456298828125, 1.28369140625, 1.95281982421875, 2.6219482421875, 3.29107666015625, 3.960205078125, 4.62933349609375, 5.2984619140625, 5.96759033203125, 6.63671875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 11.0, 10.0, 24.0, 38.0, 70.0, 86.0, 101.0, 120.0, 136.0, 136.0, 100.0, 71.0, 30.0, 32.0, 15.0, 9.0, 8.0, 4.0, 1.0, 1.0, 3.0], "bins": [-1.26171875, -1.23699951171875, -1.2122802734375, -1.18756103515625, -1.162841796875, -1.13812255859375, -1.1134033203125, -1.08868408203125, -1.06396484375, -1.03924560546875, -1.0145263671875, -0.98980712890625, -0.965087890625, -0.94036865234375, -0.9156494140625, -0.89093017578125, -0.8662109375, -0.84149169921875, -0.8167724609375, -0.79205322265625, -0.767333984375, -0.74261474609375, -0.7178955078125, -0.69317626953125, -0.66845703125, -0.64373779296875, -0.6190185546875, -0.59429931640625, -0.569580078125, -0.54486083984375, -0.5201416015625, -0.49542236328125, -0.470703125, -0.44598388671875, -0.4212646484375, -0.39654541015625, -0.371826171875, -0.34710693359375, -0.3223876953125, -0.29766845703125, -0.27294921875, -0.24822998046875, -0.2235107421875, -0.19879150390625, -0.174072265625, -0.14935302734375, -0.1246337890625, -0.09991455078125, -0.0751953125, -0.05047607421875, -0.0257568359375, -0.00103759765625, 0.023681640625, 0.04840087890625, 0.0731201171875, 0.09783935546875, 0.12255859375, 0.14727783203125, 0.1719970703125, 0.19671630859375, 0.221435546875, 0.24615478515625, 0.2708740234375, 0.29559326171875, 0.3203125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 7.0, 14.0, 44.0, 56.0, 89.0, 139.0, 223.0, 938.0, 4191601.0, 686.0, 232.0, 137.0, 70.0, 28.0, 16.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.375, -94.255859375, -92.13671875, -90.017578125, -87.8984375, -85.779296875, -83.66015625, -81.541015625, -79.421875, -77.302734375, -75.18359375, -73.064453125, -70.9453125, -68.826171875, -66.70703125, -64.587890625, -62.46875, -60.349609375, -58.23046875, -56.111328125, -53.9921875, -51.873046875, -49.75390625, -47.634765625, -45.515625, -43.396484375, -41.27734375, -39.158203125, -37.0390625, -34.919921875, -32.80078125, -30.681640625, -28.5625, -26.443359375, -24.32421875, -22.205078125, -20.0859375, -17.966796875, -15.84765625, -13.728515625, -11.609375, -9.490234375, -7.37109375, -5.251953125, -3.1328125, -1.013671875, 1.10546875, 3.224609375, 5.34375, 7.462890625, 9.58203125, 11.701171875, 13.8203125, 15.939453125, 18.05859375, 20.177734375, 22.296875, 24.416015625, 26.53515625, 28.654296875, 30.7734375, 32.892578125, 35.01171875, 37.130859375, 39.25]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 14.0, 241.0, 3783.0, 46.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4765625, -12.19500732421875, -11.9134521484375, -11.63189697265625, -11.350341796875, -11.06878662109375, -10.7872314453125, -10.50567626953125, -10.22412109375, -9.94256591796875, -9.6610107421875, -9.37945556640625, -9.097900390625, -8.81634521484375, -8.5347900390625, -8.25323486328125, -7.9716796875, -7.69012451171875, -7.4085693359375, -7.12701416015625, -6.845458984375, -6.56390380859375, -6.2823486328125, -6.00079345703125, -5.71923828125, -5.43768310546875, -5.1561279296875, -4.87457275390625, -4.593017578125, -4.31146240234375, -4.0299072265625, -3.74835205078125, -3.466796875, -3.18524169921875, -2.9036865234375, -2.62213134765625, -2.340576171875, -2.05902099609375, -1.7774658203125, -1.49591064453125, -1.21435546875, -0.93280029296875, -0.6512451171875, -0.36968994140625, -0.088134765625, 0.19342041015625, 0.4749755859375, 0.75653076171875, 1.0380859375, 1.31964111328125, 1.6011962890625, 1.88275146484375, 2.164306640625, 2.44586181640625, 2.7274169921875, 3.00897216796875, 3.29052734375, 3.57208251953125, 3.8536376953125, 4.13519287109375, 4.416748046875, 4.69830322265625, 4.9798583984375, 5.26141357421875, 5.54296875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 40.0, 529.0, 411.0, 19.0, 4.0, 3.0, 1.0], "bins": [-146.26087951660156, -143.78219604492188, -141.30352783203125, -138.82484436035156, -136.34616088867188, -133.86749267578125, -131.38880920410156, -128.91012573242188, -126.43145751953125, -123.9527816772461, -121.4740982055664, -118.99542236328125, -116.5167465209961, -114.03807067871094, -111.55938720703125, -109.0807113647461, -106.6020278930664, -104.12335205078125, -101.64466857910156, -99.1659927368164, -96.68731689453125, -94.20863342285156, -91.7299575805664, -89.25128173828125, -86.77259826660156, -84.2939224243164, -81.81523895263672, -79.33656311035156, -76.8578872680664, -74.37921142578125, -71.90052795410156, -69.4218521118164, -66.94317626953125, -64.4645004272461, -61.98582077026367, -59.50714111328125, -57.028465270996094, -54.54978561401367, -52.07110595703125, -49.592430114746094, -47.113746643066406, -44.635066986083984, -42.15639114379883, -39.677711486816406, -37.19903564453125, -34.72035598754883, -32.241676330566406, -29.762998580932617, -27.28432273864746, -24.805644989013672, -22.32696533203125, -19.84828758239746, -17.369609832763672, -14.890932083129883, -12.412253379821777, -9.933574676513672, -7.454896926879883, -4.9762187004089355, -2.4975404739379883, -0.018862247467041016, 2.4598159790039062, 4.938493728637695, 7.417172431945801, 9.895851135253906, 12.374528884887695]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 10.0, 4.0, 11.0, 29.0, 23.0, 48.0, 68.0, 67.0, 78.0, 100.0, 107.0, 88.0, 70.0, 79.0, 59.0, 52.0, 41.0, 25.0, 13.0, 11.0, 8.0, 7.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.27396011352539, -15.76771354675293, -15.261466979980469, -14.755220413208008, -14.248973846435547, -13.742727279663086, -13.236481666564941, -12.73023509979248, -12.22398853302002, -11.717741966247559, -11.211495399475098, -10.705248832702637, -10.199003219604492, -9.692756652832031, -9.18651008605957, -8.68026351928711, -8.174016952514648, -7.6677703857421875, -7.161523818969727, -6.655277729034424, -6.149031162261963, -5.642784595489502, -5.136538505554199, -4.630291938781738, -4.124045372009277, -3.6177988052368164, -3.1115524768829346, -2.6053061485290527, -2.099059581756592, -1.5928130149841309, -1.086566686630249, -0.5803203582763672, -0.07407379150390625, 0.43217265605926514, 0.9384191036224365, 1.444665551185608, 1.9509119987487793, 2.4571585655212402, 2.963404893875122, 3.469651222229004, 3.975897789001465, 4.482144355773926, 4.988390922546387, 5.4946370124816895, 6.00088357925415, 6.507130146026611, 7.013376235961914, 7.519622802734375, 8.025869369506836, 8.532115936279297, 9.038362503051758, 9.544609069824219, 10.05085563659668, 10.55710220336914, 11.063347816467285, 11.569594383239746, 12.075840950012207, 12.582087516784668, 13.088334083557129, 13.59458065032959, 14.100826263427734, 14.607072830200195, 15.113319396972656, 15.619565963745117, 16.125812530517578]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 4.0, 10.0, 11.0, 13.0, 12.0, 19.0, 20.0, 24.0, 40.0, 49.0, 70.0, 114.0, 176.0, 327.0, 732.0, 2356.0, 12645.0, 130048.0, 786680.0, 101110.0, 10477.0, 2129.0, 695.0, 340.0, 149.0, 85.0, 58.0, 41.0, 35.0, 26.0, 18.0, 9.0, 9.0, 4.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.640625, -9.37615966796875, -9.1116943359375, -8.84722900390625, -8.582763671875, -8.31829833984375, -8.0538330078125, -7.78936767578125, -7.52490234375, -7.26043701171875, -6.9959716796875, -6.73150634765625, -6.467041015625, -6.20257568359375, -5.9381103515625, -5.67364501953125, -5.4091796875, -5.14471435546875, -4.8802490234375, -4.61578369140625, -4.351318359375, -4.08685302734375, -3.8223876953125, -3.55792236328125, -3.29345703125, -3.02899169921875, -2.7645263671875, -2.50006103515625, -2.235595703125, -1.97113037109375, -1.7066650390625, -1.44219970703125, -1.177734375, -0.91326904296875, -0.6488037109375, -0.38433837890625, -0.119873046875, 0.14459228515625, 0.4090576171875, 0.67352294921875, 0.93798828125, 1.20245361328125, 1.4669189453125, 1.73138427734375, 1.995849609375, 2.26031494140625, 2.5247802734375, 2.78924560546875, 3.0537109375, 3.31817626953125, 3.5826416015625, 3.84710693359375, 4.111572265625, 4.37603759765625, 4.6405029296875, 4.90496826171875, 5.16943359375, 5.43389892578125, 5.6983642578125, 5.96282958984375, 6.227294921875, 6.49176025390625, 6.7562255859375, 7.02069091796875, 7.28515625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 8.0, 27.0, 34.0, 44.0, 59.0, 80.0, 84.0, 106.0, 129.0, 114.0, 92.0, 71.0, 51.0, 37.0, 15.0, 26.0, 10.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6455078125, -1.6082534790039062, -1.5709991455078125, -1.5337448120117188, -1.496490478515625, -1.4592361450195312, -1.4219818115234375, -1.3847274780273438, -1.34747314453125, -1.3102188110351562, -1.2729644775390625, -1.2357101440429688, -1.198455810546875, -1.1612014770507812, -1.1239471435546875, -1.0866928100585938, -1.0494384765625, -1.0121841430664062, -0.9749298095703125, -0.9376754760742188, -0.900421142578125, -0.8631668090820312, -0.8259124755859375, -0.7886581420898438, -0.75140380859375, -0.7141494750976562, -0.6768951416015625, -0.6396408081054688, -0.602386474609375, -0.5651321411132812, -0.5278778076171875, -0.49062347412109375, -0.453369140625, -0.41611480712890625, -0.3788604736328125, -0.34160614013671875, -0.304351806640625, -0.26709747314453125, -0.2298431396484375, -0.19258880615234375, -0.15533447265625, -0.11808013916015625, -0.0808258056640625, -0.04357147216796875, -0.006317138671875, 0.03093719482421875, 0.0681915283203125, 0.10544586181640625, 0.1427001953125, 0.17995452880859375, 0.2172088623046875, 0.25446319580078125, 0.291717529296875, 0.32897186279296875, 0.3662261962890625, 0.40348052978515625, 0.44073486328125, 0.47798919677734375, 0.5152435302734375, 0.5524978637695312, 0.589752197265625, 0.6270065307617188, 0.6642608642578125, 0.7015151977539062, 0.73876953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 7.0, 5.0, 13.0, 12.0, 23.0, 23.0, 28.0, 50.0, 69.0, 107.0, 145.0, 224.0, 392.0, 638.0, 1258.0, 2818.0, 7369.0, 24566.0, 117435.0, 547287.0, 276403.0, 48599.0, 12670.0, 4367.0, 1784.0, 873.0, 486.0, 285.0, 166.0, 129.0, 84.0, 55.0, 42.0, 35.0, 29.0, 16.0, 14.0, 9.0, 7.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.76953125, -3.64276123046875, -3.5159912109375, -3.38922119140625, -3.262451171875, -3.13568115234375, -3.0089111328125, -2.88214111328125, -2.75537109375, -2.62860107421875, -2.5018310546875, -2.37506103515625, -2.248291015625, -2.12152099609375, -1.9947509765625, -1.86798095703125, -1.7412109375, -1.61444091796875, -1.4876708984375, -1.36090087890625, -1.234130859375, -1.10736083984375, -0.9805908203125, -0.85382080078125, -0.72705078125, -0.60028076171875, -0.4735107421875, -0.34674072265625, -0.219970703125, -0.09320068359375, 0.0335693359375, 0.16033935546875, 0.287109375, 0.41387939453125, 0.5406494140625, 0.66741943359375, 0.794189453125, 0.92095947265625, 1.0477294921875, 1.17449951171875, 1.30126953125, 1.42803955078125, 1.5548095703125, 1.68157958984375, 1.808349609375, 1.93511962890625, 2.0618896484375, 2.18865966796875, 2.3154296875, 2.44219970703125, 2.5689697265625, 2.69573974609375, 2.822509765625, 2.94927978515625, 3.0760498046875, 3.20281982421875, 3.32958984375, 3.45635986328125, 3.5831298828125, 3.70989990234375, 3.836669921875, 3.96343994140625, 4.0902099609375, 4.21697998046875, 4.34375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 3.0, 8.0, 7.0, 13.0, 10.0, 15.0, 20.0, 25.0, 27.0, 27.0, 38.0, 43.0, 42.0, 51.0, 51.0, 54.0, 54.0, 51.0, 52.0, 58.0, 52.0, 48.0, 41.0, 36.0, 37.0, 20.0, 21.0, 11.0, 17.0, 11.0, 11.0, 11.0, 4.0, 6.0, 6.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.00390625, -2.9154052734375, -2.826904296875, -2.7384033203125, -2.64990234375, -2.5614013671875, -2.472900390625, -2.3843994140625, -2.2958984375, -2.2073974609375, -2.118896484375, -2.0303955078125, -1.94189453125, -1.8533935546875, -1.764892578125, -1.6763916015625, -1.587890625, -1.4993896484375, -1.410888671875, -1.3223876953125, -1.23388671875, -1.1453857421875, -1.056884765625, -0.9683837890625, -0.8798828125, -0.7913818359375, -0.702880859375, -0.6143798828125, -0.52587890625, -0.4373779296875, -0.348876953125, -0.2603759765625, -0.171875, -0.0833740234375, 0.005126953125, 0.0936279296875, 0.18212890625, 0.2706298828125, 0.359130859375, 0.4476318359375, 0.5361328125, 0.6246337890625, 0.713134765625, 0.8016357421875, 0.89013671875, 0.9786376953125, 1.067138671875, 1.1556396484375, 1.244140625, 1.3326416015625, 1.421142578125, 1.5096435546875, 1.59814453125, 1.6866455078125, 1.775146484375, 1.8636474609375, 1.9521484375, 2.0406494140625, 2.129150390625, 2.2176513671875, 2.30615234375, 2.3946533203125, 2.483154296875, 2.5716552734375, 2.66015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 4.0, 5.0, 8.0, 7.0, 15.0, 18.0, 40.0, 41.0, 81.0, 112.0, 193.0, 261.0, 456.0, 787.0, 1632.0, 3396.0, 8851.0, 27386.0, 151269.0, 677052.0, 136071.0, 25549.0, 8422.0, 3326.0, 1580.0, 824.0, 425.0, 281.0, 159.0, 106.0, 63.0, 37.0, 29.0, 19.0, 10.0, 16.0, 8.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.24609375, -2.169891357421875, -2.09368896484375, -2.017486572265625, -1.9412841796875, -1.865081787109375, -1.78887939453125, -1.712677001953125, -1.636474609375, -1.560272216796875, -1.48406982421875, -1.407867431640625, -1.3316650390625, -1.255462646484375, -1.17926025390625, -1.103057861328125, -1.02685546875, -0.950653076171875, -0.87445068359375, -0.798248291015625, -0.7220458984375, -0.645843505859375, -0.56964111328125, -0.493438720703125, -0.417236328125, -0.341033935546875, -0.26483154296875, -0.188629150390625, -0.1124267578125, -0.036224365234375, 0.03997802734375, 0.116180419921875, 0.1923828125, 0.268585205078125, 0.34478759765625, 0.420989990234375, 0.4971923828125, 0.573394775390625, 0.64959716796875, 0.725799560546875, 0.802001953125, 0.878204345703125, 0.95440673828125, 1.030609130859375, 1.1068115234375, 1.183013916015625, 1.25921630859375, 1.335418701171875, 1.41162109375, 1.487823486328125, 1.56402587890625, 1.640228271484375, 1.7164306640625, 1.792633056640625, 1.86883544921875, 1.945037841796875, 2.021240234375, 2.097442626953125, 2.17364501953125, 2.249847412109375, 2.3260498046875, 2.402252197265625, 2.47845458984375, 2.554656982421875, 2.630859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 10.0, 12.0, 17.0, 20.0, 18.0, 24.0, 33.0, 36.0, 43.0, 44.0, 61.0, 84.0, 86.0, 84.0, 82.0, 58.0, 52.0, 47.0, 36.0, 36.0, 29.0, 20.0, 18.0, 6.0, 4.0, 9.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000301361083984375, -0.0002925209701061249, -0.00028368085622787476, -0.00027484074234962463, -0.0002660006284713745, -0.0002571605145931244, -0.00024832040071487427, -0.00023948028683662415, -0.00023064017295837402, -0.0002218000590801239, -0.00021295994520187378, -0.00020411983132362366, -0.00019527971744537354, -0.0001864396035671234, -0.0001775994896888733, -0.00016875937581062317, -0.00015991926193237305, -0.00015107914805412292, -0.0001422390341758728, -0.00013339892029762268, -0.00012455880641937256, -0.00011571869254112244, -0.00010687857866287231, -9.803846478462219e-05, -8.919835090637207e-05, -8.035823702812195e-05, -7.151812314987183e-05, -6.26780092716217e-05, -5.383789539337158e-05, -4.499778151512146e-05, -3.615766763687134e-05, -2.7317553758621216e-05, -1.8477439880371094e-05, -9.637326002120972e-06, -7.972121238708496e-07, 8.042901754379272e-06, 1.6883015632629395e-05, 2.5723129510879517e-05, 3.456324338912964e-05, 4.340335726737976e-05, 5.224347114562988e-05, 6.108358502388e-05, 6.992369890213013e-05, 7.876381278038025e-05, 8.760392665863037e-05, 9.644404053688049e-05, 0.00010528415441513062, 0.00011412426829338074, 0.00012296438217163086, 0.00013180449604988098, 0.0001406446099281311, 0.00014948472380638123, 0.00015832483768463135, 0.00016716495156288147, 0.0001760050654411316, 0.00018484517931938171, 0.00019368529319763184, 0.00020252540707588196, 0.00021136552095413208, 0.0002202056348323822, 0.00022904574871063232, 0.00023788586258888245, 0.00024672597646713257, 0.0002555660903453827, 0.0002644062042236328]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 9.0, 20.0, 15.0, 21.0, 33.0, 53.0, 92.0, 145.0, 248.0, 515.0, 1052.0, 2499.0, 7023.0, 34468.0, 771270.0, 207872.0, 15399.0, 4466.0, 1655.0, 781.0, 392.0, 208.0, 107.0, 67.0, 45.0, 25.0, 12.0, 11.0, 12.0, 4.0, 7.0, 7.0, 2.0, 1.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.594482421875, -4.45849609375, -4.322509765625, -4.1865234375, -4.050537109375, -3.91455078125, -3.778564453125, -3.642578125, -3.506591796875, -3.37060546875, -3.234619140625, -3.0986328125, -2.962646484375, -2.82666015625, -2.690673828125, -2.5546875, -2.418701171875, -2.28271484375, -2.146728515625, -2.0107421875, -1.874755859375, -1.73876953125, -1.602783203125, -1.466796875, -1.330810546875, -1.19482421875, -1.058837890625, -0.9228515625, -0.786865234375, -0.65087890625, -0.514892578125, -0.37890625, -0.242919921875, -0.10693359375, 0.029052734375, 0.1650390625, 0.301025390625, 0.43701171875, 0.572998046875, 0.708984375, 0.844970703125, 0.98095703125, 1.116943359375, 1.2529296875, 1.388916015625, 1.52490234375, 1.660888671875, 1.796875, 1.932861328125, 2.06884765625, 2.204833984375, 2.3408203125, 2.476806640625, 2.61279296875, 2.748779296875, 2.884765625, 3.020751953125, 3.15673828125, 3.292724609375, 3.4287109375, 3.564697265625, 3.70068359375, 3.836669921875, 3.97265625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 3.0, 11.0, 12.0, 21.0, 21.0, 30.0, 62.0, 127.0, 160.0, 195.0, 127.0, 79.0, 40.0, 19.0, 17.0, 11.0, 9.0, 9.0, 14.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.814453125, -2.734405517578125, -2.65435791015625, -2.574310302734375, -2.4942626953125, -2.414215087890625, -2.33416748046875, -2.254119873046875, -2.174072265625, -2.094024658203125, -2.01397705078125, -1.933929443359375, -1.8538818359375, -1.773834228515625, -1.69378662109375, -1.613739013671875, -1.53369140625, -1.453643798828125, -1.37359619140625, -1.293548583984375, -1.2135009765625, -1.133453369140625, -1.05340576171875, -0.973358154296875, -0.893310546875, -0.813262939453125, -0.73321533203125, -0.653167724609375, -0.5731201171875, -0.493072509765625, -0.41302490234375, -0.332977294921875, -0.2529296875, -0.172882080078125, -0.09283447265625, -0.012786865234375, 0.0672607421875, 0.147308349609375, 0.22735595703125, 0.307403564453125, 0.387451171875, 0.467498779296875, 0.54754638671875, 0.627593994140625, 0.7076416015625, 0.787689208984375, 0.86773681640625, 0.947784423828125, 1.02783203125, 1.107879638671875, 1.18792724609375, 1.267974853515625, 1.3480224609375, 1.428070068359375, 1.50811767578125, 1.588165283203125, 1.668212890625, 1.748260498046875, 1.82830810546875, 1.908355712890625, 1.9884033203125, 2.068450927734375, 2.14849853515625, 2.228546142578125, 2.30859375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 8.0, 12.0, 39.0, 84.0, 167.0, 268.0, 211.0, 113.0, 48.0, 27.0, 14.0, 5.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.89120101928711, -19.774669647216797, -18.658138275146484, -17.54160499572754, -16.425073623657227, -15.308542251586914, -14.192009925842285, -13.075477600097656, -11.958946228027344, -10.842414855957031, -9.725882530212402, -8.609350204467773, -7.492818832397461, -6.37628698348999, -5.2597551345825195, -4.143223285675049, -3.026691436767578, -1.9101595878601074, -0.7936277389526367, 0.322904109954834, 1.4394359588623047, 2.5559678077697754, 3.672499656677246, 4.789031505584717, 5.9055633544921875, 7.022095203399658, 8.138627052307129, 9.255159378051758, 10.37169075012207, 11.488222122192383, 12.604754447937012, 13.72128677368164, 14.837818145751953, 15.954349517822266, 17.070880889892578, 18.187414169311523, 19.303945541381836, 20.42047691345215, 21.537010192871094, 22.653541564941406, 23.77007293701172, 24.88660430908203, 26.003135681152344, 27.11966896057129, 28.2362003326416, 29.352731704711914, 30.46926498413086, 31.585796356201172, 32.702327728271484, 33.8188591003418, 34.93539047241211, 36.05192184448242, 37.16845703125, 38.28498840332031, 39.401519775390625, 40.51805114746094, 41.63458251953125, 42.75111389160156, 43.867645263671875, 44.98417663574219, 46.1007080078125, 47.21724319458008, 48.33377456665039, 49.4503059387207, 50.566837310791016]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 12.0, 8.0, 11.0, 17.0, 15.0, 15.0, 31.0, 24.0, 30.0, 43.0, 34.0, 42.0, 46.0, 44.0, 45.0, 44.0, 45.0, 45.0, 57.0, 35.0, 32.0, 48.0, 46.0, 36.0, 32.0, 24.0, 22.0, 22.0, 21.0, 12.0, 12.0, 8.0, 6.0, 8.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-16.55579948425293, -16.091341018676758, -15.626880645751953, -15.162421226501465, -14.697961807250977, -14.233503341674805, -13.76904296875, -13.304584503173828, -12.84012508392334, -12.375665664672852, -11.911206245422363, -11.446746826171875, -10.982287406921387, -10.517827987670898, -10.053369522094727, -9.588910102844238, -9.12445068359375, -8.659991264343262, -8.195531845092773, -7.731072425842285, -7.266613483428955, -6.802154064178467, -6.3376946449279785, -5.873235702514648, -5.408775329589844, -4.9443159103393555, -4.479856491088867, -4.015397071838379, -3.550938129425049, -3.0864787101745605, -2.6220192909240723, -2.157560110092163, -1.693100929260254, -1.2286416292190552, -0.7641822695732117, -0.29972290992736816, 0.16473639011383057, 0.6291956901550293, 1.0936551094055176, 1.5581142902374268, 2.022573709487915, 2.4870331287384033, 2.9514923095703125, 3.415951728820801, 3.880411148071289, 4.344870567321777, 4.809329986572266, 5.273788928985596, 5.738248348236084, 6.202707767486572, 6.6671671867370605, 7.131626129150391, 7.596085548400879, 8.060544967651367, 8.525004386901855, 8.989463806152344, 9.453923225402832, 9.91838264465332, 10.382842063903809, 10.847301483154297, 11.311760902404785, 11.776220321655273, 12.240678787231445, 12.705138206481934, 13.169597625732422]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 6.0, 11.0, 9.0, 12.0, 13.0, 16.0, 30.0, 37.0, 61.0, 125.0, 193.0, 446.0, 957.0, 3049.0, 14967.0, 2951572.0, 1205641.0, 13296.0, 2454.0, 794.0, 305.0, 135.0, 64.0, 30.0, 19.0, 13.0, 7.0, 4.0, 4.0, 1.0, 1.0], "bins": [-13.5234375, -13.247314453125, -12.97119140625, -12.695068359375, -12.4189453125, -12.142822265625, -11.86669921875, -11.590576171875, -11.314453125, -11.038330078125, -10.76220703125, -10.486083984375, -10.2099609375, -9.933837890625, -9.65771484375, -9.381591796875, -9.10546875, -8.829345703125, -8.55322265625, -8.277099609375, -8.0009765625, -7.724853515625, -7.44873046875, -7.172607421875, -6.896484375, -6.620361328125, -6.34423828125, -6.068115234375, -5.7919921875, -5.515869140625, -5.23974609375, -4.963623046875, -4.6875, -4.411376953125, -4.13525390625, -3.859130859375, -3.5830078125, -3.306884765625, -3.03076171875, -2.754638671875, -2.478515625, -2.202392578125, -1.92626953125, -1.650146484375, -1.3740234375, -1.097900390625, -0.82177734375, -0.545654296875, -0.26953125, 0.006591796875, 0.28271484375, 0.558837890625, 0.8349609375, 1.111083984375, 1.38720703125, 1.663330078125, 1.939453125, 2.215576171875, 2.49169921875, 2.767822265625, 3.0439453125, 3.320068359375, 3.59619140625, 3.872314453125, 4.1484375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 10.0, 6.0, 19.0, 22.0, 33.0, 42.0, 64.0, 71.0, 98.0, 87.0, 112.0, 99.0, 84.0, 81.0, 49.0, 38.0, 45.0, 12.0, 15.0, 10.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-1.61328125, -1.5776519775390625, -1.542022705078125, -1.5063934326171875, -1.47076416015625, -1.4351348876953125, -1.399505615234375, -1.3638763427734375, -1.3282470703125, -1.2926177978515625, -1.256988525390625, -1.2213592529296875, -1.18572998046875, -1.1501007080078125, -1.114471435546875, -1.0788421630859375, -1.043212890625, -1.0075836181640625, -0.971954345703125, -0.9363250732421875, -0.90069580078125, -0.8650665283203125, -0.829437255859375, -0.7938079833984375, -0.7581787109375, -0.7225494384765625, -0.686920166015625, -0.6512908935546875, -0.61566162109375, -0.5800323486328125, -0.544403076171875, -0.5087738037109375, -0.47314453125, -0.4375152587890625, -0.401885986328125, -0.3662567138671875, -0.33062744140625, -0.2949981689453125, -0.259368896484375, -0.2237396240234375, -0.1881103515625, -0.1524810791015625, -0.116851806640625, -0.0812225341796875, -0.04559326171875, -0.0099639892578125, 0.025665283203125, 0.0612945556640625, 0.096923828125, 0.1325531005859375, 0.168182373046875, 0.2038116455078125, 0.23944091796875, 0.2750701904296875, 0.310699462890625, 0.3463287353515625, 0.3819580078125, 0.4175872802734375, 0.453216552734375, 0.4888458251953125, 0.52447509765625, 0.5601043701171875, 0.595733642578125, 0.6313629150390625, 0.6669921875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 18.0, 17.0, 32.0, 31.0, 40.0, 54.0, 102.0, 636.0, 19626.0, 4170908.0, 2240.0, 218.0, 88.0, 70.0, 63.0, 26.0, 27.0, 28.0, 24.0, 14.0, 9.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -14.7427978515625, -13.837158203125, -12.9315185546875, -12.02587890625, -11.1202392578125, -10.214599609375, -9.3089599609375, -8.4033203125, -7.4976806640625, -6.592041015625, -5.6864013671875, -4.78076171875, -3.8751220703125, -2.969482421875, -2.0638427734375, -1.158203125, -0.2525634765625, 0.653076171875, 1.5587158203125, 2.46435546875, 3.3699951171875, 4.275634765625, 5.1812744140625, 6.0869140625, 6.9925537109375, 7.898193359375, 8.8038330078125, 9.70947265625, 10.6151123046875, 11.520751953125, 12.4263916015625, 13.33203125, 14.2376708984375, 15.143310546875, 16.0489501953125, 16.95458984375, 17.8602294921875, 18.765869140625, 19.6715087890625, 20.5771484375, 21.4827880859375, 22.388427734375, 23.2940673828125, 24.19970703125, 25.1053466796875, 26.010986328125, 26.9166259765625, 27.822265625, 28.7279052734375, 29.633544921875, 30.5391845703125, 31.44482421875, 32.3504638671875, 33.256103515625, 34.1617431640625, 35.0673828125, 35.9730224609375, 36.878662109375, 37.7843017578125, 38.68994140625, 39.5955810546875, 40.501220703125, 41.4068603515625, 42.3125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 13.0, 53.0, 640.0, 3203.0, 128.0, 30.0, 10.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.76953125, -1.61224365234375, -1.4549560546875, -1.29766845703125, -1.140380859375, -0.98309326171875, -0.8258056640625, -0.66851806640625, -0.51123046875, -0.35394287109375, -0.1966552734375, -0.03936767578125, 0.117919921875, 0.27520751953125, 0.4324951171875, 0.58978271484375, 0.7470703125, 0.90435791015625, 1.0616455078125, 1.21893310546875, 1.376220703125, 1.53350830078125, 1.6907958984375, 1.84808349609375, 2.00537109375, 2.16265869140625, 2.3199462890625, 2.47723388671875, 2.634521484375, 2.79180908203125, 2.9490966796875, 3.10638427734375, 3.263671875, 3.42095947265625, 3.5782470703125, 3.73553466796875, 3.892822265625, 4.05010986328125, 4.2073974609375, 4.36468505859375, 4.52197265625, 4.67926025390625, 4.8365478515625, 4.99383544921875, 5.151123046875, 5.30841064453125, 5.4656982421875, 5.62298583984375, 5.7802734375, 5.93756103515625, 6.0948486328125, 6.25213623046875, 6.409423828125, 6.56671142578125, 6.7239990234375, 6.88128662109375, 7.03857421875, 7.19586181640625, 7.3531494140625, 7.51043701171875, 7.667724609375, 7.82501220703125, 7.9822998046875, 8.13958740234375, 8.296875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 54.0, 424.0, 442.0, 64.0, 9.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.703098773956299, -6.742628574371338, -5.782157897949219, -4.821687698364258, -3.861217498779297, -2.900747299194336, -1.9402766227722168, -0.9798064231872559, -0.019336223602294922, 0.9411340951919556, 1.901604413986206, 2.862074851989746, 3.822545051574707, 4.783015251159668, 5.743485927581787, 6.703956127166748, 7.664426326751709, 8.624897003173828, 9.585367202758789, 10.54583740234375, 11.506307601928711, 12.466777801513672, 13.427248001098633, 14.387718200683594, 15.348188400268555, 16.308658599853516, 17.269128799438477, 18.229598999023438, 19.1900691986084, 20.15053939819336, 21.111011505126953, 22.07147979736328, 23.031951904296875, 23.992422103881836, 24.952892303466797, 25.913362503051758, 26.87383270263672, 27.83430290222168, 28.79477310180664, 29.755245208740234, 30.715713500976562, 31.676183700561523, 32.636653900146484, 33.59712600708008, 34.557594299316406, 35.51806640625, 36.47853469848633, 37.43900680541992, 38.39947509765625, 39.359947204589844, 40.32041549682617, 41.280887603759766, 42.241355895996094, 43.20182800292969, 44.162296295166016, 45.12276840209961, 46.0832405090332, 47.0437126159668, 48.004180908203125, 48.96465301513672, 49.92512130737305, 50.88559341430664, 51.84606170654297, 52.80653381347656, 53.76700210571289]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 17.0, 30.0, 54.0, 95.0, 101.0, 134.0, 144.0, 138.0, 108.0, 68.0, 57.0, 35.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.490209579467773, -11.138142585754395, -10.786075592041016, -10.434008598327637, -10.081941604614258, -9.729874610900879, -9.3778076171875, -9.025740623474121, -8.673673629760742, -8.321606636047363, -7.969539642333984, -7.6174726486206055, -7.265405654907227, -6.913338661193848, -6.561271667480469, -6.20920467376709, -5.857137680053711, -5.505070686340332, -5.153003692626953, -4.800936698913574, -4.448869705200195, -4.096802711486816, -3.7447357177734375, -3.3926687240600586, -3.0406017303466797, -2.688534736633301, -2.336467742919922, -1.984400749206543, -1.632333755493164, -1.2802667617797852, -0.9281997680664062, -0.5761327743530273, -0.22406578063964844, 0.12800121307373047, 0.4800682067871094, 0.8321352005004883, 1.1842021942138672, 1.536269187927246, 1.888336181640625, 2.240403175354004, 2.592470169067383, 2.9445371627807617, 3.2966041564941406, 3.6486711502075195, 4.000738143920898, 4.352805137634277, 4.704872131347656, 5.056939125061035, 5.409006118774414, 5.761073112487793, 6.113140106201172, 6.465207099914551, 6.81727409362793, 7.169341087341309, 7.5214080810546875, 7.873475074768066, 8.225542068481445, 8.577609062194824, 8.929676055908203, 9.281743049621582, 9.633810043334961, 9.98587703704834, 10.337944030761719, 10.690011024475098, 11.042078018188477]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 11.0, 11.0, 17.0, 30.0, 30.0, 50.0, 48.0, 112.0, 215.0, 388.0, 1025.0, 3755.0, 19995.0, 171819.0, 689101.0, 139695.0, 17128.0, 3287.0, 948.0, 367.0, 172.0, 85.0, 72.0, 40.0, 25.0, 22.0, 22.0, 23.0, 12.0, 11.0, 5.0, 8.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.36676025390625, -5.1905517578125, -5.01434326171875, -4.838134765625, -4.66192626953125, -4.4857177734375, -4.30950927734375, -4.13330078125, -3.95709228515625, -3.7808837890625, -3.60467529296875, -3.428466796875, -3.25225830078125, -3.0760498046875, -2.89984130859375, -2.7236328125, -2.54742431640625, -2.3712158203125, -2.19500732421875, -2.018798828125, -1.84259033203125, -1.6663818359375, -1.49017333984375, -1.31396484375, -1.13775634765625, -0.9615478515625, -0.78533935546875, -0.609130859375, -0.43292236328125, -0.2567138671875, -0.08050537109375, 0.095703125, 0.27191162109375, 0.4481201171875, 0.62432861328125, 0.800537109375, 0.97674560546875, 1.1529541015625, 1.32916259765625, 1.50537109375, 1.68157958984375, 1.8577880859375, 2.03399658203125, 2.210205078125, 2.38641357421875, 2.5626220703125, 2.73883056640625, 2.9150390625, 3.09124755859375, 3.2674560546875, 3.44366455078125, 3.619873046875, 3.79608154296875, 3.9722900390625, 4.14849853515625, 4.32470703125, 4.50091552734375, 4.6771240234375, 4.85333251953125, 5.029541015625, 5.20574951171875, 5.3819580078125, 5.55816650390625, 5.734375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 9.0, 6.0, 8.0, 21.0, 30.0, 36.0, 30.0, 59.0, 63.0, 81.0, 96.0, 96.0, 93.0, 72.0, 80.0, 54.0, 50.0, 34.0, 24.0, 21.0, 20.0, 14.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.296875, -1.2664718627929688, -1.2360687255859375, -1.2056655883789062, -1.175262451171875, -1.1448593139648438, -1.1144561767578125, -1.0840530395507812, -1.05364990234375, -1.0232467651367188, -0.9928436279296875, -0.9624404907226562, -0.932037353515625, -0.9016342163085938, -0.8712310791015625, -0.8408279418945312, -0.8104248046875, -0.7800216674804688, -0.7496185302734375, -0.7192153930664062, -0.688812255859375, -0.6584091186523438, -0.6280059814453125, -0.5976028442382812, -0.56719970703125, -0.5367965698242188, -0.5063934326171875, -0.47599029541015625, -0.445587158203125, -0.41518402099609375, -0.3847808837890625, -0.35437774658203125, -0.323974609375, -0.29357147216796875, -0.2631683349609375, -0.23276519775390625, -0.202362060546875, -0.17195892333984375, -0.1415557861328125, -0.11115264892578125, -0.08074951171875, -0.05034637451171875, -0.0199432373046875, 0.01045989990234375, 0.040863037109375, 0.07126617431640625, 0.1016693115234375, 0.13207244873046875, 0.1624755859375, 0.19287872314453125, 0.2232818603515625, 0.25368499755859375, 0.284088134765625, 0.31449127197265625, 0.3448944091796875, 0.37529754638671875, 0.40570068359375, 0.43610382080078125, 0.4665069580078125, 0.49691009521484375, 0.527313232421875, 0.5577163696289062, 0.5881195068359375, 0.6185226440429688, 0.64892578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 10.0, 11.0, 17.0, 25.0, 31.0, 54.0, 68.0, 100.0, 183.0, 325.0, 602.0, 1334.0, 3651.0, 13952.0, 84529.0, 559329.0, 330038.0, 41595.0, 8155.0, 2414.0, 952.0, 467.0, 258.0, 149.0, 99.0, 67.0, 43.0, 25.0, 22.0, 14.0, 16.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.68157958984375, -4.5389404296875, -4.39630126953125, -4.253662109375, -4.11102294921875, -3.9683837890625, -3.82574462890625, -3.68310546875, -3.54046630859375, -3.3978271484375, -3.25518798828125, -3.112548828125, -2.96990966796875, -2.8272705078125, -2.68463134765625, -2.5419921875, -2.39935302734375, -2.2567138671875, -2.11407470703125, -1.971435546875, -1.82879638671875, -1.6861572265625, -1.54351806640625, -1.40087890625, -1.25823974609375, -1.1156005859375, -0.97296142578125, -0.830322265625, -0.68768310546875, -0.5450439453125, -0.40240478515625, -0.259765625, -0.11712646484375, 0.0255126953125, 0.16815185546875, 0.310791015625, 0.45343017578125, 0.5960693359375, 0.73870849609375, 0.88134765625, 1.02398681640625, 1.1666259765625, 1.30926513671875, 1.451904296875, 1.59454345703125, 1.7371826171875, 1.87982177734375, 2.0224609375, 2.16510009765625, 2.3077392578125, 2.45037841796875, 2.593017578125, 2.73565673828125, 2.8782958984375, 3.02093505859375, 3.16357421875, 3.30621337890625, 3.4488525390625, 3.59149169921875, 3.734130859375, 3.87677001953125, 4.0194091796875, 4.16204833984375, 4.3046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 10.0, 10.0, 18.0, 11.0, 19.0, 4.0, 28.0, 28.0, 24.0, 35.0, 43.0, 46.0, 57.0, 45.0, 50.0, 52.0, 50.0, 65.0, 46.0, 55.0, 42.0, 45.0, 31.0, 43.0, 17.0, 26.0, 18.0, 16.0, 9.0, 12.0, 8.0, 8.0, 8.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.626953125, -3.53369140625, -3.4404296875, -3.34716796875, -3.25390625, -3.16064453125, -3.0673828125, -2.97412109375, -2.880859375, -2.78759765625, -2.6943359375, -2.60107421875, -2.5078125, -2.41455078125, -2.3212890625, -2.22802734375, -2.134765625, -2.04150390625, -1.9482421875, -1.85498046875, -1.76171875, -1.66845703125, -1.5751953125, -1.48193359375, -1.388671875, -1.29541015625, -1.2021484375, -1.10888671875, -1.015625, -0.92236328125, -0.8291015625, -0.73583984375, -0.642578125, -0.54931640625, -0.4560546875, -0.36279296875, -0.26953125, -0.17626953125, -0.0830078125, 0.01025390625, 0.103515625, 0.19677734375, 0.2900390625, 0.38330078125, 0.4765625, 0.56982421875, 0.6630859375, 0.75634765625, 0.849609375, 0.94287109375, 1.0361328125, 1.12939453125, 1.22265625, 1.31591796875, 1.4091796875, 1.50244140625, 1.595703125, 1.68896484375, 1.7822265625, 1.87548828125, 1.96875, 2.06201171875, 2.1552734375, 2.24853515625, 2.341796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 12.0, 10.0, 15.0, 23.0, 28.0, 53.0, 68.0, 134.0, 206.0, 332.0, 602.0, 1127.0, 2601.0, 6768.0, 22592.0, 109268.0, 567498.0, 272989.0, 44966.0, 11711.0, 3927.0, 1670.0, 830.0, 405.0, 256.0, 144.0, 109.0, 56.0, 35.0, 26.0, 19.0, 17.0, 12.0, 13.0, 3.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7080078125, -1.6485748291015625, -1.589141845703125, -1.5297088623046875, -1.47027587890625, -1.4108428955078125, -1.351409912109375, -1.2919769287109375, -1.2325439453125, -1.1731109619140625, -1.113677978515625, -1.0542449951171875, -0.99481201171875, -0.9353790283203125, -0.875946044921875, -0.8165130615234375, -0.757080078125, -0.6976470947265625, -0.638214111328125, -0.5787811279296875, -0.51934814453125, -0.4599151611328125, -0.400482177734375, -0.3410491943359375, -0.2816162109375, -0.2221832275390625, -0.162750244140625, -0.1033172607421875, -0.04388427734375, 0.0155487060546875, 0.074981689453125, 0.1344146728515625, 0.19384765625, 0.2532806396484375, 0.312713623046875, 0.3721466064453125, 0.43157958984375, 0.4910125732421875, 0.550445556640625, 0.6098785400390625, 0.6693115234375, 0.7287445068359375, 0.788177490234375, 0.8476104736328125, 0.90704345703125, 0.9664764404296875, 1.025909423828125, 1.0853424072265625, 1.144775390625, 1.2042083740234375, 1.263641357421875, 1.3230743408203125, 1.38250732421875, 1.4419403076171875, 1.501373291015625, 1.5608062744140625, 1.6202392578125, 1.6796722412109375, 1.739105224609375, 1.7985382080078125, 1.85797119140625, 1.9174041748046875, 1.976837158203125, 2.0362701416015625, 2.095703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 2.0, 8.0, 10.0, 13.0, 17.0, 17.0, 18.0, 23.0, 27.0, 41.0, 46.0, 42.0, 51.0, 69.0, 63.0, 53.0, 64.0, 56.0, 55.0, 56.0, 36.0, 34.0, 41.0, 27.0, 18.0, 17.0, 19.0, 14.0, 9.0, 7.0, 8.0, 1.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.000156402587890625, -0.0001518838107585907, -0.0001473650336265564, -0.0001428462564945221, -0.0001383274793624878, -0.0001338087022304535, -0.0001292899250984192, -0.0001247711479663849, -0.00012025237083435059, -0.00011573359370231628, -0.00011121481657028198, -0.00010669603943824768, -0.00010217726230621338, -9.765848517417908e-05, -9.313970804214478e-05, -8.862093091011047e-05, -8.410215377807617e-05, -7.958337664604187e-05, -7.506459951400757e-05, -7.054582238197327e-05, -6.602704524993896e-05, -6.150826811790466e-05, -5.698949098587036e-05, -5.247071385383606e-05, -4.795193672180176e-05, -4.3433159589767456e-05, -3.8914382457733154e-05, -3.439560532569885e-05, -2.987682819366455e-05, -2.535805106163025e-05, -2.0839273929595947e-05, -1.6320496797561646e-05, -1.1801719665527344e-05, -7.282942533493042e-06, -2.7641654014587402e-06, 1.7546117305755615e-06, 6.273388862609863e-06, 1.0792165994644165e-05, 1.5310943126678467e-05, 1.982972025871277e-05, 2.434849739074707e-05, 2.8867274522781372e-05, 3.3386051654815674e-05, 3.7904828786849976e-05, 4.242360591888428e-05, 4.694238305091858e-05, 5.146116018295288e-05, 5.597993731498718e-05, 6.0498714447021484e-05, 6.501749157905579e-05, 6.953626871109009e-05, 7.405504584312439e-05, 7.857382297515869e-05, 8.309260010719299e-05, 8.76113772392273e-05, 9.21301543712616e-05, 9.66489315032959e-05, 0.0001011677086353302, 0.0001056864857673645, 0.0001102052628993988, 0.0001147240400314331, 0.00011924281716346741, 0.0001237615942955017, 0.000128280371427536, 0.0001327991485595703]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 8.0, 8.0, 8.0, 10.0, 15.0, 25.0, 21.0, 38.0, 47.0, 75.0, 82.0, 144.0, 205.0, 408.0, 684.0, 1429.0, 3199.0, 7666.0, 22898.0, 95252.0, 498110.0, 331711.0, 59291.0, 16227.0, 5893.0, 2384.0, 1183.0, 570.0, 341.0, 184.0, 122.0, 83.0, 61.0, 47.0, 27.0, 31.0, 20.0, 9.0, 14.0, 5.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-1.9111328125, -1.856292724609375, -1.80145263671875, -1.746612548828125, -1.6917724609375, -1.636932373046875, -1.58209228515625, -1.527252197265625, -1.472412109375, -1.417572021484375, -1.36273193359375, -1.307891845703125, -1.2530517578125, -1.198211669921875, -1.14337158203125, -1.088531494140625, -1.03369140625, -0.978851318359375, -0.92401123046875, -0.869171142578125, -0.8143310546875, -0.759490966796875, -0.70465087890625, -0.649810791015625, -0.594970703125, -0.540130615234375, -0.48529052734375, -0.430450439453125, -0.3756103515625, -0.320770263671875, -0.26593017578125, -0.211090087890625, -0.15625, -0.101409912109375, -0.04656982421875, 0.008270263671875, 0.0631103515625, 0.117950439453125, 0.17279052734375, 0.227630615234375, 0.282470703125, 0.337310791015625, 0.39215087890625, 0.446990966796875, 0.5018310546875, 0.556671142578125, 0.61151123046875, 0.666351318359375, 0.72119140625, 0.776031494140625, 0.83087158203125, 0.885711669921875, 0.9405517578125, 0.995391845703125, 1.05023193359375, 1.105072021484375, 1.159912109375, 1.214752197265625, 1.26959228515625, 1.324432373046875, 1.3792724609375, 1.434112548828125, 1.48895263671875, 1.543792724609375, 1.5986328125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 4.0, 11.0, 11.0, 23.0, 25.0, 32.0, 37.0, 46.0, 66.0, 77.0, 82.0, 110.0, 95.0, 84.0, 67.0, 50.0, 39.0, 24.0, 23.0, 17.0, 6.0, 12.0, 9.0, 9.0, 4.0, 4.0, 8.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.501953125, -1.45849609375, -1.4150390625, -1.37158203125, -1.328125, -1.28466796875, -1.2412109375, -1.19775390625, -1.154296875, -1.11083984375, -1.0673828125, -1.02392578125, -0.98046875, -0.93701171875, -0.8935546875, -0.85009765625, -0.806640625, -0.76318359375, -0.7197265625, -0.67626953125, -0.6328125, -0.58935546875, -0.5458984375, -0.50244140625, -0.458984375, -0.41552734375, -0.3720703125, -0.32861328125, -0.28515625, -0.24169921875, -0.1982421875, -0.15478515625, -0.111328125, -0.06787109375, -0.0244140625, 0.01904296875, 0.0625, 0.10595703125, 0.1494140625, 0.19287109375, 0.236328125, 0.27978515625, 0.3232421875, 0.36669921875, 0.41015625, 0.45361328125, 0.4970703125, 0.54052734375, 0.583984375, 0.62744140625, 0.6708984375, 0.71435546875, 0.7578125, 0.80126953125, 0.8447265625, 0.88818359375, 0.931640625, 0.97509765625, 1.0185546875, 1.06201171875, 1.10546875, 1.14892578125, 1.1923828125, 1.23583984375, 1.279296875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 5.0, 9.0, 22.0, 33.0, 36.0, 69.0, 105.0, 102.0, 108.0, 130.0, 117.0, 76.0, 51.0, 45.0, 26.0, 16.0, 6.0, 6.0, 7.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.722097396850586, -10.182842254638672, -9.643587112426758, -9.104331970214844, -8.56507682800293, -8.025821685791016, -7.486565589904785, -6.947310447692871, -6.408055305480957, -5.868800163269043, -5.329545021057129, -4.790289402008057, -4.251034259796143, -3.7117791175842285, -3.1725237369537354, -2.633268356323242, -2.094013214111328, -1.5547579526901245, -1.015502691268921, -0.4762474298477173, 0.06300783157348633, 0.6022629737854004, 1.1415183544158936, 1.6807737350463867, 2.220028877258301, 2.759284019470215, 3.298539400100708, 3.837794780731201, 4.377049922943115, 4.916305065155029, 5.455560684204102, 5.994815826416016, 6.534069061279297, 7.073324203491211, 7.612579345703125, 8.151834487915039, 8.691089630126953, 9.230344772338867, 9.769600868225098, 10.308856010437012, 10.848111152648926, 11.38736629486084, 11.926621437072754, 12.465876579284668, 13.005132675170898, 13.544387817382812, 14.083642959594727, 14.62289810180664, 15.162153244018555, 15.701408386230469, 16.240663528442383, 16.779918670654297, 17.31917381286621, 17.858428955078125, 18.39768409729004, 18.936939239501953, 19.4761962890625, 20.015451431274414, 20.554706573486328, 21.093961715698242, 21.633216857910156, 22.17247200012207, 22.711727142333984, 23.25098419189453, 23.790237426757812]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 9.0, 7.0, 12.0, 10.0, 9.0, 10.0, 15.0, 14.0, 30.0, 20.0, 32.0, 35.0, 33.0, 32.0, 41.0, 50.0, 54.0, 55.0, 49.0, 55.0, 70.0, 43.0, 53.0, 28.0, 32.0, 32.0, 35.0, 26.0, 29.0, 19.0, 12.0, 11.0, 14.0, 5.0, 6.0, 9.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-17.026798248291016, -16.4853515625, -15.943904876708984, -15.402458190917969, -14.861011505126953, -14.319564819335938, -13.778119087219238, -13.236672401428223, -12.695225715637207, -12.153779029846191, -11.612332344055176, -11.07088565826416, -10.529439926147461, -9.987993240356445, -9.44654655456543, -8.905099868774414, -8.363653182983398, -7.822206497192383, -7.280759811401367, -6.73931360244751, -6.197866916656494, -5.6564202308654785, -5.114974021911621, -4.5735273361206055, -4.03208065032959, -3.490633964538574, -2.9491875171661377, -2.407741069793701, -1.8662943840026855, -1.32484769821167, -0.7834012508392334, -0.24195480346679688, 0.29949188232421875, 0.8409384489059448, 1.382385015487671, 1.923831582069397, 2.465278148651123, 3.0067248344421387, 3.548171281814575, 4.089617729187012, 4.631064414978027, 5.172511100769043, 5.713957786560059, 6.255403995513916, 6.796850681304932, 7.338297367095947, 7.879743576049805, 8.42119026184082, 8.962636947631836, 9.504083633422852, 10.045530319213867, 10.586977005004883, 11.128423690795898, 11.669870376586914, 12.211316108703613, 12.752762794494629, 13.294209480285645, 13.83565616607666, 14.377102851867676, 14.918549537658691, 15.45999526977539, 16.001441955566406, 16.542888641357422, 17.084335327148438, 17.625782012939453]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 11.0, 11.0, 15.0, 20.0, 19.0, 35.0, 56.0, 57.0, 98.0, 146.0, 278.0, 615.0, 2009.0, 9011.0, 97024.0, 3994020.0, 80603.0, 7795.0, 1597.0, 498.0, 156.0, 77.0, 59.0, 20.0, 26.0, 9.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-11.53125, -11.27764892578125, -11.0240478515625, -10.77044677734375, -10.516845703125, -10.26324462890625, -10.0096435546875, -9.75604248046875, -9.50244140625, -9.24884033203125, -8.9952392578125, -8.74163818359375, -8.488037109375, -8.23443603515625, -7.9808349609375, -7.72723388671875, -7.4736328125, -7.22003173828125, -6.9664306640625, -6.71282958984375, -6.459228515625, -6.20562744140625, -5.9520263671875, -5.69842529296875, -5.44482421875, -5.19122314453125, -4.9376220703125, -4.68402099609375, -4.430419921875, -4.17681884765625, -3.9232177734375, -3.66961669921875, -3.416015625, -3.16241455078125, -2.9088134765625, -2.65521240234375, -2.401611328125, -2.14801025390625, -1.8944091796875, -1.64080810546875, -1.38720703125, -1.13360595703125, -0.8800048828125, -0.62640380859375, -0.372802734375, -0.11920166015625, 0.1343994140625, 0.38800048828125, 0.6416015625, 0.89520263671875, 1.1488037109375, 1.40240478515625, 1.656005859375, 1.90960693359375, 2.1632080078125, 2.41680908203125, 2.67041015625, 2.92401123046875, 3.1776123046875, 3.43121337890625, 3.684814453125, 3.93841552734375, 4.1920166015625, 4.44561767578125, 4.69921875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 10.0, 20.0, 23.0, 34.0, 39.0, 49.0, 55.0, 69.0, 82.0, 100.0, 98.0, 87.0, 79.0, 74.0, 52.0, 40.0, 28.0, 22.0, 16.0, 16.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.322265625, -1.29150390625, -1.2607421875, -1.22998046875, -1.19921875, -1.16845703125, -1.1376953125, -1.10693359375, -1.076171875, -1.04541015625, -1.0146484375, -0.98388671875, -0.953125, -0.92236328125, -0.8916015625, -0.86083984375, -0.830078125, -0.79931640625, -0.7685546875, -0.73779296875, -0.70703125, -0.67626953125, -0.6455078125, -0.61474609375, -0.583984375, -0.55322265625, -0.5224609375, -0.49169921875, -0.4609375, -0.43017578125, -0.3994140625, -0.36865234375, -0.337890625, -0.30712890625, -0.2763671875, -0.24560546875, -0.21484375, -0.18408203125, -0.1533203125, -0.12255859375, -0.091796875, -0.06103515625, -0.0302734375, 0.00048828125, 0.03125, 0.06201171875, 0.0927734375, 0.12353515625, 0.154296875, 0.18505859375, 0.2158203125, 0.24658203125, 0.27734375, 0.30810546875, 0.3388671875, 0.36962890625, 0.400390625, 0.43115234375, 0.4619140625, 0.49267578125, 0.5234375, 0.55419921875, 0.5849609375, 0.61572265625, 0.646484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 11.0, 14.0, 6.0, 16.0, 17.0, 26.0, 19.0, 30.0, 48.0, 65.0, 138.0, 260.0, 705.0, 2730.0, 17599.0, 3870188.0, 291616.0, 8397.0, 1640.0, 417.0, 142.0, 65.0, 41.0, 23.0, 22.0, 16.0, 10.0, 4.0, 7.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9921875, -10.6236572265625, -10.255126953125, -9.8865966796875, -9.51806640625, -9.1495361328125, -8.781005859375, -8.4124755859375, -8.0439453125, -7.6754150390625, -7.306884765625, -6.9383544921875, -6.56982421875, -6.2012939453125, -5.832763671875, -5.4642333984375, -5.095703125, -4.7271728515625, -4.358642578125, -3.9901123046875, -3.62158203125, -3.2530517578125, -2.884521484375, -2.5159912109375, -2.1474609375, -1.7789306640625, -1.410400390625, -1.0418701171875, -0.67333984375, -0.3048095703125, 0.063720703125, 0.4322509765625, 0.80078125, 1.1693115234375, 1.537841796875, 1.9063720703125, 2.27490234375, 2.6434326171875, 3.011962890625, 3.3804931640625, 3.7490234375, 4.1175537109375, 4.486083984375, 4.8546142578125, 5.22314453125, 5.5916748046875, 5.960205078125, 6.3287353515625, 6.697265625, 7.0657958984375, 7.434326171875, 7.8028564453125, 8.17138671875, 8.5399169921875, 8.908447265625, 9.2769775390625, 9.6455078125, 10.0140380859375, 10.382568359375, 10.7510986328125, 11.11962890625, 11.4881591796875, 11.856689453125, 12.2252197265625, 12.59375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 34.0, 76.0, 347.0, 2772.0, 636.0, 123.0, 40.0, 16.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0], "bins": [-7.88671875, -7.7340545654296875, -7.581390380859375, -7.4287261962890625, -7.27606201171875, -7.1233978271484375, -6.970733642578125, -6.8180694580078125, -6.6654052734375, -6.5127410888671875, -6.360076904296875, -6.2074127197265625, -6.05474853515625, -5.9020843505859375, -5.749420166015625, -5.5967559814453125, -5.444091796875, -5.2914276123046875, -5.138763427734375, -4.9860992431640625, -4.83343505859375, -4.6807708740234375, -4.528106689453125, -4.3754425048828125, -4.2227783203125, -4.0701141357421875, -3.917449951171875, -3.7647857666015625, -3.61212158203125, -3.4594573974609375, -3.306793212890625, -3.1541290283203125, -3.00146484375, -2.8488006591796875, -2.696136474609375, -2.5434722900390625, -2.39080810546875, -2.2381439208984375, -2.085479736328125, -1.9328155517578125, -1.7801513671875, -1.6274871826171875, -1.474822998046875, -1.3221588134765625, -1.16949462890625, -1.0168304443359375, -0.864166259765625, -0.7115020751953125, -0.558837890625, -0.4061737060546875, -0.253509521484375, -0.1008453369140625, 0.05181884765625, 0.2044830322265625, 0.357147216796875, 0.5098114013671875, 0.6624755859375, 0.8151397705078125, 0.967803955078125, 1.1204681396484375, 1.27313232421875, 1.4257965087890625, 1.578460693359375, 1.7311248779296875, 1.8837890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 10.0, 9.0, 22.0, 38.0, 85.0, 171.0, 187.0, 204.0, 116.0, 76.0, 40.0, 20.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.689665794372559, -15.226458549499512, -14.763252258300781, -14.300045013427734, -13.836837768554688, -13.37363052368164, -12.910423278808594, -12.447216987609863, -11.984009742736816, -11.52080249786377, -11.057596206665039, -10.594388961791992, -10.131181716918945, -9.667974472045898, -9.204767227172852, -8.741560935974121, -8.278353691101074, -7.815146446228027, -7.351939678192139, -6.88873291015625, -6.425525665283203, -5.962318420410156, -5.499111652374268, -5.035904884338379, -4.572697639465332, -4.109490394592285, -3.6462836265563965, -3.1830766201019287, -2.719869613647461, -2.256662607192993, -1.7934556007385254, -1.3302485942840576, -0.8670425415039062, -0.4038355350494385, 0.0593714714050293, 0.5225784778594971, 0.9857854843139648, 1.4489924907684326, 1.9121994972229004, 2.375406503677368, 2.838613510131836, 3.3018205165863037, 3.7650275230407715, 4.22823429107666, 4.691441535949707, 5.154648780822754, 5.617855548858643, 6.081062316894531, 6.544269561767578, 7.007476806640625, 7.470683574676514, 7.933890342712402, 8.39709758758545, 8.860304832458496, 9.323511123657227, 9.786718368530273, 10.24992561340332, 10.713132858276367, 11.176340103149414, 11.639546394348145, 12.102753639221191, 12.565960884094238, 13.029167175292969, 13.492374420166016, 13.955581665039062]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 1.0, 3.0, 7.0, 16.0, 19.0, 31.0, 25.0, 48.0, 70.0, 68.0, 77.0, 78.0, 88.0, 89.0, 84.0, 70.0, 65.0, 55.0, 36.0, 21.0, 16.0, 10.0, 9.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-11.889753341674805, -11.560273170471191, -11.230792999267578, -10.901312828063965, -10.571832656860352, -10.242353439331055, -9.912873268127441, -9.583393096923828, -9.253912925720215, -8.924432754516602, -8.594952583312988, -8.265472412109375, -7.93599271774292, -7.606512546539307, -7.277032852172852, -6.947552680969238, -6.618072509765625, -6.288592338562012, -5.959112167358398, -5.629632472991943, -5.30015230178833, -4.970672130584717, -4.641192436218262, -4.311712265014648, -3.982232093811035, -3.652751922607422, -3.3232719898223877, -2.9937920570373535, -2.6643118858337402, -2.334831714630127, -2.0053517818450928, -1.6758718490600586, -1.3463916778564453, -1.0169116258621216, -0.6874315738677979, -0.3579515218734741, -0.02847146987915039, 0.30100858211517334, 0.6304886341094971, 0.9599685668945312, 1.2894487380981445, 1.6189287900924683, 1.948408842086792, 2.277888774871826, 2.6073689460754395, 2.9368491172790527, 3.266329050064087, 3.595808982849121, 3.9252891540527344, 4.254769325256348, 4.584249496459961, 4.913729190826416, 5.243209362030029, 5.572689533233643, 5.902169227600098, 6.231649398803711, 6.561129570007324, 6.8906097412109375, 7.220089912414551, 7.549569606781006, 7.879049777984619, 8.208529472351074, 8.538009643554688, 8.8674898147583, 9.196969985961914]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 2.0, 3.0, 10.0, 12.0, 22.0, 18.0, 23.0, 40.0, 45.0, 70.0, 109.0, 198.0, 474.0, 1113.0, 3723.0, 17215.0, 113454.0, 635405.0, 236543.0, 31290.0, 5872.0, 1627.0, 596.0, 250.0, 141.0, 90.0, 59.0, 36.0, 31.0, 20.0, 13.0, 12.0, 6.0, 6.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.28094482421875, -6.1048583984375, -5.92877197265625, -5.752685546875, -5.57659912109375, -5.4005126953125, -5.22442626953125, -5.04833984375, -4.87225341796875, -4.6961669921875, -4.52008056640625, -4.343994140625, -4.16790771484375, -3.9918212890625, -3.81573486328125, -3.6396484375, -3.46356201171875, -3.2874755859375, -3.11138916015625, -2.935302734375, -2.75921630859375, -2.5831298828125, -2.40704345703125, -2.23095703125, -2.05487060546875, -1.8787841796875, -1.70269775390625, -1.526611328125, -1.35052490234375, -1.1744384765625, -0.99835205078125, -0.822265625, -0.64617919921875, -0.4700927734375, -0.29400634765625, -0.117919921875, 0.05816650390625, 0.2342529296875, 0.41033935546875, 0.58642578125, 0.76251220703125, 0.9385986328125, 1.11468505859375, 1.290771484375, 1.46685791015625, 1.6429443359375, 1.81903076171875, 1.9951171875, 2.17120361328125, 2.3472900390625, 2.52337646484375, 2.699462890625, 2.87554931640625, 3.0516357421875, 3.22772216796875, 3.40380859375, 3.57989501953125, 3.7559814453125, 3.93206787109375, 4.108154296875, 4.28424072265625, 4.4603271484375, 4.63641357421875, 4.8125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 16.0, 12.0, 13.0, 38.0, 44.0, 42.0, 70.0, 76.0, 99.0, 82.0, 95.0, 79.0, 102.0, 57.0, 52.0, 34.0, 22.0, 21.0, 25.0, 6.0, 7.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.384765625, -1.3532943725585938, -1.3218231201171875, -1.2903518676757812, -1.258880615234375, -1.2274093627929688, -1.1959381103515625, -1.1644668579101562, -1.13299560546875, -1.1015243530273438, -1.0700531005859375, -1.0385818481445312, -1.007110595703125, -0.9756393432617188, -0.9441680908203125, -0.9126968383789062, -0.8812255859375, -0.8497543334960938, -0.8182830810546875, -0.7868118286132812, -0.755340576171875, -0.7238693237304688, -0.6923980712890625, -0.6609268188476562, -0.62945556640625, -0.5979843139648438, -0.5665130615234375, -0.5350418090820312, -0.503570556640625, -0.47209930419921875, -0.4406280517578125, -0.40915679931640625, -0.377685546875, -0.34621429443359375, -0.3147430419921875, -0.28327178955078125, -0.251800537109375, -0.22032928466796875, -0.1888580322265625, -0.15738677978515625, -0.12591552734375, -0.09444427490234375, -0.0629730224609375, -0.03150177001953125, -3.0517578125e-05, 0.03144073486328125, 0.0629119873046875, 0.09438323974609375, 0.1258544921875, 0.15732574462890625, 0.1887969970703125, 0.22026824951171875, 0.251739501953125, 0.28321075439453125, 0.3146820068359375, 0.34615325927734375, 0.37762451171875, 0.40909576416015625, 0.4405670166015625, 0.47203826904296875, 0.503509521484375, 0.5349807739257812, 0.5664520263671875, 0.5979232788085938, 0.62939453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 10.0, 18.0, 23.0, 26.0, 30.0, 31.0, 61.0, 145.0, 253.0, 496.0, 1046.0, 2438.0, 7133.0, 26212.0, 113594.0, 428364.0, 353486.0, 85350.0, 20238.0, 5768.0, 2002.0, 875.0, 379.0, 229.0, 114.0, 89.0, 46.0, 24.0, 11.0, 11.0, 11.0, 12.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.673828125, -3.568572998046875, -3.46331787109375, -3.358062744140625, -3.2528076171875, -3.147552490234375, -3.04229736328125, -2.937042236328125, -2.831787109375, -2.726531982421875, -2.62127685546875, -2.516021728515625, -2.4107666015625, -2.305511474609375, -2.20025634765625, -2.095001220703125, -1.98974609375, -1.884490966796875, -1.77923583984375, -1.673980712890625, -1.5687255859375, -1.463470458984375, -1.35821533203125, -1.252960205078125, -1.147705078125, -1.042449951171875, -0.93719482421875, -0.831939697265625, -0.7266845703125, -0.621429443359375, -0.51617431640625, -0.410919189453125, -0.3056640625, -0.200408935546875, -0.09515380859375, 0.010101318359375, 0.1153564453125, 0.220611572265625, 0.32586669921875, 0.431121826171875, 0.536376953125, 0.641632080078125, 0.74688720703125, 0.852142333984375, 0.9573974609375, 1.062652587890625, 1.16790771484375, 1.273162841796875, 1.37841796875, 1.483673095703125, 1.58892822265625, 1.694183349609375, 1.7994384765625, 1.904693603515625, 2.00994873046875, 2.115203857421875, 2.220458984375, 2.325714111328125, 2.43096923828125, 2.536224365234375, 2.6414794921875, 2.746734619140625, 2.85198974609375, 2.957244873046875, 3.0625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 7.0, 11.0, 8.0, 12.0, 15.0, 16.0, 23.0, 27.0, 31.0, 43.0, 50.0, 39.0, 48.0, 39.0, 47.0, 49.0, 60.0, 58.0, 49.0, 38.0, 45.0, 41.0, 40.0, 36.0, 32.0, 25.0, 27.0, 16.0, 20.0, 9.0, 8.0, 6.0, 3.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.119140625, -3.033233642578125, -2.94732666015625, -2.861419677734375, -2.7755126953125, -2.689605712890625, -2.60369873046875, -2.517791748046875, -2.431884765625, -2.345977783203125, -2.26007080078125, -2.174163818359375, -2.0882568359375, -2.002349853515625, -1.91644287109375, -1.830535888671875, -1.74462890625, -1.658721923828125, -1.57281494140625, -1.486907958984375, -1.4010009765625, -1.315093994140625, -1.22918701171875, -1.143280029296875, -1.057373046875, -0.971466064453125, -0.88555908203125, -0.799652099609375, -0.7137451171875, -0.627838134765625, -0.54193115234375, -0.456024169921875, -0.3701171875, -0.284210205078125, -0.19830322265625, -0.112396240234375, -0.0264892578125, 0.059417724609375, 0.14532470703125, 0.231231689453125, 0.317138671875, 0.403045654296875, 0.48895263671875, 0.574859619140625, 0.6607666015625, 0.746673583984375, 0.83258056640625, 0.918487548828125, 1.00439453125, 1.090301513671875, 1.17620849609375, 1.262115478515625, 1.3480224609375, 1.433929443359375, 1.51983642578125, 1.605743408203125, 1.691650390625, 1.777557373046875, 1.86346435546875, 1.949371337890625, 2.0352783203125, 2.121185302734375, 2.20709228515625, 2.292999267578125, 2.37890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 8.0, 12.0, 21.0, 23.0, 32.0, 70.0, 69.0, 133.0, 209.0, 353.0, 635.0, 1230.0, 2626.0, 6622.0, 54734.0, 918279.0, 51640.0, 6551.0, 2506.0, 1235.0, 630.0, 312.0, 220.0, 143.0, 67.0, 55.0, 42.0, 27.0, 14.0, 11.0, 6.0, 7.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.92578125, -5.74884033203125, -5.5718994140625, -5.39495849609375, -5.218017578125, -5.04107666015625, -4.8641357421875, -4.68719482421875, -4.51025390625, -4.33331298828125, -4.1563720703125, -3.97943115234375, -3.802490234375, -3.62554931640625, -3.4486083984375, -3.27166748046875, -3.0947265625, -2.91778564453125, -2.7408447265625, -2.56390380859375, -2.386962890625, -2.21002197265625, -2.0330810546875, -1.85614013671875, -1.67919921875, -1.50225830078125, -1.3253173828125, -1.14837646484375, -0.971435546875, -0.79449462890625, -0.6175537109375, -0.44061279296875, -0.263671875, -0.08673095703125, 0.0902099609375, 0.26715087890625, 0.444091796875, 0.62103271484375, 0.7979736328125, 0.97491455078125, 1.15185546875, 1.32879638671875, 1.5057373046875, 1.68267822265625, 1.859619140625, 2.03656005859375, 2.2135009765625, 2.39044189453125, 2.5673828125, 2.74432373046875, 2.9212646484375, 3.09820556640625, 3.275146484375, 3.45208740234375, 3.6290283203125, 3.80596923828125, 3.98291015625, 4.15985107421875, 4.3367919921875, 4.51373291015625, 4.690673828125, 4.86761474609375, 5.0445556640625, 5.22149658203125, 5.3984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 9.0, 11.0, 8.0, 16.0, 19.0, 24.0, 23.0, 17.0, 26.0, 43.0, 47.0, 61.0, 87.0, 125.0, 101.0, 84.0, 64.0, 42.0, 33.0, 26.0, 23.0, 19.0, 11.0, 15.0, 13.0, 9.0, 6.0, 11.0, 3.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017571449279785156, -0.0001693814992904663, -0.00016304850578308105, -0.0001567155122756958, -0.00015038251876831055, -0.0001440495252609253, -0.00013771653175354004, -0.00013138353824615479, -0.00012505054473876953, -0.00011871755123138428, -0.00011238455772399902, -0.00010605156421661377, -9.971857070922852e-05, -9.338557720184326e-05, -8.705258369445801e-05, -8.071959018707275e-05, -7.43865966796875e-05, -6.805360317230225e-05, -6.172060966491699e-05, -5.538761615753174e-05, -4.9054622650146484e-05, -4.272162914276123e-05, -3.6388635635375977e-05, -3.0055642127990723e-05, -2.372264862060547e-05, -1.7389655113220215e-05, -1.1056661605834961e-05, -4.723668098449707e-06, 1.6093254089355469e-06, 7.9423189163208e-06, 1.4275312423706055e-05, 2.060830593109131e-05, 2.6941299438476562e-05, 3.3274292945861816e-05, 3.960728645324707e-05, 4.5940279960632324e-05, 5.227327346801758e-05, 5.860626697540283e-05, 6.493926048278809e-05, 7.127225399017334e-05, 7.76052474975586e-05, 8.393824100494385e-05, 9.02712345123291e-05, 9.660422801971436e-05, 0.00010293722152709961, 0.00010927021503448486, 0.00011560320854187012, 0.00012193620204925537, 0.00012826919555664062, 0.00013460218906402588, 0.00014093518257141113, 0.0001472681760787964, 0.00015360116958618164, 0.0001599341630935669, 0.00016626715660095215, 0.0001726001501083374, 0.00017893314361572266, 0.0001852661371231079, 0.00019159913063049316, 0.00019793212413787842, 0.00020426511764526367, 0.00021059811115264893, 0.00021693110466003418, 0.00022326409816741943, 0.0002295970916748047]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 12.0, 25.0, 28.0, 38.0, 59.0, 107.0, 197.0, 394.0, 952.0, 2874.0, 14428.0, 706096.0, 309382.0, 10080.0, 2298.0, 827.0, 311.0, 191.0, 83.0, 57.0, 43.0, 28.0, 7.0, 12.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.64453125, -5.42669677734375, -5.2088623046875, -4.99102783203125, -4.773193359375, -4.55535888671875, -4.3375244140625, -4.11968994140625, -3.90185546875, -3.68402099609375, -3.4661865234375, -3.24835205078125, -3.030517578125, -2.81268310546875, -2.5948486328125, -2.37701416015625, -2.1591796875, -1.94134521484375, -1.7235107421875, -1.50567626953125, -1.287841796875, -1.07000732421875, -0.8521728515625, -0.63433837890625, -0.41650390625, -0.19866943359375, 0.0191650390625, 0.23699951171875, 0.454833984375, 0.67266845703125, 0.8905029296875, 1.10833740234375, 1.326171875, 1.54400634765625, 1.7618408203125, 1.97967529296875, 2.197509765625, 2.41534423828125, 2.6331787109375, 2.85101318359375, 3.06884765625, 3.28668212890625, 3.5045166015625, 3.72235107421875, 3.940185546875, 4.15802001953125, 4.3758544921875, 4.59368896484375, 4.8115234375, 5.02935791015625, 5.2471923828125, 5.46502685546875, 5.682861328125, 5.90069580078125, 6.1185302734375, 6.33636474609375, 6.55419921875, 6.77203369140625, 6.9898681640625, 7.20770263671875, 7.425537109375, 7.64337158203125, 7.8612060546875, 8.07904052734375, 8.296875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 5.0, 20.0, 34.0, 94.0, 161.0, 227.0, 219.0, 109.0, 54.0, 35.0, 13.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.984375, -3.8453369140625, -3.706298828125, -3.5672607421875, -3.42822265625, -3.2891845703125, -3.150146484375, -3.0111083984375, -2.8720703125, -2.7330322265625, -2.593994140625, -2.4549560546875, -2.31591796875, -2.1768798828125, -2.037841796875, -1.8988037109375, -1.759765625, -1.6207275390625, -1.481689453125, -1.3426513671875, -1.20361328125, -1.0645751953125, -0.925537109375, -0.7864990234375, -0.6474609375, -0.5084228515625, -0.369384765625, -0.2303466796875, -0.09130859375, 0.0477294921875, 0.186767578125, 0.3258056640625, 0.46484375, 0.6038818359375, 0.742919921875, 0.8819580078125, 1.02099609375, 1.1600341796875, 1.299072265625, 1.4381103515625, 1.5771484375, 1.7161865234375, 1.855224609375, 1.9942626953125, 2.13330078125, 2.2723388671875, 2.411376953125, 2.5504150390625, 2.689453125, 2.8284912109375, 2.967529296875, 3.1065673828125, 3.24560546875, 3.3846435546875, 3.523681640625, 3.6627197265625, 3.8017578125, 3.9407958984375, 4.079833984375, 4.2188720703125, 4.35791015625, 4.4969482421875, 4.635986328125, 4.7750244140625, 4.9140625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 8.0, 24.0, 59.0, 119.0, 213.0, 266.0, 174.0, 89.0, 28.0, 16.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.492610931396484, -43.027252197265625, -41.5618896484375, -40.096527099609375, -38.631168365478516, -37.165809631347656, -35.70044708251953, -34.235084533691406, -32.76972579956055, -31.304365158081055, -29.839004516601562, -28.37364387512207, -26.908283233642578, -25.442922592163086, -23.977561950683594, -22.5122013092041, -21.04684066772461, -19.581480026245117, -18.116119384765625, -16.650758743286133, -15.18539810180664, -13.720037460327148, -12.254676818847656, -10.789316177368164, -9.323955535888672, -7.85859489440918, -6.3932342529296875, -4.927873611450195, -3.462512969970703, -1.997152328491211, -0.5317916870117188, 0.9335689544677734, 2.39892578125, 3.864286422729492, 5.329647064208984, 6.795007705688477, 8.260368347167969, 9.725728988647461, 11.191089630126953, 12.656450271606445, 14.121810913085938, 15.58717155456543, 17.052532196044922, 18.517892837524414, 19.983253479003906, 21.4486141204834, 22.91397476196289, 24.379335403442383, 25.844696044921875, 27.310056686401367, 28.77541732788086, 30.24077796936035, 31.706138610839844, 33.17150115966797, 34.63685989379883, 36.10221862792969, 37.56758117675781, 39.03294372558594, 40.4983024597168, 41.963661193847656, 43.42902374267578, 44.894386291503906, 46.359745025634766, 47.825103759765625, 49.29046630859375]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 7.0, 2.0, 5.0, 8.0, 11.0, 14.0, 17.0, 14.0, 26.0, 22.0, 36.0, 36.0, 40.0, 39.0, 66.0, 56.0, 46.0, 43.0, 58.0, 61.0, 58.0, 53.0, 47.0, 49.0, 24.0, 28.0, 24.0, 19.0, 23.0, 25.0, 10.0, 11.0, 13.0, 4.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.824080467224121, -14.27914810180664, -13.734216690063477, -13.189284324645996, -12.644352912902832, -12.099420547485352, -11.554489135742188, -11.009556770324707, -10.464624404907227, -9.919692039489746, -9.374760627746582, -8.829828262329102, -8.284896850585938, -7.739964485168457, -7.195032596588135, -6.6501007080078125, -6.105169296264648, -5.560237407684326, -5.015305519104004, -4.470373153686523, -3.9254415035247803, -3.380509614944458, -2.8355774879455566, -2.2906455993652344, -1.745713710784912, -1.2007818222045898, -0.655849814414978, -0.11091780662536621, 0.43401408195495605, 0.9789459705352783, 1.5238780975341797, 2.068809986114502, 2.613740921020508, 3.15867280960083, 3.7036046981811523, 4.248537063598633, 4.793468475341797, 5.338400840759277, 5.8833327293396, 6.428264617919922, 6.973196506500244, 7.518128395080566, 8.063060760498047, 8.607992172241211, 9.152924537658691, 9.697855949401855, 10.242788314819336, 10.7877197265625, 11.33265209197998, 11.877584457397461, 12.422515869140625, 12.967448234558105, 13.51237964630127, 14.05731201171875, 14.602243423461914, 15.147175788879395, 15.692108154296875, 16.23703956604004, 16.781972885131836, 17.326904296875, 17.871835708618164, 18.416767120361328, 18.961700439453125, 19.50663185119629, 20.051563262939453]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 17.0, 22.0, 36.0, 53.0, 91.0, 173.0, 339.0, 1445.0, 10943.0, 2590471.0, 1578242.0, 10393.0, 1378.0, 307.0, 137.0, 90.0, 56.0, 29.0, 24.0, 9.0, 9.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8203125, -11.538818359375, -11.25732421875, -10.975830078125, -10.6943359375, -10.412841796875, -10.13134765625, -9.849853515625, -9.568359375, -9.286865234375, -9.00537109375, -8.723876953125, -8.4423828125, -8.160888671875, -7.87939453125, -7.597900390625, -7.31640625, -7.034912109375, -6.75341796875, -6.471923828125, -6.1904296875, -5.908935546875, -5.62744140625, -5.345947265625, -5.064453125, -4.782958984375, -4.50146484375, -4.219970703125, -3.9384765625, -3.656982421875, -3.37548828125, -3.093994140625, -2.8125, -2.531005859375, -2.24951171875, -1.968017578125, -1.6865234375, -1.405029296875, -1.12353515625, -0.842041015625, -0.560546875, -0.279052734375, 0.00244140625, 0.283935546875, 0.5654296875, 0.846923828125, 1.12841796875, 1.409912109375, 1.69140625, 1.972900390625, 2.25439453125, 2.535888671875, 2.8173828125, 3.098876953125, 3.38037109375, 3.661865234375, 3.943359375, 4.224853515625, 4.50634765625, 4.787841796875, 5.0693359375, 5.350830078125, 5.63232421875, 5.913818359375, 6.1953125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 7.0, 10.0, 8.0, 16.0, 23.0, 44.0, 48.0, 69.0, 70.0, 81.0, 96.0, 83.0, 85.0, 86.0, 71.0, 58.0, 42.0, 40.0, 17.0, 20.0, 12.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4013671875, -1.3690109252929688, -1.3366546630859375, -1.3042984008789062, -1.271942138671875, -1.2395858764648438, -1.2072296142578125, -1.1748733520507812, -1.14251708984375, -1.1101608276367188, -1.0778045654296875, -1.0454483032226562, -1.013092041015625, -0.9807357788085938, -0.9483795166015625, -0.9160232543945312, -0.8836669921875, -0.8513107299804688, -0.8189544677734375, -0.7865982055664062, -0.754241943359375, -0.7218856811523438, -0.6895294189453125, -0.6571731567382812, -0.62481689453125, -0.5924606323242188, -0.5601043701171875, -0.5277481079101562, -0.495391845703125, -0.46303558349609375, -0.4306793212890625, -0.39832305908203125, -0.365966796875, -0.33361053466796875, -0.3012542724609375, -0.26889801025390625, -0.236541748046875, -0.20418548583984375, -0.1718292236328125, -0.13947296142578125, -0.10711669921875, -0.07476043701171875, -0.0424041748046875, -0.01004791259765625, 0.022308349609375, 0.05466461181640625, 0.0870208740234375, 0.11937713623046875, 0.1517333984375, 0.18408966064453125, 0.2164459228515625, 0.24880218505859375, 0.281158447265625, 0.31351470947265625, 0.3458709716796875, 0.37822723388671875, 0.41058349609375, 0.44293975830078125, 0.4752960205078125, 0.5076522827148438, 0.540008544921875, 0.5723648071289062, 0.6047210693359375, 0.6370773315429688, 0.66943359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 0.0, 0.0, 6.0, 6.0, 10.0, 17.0, 17.0, 21.0, 35.0, 33.0, 38.0, 55.0, 88.0, 225.0, 928.0, 8983.0, 724341.0, 3442518.0, 14963.0, 1354.0, 253.0, 121.0, 45.0, 39.0, 24.0, 34.0, 32.0, 31.0, 20.0, 14.0, 15.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.73828125, -7.44158935546875, -7.1448974609375, -6.84820556640625, -6.551513671875, -6.25482177734375, -5.9581298828125, -5.66143798828125, -5.36474609375, -5.06805419921875, -4.7713623046875, -4.47467041015625, -4.177978515625, -3.88128662109375, -3.5845947265625, -3.28790283203125, -2.9912109375, -2.69451904296875, -2.3978271484375, -2.10113525390625, -1.804443359375, -1.50775146484375, -1.2110595703125, -0.91436767578125, -0.61767578125, -0.32098388671875, -0.0242919921875, 0.27239990234375, 0.569091796875, 0.86578369140625, 1.1624755859375, 1.45916748046875, 1.755859375, 2.05255126953125, 2.3492431640625, 2.64593505859375, 2.942626953125, 3.23931884765625, 3.5360107421875, 3.83270263671875, 4.12939453125, 4.42608642578125, 4.7227783203125, 5.01947021484375, 5.316162109375, 5.61285400390625, 5.9095458984375, 6.20623779296875, 6.5029296875, 6.79962158203125, 7.0963134765625, 7.39300537109375, 7.689697265625, 7.98638916015625, 8.2830810546875, 8.57977294921875, 8.87646484375, 9.17315673828125, 9.4698486328125, 9.76654052734375, 10.063232421875, 10.35992431640625, 10.6566162109375, 10.95330810546875, 11.25]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 11.0, 17.0, 33.0, 57.0, 122.0, 439.0, 2285.0, 741.0, 203.0, 76.0, 39.0, 26.0, 13.0, 10.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.56640625, -1.490570068359375, -1.41473388671875, -1.338897705078125, -1.2630615234375, -1.187225341796875, -1.11138916015625, -1.035552978515625, -0.959716796875, -0.883880615234375, -0.80804443359375, -0.732208251953125, -0.6563720703125, -0.580535888671875, -0.50469970703125, -0.428863525390625, -0.35302734375, -0.277191162109375, -0.20135498046875, -0.125518798828125, -0.0496826171875, 0.026153564453125, 0.10198974609375, 0.177825927734375, 0.253662109375, 0.329498291015625, 0.40533447265625, 0.481170654296875, 0.5570068359375, 0.632843017578125, 0.70867919921875, 0.784515380859375, 0.8603515625, 0.936187744140625, 1.01202392578125, 1.087860107421875, 1.1636962890625, 1.239532470703125, 1.31536865234375, 1.391204833984375, 1.467041015625, 1.542877197265625, 1.61871337890625, 1.694549560546875, 1.7703857421875, 1.846221923828125, 1.92205810546875, 1.997894287109375, 2.07373046875, 2.149566650390625, 2.22540283203125, 2.301239013671875, 2.3770751953125, 2.452911376953125, 2.52874755859375, 2.604583740234375, 2.680419921875, 2.756256103515625, 2.83209228515625, 2.907928466796875, 2.9837646484375, 3.059600830078125, 3.13543701171875, 3.211273193359375, 3.287109375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 33.0, 67.0, 194.0, 317.0, 223.0, 113.0, 32.0, 12.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.651105880737305, -5.05836296081543, -4.465620040893555, -3.8728771209716797, -3.2801342010498047, -2.6873912811279297, -2.0946483612060547, -1.5019054412841797, -0.9091625213623047, -0.3164196014404297, 0.2763233184814453, 0.8690662384033203, 1.4618091583251953, 2.0545520782470703, 2.6472949981689453, 3.2400379180908203, 3.8327808380126953, 4.42552375793457, 5.018266677856445, 5.61100959777832, 6.203752517700195, 6.79649543762207, 7.389238357543945, 7.98198127746582, 8.574724197387695, 9.16746711730957, 9.760210037231445, 10.35295295715332, 10.945695877075195, 11.53843879699707, 12.131181716918945, 12.72392463684082, 13.316665649414062, 13.909408569335938, 14.502151489257812, 15.094894409179688, 15.687637329101562, 16.280380249023438, 16.873123168945312, 17.465866088867188, 18.058609008789062, 18.651351928710938, 19.244094848632812, 19.836837768554688, 20.429580688476562, 21.022323608398438, 21.615066528320312, 22.207809448242188, 22.800552368164062, 23.393295288085938, 23.986038208007812, 24.578781127929688, 25.171524047851562, 25.764266967773438, 26.357009887695312, 26.949752807617188, 27.542495727539062, 28.135238647460938, 28.727981567382812, 29.320724487304688, 29.913467407226562, 30.506210327148438, 31.098953247070312, 31.691696166992188, 32.28443908691406]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 26.0, 32.0, 53.0, 95.0, 137.0, 146.0, 159.0, 126.0, 111.0, 61.0, 29.0, 18.0, 8.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.374794960021973, -12.915046691894531, -12.455297470092773, -11.995549201965332, -11.53580093383789, -11.07605266571045, -10.616304397583008, -10.15655517578125, -9.696806907653809, -9.237058639526367, -8.77730941772461, -8.317561149597168, -7.857812881469727, -7.398064613342285, -6.9383158683776855, -6.478567123413086, -6.0188188552856445, -5.559070587158203, -5.0993218421936035, -4.639573097229004, -4.1798248291015625, -3.720076322555542, -3.2603278160095215, -2.800579309463501, -2.3408308029174805, -1.88108229637146, -1.4213337898254395, -0.961585283279419, -0.5018367767333984, -0.04208827018737793, 0.4176602363586426, 0.8774087429046631, 1.337158203125, 1.7969067096710205, 2.256655216217041, 2.7164037227630615, 3.176152229309082, 3.6359007358551025, 4.095649242401123, 4.555397987365723, 5.015146255493164, 5.4748945236206055, 5.934643268585205, 6.394392013549805, 6.854140281677246, 7.3138885498046875, 7.773637294769287, 8.233386039733887, 8.693134307861328, 9.15288257598877, 9.612630844116211, 10.072380065917969, 10.53212833404541, 10.991876602172852, 11.45162582397461, 11.91137409210205, 12.371122360229492, 12.830870628356934, 13.290618896484375, 13.750368118286133, 14.210116386413574, 14.669864654541016, 15.129613876342773, 15.589362144470215, 16.049110412597656]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 7.0, 11.0, 10.0, 11.0, 18.0, 46.0, 53.0, 66.0, 101.0, 156.0, 232.0, 412.0, 719.0, 1249.0, 2396.0, 4645.0, 9956.0, 22559.0, 54316.0, 137887.0, 302398.0, 290400.0, 129449.0, 51261.0, 21204.0, 9387.0, 4424.0, 2198.0, 1124.0, 653.0, 419.0, 270.0, 166.0, 94.0, 71.0, 43.0, 50.0, 15.0, 15.0, 12.0, 8.0, 12.0, 4.0, 3.0, 5.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.630859375, -2.548553466796875, -2.46624755859375, -2.383941650390625, -2.3016357421875, -2.219329833984375, -2.13702392578125, -2.054718017578125, -1.972412109375, -1.890106201171875, -1.80780029296875, -1.725494384765625, -1.6431884765625, -1.560882568359375, -1.47857666015625, -1.396270751953125, -1.31396484375, -1.231658935546875, -1.14935302734375, -1.067047119140625, -0.9847412109375, -0.902435302734375, -0.82012939453125, -0.737823486328125, -0.655517578125, -0.573211669921875, -0.49090576171875, -0.408599853515625, -0.3262939453125, -0.243988037109375, -0.16168212890625, -0.079376220703125, 0.0029296875, 0.085235595703125, 0.16754150390625, 0.249847412109375, 0.3321533203125, 0.414459228515625, 0.49676513671875, 0.579071044921875, 0.661376953125, 0.743682861328125, 0.82598876953125, 0.908294677734375, 0.9906005859375, 1.072906494140625, 1.15521240234375, 1.237518310546875, 1.31982421875, 1.402130126953125, 1.48443603515625, 1.566741943359375, 1.6490478515625, 1.731353759765625, 1.81365966796875, 1.895965576171875, 1.978271484375, 2.060577392578125, 2.14288330078125, 2.225189208984375, 2.3074951171875, 2.389801025390625, 2.47210693359375, 2.554412841796875, 2.63671875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 5.0, 5.0, 5.0, 9.0, 11.0, 14.0, 26.0, 32.0, 42.0, 37.0, 36.0, 52.0, 55.0, 55.0, 62.0, 56.0, 59.0, 62.0, 53.0, 58.0, 48.0, 29.0, 39.0, 31.0, 28.0, 22.0, 14.0, 14.0, 11.0, 7.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7578125, -0.7360763549804688, -0.7143402099609375, -0.6926040649414062, -0.670867919921875, -0.6491317749023438, -0.6273956298828125, -0.6056594848632812, -0.58392333984375, -0.5621871948242188, -0.5404510498046875, -0.5187149047851562, -0.496978759765625, -0.47524261474609375, -0.4535064697265625, -0.43177032470703125, -0.4100341796875, -0.38829803466796875, -0.3665618896484375, -0.34482574462890625, -0.323089599609375, -0.30135345458984375, -0.2796173095703125, -0.25788116455078125, -0.23614501953125, -0.21440887451171875, -0.1926727294921875, -0.17093658447265625, -0.149200439453125, -0.12746429443359375, -0.1057281494140625, -0.08399200439453125, -0.062255859375, -0.04051971435546875, -0.0187835693359375, 0.00295257568359375, 0.024688720703125, 0.04642486572265625, 0.0681610107421875, 0.08989715576171875, 0.11163330078125, 0.13336944580078125, 0.1551055908203125, 0.17684173583984375, 0.198577880859375, 0.22031402587890625, 0.2420501708984375, 0.26378631591796875, 0.2855224609375, 0.30725860595703125, 0.3289947509765625, 0.35073089599609375, 0.372467041015625, 0.39420318603515625, 0.4159393310546875, 0.43767547607421875, 0.45941162109375, 0.48114776611328125, 0.5028839111328125, 0.5246200561523438, 0.546356201171875, 0.5680923461914062, 0.5898284912109375, 0.6115646362304688, 0.63330078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 4.0, 9.0, 9.0, 13.0, 25.0, 31.0, 34.0, 57.0, 71.0, 94.0, 121.0, 171.0, 276.0, 449.0, 691.0, 1365.0, 2827.0, 7296.0, 20412.0, 61251.0, 180612.0, 383029.0, 253135.0, 88790.0, 29401.0, 10268.0, 3913.0, 1771.0, 852.0, 501.0, 302.0, 203.0, 163.0, 108.0, 76.0, 57.0, 44.0, 25.0, 19.0, 24.0, 12.0, 7.0, 8.0, 5.0, 8.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.35546875, -2.2733154296875, -2.191162109375, -2.1090087890625, -2.02685546875, -1.9447021484375, -1.862548828125, -1.7803955078125, -1.6982421875, -1.6160888671875, -1.533935546875, -1.4517822265625, -1.36962890625, -1.2874755859375, -1.205322265625, -1.1231689453125, -1.041015625, -0.9588623046875, -0.876708984375, -0.7945556640625, -0.71240234375, -0.6302490234375, -0.548095703125, -0.4659423828125, -0.3837890625, -0.3016357421875, -0.219482421875, -0.1373291015625, -0.05517578125, 0.0269775390625, 0.109130859375, 0.1912841796875, 0.2734375, 0.3555908203125, 0.437744140625, 0.5198974609375, 0.60205078125, 0.6842041015625, 0.766357421875, 0.8485107421875, 0.9306640625, 1.0128173828125, 1.094970703125, 1.1771240234375, 1.25927734375, 1.3414306640625, 1.423583984375, 1.5057373046875, 1.587890625, 1.6700439453125, 1.752197265625, 1.8343505859375, 1.91650390625, 1.9986572265625, 2.080810546875, 2.1629638671875, 2.2451171875, 2.3272705078125, 2.409423828125, 2.4915771484375, 2.57373046875, 2.6558837890625, 2.738037109375, 2.8201904296875, 2.90234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 9.0, 8.0, 11.0, 8.0, 18.0, 26.0, 25.0, 27.0, 29.0, 40.0, 21.0, 33.0, 33.0, 45.0, 36.0, 48.0, 53.0, 44.0, 54.0, 45.0, 43.0, 40.0, 35.0, 38.0, 31.0, 25.0, 28.0, 24.0, 18.0, 22.0, 14.0, 12.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.732421875, -2.65264892578125, -2.5728759765625, -2.49310302734375, -2.413330078125, -2.33355712890625, -2.2537841796875, -2.17401123046875, -2.09423828125, -2.01446533203125, -1.9346923828125, -1.85491943359375, -1.775146484375, -1.69537353515625, -1.6156005859375, -1.53582763671875, -1.4560546875, -1.37628173828125, -1.2965087890625, -1.21673583984375, -1.136962890625, -1.05718994140625, -0.9774169921875, -0.89764404296875, -0.81787109375, -0.73809814453125, -0.6583251953125, -0.57855224609375, -0.498779296875, -0.41900634765625, -0.3392333984375, -0.25946044921875, -0.1796875, -0.09991455078125, -0.0201416015625, 0.05963134765625, 0.139404296875, 0.21917724609375, 0.2989501953125, 0.37872314453125, 0.45849609375, 0.53826904296875, 0.6180419921875, 0.69781494140625, 0.777587890625, 0.85736083984375, 0.9371337890625, 1.01690673828125, 1.0966796875, 1.17645263671875, 1.2562255859375, 1.33599853515625, 1.415771484375, 1.49554443359375, 1.5753173828125, 1.65509033203125, 1.73486328125, 1.81463623046875, 1.8944091796875, 1.97418212890625, 2.053955078125, 2.13372802734375, 2.2135009765625, 2.29327392578125, 2.373046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 11.0, 6.0, 8.0, 15.0, 26.0, 37.0, 59.0, 130.0, 306.0, 740.0, 2000.0, 6538.0, 29883.0, 278460.0, 653647.0, 60821.0, 10972.0, 3070.0, 995.0, 416.0, 181.0, 90.0, 44.0, 28.0, 21.0, 10.0, 8.0, 8.0, 7.0, 2.0, 4.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1640625, -3.065765380859375, -2.96746826171875, -2.869171142578125, -2.7708740234375, -2.672576904296875, -2.57427978515625, -2.475982666015625, -2.377685546875, -2.279388427734375, -2.18109130859375, -2.082794189453125, -1.9844970703125, -1.886199951171875, -1.78790283203125, -1.689605712890625, -1.59130859375, -1.493011474609375, -1.39471435546875, -1.296417236328125, -1.1981201171875, -1.099822998046875, -1.00152587890625, -0.903228759765625, -0.804931640625, -0.706634521484375, -0.60833740234375, -0.510040283203125, -0.4117431640625, -0.313446044921875, -0.21514892578125, -0.116851806640625, -0.0185546875, 0.079742431640625, 0.17803955078125, 0.276336669921875, 0.3746337890625, 0.472930908203125, 0.57122802734375, 0.669525146484375, 0.767822265625, 0.866119384765625, 0.96441650390625, 1.062713623046875, 1.1610107421875, 1.259307861328125, 1.35760498046875, 1.455902099609375, 1.55419921875, 1.652496337890625, 1.75079345703125, 1.849090576171875, 1.9473876953125, 2.045684814453125, 2.14398193359375, 2.242279052734375, 2.340576171875, 2.438873291015625, 2.53717041015625, 2.635467529296875, 2.7337646484375, 2.832061767578125, 2.93035888671875, 3.028656005859375, 3.126953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 4.0, 0.0, 8.0, 3.0, 5.0, 10.0, 6.0, 12.0, 19.0, 25.0, 21.0, 22.0, 33.0, 31.0, 38.0, 38.0, 63.0, 81.0, 100.0, 90.0, 78.0, 53.0, 43.0, 33.0, 29.0, 32.0, 21.0, 15.0, 13.0, 15.0, 13.0, 9.0, 8.0, 9.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00022423267364501953, -0.0002177748829126358, -0.00021131709218025208, -0.00020485930144786835, -0.00019840151071548462, -0.0001919437199831009, -0.00018548592925071716, -0.00017902813851833344, -0.0001725703477859497, -0.00016611255705356598, -0.00015965476632118225, -0.00015319697558879852, -0.0001467391848564148, -0.00014028139412403107, -0.00013382360339164734, -0.0001273658126592636, -0.00012090802192687988, -0.00011445023119449615, -0.00010799244046211243, -0.0001015346497297287, -9.507685899734497e-05, -8.861906826496124e-05, -8.216127753257751e-05, -7.570348680019379e-05, -6.924569606781006e-05, -6.278790533542633e-05, -5.63301146030426e-05, -4.9872323870658875e-05, -4.3414533138275146e-05, -3.695674240589142e-05, -3.049895167350769e-05, -2.4041160941123962e-05, -1.7583370208740234e-05, -1.1125579476356506e-05, -4.667788743972778e-06, 1.7900019884109497e-06, 8.247792720794678e-06, 1.4705583453178406e-05, 2.1163374185562134e-05, 2.7621164917945862e-05, 3.407895565032959e-05, 4.053674638271332e-05, 4.6994537115097046e-05, 5.3452327847480774e-05, 5.99101185798645e-05, 6.636790931224823e-05, 7.282570004463196e-05, 7.928349077701569e-05, 8.574128150939941e-05, 9.219907224178314e-05, 9.865686297416687e-05, 0.0001051146537065506, 0.00011157244443893433, 0.00011803023517131805, 0.00012448802590370178, 0.0001309458166360855, 0.00013740360736846924, 0.00014386139810085297, 0.0001503191888332367, 0.00015677697956562042, 0.00016323477029800415, 0.00016969256103038788, 0.0001761503517627716, 0.00018260814249515533, 0.00018906593322753906]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 4.0, 8.0, 8.0, 9.0, 16.0, 22.0, 23.0, 30.0, 52.0, 103.0, 125.0, 254.0, 442.0, 874.0, 1764.0, 3896.0, 10284.0, 33631.0, 178168.0, 662049.0, 116322.0, 25666.0, 8293.0, 3292.0, 1493.0, 744.0, 398.0, 230.0, 109.0, 82.0, 59.0, 24.0, 24.0, 15.0, 14.0, 7.0, 6.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.533203125, -2.449859619140625, -2.36651611328125, -2.283172607421875, -2.1998291015625, -2.116485595703125, -2.03314208984375, -1.949798583984375, -1.866455078125, -1.783111572265625, -1.69976806640625, -1.616424560546875, -1.5330810546875, -1.449737548828125, -1.36639404296875, -1.283050537109375, -1.19970703125, -1.116363525390625, -1.03302001953125, -0.949676513671875, -0.8663330078125, -0.782989501953125, -0.69964599609375, -0.616302490234375, -0.532958984375, -0.449615478515625, -0.36627197265625, -0.282928466796875, -0.1995849609375, -0.116241455078125, -0.03289794921875, 0.050445556640625, 0.1337890625, 0.217132568359375, 0.30047607421875, 0.383819580078125, 0.4671630859375, 0.550506591796875, 0.63385009765625, 0.717193603515625, 0.800537109375, 0.883880615234375, 0.96722412109375, 1.050567626953125, 1.1339111328125, 1.217254638671875, 1.30059814453125, 1.383941650390625, 1.46728515625, 1.550628662109375, 1.63397216796875, 1.717315673828125, 1.8006591796875, 1.884002685546875, 1.96734619140625, 2.050689697265625, 2.134033203125, 2.217376708984375, 2.30072021484375, 2.384063720703125, 2.4674072265625, 2.550750732421875, 2.63409423828125, 2.717437744140625, 2.80078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 7.0, 12.0, 15.0, 12.0, 16.0, 28.0, 28.0, 29.0, 70.0, 79.0, 103.0, 128.0, 110.0, 89.0, 56.0, 49.0, 37.0, 20.0, 20.0, 19.0, 14.0, 11.0, 8.0, 9.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.44140625, -2.3764801025390625, -2.311553955078125, -2.2466278076171875, -2.18170166015625, -2.1167755126953125, -2.051849365234375, -1.9869232177734375, -1.9219970703125, -1.8570709228515625, -1.792144775390625, -1.7272186279296875, -1.66229248046875, -1.5973663330078125, -1.532440185546875, -1.4675140380859375, -1.402587890625, -1.3376617431640625, -1.272735595703125, -1.2078094482421875, -1.14288330078125, -1.0779571533203125, -1.013031005859375, -0.9481048583984375, -0.8831787109375, -0.8182525634765625, -0.753326416015625, -0.6884002685546875, -0.62347412109375, -0.5585479736328125, -0.493621826171875, -0.4286956787109375, -0.36376953125, -0.2988433837890625, -0.233917236328125, -0.1689910888671875, -0.10406494140625, -0.0391387939453125, 0.025787353515625, 0.0907135009765625, 0.1556396484375, 0.2205657958984375, 0.285491943359375, 0.3504180908203125, 0.41534423828125, 0.4802703857421875, 0.545196533203125, 0.6101226806640625, 0.675048828125, 0.7399749755859375, 0.804901123046875, 0.8698272705078125, 0.93475341796875, 0.9996795654296875, 1.064605712890625, 1.1295318603515625, 1.1944580078125, 1.2593841552734375, 1.324310302734375, 1.3892364501953125, 1.45416259765625, 1.5190887451171875, 1.584014892578125, 1.6489410400390625, 1.7138671875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 15.0, 52.0, 86.0, 169.0, 237.0, 216.0, 115.0, 43.0, 30.0, 16.0, 11.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.099685668945312, -17.79871940612793, -16.497753143310547, -15.19678783416748, -13.895821571350098, -12.594855308532715, -11.293889999389648, -9.992923736572266, -8.691957473754883, -7.3909912109375, -6.090025424957275, -4.789059638977051, -3.488093376159668, -2.187127113342285, -0.8861613273620605, 0.41480445861816406, 1.7157707214355469, 3.0167367458343506, 4.317702770233154, 5.618668556213379, 6.919634819030762, 8.220601081848145, 9.521566390991211, 10.822532653808594, 12.123498916625977, 13.42446517944336, 14.725431442260742, 16.026397705078125, 17.327362060546875, 18.62833023071289, 19.92929458618164, 21.230260848999023, 22.531227111816406, 23.83219337463379, 25.133159637451172, 26.434125900268555, 27.735092163085938, 29.036056518554688, 30.33702278137207, 31.637989044189453, 32.93895721435547, 34.23992156982422, 35.540889739990234, 36.841854095458984, 38.142822265625, 39.44378662109375, 40.744754791259766, 42.045719146728516, 43.346683502197266, 44.647647857666016, 45.94861602783203, 47.24958038330078, 48.5505485534668, 49.85151290893555, 51.15248107910156, 52.45344543457031, 53.75440979003906, 55.05537414550781, 56.35634231567383, 57.65730667114258, 58.958274841308594, 60.259239196777344, 61.56020736694336, 62.86117172241211, 64.16213989257812]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 7.0, 2.0, 6.0, 6.0, 10.0, 17.0, 15.0, 15.0, 17.0, 27.0, 26.0, 23.0, 34.0, 46.0, 39.0, 45.0, 41.0, 49.0, 38.0, 48.0, 43.0, 56.0, 48.0, 50.0, 49.0, 30.0, 25.0, 25.0, 43.0, 17.0, 18.0, 16.0, 16.0, 9.0, 12.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.334754943847656, -13.865535736083984, -13.396317481994629, -12.927098274230957, -12.457880020141602, -11.98866081237793, -11.519441604614258, -11.050222396850586, -10.58100414276123, -10.111784934997559, -9.642566680908203, -9.173347473144531, -8.70412826538086, -8.234910011291504, -7.765690803527832, -7.296472072601318, -6.827253341674805, -6.358034610748291, -5.888815879821777, -5.4195966720581055, -4.950377941131592, -4.481159210205078, -4.011940002441406, -3.5427212715148926, -3.073502540588379, -2.6042838096618652, -2.1350648403167725, -1.6658459901809692, -1.196627140045166, -0.7274084091186523, -0.25818943977355957, 0.2110295295715332, 0.6802492141723633, 1.1494680643081665, 1.6186869144439697, 2.0879058837890625, 2.557124614715576, 3.02634334564209, 3.4955623149871826, 3.9647812843322754, 4.434000015258789, 4.903218746185303, 5.372437477111816, 5.841656684875488, 6.310875415802002, 6.780094146728516, 7.2493133544921875, 7.718532085418701, 8.187750816345215, 8.656970024108887, 9.126188278198242, 9.595407485961914, 10.064626693725586, 10.533844947814941, 11.003064155578613, 11.472282409667969, 11.94150161743164, 12.410720825195312, 12.879939079284668, 13.34915828704834, 13.818376541137695, 14.287595748901367, 14.756814956665039, 15.226034164428711, 15.695252418518066]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 8.0, 16.0, 15.0, 33.0, 45.0, 71.0, 79.0, 152.0, 285.0, 464.0, 1009.0, 2259.0, 6353.0, 23361.0, 161044.0, 3745566.0, 214097.0, 27509.0, 7072.0, 2485.0, 1052.0, 530.0, 278.0, 169.0, 101.0, 73.0, 35.0, 28.0, 18.0, 20.0, 14.0, 7.0, 7.0, 7.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.2578125, -4.12286376953125, -3.9879150390625, -3.85296630859375, -3.718017578125, -3.58306884765625, -3.4481201171875, -3.31317138671875, -3.17822265625, -3.04327392578125, -2.9083251953125, -2.77337646484375, -2.638427734375, -2.50347900390625, -2.3685302734375, -2.23358154296875, -2.0986328125, -1.96368408203125, -1.8287353515625, -1.69378662109375, -1.558837890625, -1.42388916015625, -1.2889404296875, -1.15399169921875, -1.01904296875, -0.88409423828125, -0.7491455078125, -0.61419677734375, -0.479248046875, -0.34429931640625, -0.2093505859375, -0.07440185546875, 0.060546875, 0.19549560546875, 0.3304443359375, 0.46539306640625, 0.600341796875, 0.73529052734375, 0.8702392578125, 1.00518798828125, 1.14013671875, 1.27508544921875, 1.4100341796875, 1.54498291015625, 1.679931640625, 1.81488037109375, 1.9498291015625, 2.08477783203125, 2.2197265625, 2.35467529296875, 2.4896240234375, 2.62457275390625, 2.759521484375, 2.89447021484375, 3.0294189453125, 3.16436767578125, 3.29931640625, 3.43426513671875, 3.5692138671875, 3.70416259765625, 3.839111328125, 3.97406005859375, 4.1090087890625, 4.24395751953125, 4.37890625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 7.0, 11.0, 8.0, 12.0, 13.0, 18.0, 27.0, 28.0, 27.0, 38.0, 34.0, 42.0, 50.0, 44.0, 48.0, 44.0, 40.0, 52.0, 49.0, 51.0, 39.0, 35.0, 45.0, 40.0, 30.0, 25.0, 26.0, 20.0, 23.0, 18.0, 10.0, 9.0, 6.0, 3.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.72607421875, -0.7057266235351562, -0.6853790283203125, -0.6650314331054688, -0.644683837890625, -0.6243362426757812, -0.6039886474609375, -0.5836410522460938, -0.56329345703125, -0.5429458618164062, -0.5225982666015625, -0.5022506713867188, -0.481903076171875, -0.46155548095703125, -0.4412078857421875, -0.42086029052734375, -0.4005126953125, -0.38016510009765625, -0.3598175048828125, -0.33946990966796875, -0.319122314453125, -0.29877471923828125, -0.2784271240234375, -0.25807952880859375, -0.23773193359375, -0.21738433837890625, -0.1970367431640625, -0.17668914794921875, -0.156341552734375, -0.13599395751953125, -0.1156463623046875, -0.09529876708984375, -0.074951171875, -0.05460357666015625, -0.0342559814453125, -0.01390838623046875, 0.006439208984375, 0.02678680419921875, 0.0471343994140625, 0.06748199462890625, 0.08782958984375, 0.10817718505859375, 0.1285247802734375, 0.14887237548828125, 0.169219970703125, 0.18956756591796875, 0.2099151611328125, 0.23026275634765625, 0.2506103515625, 0.27095794677734375, 0.2913055419921875, 0.31165313720703125, 0.332000732421875, 0.35234832763671875, 0.3726959228515625, 0.39304351806640625, 0.41339111328125, 0.43373870849609375, 0.4540863037109375, 0.47443389892578125, 0.494781494140625, 0.5151290893554688, 0.5354766845703125, 0.5558242797851562, 0.576171875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 7.0, 10.0, 13.0, 26.0, 24.0, 42.0, 65.0, 115.0, 225.0, 437.0, 850.0, 1874.0, 4181.0, 10054.0, 29771.0, 119524.0, 1169427.0, 2627208.0, 169716.0, 38446.0, 12580.0, 5067.0, 2200.0, 1098.0, 589.0, 305.0, 188.0, 88.0, 49.0, 34.0, 22.0, 11.0, 4.0, 5.0, 11.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-3.62109375, -3.52606201171875, -3.4310302734375, -3.33599853515625, -3.240966796875, -3.14593505859375, -3.0509033203125, -2.95587158203125, -2.86083984375, -2.76580810546875, -2.6707763671875, -2.57574462890625, -2.480712890625, -2.38568115234375, -2.2906494140625, -2.19561767578125, -2.1005859375, -2.00555419921875, -1.9105224609375, -1.81549072265625, -1.720458984375, -1.62542724609375, -1.5303955078125, -1.43536376953125, -1.34033203125, -1.24530029296875, -1.1502685546875, -1.05523681640625, -0.960205078125, -0.86517333984375, -0.7701416015625, -0.67510986328125, -0.580078125, -0.48504638671875, -0.3900146484375, -0.29498291015625, -0.199951171875, -0.10491943359375, -0.0098876953125, 0.08514404296875, 0.18017578125, 0.27520751953125, 0.3702392578125, 0.46527099609375, 0.560302734375, 0.65533447265625, 0.7503662109375, 0.84539794921875, 0.9404296875, 1.03546142578125, 1.1304931640625, 1.22552490234375, 1.320556640625, 1.41558837890625, 1.5106201171875, 1.60565185546875, 1.70068359375, 1.79571533203125, 1.8907470703125, 1.98577880859375, 2.080810546875, 2.17584228515625, 2.2708740234375, 2.36590576171875, 2.4609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 4.0, 5.0, 5.0, 8.0, 12.0, 21.0, 21.0, 32.0, 42.0, 60.0, 93.0, 142.0, 250.0, 593.0, 1324.0, 674.0, 273.0, 147.0, 100.0, 94.0, 38.0, 34.0, 25.0, 15.0, 13.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2001953125, -1.156707763671875, -1.11322021484375, -1.069732666015625, -1.0262451171875, -0.982757568359375, -0.93927001953125, -0.895782470703125, -0.852294921875, -0.808807373046875, -0.76531982421875, -0.721832275390625, -0.6783447265625, -0.634857177734375, -0.59136962890625, -0.547882080078125, -0.50439453125, -0.460906982421875, -0.41741943359375, -0.373931884765625, -0.3304443359375, -0.286956787109375, -0.24346923828125, -0.199981689453125, -0.156494140625, -0.113006591796875, -0.06951904296875, -0.026031494140625, 0.0174560546875, 0.060943603515625, 0.10443115234375, 0.147918701171875, 0.19140625, 0.234893798828125, 0.27838134765625, 0.321868896484375, 0.3653564453125, 0.408843994140625, 0.45233154296875, 0.495819091796875, 0.539306640625, 0.582794189453125, 0.62628173828125, 0.669769287109375, 0.7132568359375, 0.756744384765625, 0.80023193359375, 0.843719482421875, 0.88720703125, 0.930694580078125, 0.97418212890625, 1.017669677734375, 1.0611572265625, 1.104644775390625, 1.14813232421875, 1.191619873046875, 1.235107421875, 1.278594970703125, 1.32208251953125, 1.365570068359375, 1.4090576171875, 1.452545166015625, 1.49603271484375, 1.539520263671875, 1.5830078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 8.0, 18.0, 26.0, 52.0, 90.0, 135.0, 180.0, 174.0, 138.0, 67.0, 56.0, 29.0, 10.0, 3.0, 6.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.113005638122559, -9.689754486083984, -9.26650333404541, -8.843252182006836, -8.420000076293945, -7.996748924255371, -7.573497772216797, -7.150246620178223, -6.72699499130249, -6.303743839263916, -5.880492210388184, -5.457241058349609, -5.033989906311035, -4.610738277435303, -4.1874871253967285, -3.764235734939575, -3.340984344482422, -2.9177329540252686, -2.4944815635681152, -2.071230411529541, -1.6479790210723877, -1.2247276306152344, -0.8014764785766602, -0.37822508811950684, 0.045026302337646484, 0.46827763319015503, 0.8915289640426636, 1.3147802352905273, 1.7380316257476807, 2.161283016204834, 2.584534168243408, 3.0077855587005615, 3.4310359954833984, 3.8542873859405518, 4.277538776397705, 4.700789928436279, 5.124041557312012, 5.547292709350586, 5.97054386138916, 6.393795013427734, 6.817046642303467, 7.240297794342041, 7.663549423217773, 8.086800575256348, 8.510051727294922, 8.933303833007812, 9.35655403137207, 9.779806137084961, 10.203057289123535, 10.62630844116211, 11.049559593200684, 11.472810745239258, 11.896062850952148, 12.319314002990723, 12.742565155029297, 13.165816307067871, 13.589067459106445, 14.01231861114502, 14.435569763183594, 14.858821868896484, 15.282073020935059, 15.705324172973633, 16.12857437133789, 16.55182647705078, 16.975078582763672]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 7.0, 14.0, 19.0, 30.0, 20.0, 51.0, 56.0, 62.0, 76.0, 86.0, 103.0, 76.0, 74.0, 68.0, 67.0, 42.0, 35.0, 33.0, 24.0, 15.0, 19.0, 8.0, 7.0, 4.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.524771690368652, -9.216562271118164, -8.908352851867676, -8.600143432617188, -8.291933059692383, -7.983724117279053, -7.675514221191406, -7.367304801940918, -7.05909538269043, -6.750885963439941, -6.442676544189453, -6.134466648101807, -5.826257228851318, -5.51804780960083, -5.209837913513184, -4.901628494262695, -4.593419075012207, -4.285209655761719, -3.9769999980926514, -3.668790340423584, -3.3605809211730957, -3.0523715019226074, -2.74416184425354, -2.4359521865844727, -2.1277427673339844, -1.8195332288742065, -1.5113236904144287, -1.2031141519546509, -0.894904613494873, -0.5866950750350952, -0.2784855365753174, 0.02972412109375, 0.3379335403442383, 0.6461430788040161, 0.954352617263794, 1.2625621557235718, 1.5707716941833496, 1.8789812326431274, 2.1871907711029053, 2.4954004287719727, 2.803609848022461, 3.111819267272949, 3.4200289249420166, 3.728238582611084, 4.036448001861572, 4.3446574211120605, 4.652867317199707, 4.961076736450195, 5.269286155700684, 5.577495574951172, 5.88570499420166, 6.193914890289307, 6.502124309539795, 6.810333728790283, 7.11854362487793, 7.426753044128418, 7.734962463378906, 8.043171882629395, 8.351381301879883, 8.659590721130371, 8.96780014038086, 9.276010513305664, 9.584219932556152, 9.89242935180664, 10.200638771057129]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 4.0, 10.0, 7.0, 10.0, 15.0, 23.0, 45.0, 68.0, 95.0, 148.0, 214.0, 295.0, 474.0, 896.0, 1445.0, 2748.0, 5471.0, 11897.0, 27688.0, 71569.0, 197918.0, 381617.0, 213631.0, 77299.0, 29665.0, 12719.0, 5773.0, 2905.0, 1554.0, 843.0, 545.0, 327.0, 214.0, 125.0, 99.0, 75.0, 38.0, 33.0, 11.0, 17.0, 8.0, 6.0, 4.0, 2.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.439453125, -2.353973388671875, -2.26849365234375, -2.183013916015625, -2.0975341796875, -2.012054443359375, -1.92657470703125, -1.841094970703125, -1.755615234375, -1.670135498046875, -1.58465576171875, -1.499176025390625, -1.4136962890625, -1.328216552734375, -1.24273681640625, -1.157257080078125, -1.07177734375, -0.986297607421875, -0.90081787109375, -0.815338134765625, -0.7298583984375, -0.644378662109375, -0.55889892578125, -0.473419189453125, -0.387939453125, -0.302459716796875, -0.21697998046875, -0.131500244140625, -0.0460205078125, 0.039459228515625, 0.12493896484375, 0.210418701171875, 0.2958984375, 0.381378173828125, 0.46685791015625, 0.552337646484375, 0.6378173828125, 0.723297119140625, 0.80877685546875, 0.894256591796875, 0.979736328125, 1.065216064453125, 1.15069580078125, 1.236175537109375, 1.3216552734375, 1.407135009765625, 1.49261474609375, 1.578094482421875, 1.66357421875, 1.749053955078125, 1.83453369140625, 1.920013427734375, 2.0054931640625, 2.090972900390625, 2.17645263671875, 2.261932373046875, 2.347412109375, 2.432891845703125, 2.51837158203125, 2.603851318359375, 2.6893310546875, 2.774810791015625, 2.86029052734375, 2.945770263671875, 3.03125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 7.0, 5.0, 4.0, 5.0, 10.0, 12.0, 13.0, 10.0, 19.0, 12.0, 22.0, 30.0, 30.0, 31.0, 37.0, 37.0, 45.0, 50.0, 36.0, 37.0, 43.0, 48.0, 50.0, 38.0, 43.0, 31.0, 41.0, 22.0, 34.0, 31.0, 20.0, 27.0, 16.0, 16.0, 13.0, 14.0, 14.0, 12.0, 6.0, 7.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.623046875, -0.6042327880859375, -0.585418701171875, -0.5666046142578125, -0.54779052734375, -0.5289764404296875, -0.510162353515625, -0.4913482666015625, -0.4725341796875, -0.4537200927734375, -0.434906005859375, -0.4160919189453125, -0.39727783203125, -0.3784637451171875, -0.359649658203125, -0.3408355712890625, -0.322021484375, -0.3032073974609375, -0.284393310546875, -0.2655792236328125, -0.24676513671875, -0.2279510498046875, -0.209136962890625, -0.1903228759765625, -0.1715087890625, -0.1526947021484375, -0.133880615234375, -0.1150665283203125, -0.09625244140625, -0.0774383544921875, -0.058624267578125, -0.0398101806640625, -0.02099609375, -0.0021820068359375, 0.016632080078125, 0.0354461669921875, 0.05426025390625, 0.0730743408203125, 0.091888427734375, 0.1107025146484375, 0.1295166015625, 0.1483306884765625, 0.167144775390625, 0.1859588623046875, 0.20477294921875, 0.2235870361328125, 0.242401123046875, 0.2612152099609375, 0.280029296875, 0.2988433837890625, 0.317657470703125, 0.3364715576171875, 0.35528564453125, 0.3740997314453125, 0.392913818359375, 0.4117279052734375, 0.4305419921875, 0.4493560791015625, 0.468170166015625, 0.4869842529296875, 0.50579833984375, 0.5246124267578125, 0.543426513671875, 0.5622406005859375, 0.5810546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 14.0, 12.0, 17.0, 19.0, 32.0, 36.0, 58.0, 112.0, 123.0, 239.0, 410.0, 759.0, 1513.0, 3383.0, 9050.0, 28550.0, 112999.0, 436888.0, 340067.0, 79870.0, 21359.0, 7146.0, 2862.0, 1312.0, 672.0, 368.0, 223.0, 149.0, 80.0, 63.0, 42.0, 32.0, 16.0, 18.0, 19.0, 10.0, 8.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.443359375, -3.328125, -3.212890625, -3.09765625, -2.982421875, -2.8671875, -2.751953125, -2.63671875, -2.521484375, -2.40625, -2.291015625, -2.17578125, -2.060546875, -1.9453125, -1.830078125, -1.71484375, -1.599609375, -1.484375, -1.369140625, -1.25390625, -1.138671875, -1.0234375, -0.908203125, -0.79296875, -0.677734375, -0.5625, -0.447265625, -0.33203125, -0.216796875, -0.1015625, 0.013671875, 0.12890625, 0.244140625, 0.359375, 0.474609375, 0.58984375, 0.705078125, 0.8203125, 0.935546875, 1.05078125, 1.166015625, 1.28125, 1.396484375, 1.51171875, 1.626953125, 1.7421875, 1.857421875, 1.97265625, 2.087890625, 2.203125, 2.318359375, 2.43359375, 2.548828125, 2.6640625, 2.779296875, 2.89453125, 3.009765625, 3.125, 3.240234375, 3.35546875, 3.470703125, 3.5859375, 3.701171875, 3.81640625, 3.931640625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 11.0, 7.0, 6.0, 8.0, 15.0, 14.0, 25.0, 29.0, 27.0, 37.0, 37.0, 53.0, 56.0, 45.0, 51.0, 72.0, 46.0, 49.0, 66.0, 49.0, 48.0, 38.0, 40.0, 33.0, 32.0, 31.0, 18.0, 9.0, 12.0, 9.0, 4.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.939453125, -3.824127197265625, -3.70880126953125, -3.593475341796875, -3.4781494140625, -3.362823486328125, -3.24749755859375, -3.132171630859375, -3.016845703125, -2.901519775390625, -2.78619384765625, -2.670867919921875, -2.5555419921875, -2.440216064453125, -2.32489013671875, -2.209564208984375, -2.09423828125, -1.978912353515625, -1.86358642578125, -1.748260498046875, -1.6329345703125, -1.517608642578125, -1.40228271484375, -1.286956787109375, -1.171630859375, -1.056304931640625, -0.94097900390625, -0.825653076171875, -0.7103271484375, -0.595001220703125, -0.47967529296875, -0.364349365234375, -0.2490234375, -0.133697509765625, -0.01837158203125, 0.096954345703125, 0.2122802734375, 0.327606201171875, 0.44293212890625, 0.558258056640625, 0.673583984375, 0.788909912109375, 0.90423583984375, 1.019561767578125, 1.1348876953125, 1.250213623046875, 1.36553955078125, 1.480865478515625, 1.59619140625, 1.711517333984375, 1.82684326171875, 1.942169189453125, 2.0574951171875, 2.172821044921875, 2.28814697265625, 2.403472900390625, 2.518798828125, 2.634124755859375, 2.74945068359375, 2.864776611328125, 2.9801025390625, 3.095428466796875, 3.21075439453125, 3.326080322265625, 3.44140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 9.0, 10.0, 17.0, 44.0, 70.0, 108.0, 210.0, 510.0, 1259.0, 5696.0, 57079.0, 895896.0, 78001.0, 7080.0, 1488.0, 554.0, 225.0, 134.0, 58.0, 32.0, 28.0, 16.0, 12.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.953125, -4.796142578125, -4.63916015625, -4.482177734375, -4.3251953125, -4.168212890625, -4.01123046875, -3.854248046875, -3.697265625, -3.540283203125, -3.38330078125, -3.226318359375, -3.0693359375, -2.912353515625, -2.75537109375, -2.598388671875, -2.44140625, -2.284423828125, -2.12744140625, -1.970458984375, -1.8134765625, -1.656494140625, -1.49951171875, -1.342529296875, -1.185546875, -1.028564453125, -0.87158203125, -0.714599609375, -0.5576171875, -0.400634765625, -0.24365234375, -0.086669921875, 0.0703125, 0.227294921875, 0.38427734375, 0.541259765625, 0.6982421875, 0.855224609375, 1.01220703125, 1.169189453125, 1.326171875, 1.483154296875, 1.64013671875, 1.797119140625, 1.9541015625, 2.111083984375, 2.26806640625, 2.425048828125, 2.58203125, 2.739013671875, 2.89599609375, 3.052978515625, 3.2099609375, 3.366943359375, 3.52392578125, 3.680908203125, 3.837890625, 3.994873046875, 4.15185546875, 4.308837890625, 4.4658203125, 4.622802734375, 4.77978515625, 4.936767578125, 5.09375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 10.0, 8.0, 13.0, 21.0, 33.0, 44.0, 100.0, 231.0, 278.0, 100.0, 38.0, 33.0, 15.0, 20.0, 9.0, 7.0, 4.0, 2.0, 4.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038242340087890625, -0.00037153810262680054, -0.0003606528043746948, -0.0003497675061225891, -0.0003388822078704834, -0.0003279969096183777, -0.00031711161136627197, -0.00030622631311416626, -0.00029534101486206055, -0.00028445571660995483, -0.0002735704183578491, -0.0002626851201057434, -0.0002517998218536377, -0.00024091452360153198, -0.00023002922534942627, -0.00021914392709732056, -0.00020825862884521484, -0.00019737333059310913, -0.00018648803234100342, -0.0001756027340888977, -0.000164717435836792, -0.00015383213758468628, -0.00014294683933258057, -0.00013206154108047485, -0.00012117624282836914, -0.00011029094457626343, -9.940564632415771e-05, -8.8520348072052e-05, -7.763504981994629e-05, -6.674975156784058e-05, -5.586445331573486e-05, -4.497915506362915e-05, -3.409385681152344e-05, -2.3208558559417725e-05, -1.2323260307312012e-05, -1.4379620552062988e-06, 9.447336196899414e-06, 2.0332634449005127e-05, 3.121793270111084e-05, 4.210323095321655e-05, 5.2988529205322266e-05, 6.387382745742798e-05, 7.475912570953369e-05, 8.56444239616394e-05, 9.652972221374512e-05, 0.00010741502046585083, 0.00011830031871795654, 0.00012918561697006226, 0.00014007091522216797, 0.00015095621347427368, 0.0001618415117263794, 0.0001727268099784851, 0.00018361210823059082, 0.00019449740648269653, 0.00020538270473480225, 0.00021626800298690796, 0.00022715330123901367, 0.00023803859949111938, 0.0002489238977432251, 0.0002598091959953308, 0.0002706944942474365, 0.00028157979249954224, 0.00029246509075164795, 0.00030335038900375366, 0.0003142356872558594]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 10.0, 10.0, 14.0, 25.0, 36.0, 48.0, 66.0, 111.0, 179.0, 298.0, 530.0, 1066.0, 2425.0, 5705.0, 17567.0, 81927.0, 752892.0, 147697.0, 24560.0, 7629.0, 2904.0, 1293.0, 644.0, 382.0, 189.0, 104.0, 61.0, 45.0, 41.0, 21.0, 19.0, 11.0, 4.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.48828125, -3.390380859375, -3.29248046875, -3.194580078125, -3.0966796875, -2.998779296875, -2.90087890625, -2.802978515625, -2.705078125, -2.607177734375, -2.50927734375, -2.411376953125, -2.3134765625, -2.215576171875, -2.11767578125, -2.019775390625, -1.921875, -1.823974609375, -1.72607421875, -1.628173828125, -1.5302734375, -1.432373046875, -1.33447265625, -1.236572265625, -1.138671875, -1.040771484375, -0.94287109375, -0.844970703125, -0.7470703125, -0.649169921875, -0.55126953125, -0.453369140625, -0.35546875, -0.257568359375, -0.15966796875, -0.061767578125, 0.0361328125, 0.134033203125, 0.23193359375, 0.329833984375, 0.427734375, 0.525634765625, 0.62353515625, 0.721435546875, 0.8193359375, 0.917236328125, 1.01513671875, 1.113037109375, 1.2109375, 1.308837890625, 1.40673828125, 1.504638671875, 1.6025390625, 1.700439453125, 1.79833984375, 1.896240234375, 1.994140625, 2.092041015625, 2.18994140625, 2.287841796875, 2.3857421875, 2.483642578125, 2.58154296875, 2.679443359375, 2.77734375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 9.0, 14.0, 18.0, 23.0, 53.0, 88.0, 175.0, 246.0, 160.0, 77.0, 43.0, 25.0, 12.0, 17.0, 8.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.83984375, -4.71405029296875, -4.5882568359375, -4.46246337890625, -4.336669921875, -4.21087646484375, -4.0850830078125, -3.95928955078125, -3.83349609375, -3.70770263671875, -3.5819091796875, -3.45611572265625, -3.330322265625, -3.20452880859375, -3.0787353515625, -2.95294189453125, -2.8271484375, -2.70135498046875, -2.5755615234375, -2.44976806640625, -2.323974609375, -2.19818115234375, -2.0723876953125, -1.94659423828125, -1.82080078125, -1.69500732421875, -1.5692138671875, -1.44342041015625, -1.317626953125, -1.19183349609375, -1.0660400390625, -0.94024658203125, -0.814453125, -0.68865966796875, -0.5628662109375, -0.43707275390625, -0.311279296875, -0.18548583984375, -0.0596923828125, 0.06610107421875, 0.19189453125, 0.31768798828125, 0.4434814453125, 0.56927490234375, 0.695068359375, 0.82086181640625, 0.9466552734375, 1.07244873046875, 1.1982421875, 1.32403564453125, 1.4498291015625, 1.57562255859375, 1.701416015625, 1.82720947265625, 1.9530029296875, 2.07879638671875, 2.20458984375, 2.33038330078125, 2.4561767578125, 2.58197021484375, 2.707763671875, 2.83355712890625, 2.9593505859375, 3.08514404296875, 3.2109375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 13.0, 16.0, 36.0, 61.0, 126.0, 166.0, 187.0, 175.0, 101.0, 57.0, 27.0, 17.0, 3.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.942989349365234, -33.79560470581055, -32.648216247558594, -31.500831604003906, -30.35344696044922, -29.2060604095459, -28.058673858642578, -26.91128921508789, -25.76390266418457, -24.61651611328125, -23.469131469726562, -22.321744918823242, -21.174358367919922, -20.026973724365234, -18.879587173461914, -17.732200622558594, -16.584815979003906, -15.437430381774902, -14.290044784545898, -13.142658233642578, -11.995272636413574, -10.84788703918457, -9.70050048828125, -8.553114891052246, -7.405729293823242, -6.258343696594238, -5.110957622528076, -3.963571786880493, -2.81618595123291, -1.6688003540039062, -0.5214142799377441, 0.625971794128418, 1.7733535766601562, 2.9207394123077393, 4.068125247955322, 5.215511322021484, 6.362896919250488, 7.510282516479492, 8.657669067382812, 9.805054664611816, 10.95244026184082, 12.099825859069824, 13.247211456298828, 14.394598007202148, 15.541983604431152, 16.689369201660156, 17.836755752563477, 18.984142303466797, 20.131526947021484, 21.278913497924805, 22.426298141479492, 23.573684692382812, 24.7210693359375, 25.86845588684082, 27.01584243774414, 28.163227081298828, 29.31061363220215, 30.45800018310547, 31.605384826660156, 32.752769470214844, 33.9001579284668, 35.047542572021484, 36.19492721557617, 37.342315673828125, 38.48970031738281]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 6.0, 15.0, 6.0, 11.0, 18.0, 28.0, 25.0, 28.0, 33.0, 34.0, 31.0, 38.0, 53.0, 51.0, 66.0, 58.0, 55.0, 46.0, 43.0, 45.0, 40.0, 39.0, 40.0, 33.0, 32.0, 34.0, 24.0, 13.0, 11.0, 14.0, 9.0, 5.0, 4.0, 7.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.499977111816406, -13.898889541625977, -13.29780101776123, -12.696712493896484, -12.095624923706055, -11.494537353515625, -10.893448829650879, -10.292360305786133, -9.691272735595703, -9.090185165405273, -8.489096641540527, -7.8880085945129395, -7.286920547485352, -6.685832500457764, -6.084744453430176, -5.483656406402588, -4.882568359375, -4.281480312347412, -3.680392265319824, -3.0793042182922363, -2.4782161712646484, -1.8771281242370605, -1.2760400772094727, -0.6749520301818848, -0.07386398315429688, 0.527224063873291, 1.128312110900879, 1.7294001579284668, 2.3304882049560547, 2.9315762519836426, 3.5326642990112305, 4.133752346038818, 4.734840393066406, 5.335928440093994, 5.937016487121582, 6.53810453414917, 7.139192581176758, 7.740280628204346, 8.341368675231934, 8.94245719909668, 9.54354476928711, 10.144632339477539, 10.745720863342285, 11.346809387207031, 11.947896957397461, 12.54898452758789, 13.150073051452637, 13.751161575317383, 14.352249145507812, 14.953336715698242, 15.554425239562988, 16.155513763427734, 16.756601333618164, 17.357688903808594, 17.958778381347656, 18.559865951538086, 19.160953521728516, 19.762041091918945, 20.363128662109375, 20.964218139648438, 21.565305709838867, 22.166393280029297, 22.76748275756836, 23.36857032775879, 23.96965789794922]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 4.0, 3.0, 16.0, 16.0, 22.0, 26.0, 45.0, 68.0, 114.0, 192.0, 274.0, 523.0, 986.0, 1724.0, 3608.0, 8297.0, 22168.0, 80820.0, 1698588.0, 2254521.0, 82602.0, 22853.0, 8581.0, 3856.0, 1892.0, 1024.0, 515.0, 325.0, 202.0, 129.0, 81.0, 52.0, 42.0, 25.0, 22.0, 17.0, 12.0, 13.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.84375, -2.73846435546875, -2.6331787109375, -2.52789306640625, -2.422607421875, -2.31732177734375, -2.2120361328125, -2.10675048828125, -2.00146484375, -1.89617919921875, -1.7908935546875, -1.68560791015625, -1.580322265625, -1.47503662109375, -1.3697509765625, -1.26446533203125, -1.1591796875, -1.05389404296875, -0.9486083984375, -0.84332275390625, -0.738037109375, -0.63275146484375, -0.5274658203125, -0.42218017578125, -0.31689453125, -0.21160888671875, -0.1063232421875, -0.00103759765625, 0.104248046875, 0.20953369140625, 0.3148193359375, 0.42010498046875, 0.525390625, 0.63067626953125, 0.7359619140625, 0.84124755859375, 0.946533203125, 1.05181884765625, 1.1571044921875, 1.26239013671875, 1.36767578125, 1.47296142578125, 1.5782470703125, 1.68353271484375, 1.788818359375, 1.89410400390625, 1.9993896484375, 2.10467529296875, 2.2099609375, 2.31524658203125, 2.4205322265625, 2.52581787109375, 2.631103515625, 2.73638916015625, 2.8416748046875, 2.94696044921875, 3.05224609375, 3.15753173828125, 3.2628173828125, 3.36810302734375, 3.473388671875, 3.57867431640625, 3.6839599609375, 3.78924560546875, 3.89453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 10.0, 17.0, 19.0, 19.0, 25.0, 35.0, 62.0, 62.0, 63.0, 57.0, 80.0, 80.0, 61.0, 70.0, 65.0, 50.0, 56.0, 32.0, 35.0, 25.0, 24.0, 16.0, 9.0, 10.0, 8.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86328125, -0.8267974853515625, -0.790313720703125, -0.7538299560546875, -0.71734619140625, -0.6808624267578125, -0.644378662109375, -0.6078948974609375, -0.5714111328125, -0.5349273681640625, -0.498443603515625, -0.4619598388671875, -0.42547607421875, -0.3889923095703125, -0.352508544921875, -0.3160247802734375, -0.279541015625, -0.2430572509765625, -0.206573486328125, -0.1700897216796875, -0.13360595703125, -0.0971221923828125, -0.060638427734375, -0.0241546630859375, 0.0123291015625, 0.0488128662109375, 0.085296630859375, 0.1217803955078125, 0.15826416015625, 0.1947479248046875, 0.231231689453125, 0.2677154541015625, 0.30419921875, 0.3406829833984375, 0.377166748046875, 0.4136505126953125, 0.45013427734375, 0.4866180419921875, 0.523101806640625, 0.5595855712890625, 0.5960693359375, 0.6325531005859375, 0.669036865234375, 0.7055206298828125, 0.74200439453125, 0.7784881591796875, 0.814971923828125, 0.8514556884765625, 0.887939453125, 0.9244232177734375, 0.960906982421875, 0.9973907470703125, 1.03387451171875, 1.0703582763671875, 1.106842041015625, 1.1433258056640625, 1.1798095703125, 1.2162933349609375, 1.252777099609375, 1.2892608642578125, 1.32574462890625, 1.3622283935546875, 1.398712158203125, 1.4351959228515625, 1.4716796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 8.0, 5.0, 9.0, 14.0, 21.0, 27.0, 54.0, 69.0, 103.0, 213.0, 344.0, 593.0, 1171.0, 2342.0, 5282.0, 12841.0, 40296.0, 209152.0, 3443203.0, 392847.0, 56768.0, 16604.0, 6329.0, 2829.0, 1437.0, 722.0, 382.0, 260.0, 134.0, 71.0, 68.0, 27.0, 16.0, 9.0, 12.0, 6.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-3.55859375, -3.446075439453125, -3.33355712890625, -3.221038818359375, -3.1085205078125, -2.996002197265625, -2.88348388671875, -2.770965576171875, -2.658447265625, -2.545928955078125, -2.43341064453125, -2.320892333984375, -2.2083740234375, -2.095855712890625, -1.98333740234375, -1.870819091796875, -1.75830078125, -1.645782470703125, -1.53326416015625, -1.420745849609375, -1.3082275390625, -1.195709228515625, -1.08319091796875, -0.970672607421875, -0.858154296875, -0.745635986328125, -0.63311767578125, -0.520599365234375, -0.4080810546875, -0.295562744140625, -0.18304443359375, -0.070526123046875, 0.0419921875, 0.154510498046875, 0.26702880859375, 0.379547119140625, 0.4920654296875, 0.604583740234375, 0.71710205078125, 0.829620361328125, 0.942138671875, 1.054656982421875, 1.16717529296875, 1.279693603515625, 1.3922119140625, 1.504730224609375, 1.61724853515625, 1.729766845703125, 1.84228515625, 1.954803466796875, 2.06732177734375, 2.179840087890625, 2.2923583984375, 2.404876708984375, 2.51739501953125, 2.629913330078125, 2.742431640625, 2.854949951171875, 2.96746826171875, 3.079986572265625, 3.1925048828125, 3.305023193359375, 3.41754150390625, 3.530059814453125, 3.642578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 10.0, 16.0, 22.0, 33.0, 61.0, 76.0, 184.0, 545.0, 2024.0, 602.0, 228.0, 107.0, 44.0, 34.0, 28.0, 10.0, 11.0, 8.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.314453125, -2.251129150390625, -2.18780517578125, -2.124481201171875, -2.0611572265625, -1.997833251953125, -1.93450927734375, -1.871185302734375, -1.807861328125, -1.744537353515625, -1.68121337890625, -1.617889404296875, -1.5545654296875, -1.491241455078125, -1.42791748046875, -1.364593505859375, -1.30126953125, -1.237945556640625, -1.17462158203125, -1.111297607421875, -1.0479736328125, -0.984649658203125, -0.92132568359375, -0.858001708984375, -0.794677734375, -0.731353759765625, -0.66802978515625, -0.604705810546875, -0.5413818359375, -0.478057861328125, -0.41473388671875, -0.351409912109375, -0.2880859375, -0.224761962890625, -0.16143798828125, -0.098114013671875, -0.0347900390625, 0.028533935546875, 0.09185791015625, 0.155181884765625, 0.218505859375, 0.281829833984375, 0.34515380859375, 0.408477783203125, 0.4718017578125, 0.535125732421875, 0.59844970703125, 0.661773681640625, 0.72509765625, 0.788421630859375, 0.85174560546875, 0.915069580078125, 0.9783935546875, 1.041717529296875, 1.10504150390625, 1.168365478515625, 1.231689453125, 1.295013427734375, 1.35833740234375, 1.421661376953125, 1.4849853515625, 1.548309326171875, 1.61163330078125, 1.674957275390625, 1.73828125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 10.0, 25.0, 33.0, 60.0, 147.0, 215.0, 221.0, 157.0, 69.0, 39.0, 7.0, 6.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.352341651916504, -8.879697799682617, -8.407052993774414, -7.934409141540527, -7.461765289306641, -6.989120960235596, -6.516476631164551, -6.043832778930664, -5.571188449859619, -5.098544120788574, -4.6259002685546875, -4.153255939483643, -3.6806118488311768, -3.207967758178711, -2.735323429107666, -2.2626793384552, -1.7900352478027344, -1.3173911571502686, -0.8447469472885132, -0.3721027374267578, 0.10054135322570801, 0.5731854438781738, 1.0458297729492188, 1.5184738636016846, 1.9911179542541504, 2.463762044906616, 2.936406135559082, 3.409050464630127, 3.8816945552825928, 4.354338645935059, 4.8269829750061035, 5.299627304077148, 5.772272109985352, 6.2449164390563965, 6.717560291290283, 7.190204620361328, 7.662848472595215, 8.135492324829102, 8.608137130737305, 9.080780982971191, 9.553424835205078, 10.026068687438965, 10.498713493347168, 10.971357345581055, 11.444001197814941, 11.916645050048828, 12.389289855957031, 12.861933708190918, 13.334578514099121, 13.807222366333008, 14.279867172241211, 14.752511024475098, 15.225154876708984, 15.697799682617188, 16.17044448852539, 16.64308738708496, 17.115732192993164, 17.588376998901367, 18.061019897460938, 18.53366470336914, 19.006309509277344, 19.478952407836914, 19.951597213745117, 20.42424201965332, 20.89688491821289]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 16.0, 19.0, 20.0, 25.0, 39.0, 43.0, 51.0, 60.0, 46.0, 74.0, 69.0, 78.0, 73.0, 55.0, 53.0, 63.0, 38.0, 41.0, 32.0, 26.0, 19.0, 19.0, 7.0, 7.0, 6.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.600971221923828, -8.388124465942383, -8.175278663635254, -7.962431907653809, -7.7495856285095215, -7.536739349365234, -7.323893070220947, -7.11104679107666, -6.898200035095215, -6.685353755950928, -6.472507476806641, -6.259660720825195, -6.046814441680908, -5.833968162536621, -5.621121883392334, -5.408275604248047, -5.19542932510376, -4.982583045959473, -4.7697367668151855, -4.556890487670898, -4.344043731689453, -4.131197452545166, -3.918351173400879, -3.705504894256592, -3.4926583766937256, -3.2798120975494385, -3.0669655799865723, -2.854119300842285, -2.641273021697998, -2.428426504135132, -2.2155802249908447, -2.0027337074279785, -1.7898879051208496, -1.577041506767273, -1.3641951084136963, -1.1513488292694092, -0.9385024309158325, -0.7256560325622559, -0.5128097534179688, -0.2999633550643921, -0.08711695671081543, 0.12572941184043884, 0.3385757803916931, 0.551422119140625, 0.7642685174942017, 0.9771149158477783, 1.1899611949920654, 1.402807593345642, 1.6156539916992188, 1.8285003900527954, 2.041346788406372, 2.254193067550659, 2.4670395851135254, 2.6798858642578125, 2.8927321434020996, 3.1055784225463867, 3.318424940109253, 3.53127121925354, 3.7441177368164062, 3.9569640159606934, 4.1698102951049805, 4.382657051086426, 4.595502853393555, 4.808349609375, 5.021195888519287]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 4.0, 4.0, 8.0, 8.0, 11.0, 8.0, 9.0, 19.0, 22.0, 39.0, 50.0, 85.0, 182.0, 342.0, 673.0, 1601.0, 3950.0, 11307.0, 35233.0, 117022.0, 358178.0, 353469.0, 113906.0, 34323.0, 11075.0, 3983.0, 1608.0, 692.0, 299.0, 162.0, 93.0, 50.0, 31.0, 21.0, 16.0, 15.0, 15.0, 9.0, 7.0, 9.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.384765625, -3.278961181640625, -3.17315673828125, -3.067352294921875, -2.9615478515625, -2.855743408203125, -2.74993896484375, -2.644134521484375, -2.538330078125, -2.432525634765625, -2.32672119140625, -2.220916748046875, -2.1151123046875, -2.009307861328125, -1.90350341796875, -1.797698974609375, -1.69189453125, -1.586090087890625, -1.48028564453125, -1.374481201171875, -1.2686767578125, -1.162872314453125, -1.05706787109375, -0.951263427734375, -0.845458984375, -0.739654541015625, -0.63385009765625, -0.528045654296875, -0.4222412109375, -0.316436767578125, -0.21063232421875, -0.104827880859375, 0.0009765625, 0.106781005859375, 0.21258544921875, 0.318389892578125, 0.4241943359375, 0.529998779296875, 0.63580322265625, 0.741607666015625, 0.847412109375, 0.953216552734375, 1.05902099609375, 1.164825439453125, 1.2706298828125, 1.376434326171875, 1.48223876953125, 1.588043212890625, 1.69384765625, 1.799652099609375, 1.90545654296875, 2.011260986328125, 2.1170654296875, 2.222869873046875, 2.32867431640625, 2.434478759765625, 2.540283203125, 2.646087646484375, 2.75189208984375, 2.857696533203125, 2.9635009765625, 3.069305419921875, 3.17510986328125, 3.280914306640625, 3.38671875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 5.0, 8.0, 7.0, 13.0, 10.0, 7.0, 12.0, 18.0, 23.0, 15.0, 25.0, 30.0, 45.0, 46.0, 33.0, 33.0, 54.0, 57.0, 42.0, 46.0, 42.0, 36.0, 45.0, 36.0, 48.0, 43.0, 33.0, 31.0, 20.0, 26.0, 16.0, 17.0, 11.0, 11.0, 19.0, 12.0, 9.0, 2.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.826171875, -0.8028411865234375, -0.779510498046875, -0.7561798095703125, -0.73284912109375, -0.7095184326171875, -0.686187744140625, -0.6628570556640625, -0.6395263671875, -0.6161956787109375, -0.592864990234375, -0.5695343017578125, -0.54620361328125, -0.5228729248046875, -0.499542236328125, -0.4762115478515625, -0.452880859375, -0.4295501708984375, -0.406219482421875, -0.3828887939453125, -0.35955810546875, -0.3362274169921875, -0.312896728515625, -0.2895660400390625, -0.2662353515625, -0.2429046630859375, -0.219573974609375, -0.1962432861328125, -0.17291259765625, -0.1495819091796875, -0.126251220703125, -0.1029205322265625, -0.07958984375, -0.0562591552734375, -0.032928466796875, -0.0095977783203125, 0.01373291015625, 0.0370635986328125, 0.060394287109375, 0.0837249755859375, 0.1070556640625, 0.1303863525390625, 0.153717041015625, 0.1770477294921875, 0.20037841796875, 0.2237091064453125, 0.247039794921875, 0.2703704833984375, 0.293701171875, 0.3170318603515625, 0.340362548828125, 0.3636932373046875, 0.38702392578125, 0.4103546142578125, 0.433685302734375, 0.4570159912109375, 0.4803466796875, 0.5036773681640625, 0.527008056640625, 0.5503387451171875, 0.57366943359375, 0.5970001220703125, 0.620330810546875, 0.6436614990234375, 0.6669921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 6.0, 9.0, 6.0, 14.0, 14.0, 17.0, 28.0, 27.0, 45.0, 54.0, 95.0, 145.0, 238.0, 379.0, 756.0, 1359.0, 2991.0, 7031.0, 17459.0, 45279.0, 122911.0, 313992.0, 326504.0, 129182.0, 47367.0, 18405.0, 7594.0, 3331.0, 1480.0, 711.0, 376.0, 249.0, 145.0, 94.0, 61.0, 49.0, 39.0, 27.0, 22.0, 19.0, 7.0, 8.0, 9.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.51171875, -2.428070068359375, -2.34442138671875, -2.260772705078125, -2.1771240234375, -2.093475341796875, -2.00982666015625, -1.926177978515625, -1.842529296875, -1.758880615234375, -1.67523193359375, -1.591583251953125, -1.5079345703125, -1.424285888671875, -1.34063720703125, -1.256988525390625, -1.17333984375, -1.089691162109375, -1.00604248046875, -0.922393798828125, -0.8387451171875, -0.755096435546875, -0.67144775390625, -0.587799072265625, -0.504150390625, -0.420501708984375, -0.33685302734375, -0.253204345703125, -0.1695556640625, -0.085906982421875, -0.00225830078125, 0.081390380859375, 0.1650390625, 0.248687744140625, 0.33233642578125, 0.415985107421875, 0.4996337890625, 0.583282470703125, 0.66693115234375, 0.750579833984375, 0.834228515625, 0.917877197265625, 1.00152587890625, 1.085174560546875, 1.1688232421875, 1.252471923828125, 1.33612060546875, 1.419769287109375, 1.50341796875, 1.587066650390625, 1.67071533203125, 1.754364013671875, 1.8380126953125, 1.921661376953125, 2.00531005859375, 2.088958740234375, 2.172607421875, 2.256256103515625, 2.33990478515625, 2.423553466796875, 2.5072021484375, 2.590850830078125, 2.67449951171875, 2.758148193359375, 2.841796875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 6.0, 5.0, 3.0, 11.0, 9.0, 11.0, 18.0, 14.0, 15.0, 21.0, 35.0, 29.0, 33.0, 35.0, 38.0, 39.0, 40.0, 47.0, 28.0, 41.0, 34.0, 28.0, 43.0, 33.0, 38.0, 40.0, 21.0, 39.0, 38.0, 29.0, 16.0, 32.0, 16.0, 27.0, 15.0, 12.0, 11.0, 3.0, 11.0, 7.0, 5.0, 3.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.033203125, -2.94403076171875, -2.8548583984375, -2.76568603515625, -2.676513671875, -2.58734130859375, -2.4981689453125, -2.40899658203125, -2.31982421875, -2.23065185546875, -2.1414794921875, -2.05230712890625, -1.963134765625, -1.87396240234375, -1.7847900390625, -1.69561767578125, -1.6064453125, -1.51727294921875, -1.4281005859375, -1.33892822265625, -1.249755859375, -1.16058349609375, -1.0714111328125, -0.98223876953125, -0.89306640625, -0.80389404296875, -0.7147216796875, -0.62554931640625, -0.536376953125, -0.44720458984375, -0.3580322265625, -0.26885986328125, -0.1796875, -0.09051513671875, -0.0013427734375, 0.08782958984375, 0.177001953125, 0.26617431640625, 0.3553466796875, 0.44451904296875, 0.53369140625, 0.62286376953125, 0.7120361328125, 0.80120849609375, 0.890380859375, 0.97955322265625, 1.0687255859375, 1.15789794921875, 1.2470703125, 1.33624267578125, 1.4254150390625, 1.51458740234375, 1.603759765625, 1.69293212890625, 1.7821044921875, 1.87127685546875, 1.96044921875, 2.04962158203125, 2.1387939453125, 2.22796630859375, 2.317138671875, 2.40631103515625, 2.4954833984375, 2.58465576171875, 2.673828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 9.0, 9.0, 11.0, 18.0, 27.0, 49.0, 90.0, 132.0, 230.0, 539.0, 1207.0, 3788.0, 14450.0, 81596.0, 610028.0, 287010.0, 37538.0, 7767.0, 2333.0, 868.0, 359.0, 206.0, 104.0, 73.0, 34.0, 24.0, 16.0, 7.0, 13.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4462890625, -1.3902130126953125, -1.334136962890625, -1.2780609130859375, -1.22198486328125, -1.1659088134765625, -1.109832763671875, -1.0537567138671875, -0.9976806640625, -0.9416046142578125, -0.885528564453125, -0.8294525146484375, -0.77337646484375, -0.7173004150390625, -0.661224365234375, -0.6051483154296875, -0.549072265625, -0.4929962158203125, -0.436920166015625, -0.3808441162109375, -0.32476806640625, -0.2686920166015625, -0.212615966796875, -0.1565399169921875, -0.1004638671875, -0.0443878173828125, 0.011688232421875, 0.0677642822265625, 0.12384033203125, 0.1799163818359375, 0.235992431640625, 0.2920684814453125, 0.34814453125, 0.4042205810546875, 0.460296630859375, 0.5163726806640625, 0.57244873046875, 0.6285247802734375, 0.684600830078125, 0.7406768798828125, 0.7967529296875, 0.8528289794921875, 0.908905029296875, 0.9649810791015625, 1.02105712890625, 1.0771331787109375, 1.133209228515625, 1.1892852783203125, 1.245361328125, 1.3014373779296875, 1.357513427734375, 1.4135894775390625, 1.46966552734375, 1.5257415771484375, 1.581817626953125, 1.6378936767578125, 1.6939697265625, 1.7500457763671875, 1.806121826171875, 1.8621978759765625, 1.91827392578125, 1.9743499755859375, 2.030426025390625, 2.0865020751953125, 2.142578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 8.0, 9.0, 8.0, 10.0, 18.0, 28.0, 24.0, 47.0, 79.0, 145.0, 215.0, 154.0, 78.0, 57.0, 35.0, 19.0, 17.0, 9.0, 12.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00031113624572753906, -0.0003032684326171875, -0.00029540061950683594, -0.0002875328063964844, -0.0002796649932861328, -0.00027179718017578125, -0.0002639293670654297, -0.0002560615539550781, -0.00024819374084472656, -0.000240325927734375, -0.00023245811462402344, -0.00022459030151367188, -0.0002167224884033203, -0.00020885467529296875, -0.0002009868621826172, -0.00019311904907226562, -0.00018525123596191406, -0.0001773834228515625, -0.00016951560974121094, -0.00016164779663085938, -0.0001537799835205078, -0.00014591217041015625, -0.0001380443572998047, -0.00013017654418945312, -0.00012230873107910156, -0.00011444091796875, -0.00010657310485839844, -9.870529174804688e-05, -9.083747863769531e-05, -8.296966552734375e-05, -7.510185241699219e-05, -6.723403930664062e-05, -5.936622619628906e-05, -5.14984130859375e-05, -4.363059997558594e-05, -3.5762786865234375e-05, -2.7894973754882812e-05, -2.002716064453125e-05, -1.2159347534179688e-05, -4.291534423828125e-06, 3.5762786865234375e-06, 1.1444091796875e-05, 1.9311904907226562e-05, 2.7179718017578125e-05, 3.504753112792969e-05, 4.291534423828125e-05, 5.078315734863281e-05, 5.8650970458984375e-05, 6.651878356933594e-05, 7.43865966796875e-05, 8.225440979003906e-05, 9.012222290039062e-05, 9.799003601074219e-05, 0.00010585784912109375, 0.00011372566223144531, 0.00012159347534179688, 0.00012946128845214844, 0.0001373291015625, 0.00014519691467285156, 0.00015306472778320312, 0.0001609325408935547, 0.00016880035400390625, 0.0001766681671142578, 0.00018453598022460938, 0.00019240379333496094]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 5.0, 11.0, 12.0, 16.0, 26.0, 27.0, 45.0, 54.0, 75.0, 126.0, 204.0, 408.0, 707.0, 1595.0, 3764.0, 11675.0, 49952.0, 330894.0, 539195.0, 83217.0, 17254.0, 5210.0, 1992.0, 904.0, 489.0, 247.0, 128.0, 91.0, 47.0, 38.0, 36.0, 26.0, 20.0, 13.0, 7.0, 8.0, 7.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2431640625, -1.1973724365234375, -1.151580810546875, -1.1057891845703125, -1.05999755859375, -1.0142059326171875, -0.968414306640625, -0.9226226806640625, -0.8768310546875, -0.8310394287109375, -0.785247802734375, -0.7394561767578125, -0.69366455078125, -0.6478729248046875, -0.602081298828125, -0.5562896728515625, -0.510498046875, -0.4647064208984375, -0.418914794921875, -0.3731231689453125, -0.32733154296875, -0.2815399169921875, -0.235748291015625, -0.1899566650390625, -0.1441650390625, -0.0983734130859375, -0.052581787109375, -0.0067901611328125, 0.03900146484375, 0.0847930908203125, 0.130584716796875, 0.1763763427734375, 0.22216796875, 0.2679595947265625, 0.313751220703125, 0.3595428466796875, 0.40533447265625, 0.4511260986328125, 0.496917724609375, 0.5427093505859375, 0.5885009765625, 0.6342926025390625, 0.680084228515625, 0.7258758544921875, 0.77166748046875, 0.8174591064453125, 0.863250732421875, 0.9090423583984375, 0.954833984375, 1.0006256103515625, 1.046417236328125, 1.0922088623046875, 1.13800048828125, 1.1837921142578125, 1.229583740234375, 1.2753753662109375, 1.3211669921875, 1.3669586181640625, 1.412750244140625, 1.4585418701171875, 1.50433349609375, 1.5501251220703125, 1.595916748046875, 1.6417083740234375, 1.6875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 11.0, 16.0, 27.0, 33.0, 33.0, 52.0, 81.0, 113.0, 104.0, 126.0, 111.0, 85.0, 53.0, 57.0, 26.0, 17.0, 9.0, 11.0, 4.0, 9.0, 4.0, 5.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.37890625, -1.329681396484375, -1.28045654296875, -1.231231689453125, -1.1820068359375, -1.132781982421875, -1.08355712890625, -1.034332275390625, -0.985107421875, -0.935882568359375, -0.88665771484375, -0.837432861328125, -0.7882080078125, -0.738983154296875, -0.68975830078125, -0.640533447265625, -0.59130859375, -0.542083740234375, -0.49285888671875, -0.443634033203125, -0.3944091796875, -0.345184326171875, -0.29595947265625, -0.246734619140625, -0.197509765625, -0.148284912109375, -0.09906005859375, -0.049835205078125, -0.0006103515625, 0.048614501953125, 0.09783935546875, 0.147064208984375, 0.1962890625, 0.245513916015625, 0.29473876953125, 0.343963623046875, 0.3931884765625, 0.442413330078125, 0.49163818359375, 0.540863037109375, 0.590087890625, 0.639312744140625, 0.68853759765625, 0.737762451171875, 0.7869873046875, 0.836212158203125, 0.88543701171875, 0.934661865234375, 0.98388671875, 1.033111572265625, 1.08233642578125, 1.131561279296875, 1.1807861328125, 1.230010986328125, 1.27923583984375, 1.328460693359375, 1.377685546875, 1.426910400390625, 1.47613525390625, 1.525360107421875, 1.5745849609375, 1.623809814453125, 1.67303466796875, 1.722259521484375, 1.771484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 10.0, 17.0, 39.0, 82.0, 160.0, 256.0, 211.0, 122.0, 62.0, 27.0, 17.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.6652603149414, -64.37455749511719, -63.0838508605957, -61.79314422607422, -60.502437591552734, -59.21173095703125, -57.92102813720703, -56.63032150268555, -55.33961486816406, -54.04890823364258, -52.75820541381836, -51.467498779296875, -50.17679214477539, -48.886085510253906, -47.59538269042969, -46.3046760559082, -45.01396942138672, -43.723262786865234, -42.432559967041016, -41.14185333251953, -39.85114669799805, -38.56044006347656, -37.269737243652344, -35.97903060913086, -34.68832778930664, -33.397621154785156, -32.10691833496094, -30.816211700439453, -29.52550506591797, -28.234800338745117, -26.944095611572266, -25.65338897705078, -24.362680435180664, -23.071975708007812, -21.781269073486328, -20.490564346313477, -19.199857711791992, -17.90915298461914, -16.618446350097656, -15.327741622924805, -14.037035942077637, -12.746330261230469, -11.4556245803833, -10.164918899536133, -8.874214172363281, -7.583508014678955, -6.292802810668945, -5.002097129821777, -3.7113914489746094, -2.4206857681274414, -1.1299803256988525, 0.16072511672973633, 1.4514307975769043, 2.7421364784240723, 4.032841682434082, 5.32354736328125, 6.614253044128418, 7.904958724975586, 9.195664405822754, 10.486370086669922, 11.777074813842773, 13.067781448364258, 14.35848617553711, 15.649191856384277, 16.939897537231445]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 9.0, 5.0, 13.0, 11.0, 15.0, 21.0, 17.0, 18.0, 24.0, 24.0, 33.0, 34.0, 33.0, 39.0, 54.0, 44.0, 48.0, 54.0, 42.0, 48.0, 46.0, 54.0, 48.0, 29.0, 21.0, 25.0, 39.0, 25.0, 23.0, 15.0, 21.0, 12.0, 18.0, 10.0, 9.0, 3.0, 7.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.654991149902344, -14.152769088745117, -13.65054702758789, -13.148324012756348, -12.646101951599121, -12.143879890441895, -11.641656875610352, -11.139434814453125, -10.637212753295898, -10.134990692138672, -9.632768630981445, -9.130545616149902, -8.628323554992676, -8.12610149383545, -7.6238789558410645, -7.12165641784668, -6.619434356689453, -6.117212295532227, -5.614989757537842, -5.112767219543457, -4.6105451583862305, -4.108323097229004, -3.606100559234619, -3.1038782596588135, -2.601655960083008, -2.099433660507202, -1.5972113609313965, -1.0949890613555908, -0.5927667617797852, -0.09054446220397949, 0.41167783737182617, 0.9139001369476318, 1.4161224365234375, 1.9183447360992432, 2.420567035675049, 2.9227893352508545, 3.42501163482666, 3.927233934402466, 4.4294562339782715, 4.931678771972656, 5.433900833129883, 5.936122894287109, 6.438345432281494, 6.940567970275879, 7.4427900314331055, 7.945012092590332, 8.447235107421875, 8.949457168579102, 9.451679229736328, 9.953901290893555, 10.456123352050781, 10.958346366882324, 11.46056842803955, 11.962790489196777, 12.46501350402832, 12.967235565185547, 13.469457626342773, 13.9716796875, 14.473901748657227, 14.97612476348877, 15.478346824645996, 15.980568885803223, 16.482791900634766, 16.985013961791992, 17.48723602294922]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 9.0, 7.0, 11.0, 24.0, 21.0, 37.0, 43.0, 61.0, 111.0, 194.0, 296.0, 463.0, 805.0, 1380.0, 2312.0, 4322.0, 8832.0, 21784.0, 79913.0, 3719501.0, 285721.0, 39881.0, 14005.0, 6410.0, 3338.0, 1879.0, 1112.0, 664.0, 405.0, 245.0, 173.0, 106.0, 56.0, 54.0, 31.0, 23.0, 20.0, 9.0, 6.0, 5.0, 5.0, 0.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.57421875, -4.40948486328125, -4.2447509765625, -4.08001708984375, -3.915283203125, -3.75054931640625, -3.5858154296875, -3.42108154296875, -3.25634765625, -3.09161376953125, -2.9268798828125, -2.76214599609375, -2.597412109375, -2.43267822265625, -2.2679443359375, -2.10321044921875, -1.9384765625, -1.77374267578125, -1.6090087890625, -1.44427490234375, -1.279541015625, -1.11480712890625, -0.9500732421875, -0.78533935546875, -0.62060546875, -0.45587158203125, -0.2911376953125, -0.12640380859375, 0.038330078125, 0.20306396484375, 0.3677978515625, 0.53253173828125, 0.697265625, 0.86199951171875, 1.0267333984375, 1.19146728515625, 1.356201171875, 1.52093505859375, 1.6856689453125, 1.85040283203125, 2.01513671875, 2.17987060546875, 2.3446044921875, 2.50933837890625, 2.674072265625, 2.83880615234375, 3.0035400390625, 3.16827392578125, 3.3330078125, 3.49774169921875, 3.6624755859375, 3.82720947265625, 3.991943359375, 4.15667724609375, 4.3214111328125, 4.48614501953125, 4.65087890625, 4.81561279296875, 4.9803466796875, 5.14508056640625, 5.309814453125, 5.47454833984375, 5.6392822265625, 5.80401611328125, 5.96875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 6.0, 3.0, 6.0, 7.0, 11.0, 7.0, 8.0, 9.0, 8.0, 16.0, 20.0, 16.0, 18.0, 22.0, 32.0, 36.0, 32.0, 38.0, 36.0, 30.0, 44.0, 30.0, 42.0, 44.0, 28.0, 27.0, 37.0, 29.0, 36.0, 32.0, 36.0, 23.0, 20.0, 29.0, 19.0, 20.0, 24.0, 18.0, 15.0, 18.0, 14.0, 15.0, 7.0, 8.0, 7.0, 5.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6484375, -0.6275482177734375, -0.606658935546875, -0.5857696533203125, -0.56488037109375, -0.5439910888671875, -0.523101806640625, -0.5022125244140625, -0.4813232421875, -0.4604339599609375, -0.439544677734375, -0.4186553955078125, -0.39776611328125, -0.3768768310546875, -0.355987548828125, -0.3350982666015625, -0.314208984375, -0.2933197021484375, -0.272430419921875, -0.2515411376953125, -0.23065185546875, -0.2097625732421875, -0.188873291015625, -0.1679840087890625, -0.1470947265625, -0.1262054443359375, -0.105316162109375, -0.0844268798828125, -0.06353759765625, -0.0426483154296875, -0.021759033203125, -0.0008697509765625, 0.02001953125, 0.0409088134765625, 0.061798095703125, 0.0826873779296875, 0.10357666015625, 0.1244659423828125, 0.145355224609375, 0.1662445068359375, 0.1871337890625, 0.2080230712890625, 0.228912353515625, 0.2498016357421875, 0.27069091796875, 0.2915802001953125, 0.312469482421875, 0.3333587646484375, 0.354248046875, 0.3751373291015625, 0.396026611328125, 0.4169158935546875, 0.43780517578125, 0.4586944580078125, 0.479583740234375, 0.5004730224609375, 0.5213623046875, 0.5422515869140625, 0.563140869140625, 0.5840301513671875, 0.60491943359375, 0.6258087158203125, 0.646697998046875, 0.6675872802734375, 0.6884765625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 8.0, 9.0, 16.0, 13.0, 20.0, 31.0, 54.0, 81.0, 97.0, 146.0, 230.0, 361.0, 611.0, 902.0, 1677.0, 2912.0, 6051.0, 13692.0, 36661.0, 134912.0, 3467759.0, 419278.0, 67721.0, 22255.0, 9043.0, 4176.0, 2164.0, 1256.0, 781.0, 457.0, 285.0, 184.0, 127.0, 99.0, 52.0, 50.0, 27.0, 20.0, 19.0, 9.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-4.125, -4.0096435546875, -3.894287109375, -3.7789306640625, -3.66357421875, -3.5482177734375, -3.432861328125, -3.3175048828125, -3.2021484375, -3.0867919921875, -2.971435546875, -2.8560791015625, -2.74072265625, -2.6253662109375, -2.510009765625, -2.3946533203125, -2.279296875, -2.1639404296875, -2.048583984375, -1.9332275390625, -1.81787109375, -1.7025146484375, -1.587158203125, -1.4718017578125, -1.3564453125, -1.2410888671875, -1.125732421875, -1.0103759765625, -0.89501953125, -0.7796630859375, -0.664306640625, -0.5489501953125, -0.43359375, -0.3182373046875, -0.202880859375, -0.0875244140625, 0.02783203125, 0.1431884765625, 0.258544921875, 0.3739013671875, 0.4892578125, 0.6046142578125, 0.719970703125, 0.8353271484375, 0.95068359375, 1.0660400390625, 1.181396484375, 1.2967529296875, 1.412109375, 1.5274658203125, 1.642822265625, 1.7581787109375, 1.87353515625, 1.9888916015625, 2.104248046875, 2.2196044921875, 2.3349609375, 2.4503173828125, 2.565673828125, 2.6810302734375, 2.79638671875, 2.9117431640625, 3.027099609375, 3.1424560546875, 3.2578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 11.0, 7.0, 7.0, 14.0, 35.0, 38.0, 85.0, 135.0, 506.0, 2708.0, 265.0, 100.0, 56.0, 43.0, 22.0, 13.0, 8.0, 7.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03515625, -1.954681396484375, -1.87420654296875, -1.793731689453125, -1.7132568359375, -1.632781982421875, -1.55230712890625, -1.471832275390625, -1.391357421875, -1.310882568359375, -1.23040771484375, -1.149932861328125, -1.0694580078125, -0.988983154296875, -0.90850830078125, -0.828033447265625, -0.74755859375, -0.667083740234375, -0.58660888671875, -0.506134033203125, -0.4256591796875, -0.345184326171875, -0.26470947265625, -0.184234619140625, -0.103759765625, -0.023284912109375, 0.05718994140625, 0.137664794921875, 0.2181396484375, 0.298614501953125, 0.37908935546875, 0.459564208984375, 0.5400390625, 0.620513916015625, 0.70098876953125, 0.781463623046875, 0.8619384765625, 0.942413330078125, 1.02288818359375, 1.103363037109375, 1.183837890625, 1.264312744140625, 1.34478759765625, 1.425262451171875, 1.5057373046875, 1.586212158203125, 1.66668701171875, 1.747161865234375, 1.82763671875, 1.908111572265625, 1.98858642578125, 2.069061279296875, 2.1495361328125, 2.230010986328125, 2.31048583984375, 2.390960693359375, 2.471435546875, 2.551910400390625, 2.63238525390625, 2.712860107421875, 2.7933349609375, 2.873809814453125, 2.95428466796875, 3.034759521484375, 3.115234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 46.0, 236.0, 429.0, 223.0, 44.0, 18.0, 8.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.411914825439453, -25.545486450195312, -24.679058074951172, -23.81262969970703, -22.94620132446289, -22.07977294921875, -21.21334457397461, -20.34691619873047, -19.480487823486328, -18.614059448242188, -17.747631072998047, -16.881202697753906, -16.014774322509766, -15.148345947265625, -14.281917572021484, -13.415489196777344, -12.549060821533203, -11.682632446289062, -10.816204071044922, -9.949775695800781, -9.08334732055664, -8.2169189453125, -7.350490570068359, -6.484062194824219, -5.617633819580078, -4.7512054443359375, -3.884777069091797, -3.0183486938476562, -2.1519203186035156, -1.285491943359375, -0.4190635681152344, 0.44736480712890625, 1.313791275024414, 2.1802196502685547, 3.0466480255126953, 3.913076400756836, 4.779504776000977, 5.645933151245117, 6.512361526489258, 7.378789901733398, 8.245218276977539, 9.11164665222168, 9.97807502746582, 10.844503402709961, 11.710931777954102, 12.577360153198242, 13.443788528442383, 14.310216903686523, 15.176645278930664, 16.043073654174805, 16.909502029418945, 17.775930404663086, 18.642358779907227, 19.508787155151367, 20.375215530395508, 21.24164390563965, 22.10807228088379, 22.97450065612793, 23.84092903137207, 24.70735740661621, 25.57378578186035, 26.440214157104492, 27.306642532348633, 28.173070907592773, 29.039499282836914]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 7.0, 3.0, 4.0, 4.0, 12.0, 8.0, 15.0, 17.0, 24.0, 21.0, 38.0, 32.0, 43.0, 48.0, 36.0, 50.0, 46.0, 45.0, 54.0, 44.0, 47.0, 38.0, 49.0, 53.0, 39.0, 41.0, 32.0, 33.0, 21.0, 19.0, 14.0, 14.0, 9.0, 12.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.664700508117676, -5.494636535644531, -5.324573040008545, -5.1545090675354, -4.984445095062256, -4.8143815994262695, -4.644317626953125, -4.4742536544799805, -4.304189682006836, -4.134125709533691, -3.964061975479126, -3.7939982414245605, -3.623934268951416, -3.4538705348968506, -3.283806800842285, -3.1137428283691406, -2.9436793327331543, -2.773615598678589, -2.6035516262054443, -2.433487892150879, -2.2634239196777344, -2.093360185623169, -1.9232964515686035, -1.7532325983047485, -1.5831687450408936, -1.4131048917770386, -1.2430410385131836, -1.0729773044586182, -0.9029134511947632, -0.7328495979309082, -0.5627858638763428, -0.3927220106124878, -0.2226581573486328, -0.05259433388710022, 0.11746948957443237, 0.2875332832336426, 0.45759713649749756, 0.6276609897613525, 0.797724723815918, 0.967788577079773, 1.137852430343628, 1.307916283607483, 1.477980136871338, 1.6480438709259033, 1.8181077241897583, 1.9881715774536133, 2.1582353115081787, 2.328299045562744, 2.4983630180358887, 2.668426752090454, 2.8384907245635986, 3.008554458618164, 3.1786184310913086, 3.348682165145874, 3.5187458992004395, 3.688809871673584, 3.8588736057281494, 4.028937339782715, 4.199001312255859, 4.369065284729004, 4.53912878036499, 4.709192752838135, 4.879256248474121, 5.049320220947266, 5.21938419342041]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 7.0, 12.0, 12.0, 15.0, 25.0, 60.0, 64.0, 122.0, 179.0, 315.0, 523.0, 953.0, 1859.0, 3945.0, 8979.0, 22668.0, 64593.0, 205858.0, 430035.0, 204136.0, 64447.0, 22794.0, 8923.0, 3967.0, 1851.0, 934.0, 505.0, 294.0, 178.0, 101.0, 69.0, 49.0, 33.0, 14.0, 12.0, 11.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.59765625, -4.4561767578125, -4.314697265625, -4.1732177734375, -4.03173828125, -3.8902587890625, -3.748779296875, -3.6072998046875, -3.4658203125, -3.3243408203125, -3.182861328125, -3.0413818359375, -2.89990234375, -2.7584228515625, -2.616943359375, -2.4754638671875, -2.333984375, -2.1925048828125, -2.051025390625, -1.9095458984375, -1.76806640625, -1.6265869140625, -1.485107421875, -1.3436279296875, -1.2021484375, -1.0606689453125, -0.919189453125, -0.7777099609375, -0.63623046875, -0.4947509765625, -0.353271484375, -0.2117919921875, -0.0703125, 0.0711669921875, 0.212646484375, 0.3541259765625, 0.49560546875, 0.6370849609375, 0.778564453125, 0.9200439453125, 1.0615234375, 1.2030029296875, 1.344482421875, 1.4859619140625, 1.62744140625, 1.7689208984375, 1.910400390625, 2.0518798828125, 2.193359375, 2.3348388671875, 2.476318359375, 2.6177978515625, 2.75927734375, 2.9007568359375, 3.042236328125, 3.1837158203125, 3.3251953125, 3.4666748046875, 3.608154296875, 3.7496337890625, 3.89111328125, 4.0325927734375, 4.174072265625, 4.3155517578125, 4.45703125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 9.0, 10.0, 3.0, 14.0, 14.0, 13.0, 21.0, 18.0, 27.0, 29.0, 34.0, 35.0, 31.0, 33.0, 42.0, 47.0, 46.0, 38.0, 37.0, 42.0, 35.0, 44.0, 26.0, 32.0, 32.0, 31.0, 31.0, 31.0, 26.0, 22.0, 18.0, 17.0, 11.0, 17.0, 10.0, 15.0, 13.0, 8.0, 8.0, 7.0, 4.0, 5.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70068359375, -0.6773605346679688, -0.6540374755859375, -0.6307144165039062, -0.607391357421875, -0.5840682983398438, -0.5607452392578125, -0.5374221801757812, -0.51409912109375, -0.49077606201171875, -0.4674530029296875, -0.44412994384765625, -0.420806884765625, -0.39748382568359375, -0.3741607666015625, -0.35083770751953125, -0.3275146484375, -0.30419158935546875, -0.2808685302734375, -0.25754547119140625, -0.234222412109375, -0.21089935302734375, -0.1875762939453125, -0.16425323486328125, -0.14093017578125, -0.11760711669921875, -0.0942840576171875, -0.07096099853515625, -0.047637939453125, -0.02431488037109375, -0.0009918212890625, 0.02233123779296875, 0.045654296875, 0.06897735595703125, 0.0923004150390625, 0.11562347412109375, 0.138946533203125, 0.16226959228515625, 0.1855926513671875, 0.20891571044921875, 0.23223876953125, 0.25556182861328125, 0.2788848876953125, 0.30220794677734375, 0.325531005859375, 0.34885406494140625, 0.3721771240234375, 0.39550018310546875, 0.4188232421875, 0.44214630126953125, 0.4654693603515625, 0.48879241943359375, 0.512115478515625, 0.5354385375976562, 0.5587615966796875, 0.5820846557617188, 0.60540771484375, 0.6287307739257812, 0.6520538330078125, 0.6753768920898438, 0.698699951171875, 0.7220230102539062, 0.7453460693359375, 0.7686691284179688, 0.7919921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 6.0, 14.0, 20.0, 18.0, 23.0, 63.0, 71.0, 109.0, 162.0, 292.0, 474.0, 845.0, 1575.0, 3293.0, 7746.0, 20313.0, 62020.0, 207686.0, 442757.0, 204736.0, 61633.0, 20179.0, 7546.0, 3339.0, 1579.0, 812.0, 425.0, 293.0, 160.0, 99.0, 82.0, 49.0, 51.0, 19.0, 12.0, 7.0, 16.0, 7.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.298828125, -3.194091796875, -3.08935546875, -2.984619140625, -2.8798828125, -2.775146484375, -2.67041015625, -2.565673828125, -2.4609375, -2.356201171875, -2.25146484375, -2.146728515625, -2.0419921875, -1.937255859375, -1.83251953125, -1.727783203125, -1.623046875, -1.518310546875, -1.41357421875, -1.308837890625, -1.2041015625, -1.099365234375, -0.99462890625, -0.889892578125, -0.78515625, -0.680419921875, -0.57568359375, -0.470947265625, -0.3662109375, -0.261474609375, -0.15673828125, -0.052001953125, 0.052734375, 0.157470703125, 0.26220703125, 0.366943359375, 0.4716796875, 0.576416015625, 0.68115234375, 0.785888671875, 0.890625, 0.995361328125, 1.10009765625, 1.204833984375, 1.3095703125, 1.414306640625, 1.51904296875, 1.623779296875, 1.728515625, 1.833251953125, 1.93798828125, 2.042724609375, 2.1474609375, 2.252197265625, 2.35693359375, 2.461669921875, 2.56640625, 2.671142578125, 2.77587890625, 2.880615234375, 2.9853515625, 3.090087890625, 3.19482421875, 3.299560546875, 3.404296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 6.0, 10.0, 3.0, 7.0, 8.0, 12.0, 17.0, 26.0, 35.0, 36.0, 38.0, 46.0, 62.0, 58.0, 54.0, 78.0, 63.0, 68.0, 52.0, 54.0, 53.0, 35.0, 40.0, 29.0, 21.0, 25.0, 17.0, 13.0, 8.0, 10.0, 5.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.79754638671875, -4.6224365234375, -4.44732666015625, -4.272216796875, -4.09710693359375, -3.9219970703125, -3.74688720703125, -3.57177734375, -3.39666748046875, -3.2215576171875, -3.04644775390625, -2.871337890625, -2.69622802734375, -2.5211181640625, -2.34600830078125, -2.1708984375, -1.99578857421875, -1.8206787109375, -1.64556884765625, -1.470458984375, -1.29534912109375, -1.1202392578125, -0.94512939453125, -0.77001953125, -0.59490966796875, -0.4197998046875, -0.24468994140625, -0.069580078125, 0.10552978515625, 0.2806396484375, 0.45574951171875, 0.630859375, 0.80596923828125, 0.9810791015625, 1.15618896484375, 1.331298828125, 1.50640869140625, 1.6815185546875, 1.85662841796875, 2.03173828125, 2.20684814453125, 2.3819580078125, 2.55706787109375, 2.732177734375, 2.90728759765625, 3.0823974609375, 3.25750732421875, 3.4326171875, 3.60772705078125, 3.7828369140625, 3.95794677734375, 4.133056640625, 4.30816650390625, 4.4832763671875, 4.65838623046875, 4.83349609375, 5.00860595703125, 5.1837158203125, 5.35882568359375, 5.533935546875, 5.70904541015625, 5.8841552734375, 6.05926513671875, 6.234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 11.0, 14.0, 16.0, 19.0, 40.0, 75.0, 126.0, 267.0, 532.0, 1081.0, 2945.0, 8542.0, 33019.0, 207007.0, 667933.0, 97831.0, 19565.0, 5662.0, 2129.0, 867.0, 396.0, 206.0, 92.0, 68.0, 32.0, 29.0, 16.0, 7.0, 7.0, 7.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.787109375, -2.6981201171875, -2.609130859375, -2.5201416015625, -2.43115234375, -2.3421630859375, -2.253173828125, -2.1641845703125, -2.0751953125, -1.9862060546875, -1.897216796875, -1.8082275390625, -1.71923828125, -1.6302490234375, -1.541259765625, -1.4522705078125, -1.36328125, -1.2742919921875, -1.185302734375, -1.0963134765625, -1.00732421875, -0.9183349609375, -0.829345703125, -0.7403564453125, -0.6513671875, -0.5623779296875, -0.473388671875, -0.3843994140625, -0.29541015625, -0.2064208984375, -0.117431640625, -0.0284423828125, 0.060546875, 0.1495361328125, 0.238525390625, 0.3275146484375, 0.41650390625, 0.5054931640625, 0.594482421875, 0.6834716796875, 0.7724609375, 0.8614501953125, 0.950439453125, 1.0394287109375, 1.12841796875, 1.2174072265625, 1.306396484375, 1.3953857421875, 1.484375, 1.5733642578125, 1.662353515625, 1.7513427734375, 1.84033203125, 1.9293212890625, 2.018310546875, 2.1072998046875, 2.1962890625, 2.2852783203125, 2.374267578125, 2.4632568359375, 2.55224609375, 2.6412353515625, 2.730224609375, 2.8192138671875, 2.908203125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 9.0, 9.0, 11.0, 13.0, 17.0, 18.0, 22.0, 34.0, 43.0, 50.0, 85.0, 161.0, 161.0, 115.0, 64.0, 57.0, 35.0, 23.0, 16.0, 15.0, 9.0, 12.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003292560577392578, -0.00032059475779533386, -0.0003119334578514099, -0.00030327215790748596, -0.000294610857963562, -0.00028594955801963806, -0.0002772882580757141, -0.00026862695813179016, -0.0002599656581878662, -0.00025130435824394226, -0.0002426430583000183, -0.00023398175835609436, -0.0002253204584121704, -0.00021665915846824646, -0.0002079978585243225, -0.00019933655858039856, -0.0001906752586364746, -0.00018201395869255066, -0.0001733526587486267, -0.00016469135880470276, -0.0001560300588607788, -0.00014736875891685486, -0.0001387074589729309, -0.00013004615902900696, -0.00012138485908508301, -0.00011272355914115906, -0.00010406225919723511, -9.540095925331116e-05, -8.673965930938721e-05, -7.807835936546326e-05, -6.94170594215393e-05, -6.0755759477615356e-05, -5.2094459533691406e-05, -4.3433159589767456e-05, -3.4771859645843506e-05, -2.6110559701919556e-05, -1.7449259757995605e-05, -8.787959814071655e-06, -1.2665987014770508e-07, 8.534640073776245e-06, 1.7195940017700195e-05, 2.5857239961624146e-05, 3.4518539905548096e-05, 4.3179839849472046e-05, 5.1841139793395996e-05, 6.0502439737319946e-05, 6.91637396812439e-05, 7.782503962516785e-05, 8.64863395690918e-05, 9.514763951301575e-05, 0.0001038089394569397, 0.00011247023940086365, 0.0001211315393447876, 0.00012979283928871155, 0.0001384541392326355, 0.00014711543917655945, 0.0001557767391204834, 0.00016443803906440735, 0.0001730993390083313, 0.00018176063895225525, 0.0001904219388961792, 0.00019908323884010315, 0.0002077445387840271, 0.00021640583872795105, 0.000225067138671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 10.0, 7.0, 7.0, 15.0, 19.0, 34.0, 45.0, 70.0, 136.0, 223.0, 464.0, 875.0, 1860.0, 4460.0, 14697.0, 81819.0, 702598.0, 202963.0, 26513.0, 6745.0, 2538.0, 1143.0, 579.0, 280.0, 166.0, 103.0, 64.0, 31.0, 16.0, 15.0, 20.0, 9.0, 10.0, 3.0, 7.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.626953125, -3.516021728515625, -3.40509033203125, -3.294158935546875, -3.1832275390625, -3.072296142578125, -2.96136474609375, -2.850433349609375, -2.739501953125, -2.628570556640625, -2.51763916015625, -2.406707763671875, -2.2957763671875, -2.184844970703125, -2.07391357421875, -1.962982177734375, -1.85205078125, -1.741119384765625, -1.63018798828125, -1.519256591796875, -1.4083251953125, -1.297393798828125, -1.18646240234375, -1.075531005859375, -0.964599609375, -0.853668212890625, -0.74273681640625, -0.631805419921875, -0.5208740234375, -0.409942626953125, -0.29901123046875, -0.188079833984375, -0.0771484375, 0.033782958984375, 0.14471435546875, 0.255645751953125, 0.3665771484375, 0.477508544921875, 0.58843994140625, 0.699371337890625, 0.810302734375, 0.921234130859375, 1.03216552734375, 1.143096923828125, 1.2540283203125, 1.364959716796875, 1.47589111328125, 1.586822509765625, 1.69775390625, 1.808685302734375, 1.91961669921875, 2.030548095703125, 2.1414794921875, 2.252410888671875, 2.36334228515625, 2.474273681640625, 2.585205078125, 2.696136474609375, 2.80706787109375, 2.917999267578125, 3.0289306640625, 3.139862060546875, 3.25079345703125, 3.361724853515625, 3.47265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 7.0, 9.0, 9.0, 10.0, 31.0, 23.0, 39.0, 44.0, 71.0, 105.0, 139.0, 134.0, 97.0, 63.0, 58.0, 35.0, 41.0, 17.0, 15.0, 5.0, 5.0, 10.0, 4.0, 6.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.43359375, -3.322357177734375, -3.21112060546875, -3.099884033203125, -2.9886474609375, -2.877410888671875, -2.76617431640625, -2.654937744140625, -2.543701171875, -2.432464599609375, -2.32122802734375, -2.209991455078125, -2.0987548828125, -1.987518310546875, -1.87628173828125, -1.765045166015625, -1.65380859375, -1.542572021484375, -1.43133544921875, -1.320098876953125, -1.2088623046875, -1.097625732421875, -0.98638916015625, -0.875152587890625, -0.763916015625, -0.652679443359375, -0.54144287109375, -0.430206298828125, -0.3189697265625, -0.207733154296875, -0.09649658203125, 0.014739990234375, 0.1259765625, 0.237213134765625, 0.34844970703125, 0.459686279296875, 0.5709228515625, 0.682159423828125, 0.79339599609375, 0.904632568359375, 1.015869140625, 1.127105712890625, 1.23834228515625, 1.349578857421875, 1.4608154296875, 1.572052001953125, 1.68328857421875, 1.794525146484375, 1.90576171875, 2.016998291015625, 2.12823486328125, 2.239471435546875, 2.3507080078125, 2.461944580078125, 2.57318115234375, 2.684417724609375, 2.795654296875, 2.906890869140625, 3.01812744140625, 3.129364013671875, 3.2406005859375, 3.351837158203125, 3.46307373046875, 3.574310302734375, 3.685546875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 8.0, 14.0, 25.0, 28.0, 24.0, 37.0, 71.0, 66.0, 89.0, 97.0, 112.0, 79.0, 83.0, 71.0, 41.0, 46.0, 29.0, 17.0, 15.0, 11.0, 9.0, 4.0, 5.0, 6.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.12528610229492, -31.358671188354492, -30.592056274414062, -29.825439453125, -29.05882453918457, -28.29220962524414, -27.525592803955078, -26.75897789001465, -25.99236297607422, -25.22574806213379, -24.45913314819336, -23.692516326904297, -22.925901412963867, -22.159286499023438, -21.392669677734375, -20.626054763793945, -19.859439849853516, -19.092824935913086, -18.326210021972656, -17.559593200683594, -16.792978286743164, -16.026363372802734, -15.259747505187988, -14.493131637573242, -13.726516723632812, -12.959901809692383, -12.193285942077637, -11.42667007446289, -10.660055160522461, -9.893440246582031, -9.126824378967285, -8.360208511352539, -7.593591690063477, -6.826976299285889, -6.060360908508301, -5.293745517730713, -4.527130126953125, -3.760514736175537, -2.993899345397949, -2.2272839546203613, -1.4606685638427734, -0.6940531730651855, 0.07256221771240234, 0.8391776084899902, 1.6057929992675781, 2.372408390045166, 3.139023780822754, 3.905639171600342, 4.67225456237793, 5.438869953155518, 6.2054853439331055, 6.972100734710693, 7.738716125488281, 8.505331039428711, 9.271946907043457, 10.038562774658203, 10.805177688598633, 11.571792602539062, 12.338408470153809, 13.105024337768555, 13.871639251708984, 14.638254165649414, 15.40487003326416, 16.171485900878906, 16.938100814819336]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 12.0, 13.0, 17.0, 15.0, 11.0, 28.0, 30.0, 34.0, 44.0, 35.0, 33.0, 52.0, 50.0, 48.0, 55.0, 46.0, 52.0, 53.0, 42.0, 51.0, 45.0, 29.0, 44.0, 30.0, 33.0, 20.0, 22.0, 13.0, 10.0, 7.0, 5.0, 7.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.421762466430664, -30.480783462524414, -29.539804458618164, -28.598827362060547, -27.657848358154297, -26.716869354248047, -25.775890350341797, -24.834911346435547, -23.893932342529297, -22.952953338623047, -22.011974334716797, -21.070995330810547, -20.13001823425293, -19.18903923034668, -18.24806022644043, -17.30708122253418, -16.366104125976562, -15.425125122070312, -14.484147071838379, -13.543168067932129, -12.602190017700195, -11.661211013793945, -10.720232009887695, -9.779253005981445, -8.838274955749512, -7.89729642868042, -6.956317901611328, -6.015338897705078, -5.074360370635986, -4.1333818435668945, -3.1924028396606445, -2.2514243125915527, -1.3104476928710938, -0.3694690465927124, 0.571509599685669, 1.5124883651733398, 2.4534668922424316, 3.3944454193115234, 4.335424423217773, 5.276402950286865, 6.217381477355957, 7.158360004425049, 8.09933853149414, 9.04031753540039, 9.98129653930664, 10.922274589538574, 11.863253593444824, 12.804231643676758, 13.745210647583008, 14.686189651489258, 15.627167701721191, 16.568145751953125, 17.509124755859375, 18.450103759765625, 19.391082763671875, 20.332061767578125, 21.273040771484375, 22.214019775390625, 23.154998779296875, 24.095977783203125, 25.036954879760742, 25.977933883666992, 26.918912887573242, 27.859891891479492, 28.80086898803711]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 10.0, 14.0, 15.0, 23.0, 30.0, 38.0, 59.0, 100.0, 131.0, 217.0, 328.0, 464.0, 841.0, 1389.0, 2464.0, 4276.0, 8494.0, 17810.0, 43426.0, 136921.0, 1072540.0, 2630708.0, 177276.0, 52584.0, 21340.0, 9954.0, 5332.0, 2955.0, 1645.0, 1006.0, 647.0, 402.0, 277.0, 166.0, 106.0, 82.0, 53.0, 38.0, 33.0, 28.0, 18.0, 13.0, 11.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.29296875, -3.17144775390625, -3.0499267578125, -2.92840576171875, -2.806884765625, -2.68536376953125, -2.5638427734375, -2.44232177734375, -2.32080078125, -2.19927978515625, -2.0777587890625, -1.95623779296875, -1.834716796875, -1.71319580078125, -1.5916748046875, -1.47015380859375, -1.3486328125, -1.22711181640625, -1.1055908203125, -0.98406982421875, -0.862548828125, -0.74102783203125, -0.6195068359375, -0.49798583984375, -0.37646484375, -0.25494384765625, -0.1334228515625, -0.01190185546875, 0.109619140625, 0.23114013671875, 0.3526611328125, 0.47418212890625, 0.595703125, 0.71722412109375, 0.8387451171875, 0.96026611328125, 1.081787109375, 1.20330810546875, 1.3248291015625, 1.44635009765625, 1.56787109375, 1.68939208984375, 1.8109130859375, 1.93243408203125, 2.053955078125, 2.17547607421875, 2.2969970703125, 2.41851806640625, 2.5400390625, 2.66156005859375, 2.7830810546875, 2.90460205078125, 3.026123046875, 3.14764404296875, 3.2691650390625, 3.39068603515625, 3.51220703125, 3.63372802734375, 3.7552490234375, 3.87677001953125, 3.998291015625, 4.11981201171875, 4.2413330078125, 4.36285400390625, 4.484375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 5.0, 4.0, 10.0, 11.0, 8.0, 9.0, 16.0, 17.0, 18.0, 16.0, 28.0, 18.0, 35.0, 33.0, 40.0, 38.0, 42.0, 39.0, 43.0, 42.0, 39.0, 33.0, 41.0, 45.0, 41.0, 31.0, 29.0, 29.0, 29.0, 20.0, 22.0, 15.0, 21.0, 19.0, 15.0, 10.0, 13.0, 13.0, 11.0, 8.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8544921875, -0.82684326171875, -0.7991943359375, -0.77154541015625, -0.743896484375, -0.71624755859375, -0.6885986328125, -0.66094970703125, -0.63330078125, -0.60565185546875, -0.5780029296875, -0.55035400390625, -0.522705078125, -0.49505615234375, -0.4674072265625, -0.43975830078125, -0.412109375, -0.38446044921875, -0.3568115234375, -0.32916259765625, -0.301513671875, -0.27386474609375, -0.2462158203125, -0.21856689453125, -0.19091796875, -0.16326904296875, -0.1356201171875, -0.10797119140625, -0.080322265625, -0.05267333984375, -0.0250244140625, 0.00262451171875, 0.0302734375, 0.05792236328125, 0.0855712890625, 0.11322021484375, 0.140869140625, 0.16851806640625, 0.1961669921875, 0.22381591796875, 0.25146484375, 0.27911376953125, 0.3067626953125, 0.33441162109375, 0.362060546875, 0.38970947265625, 0.4173583984375, 0.44500732421875, 0.47265625, 0.50030517578125, 0.5279541015625, 0.55560302734375, 0.583251953125, 0.61090087890625, 0.6385498046875, 0.66619873046875, 0.69384765625, 0.72149658203125, 0.7491455078125, 0.77679443359375, 0.804443359375, 0.83209228515625, 0.8597412109375, 0.88739013671875, 0.9150390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 8.0, 7.0, 14.0, 25.0, 24.0, 32.0, 57.0, 81.0, 142.0, 200.0, 319.0, 504.0, 900.0, 1669.0, 3293.0, 7254.0, 18500.0, 57641.0, 264932.0, 3104641.0, 592917.0, 94262.0, 27229.0, 10207.0, 4492.0, 2129.0, 1086.0, 633.0, 385.0, 252.0, 157.0, 89.0, 53.0, 52.0, 26.0, 16.0, 16.0, 9.0, 9.0, 6.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.611328125, -3.475982666015625, -3.34063720703125, -3.205291748046875, -3.0699462890625, -2.934600830078125, -2.79925537109375, -2.663909912109375, -2.528564453125, -2.393218994140625, -2.25787353515625, -2.122528076171875, -1.9871826171875, -1.851837158203125, -1.71649169921875, -1.581146240234375, -1.44580078125, -1.310455322265625, -1.17510986328125, -1.039764404296875, -0.9044189453125, -0.769073486328125, -0.63372802734375, -0.498382568359375, -0.363037109375, -0.227691650390625, -0.09234619140625, 0.042999267578125, 0.1783447265625, 0.313690185546875, 0.44903564453125, 0.584381103515625, 0.7197265625, 0.855072021484375, 0.99041748046875, 1.125762939453125, 1.2611083984375, 1.396453857421875, 1.53179931640625, 1.667144775390625, 1.802490234375, 1.937835693359375, 2.07318115234375, 2.208526611328125, 2.3438720703125, 2.479217529296875, 2.61456298828125, 2.749908447265625, 2.88525390625, 3.020599365234375, 3.15594482421875, 3.291290283203125, 3.4266357421875, 3.561981201171875, 3.69732666015625, 3.832672119140625, 3.968017578125, 4.103363037109375, 4.23870849609375, 4.374053955078125, 4.5093994140625, 4.644744873046875, 4.78009033203125, 4.915435791015625, 5.05078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 7.0, 8.0, 10.0, 17.0, 19.0, 22.0, 27.0, 52.0, 92.0, 123.0, 201.0, 473.0, 1647.0, 702.0, 255.0, 139.0, 83.0, 63.0, 36.0, 29.0, 11.0, 12.0, 6.0, 13.0, 7.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.095703125, -2.9947509765625, -2.893798828125, -2.7928466796875, -2.69189453125, -2.5909423828125, -2.489990234375, -2.3890380859375, -2.2880859375, -2.1871337890625, -2.086181640625, -1.9852294921875, -1.88427734375, -1.7833251953125, -1.682373046875, -1.5814208984375, -1.48046875, -1.3795166015625, -1.278564453125, -1.1776123046875, -1.07666015625, -0.9757080078125, -0.874755859375, -0.7738037109375, -0.6728515625, -0.5718994140625, -0.470947265625, -0.3699951171875, -0.26904296875, -0.1680908203125, -0.067138671875, 0.0338134765625, 0.134765625, 0.2357177734375, 0.336669921875, 0.4376220703125, 0.53857421875, 0.6395263671875, 0.740478515625, 0.8414306640625, 0.9423828125, 1.0433349609375, 1.144287109375, 1.2452392578125, 1.34619140625, 1.4471435546875, 1.548095703125, 1.6490478515625, 1.75, 1.8509521484375, 1.951904296875, 2.0528564453125, 2.15380859375, 2.2547607421875, 2.355712890625, 2.4566650390625, 2.5576171875, 2.6585693359375, 2.759521484375, 2.8604736328125, 2.96142578125, 3.0623779296875, 3.163330078125, 3.2642822265625, 3.365234375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 23.0, 61.0, 166.0, 336.0, 237.0, 98.0, 49.0, 20.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.527830123901367, -22.09633445739746, -20.664838790893555, -19.23334503173828, -17.801849365234375, -16.37035369873047, -14.938858032226562, -13.507362365722656, -12.07586669921875, -10.644371032714844, -9.212875366210938, -7.781380653381348, -6.349884986877441, -4.918389320373535, -3.4868946075439453, -2.055398941040039, -0.6239032745361328, 0.8075921535491943, 2.2390875816345215, 3.6705827713012695, 5.102078437805176, 6.533574104309082, 7.965068817138672, 9.396564483642578, 10.828060150146484, 12.25955581665039, 13.691051483154297, 15.122546195983887, 16.55404281616211, 17.985538482666016, 19.41703224182129, 20.848527908325195, 22.28002166748047, 23.711517333984375, 25.14301300048828, 26.574508666992188, 28.006004333496094, 29.4375, 30.868993759155273, 32.30049133300781, 33.73198699951172, 35.163482666015625, 36.59497833251953, 38.02647399902344, 39.457969665527344, 40.88946533203125, 42.320960998535156, 43.75245666503906, 45.1839485168457, 46.61544418334961, 48.046939849853516, 49.47843551635742, 50.90993118286133, 52.341426849365234, 53.772918701171875, 55.20441436767578, 56.63591003417969, 58.067405700683594, 59.4989013671875, 60.930397033691406, 62.36189270019531, 63.79338836669922, 65.22488403320312, 66.65637969970703, 68.08787536621094]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 1.0, 2.0, 7.0, 9.0, 5.0, 11.0, 11.0, 15.0, 15.0, 20.0, 22.0, 17.0, 20.0, 30.0, 48.0, 35.0, 32.0, 40.0, 47.0, 36.0, 45.0, 39.0, 38.0, 44.0, 43.0, 48.0, 42.0, 33.0, 28.0, 22.0, 24.0, 21.0, 24.0, 19.0, 21.0, 18.0, 9.0, 12.0, 8.0, 8.0, 8.0, 6.0, 5.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.787212371826172, -11.423974990844727, -11.060736656188965, -10.69749927520752, -10.334260940551758, -9.971023559570312, -9.607786178588867, -9.244547843933105, -8.881309509277344, -8.518072128295898, -8.154833793640137, -7.791596412658691, -7.42835807800293, -7.065120697021484, -6.701882839202881, -6.338644981384277, -5.975407600402832, -5.6121697425842285, -5.248931884765625, -4.88569450378418, -4.522456169128418, -4.159218788146973, -3.795980930328369, -3.4327430725097656, -3.069505214691162, -2.7062673568725586, -2.343029499053955, -1.9797918796539307, -1.6165540218353271, -1.2533161640167236, -0.8900785446166992, -0.5268406867980957, -0.16360187530517578, 0.19963592290878296, 0.5628737211227417, 0.9261114597320557, 1.2893493175506592, 1.6525871753692627, 2.015824794769287, 2.3790626525878906, 2.742300510406494, 3.1055383682250977, 3.468776226043701, 3.8320138454437256, 4.19525146484375, 4.558489799499512, 4.921727180480957, 5.2849650382995605, 5.648202896118164, 6.011440753936768, 6.374678611755371, 6.737915992736816, 7.101154327392578, 7.464391708374023, 7.827629566192627, 8.19086742401123, 8.554105758666992, 8.917343139648438, 9.2805814743042, 9.643818855285645, 10.007057189941406, 10.370294570922852, 10.733531951904297, 11.096770286560059, 11.460007667541504]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 15.0, 14.0, 24.0, 38.0, 48.0, 93.0, 128.0, 231.0, 382.0, 672.0, 1201.0, 2443.0, 4614.0, 9406.0, 19827.0, 43682.0, 99256.0, 206597.0, 282456.0, 201069.0, 95984.0, 42251.0, 19417.0, 9130.0, 4415.0, 2282.0, 1194.0, 687.0, 385.0, 212.0, 135.0, 92.0, 46.0, 37.0, 22.0, 21.0, 11.0, 8.0, 8.0, 1.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.033203125, -2.933685302734375, -2.83416748046875, -2.734649658203125, -2.6351318359375, -2.535614013671875, -2.43609619140625, -2.336578369140625, -2.237060546875, -2.137542724609375, -2.03802490234375, -1.938507080078125, -1.8389892578125, -1.739471435546875, -1.63995361328125, -1.540435791015625, -1.44091796875, -1.341400146484375, -1.24188232421875, -1.142364501953125, -1.0428466796875, -0.943328857421875, -0.84381103515625, -0.744293212890625, -0.644775390625, -0.545257568359375, -0.44573974609375, -0.346221923828125, -0.2467041015625, -0.147186279296875, -0.04766845703125, 0.051849365234375, 0.1513671875, 0.250885009765625, 0.35040283203125, 0.449920654296875, 0.5494384765625, 0.648956298828125, 0.74847412109375, 0.847991943359375, 0.947509765625, 1.047027587890625, 1.14654541015625, 1.246063232421875, 1.3455810546875, 1.445098876953125, 1.54461669921875, 1.644134521484375, 1.74365234375, 1.843170166015625, 1.94268798828125, 2.042205810546875, 2.1417236328125, 2.241241455078125, 2.34075927734375, 2.440277099609375, 2.539794921875, 2.639312744140625, 2.73883056640625, 2.838348388671875, 2.9378662109375, 3.037384033203125, 3.13690185546875, 3.236419677734375, 3.3359375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 4.0, 2.0, 4.0, 5.0, 6.0, 4.0, 7.0, 7.0, 13.0, 11.0, 16.0, 16.0, 16.0, 14.0, 30.0, 20.0, 35.0, 37.0, 30.0, 40.0, 38.0, 36.0, 40.0, 37.0, 37.0, 36.0, 36.0, 36.0, 42.0, 36.0, 31.0, 34.0, 23.0, 14.0, 18.0, 22.0, 25.0, 32.0, 14.0, 15.0, 15.0, 14.0, 8.0, 12.0, 10.0, 5.0, 9.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0078125, -0.9761962890625, -0.944580078125, -0.9129638671875, -0.88134765625, -0.8497314453125, -0.818115234375, -0.7864990234375, -0.7548828125, -0.7232666015625, -0.691650390625, -0.6600341796875, -0.62841796875, -0.5968017578125, -0.565185546875, -0.5335693359375, -0.501953125, -0.4703369140625, -0.438720703125, -0.4071044921875, -0.37548828125, -0.3438720703125, -0.312255859375, -0.2806396484375, -0.2490234375, -0.2174072265625, -0.185791015625, -0.1541748046875, -0.12255859375, -0.0909423828125, -0.059326171875, -0.0277099609375, 0.00390625, 0.0355224609375, 0.067138671875, 0.0987548828125, 0.13037109375, 0.1619873046875, 0.193603515625, 0.2252197265625, 0.2568359375, 0.2884521484375, 0.320068359375, 0.3516845703125, 0.38330078125, 0.4149169921875, 0.446533203125, 0.4781494140625, 0.509765625, 0.5413818359375, 0.572998046875, 0.6046142578125, 0.63623046875, 0.6678466796875, 0.699462890625, 0.7310791015625, 0.7626953125, 0.7943115234375, 0.825927734375, 0.8575439453125, 0.88916015625, 0.9207763671875, 0.952392578125, 0.9840087890625, 1.015625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 4.0, 4.0, 10.0, 7.0, 22.0, 27.0, 45.0, 54.0, 85.0, 136.0, 200.0, 318.0, 591.0, 1071.0, 2104.0, 4874.0, 12254.0, 33221.0, 105615.0, 314704.0, 368245.0, 136620.0, 42396.0, 14775.0, 5690.0, 2484.0, 1313.0, 665.0, 367.0, 208.0, 166.0, 86.0, 64.0, 40.0, 30.0, 16.0, 14.0, 7.0, 8.0, 6.0, 9.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3203125, -5.16876220703125, -5.0172119140625, -4.86566162109375, -4.714111328125, -4.56256103515625, -4.4110107421875, -4.25946044921875, -4.10791015625, -3.95635986328125, -3.8048095703125, -3.65325927734375, -3.501708984375, -3.35015869140625, -3.1986083984375, -3.04705810546875, -2.8955078125, -2.74395751953125, -2.5924072265625, -2.44085693359375, -2.289306640625, -2.13775634765625, -1.9862060546875, -1.83465576171875, -1.68310546875, -1.53155517578125, -1.3800048828125, -1.22845458984375, -1.076904296875, -0.92535400390625, -0.7738037109375, -0.62225341796875, -0.470703125, -0.31915283203125, -0.1676025390625, -0.01605224609375, 0.135498046875, 0.28704833984375, 0.4385986328125, 0.59014892578125, 0.74169921875, 0.89324951171875, 1.0447998046875, 1.19635009765625, 1.347900390625, 1.49945068359375, 1.6510009765625, 1.80255126953125, 1.9541015625, 2.10565185546875, 2.2572021484375, 2.40875244140625, 2.560302734375, 2.71185302734375, 2.8634033203125, 3.01495361328125, 3.16650390625, 3.31805419921875, 3.4696044921875, 3.62115478515625, 3.772705078125, 3.92425537109375, 4.0758056640625, 4.22735595703125, 4.37890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 7.0, 3.0, 11.0, 13.0, 13.0, 17.0, 24.0, 22.0, 22.0, 33.0, 35.0, 40.0, 39.0, 40.0, 44.0, 45.0, 48.0, 47.0, 61.0, 41.0, 43.0, 54.0, 32.0, 30.0, 31.0, 33.0, 28.0, 27.0, 17.0, 18.0, 14.0, 12.0, 11.0, 9.0, 7.0, 9.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.35546875, -7.10565185546875, -6.8558349609375, -6.60601806640625, -6.356201171875, -6.10638427734375, -5.8565673828125, -5.60675048828125, -5.35693359375, -5.10711669921875, -4.8572998046875, -4.60748291015625, -4.357666015625, -4.10784912109375, -3.8580322265625, -3.60821533203125, -3.3583984375, -3.10858154296875, -2.8587646484375, -2.60894775390625, -2.359130859375, -2.10931396484375, -1.8594970703125, -1.60968017578125, -1.35986328125, -1.11004638671875, -0.8602294921875, -0.61041259765625, -0.360595703125, -0.11077880859375, 0.1390380859375, 0.38885498046875, 0.638671875, 0.88848876953125, 1.1383056640625, 1.38812255859375, 1.637939453125, 1.88775634765625, 2.1375732421875, 2.38739013671875, 2.63720703125, 2.88702392578125, 3.1368408203125, 3.38665771484375, 3.636474609375, 3.88629150390625, 4.1361083984375, 4.38592529296875, 4.6357421875, 4.88555908203125, 5.1353759765625, 5.38519287109375, 5.635009765625, 5.88482666015625, 6.1346435546875, 6.38446044921875, 6.63427734375, 6.88409423828125, 7.1339111328125, 7.38372802734375, 7.633544921875, 7.88336181640625, 8.1331787109375, 8.38299560546875, 8.6328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 7.0, 11.0, 14.0, 27.0, 26.0, 53.0, 91.0, 109.0, 201.0, 374.0, 881.0, 2421.0, 9557.0, 79560.0, 800324.0, 136543.0, 13316.0, 2994.0, 1085.0, 398.0, 196.0, 122.0, 87.0, 43.0, 35.0, 24.0, 17.0, 13.0, 8.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.03125, -5.8341064453125, -5.636962890625, -5.4398193359375, -5.24267578125, -5.0455322265625, -4.848388671875, -4.6512451171875, -4.4541015625, -4.2569580078125, -4.059814453125, -3.8626708984375, -3.66552734375, -3.4683837890625, -3.271240234375, -3.0740966796875, -2.876953125, -2.6798095703125, -2.482666015625, -2.2855224609375, -2.08837890625, -1.8912353515625, -1.694091796875, -1.4969482421875, -1.2998046875, -1.1026611328125, -0.905517578125, -0.7083740234375, -0.51123046875, -0.3140869140625, -0.116943359375, 0.0802001953125, 0.27734375, 0.4744873046875, 0.671630859375, 0.8687744140625, 1.06591796875, 1.2630615234375, 1.460205078125, 1.6573486328125, 1.8544921875, 2.0516357421875, 2.248779296875, 2.4459228515625, 2.64306640625, 2.8402099609375, 3.037353515625, 3.2344970703125, 3.431640625, 3.6287841796875, 3.825927734375, 4.0230712890625, 4.22021484375, 4.4173583984375, 4.614501953125, 4.8116455078125, 5.0087890625, 5.2059326171875, 5.403076171875, 5.6002197265625, 5.79736328125, 5.9945068359375, 6.191650390625, 6.3887939453125, 6.5859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 3.0, 16.0, 13.0, 32.0, 36.0, 104.0, 159.0, 201.0, 191.0, 106.0, 65.0, 29.0, 18.0, 9.0, 9.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007901191711425781, -0.0007666125893592834, -0.0007431060075759888, -0.0007195994257926941, -0.0006960928440093994, -0.0006725862622261047, -0.0006490796804428101, -0.0006255730986595154, -0.0006020665168762207, -0.000578559935092926, -0.0005550533533096313, -0.0005315467715263367, -0.000508040189743042, -0.0004845336079597473, -0.00046102702617645264, -0.00043752044439315796, -0.0004140138626098633, -0.0003905072808265686, -0.0003670006990432739, -0.00034349411725997925, -0.00031998753547668457, -0.0002964809536933899, -0.0002729743719100952, -0.00024946779012680054, -0.00022596120834350586, -0.00020245462656021118, -0.0001789480447769165, -0.00015544146299362183, -0.00013193488121032715, -0.00010842829942703247, -8.492171764373779e-05, -6.141513586044312e-05, -3.790855407714844e-05, -1.440197229385376e-05, 9.104609489440918e-06, 3.2611191272735596e-05, 5.6117773056030273e-05, 7.962435483932495e-05, 0.00010313093662261963, 0.0001266375184059143, 0.00015014410018920898, 0.00017365068197250366, 0.00019715726375579834, 0.00022066384553909302, 0.0002441704273223877, 0.0002676770091056824, 0.00029118359088897705, 0.00031469017267227173, 0.0003381967544555664, 0.0003617033362388611, 0.00038520991802215576, 0.00040871649980545044, 0.0004322230815887451, 0.0004557296633720398, 0.00047923624515533447, 0.0005027428269386292, 0.0005262494087219238, 0.0005497559905052185, 0.0005732625722885132, 0.0005967691540718079, 0.0006202757358551025, 0.0006437823176383972, 0.0006672888994216919, 0.0006907954812049866, 0.0007143020629882812]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 12.0, 11.0, 12.0, 13.0, 25.0, 33.0, 55.0, 62.0, 102.0, 189.0, 289.0, 467.0, 833.0, 1658.0, 3562.0, 9608.0, 39276.0, 293594.0, 586928.0, 85565.0, 16183.0, 5190.0, 2241.0, 1070.0, 554.0, 360.0, 227.0, 147.0, 93.0, 55.0, 44.0, 26.0, 15.0, 14.0, 9.0, 6.0, 7.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.8668212890625, -3.729736328125, -3.5926513671875, -3.45556640625, -3.3184814453125, -3.181396484375, -3.0443115234375, -2.9072265625, -2.7701416015625, -2.633056640625, -2.4959716796875, -2.35888671875, -2.2218017578125, -2.084716796875, -1.9476318359375, -1.810546875, -1.6734619140625, -1.536376953125, -1.3992919921875, -1.26220703125, -1.1251220703125, -0.988037109375, -0.8509521484375, -0.7138671875, -0.5767822265625, -0.439697265625, -0.3026123046875, -0.16552734375, -0.0284423828125, 0.108642578125, 0.2457275390625, 0.3828125, 0.5198974609375, 0.656982421875, 0.7940673828125, 0.93115234375, 1.0682373046875, 1.205322265625, 1.3424072265625, 1.4794921875, 1.6165771484375, 1.753662109375, 1.8907470703125, 2.02783203125, 2.1649169921875, 2.302001953125, 2.4390869140625, 2.576171875, 2.7132568359375, 2.850341796875, 2.9874267578125, 3.12451171875, 3.2615966796875, 3.398681640625, 3.5357666015625, 3.6728515625, 3.8099365234375, 3.947021484375, 4.0841064453125, 4.22119140625, 4.3582763671875, 4.495361328125, 4.6324462890625, 4.76953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 4.0, 3.0, 13.0, 9.0, 24.0, 24.0, 58.0, 77.0, 96.0, 152.0, 153.0, 109.0, 103.0, 53.0, 31.0, 33.0, 20.0, 8.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.27734375, -6.0697021484375, -5.862060546875, -5.6544189453125, -5.44677734375, -5.2391357421875, -5.031494140625, -4.8238525390625, -4.6162109375, -4.4085693359375, -4.200927734375, -3.9932861328125, -3.78564453125, -3.5780029296875, -3.370361328125, -3.1627197265625, -2.955078125, -2.7474365234375, -2.539794921875, -2.3321533203125, -2.12451171875, -1.9168701171875, -1.709228515625, -1.5015869140625, -1.2939453125, -1.0863037109375, -0.878662109375, -0.6710205078125, -0.46337890625, -0.2557373046875, -0.048095703125, 0.1595458984375, 0.3671875, 0.5748291015625, 0.782470703125, 0.9901123046875, 1.19775390625, 1.4053955078125, 1.613037109375, 1.8206787109375, 2.0283203125, 2.2359619140625, 2.443603515625, 2.6512451171875, 2.85888671875, 3.0665283203125, 3.274169921875, 3.4818115234375, 3.689453125, 3.8970947265625, 4.104736328125, 4.3123779296875, 4.52001953125, 4.7276611328125, 4.935302734375, 5.1429443359375, 5.3505859375, 5.5582275390625, 5.765869140625, 5.9735107421875, 6.18115234375, 6.3887939453125, 6.596435546875, 6.8040771484375, 7.01171875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 10.0, 19.0, 27.0, 32.0, 67.0, 121.0, 159.0, 165.0, 156.0, 108.0, 60.0, 35.0, 13.0, 11.0, 3.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.730405807495117, -28.601125717163086, -26.471845626831055, -24.34256362915039, -22.21328353881836, -20.084003448486328, -17.954723358154297, -15.825443267822266, -13.696163177490234, -11.566883087158203, -9.437602996826172, -7.308321952819824, -5.179041862487793, -3.0497617721557617, -0.9204807281494141, 1.2087993621826172, 3.3380794525146484, 5.46735954284668, 7.596640110015869, 9.725920677185059, 11.85520076751709, 13.984480857849121, 16.11376190185547, 18.2430419921875, 20.37232208251953, 22.501602172851562, 24.630882263183594, 26.760162353515625, 28.889442443847656, 31.018722534179688, 33.14800262451172, 35.27728271484375, 37.40656280517578, 39.53584289550781, 41.665122985839844, 43.794403076171875, 45.923683166503906, 48.05296325683594, 50.18224334716797, 52.3115234375, 54.44080352783203, 56.57008361816406, 58.699363708496094, 60.828643798828125, 62.957923889160156, 65.08720397949219, 67.21648406982422, 69.34576416015625, 71.47505187988281, 73.60433197021484, 75.73361206054688, 77.8628921508789, 79.99217224121094, 82.12145233154297, 84.250732421875, 86.38001251220703, 88.50929260253906, 90.6385726928711, 92.76785278320312, 94.89713287353516, 97.02641296386719, 99.15569305419922, 101.28497314453125, 103.41425323486328, 105.54353332519531]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 8.0, 13.0, 13.0, 18.0, 17.0, 17.0, 42.0, 27.0, 36.0, 47.0, 57.0, 42.0, 54.0, 66.0, 61.0, 38.0, 76.0, 49.0, 45.0, 41.0, 40.0, 38.0, 32.0, 21.0, 14.0, 11.0, 14.0, 9.0, 8.0, 4.0, 6.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.27193832397461, -55.65666580200195, -54.04138946533203, -52.426116943359375, -50.81084442138672, -49.1955680847168, -47.58029556274414, -45.96501922607422, -44.34974670410156, -42.734474182128906, -41.119197845458984, -39.50392532348633, -37.888648986816406, -36.27337646484375, -34.658103942871094, -33.04283142089844, -31.427555084228516, -29.812280654907227, -28.197006225585938, -26.58173370361328, -24.966459274291992, -23.351184844970703, -21.735912322998047, -20.120637893676758, -18.50536346435547, -16.89008903503418, -15.274815559387207, -13.659542083740234, -12.044267654418945, -10.428993225097656, -8.813719749450684, -7.198446273803711, -5.5831756591796875, -3.9679017066955566, -2.352627754211426, -0.7373538017272949, 0.8779201507568359, 2.493194580078125, 4.108468055725098, 5.72374153137207, 7.339015960693359, 8.954290390014648, 10.569563865661621, 12.184837341308594, 13.800111770629883, 15.415386199951172, 17.030658721923828, 18.645933151245117, 20.261207580566406, 21.876482009887695, 23.491756439208984, 25.10702896118164, 26.72230339050293, 28.33757781982422, 29.952850341796875, 31.568124771118164, 33.18339920043945, 34.79867172241211, 36.41394805908203, 38.02922058105469, 39.644493103027344, 41.259769439697266, 42.87504196166992, 44.490318298339844, 46.1055908203125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 4.0, 3.0, 9.0, 8.0, 12.0, 31.0, 31.0, 69.0, 80.0, 118.0, 253.0, 346.0, 675.0, 1434.0, 3247.0, 9830.0, 62027.0, 4024493.0, 74170.0, 10756.0, 3446.0, 1476.0, 754.0, 394.0, 238.0, 135.0, 84.0, 46.0, 36.0, 16.0, 21.0, 10.0, 13.0, 2.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3828125, -5.179931640625, -4.97705078125, -4.774169921875, -4.5712890625, -4.368408203125, -4.16552734375, -3.962646484375, -3.759765625, -3.556884765625, -3.35400390625, -3.151123046875, -2.9482421875, -2.745361328125, -2.54248046875, -2.339599609375, -2.13671875, -1.933837890625, -1.73095703125, -1.528076171875, -1.3251953125, -1.122314453125, -0.91943359375, -0.716552734375, -0.513671875, -0.310791015625, -0.10791015625, 0.094970703125, 0.2978515625, 0.500732421875, 0.70361328125, 0.906494140625, 1.109375, 1.312255859375, 1.51513671875, 1.718017578125, 1.9208984375, 2.123779296875, 2.32666015625, 2.529541015625, 2.732421875, 2.935302734375, 3.13818359375, 3.341064453125, 3.5439453125, 3.746826171875, 3.94970703125, 4.152587890625, 4.35546875, 4.558349609375, 4.76123046875, 4.964111328125, 5.1669921875, 5.369873046875, 5.57275390625, 5.775634765625, 5.978515625, 6.181396484375, 6.38427734375, 6.587158203125, 6.7900390625, 6.992919921875, 7.19580078125, 7.398681640625, 7.6015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 7.0, 11.0, 10.0, 13.0, 23.0, 21.0, 27.0, 33.0, 39.0, 37.0, 55.0, 49.0, 59.0, 59.0, 67.0, 53.0, 43.0, 58.0, 53.0, 49.0, 35.0, 31.0, 43.0, 36.0, 19.0, 15.0, 10.0, 9.0, 4.0, 6.0, 2.0, 5.0, 3.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.162109375, -2.1000823974609375, -2.038055419921875, -1.9760284423828125, -1.91400146484375, -1.8519744873046875, -1.789947509765625, -1.7279205322265625, -1.6658935546875, -1.6038665771484375, -1.541839599609375, -1.4798126220703125, -1.41778564453125, -1.3557586669921875, -1.293731689453125, -1.2317047119140625, -1.169677734375, -1.1076507568359375, -1.045623779296875, -0.9835968017578125, -0.92156982421875, -0.8595428466796875, -0.797515869140625, -0.7354888916015625, -0.6734619140625, -0.6114349365234375, -0.549407958984375, -0.4873809814453125, -0.42535400390625, -0.3633270263671875, -0.301300048828125, -0.2392730712890625, -0.17724609375, -0.1152191162109375, -0.053192138671875, 0.0088348388671875, 0.07086181640625, 0.1328887939453125, 0.194915771484375, 0.2569427490234375, 0.3189697265625, 0.3809967041015625, 0.443023681640625, 0.5050506591796875, 0.56707763671875, 0.6291046142578125, 0.691131591796875, 0.7531585693359375, 0.815185546875, 0.8772125244140625, 0.939239501953125, 1.0012664794921875, 1.06329345703125, 1.1253204345703125, 1.187347412109375, 1.2493743896484375, 1.3114013671875, 1.3734283447265625, 1.435455322265625, 1.4974822998046875, 1.55950927734375, 1.6215362548828125, 1.683563232421875, 1.7455902099609375, 1.8076171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 7.0, 5.0, 10.0, 11.0, 22.0, 37.0, 40.0, 34.0, 44.0, 82.0, 109.0, 148.0, 198.0, 329.0, 385.0, 602.0, 934.0, 1605.0, 3027.0, 6950.0, 22671.0, 204157.0, 3875535.0, 55122.0, 12053.0, 4375.0, 2119.0, 1222.0, 763.0, 513.0, 348.0, 209.0, 168.0, 120.0, 88.0, 64.0, 45.0, 38.0, 21.0, 25.0, 10.0, 16.0, 4.0, 11.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.53125, -6.34600830078125, -6.1607666015625, -5.97552490234375, -5.790283203125, -5.60504150390625, -5.4197998046875, -5.23455810546875, -5.04931640625, -4.86407470703125, -4.6788330078125, -4.49359130859375, -4.308349609375, -4.12310791015625, -3.9378662109375, -3.75262451171875, -3.5673828125, -3.38214111328125, -3.1968994140625, -3.01165771484375, -2.826416015625, -2.64117431640625, -2.4559326171875, -2.27069091796875, -2.08544921875, -1.90020751953125, -1.7149658203125, -1.52972412109375, -1.344482421875, -1.15924072265625, -0.9739990234375, -0.78875732421875, -0.603515625, -0.41827392578125, -0.2330322265625, -0.04779052734375, 0.137451171875, 0.32269287109375, 0.5079345703125, 0.69317626953125, 0.87841796875, 1.06365966796875, 1.2489013671875, 1.43414306640625, 1.619384765625, 1.80462646484375, 1.9898681640625, 2.17510986328125, 2.3603515625, 2.54559326171875, 2.7308349609375, 2.91607666015625, 3.101318359375, 3.28656005859375, 3.4718017578125, 3.65704345703125, 3.84228515625, 4.02752685546875, 4.2127685546875, 4.39801025390625, 4.583251953125, 4.76849365234375, 4.9537353515625, 5.13897705078125, 5.32421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 13.0, 15.0, 36.0, 102.0, 1034.0, 2704.0, 89.0, 34.0, 16.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.255859375, -2.183135986328125, -2.11041259765625, -2.037689208984375, -1.9649658203125, -1.892242431640625, -1.81951904296875, -1.746795654296875, -1.674072265625, -1.601348876953125, -1.52862548828125, -1.455902099609375, -1.3831787109375, -1.310455322265625, -1.23773193359375, -1.165008544921875, -1.09228515625, -1.019561767578125, -0.94683837890625, -0.874114990234375, -0.8013916015625, -0.728668212890625, -0.65594482421875, -0.583221435546875, -0.510498046875, -0.437774658203125, -0.36505126953125, -0.292327880859375, -0.2196044921875, -0.146881103515625, -0.07415771484375, -0.001434326171875, 0.0712890625, 0.144012451171875, 0.21673583984375, 0.289459228515625, 0.3621826171875, 0.434906005859375, 0.50762939453125, 0.580352783203125, 0.653076171875, 0.725799560546875, 0.79852294921875, 0.871246337890625, 0.9439697265625, 1.016693115234375, 1.08941650390625, 1.162139892578125, 1.23486328125, 1.307586669921875, 1.38031005859375, 1.453033447265625, 1.5257568359375, 1.598480224609375, 1.67120361328125, 1.743927001953125, 1.816650390625, 1.889373779296875, 1.96209716796875, 2.034820556640625, 2.1075439453125, 2.180267333984375, 2.25299072265625, 2.325714111328125, 2.3984375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 7.0, 4.0, 10.0, 34.0, 64.0, 191.0, 263.0, 243.0, 133.0, 43.0, 16.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8220269680023193, -3.451220750808716, -3.0804147720336914, -2.709608554840088, -2.3388023376464844, -1.9679961204528809, -1.5971901416778564, -1.226383924484253, -0.8555777072906494, -0.4847715497016907, -0.11396539211273193, 0.25684070587158203, 0.6276469230651855, 0.9984531402587891, 1.3692591190338135, 1.740065336227417, 2.1108715534210205, 2.481677770614624, 2.8524837493896484, 3.223289966583252, 3.5940961837768555, 3.964902400970459, 4.3357086181640625, 4.706514358520508, 5.0773210525512695, 5.448127269744873, 5.818933486938477, 6.189739227294922, 6.560545921325684, 6.931351661682129, 7.302157878875732, 7.672964096069336, 8.043769836425781, 8.414575576782227, 8.785382270812988, 9.156188011169434, 9.526994705200195, 9.89780044555664, 10.268606185913086, 10.639412879943848, 11.01021957397461, 11.381025314331055, 11.751832008361816, 12.122637748718262, 12.493444442749023, 12.864250183105469, 13.235055923461914, 13.605862617492676, 13.976668357849121, 14.347474098205566, 14.718280792236328, 15.089086532592773, 15.459893226623535, 15.83069896697998, 16.201505661010742, 16.572311401367188, 16.943117141723633, 17.313922882080078, 17.684728622436523, 18.0555362701416, 18.426342010498047, 18.797147750854492, 19.167953491210938, 19.538761138916016, 19.90956687927246]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 9.0, 9.0, 12.0, 11.0, 14.0, 15.0, 24.0, 20.0, 22.0, 35.0, 29.0, 34.0, 32.0, 46.0, 37.0, 42.0, 50.0, 46.0, 52.0, 47.0, 39.0, 48.0, 36.0, 32.0, 44.0, 28.0, 40.0, 22.0, 15.0, 23.0, 18.0, 13.0, 13.0, 13.0, 4.0, 4.0, 6.0, 3.0, 1.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.6612911224365234, -3.5487639904022217, -3.436236619949341, -3.323709487915039, -3.2111823558807373, -3.0986552238464355, -2.9861278533935547, -2.873600721359253, -2.761073589324951, -2.6485464572906494, -2.5360190868377686, -2.423491954803467, -2.310964822769165, -2.1984376907348633, -2.0859103202819824, -1.9733831882476807, -1.8608559370040894, -1.748328685760498, -1.6358015537261963, -1.523274302482605, -1.4107471704483032, -1.298219919204712, -1.1856927871704102, -1.0731655359268188, -0.9606383442878723, -0.8481111526489258, -0.7355839610099792, -0.6230567693710327, -0.5105295181274414, -0.3980023264884949, -0.28547513484954834, -0.1729479432106018, -0.06042075157165527, 0.05210644751787186, 0.164633646607399, 0.2771608531475067, 0.38968804478645325, 0.5022152662277222, 0.6147424578666687, 0.7272696495056152, 0.8397968411445618, 0.9523240327835083, 1.0648512840270996, 1.1773784160614014, 1.2899056673049927, 1.402432918548584, 1.5149600505828857, 1.6274871826171875, 1.7400144338607788, 1.8525416851043701, 1.9650688171386719, 2.0775959491729736, 2.1901233196258545, 2.3026504516601562, 2.415177583694458, 2.5277047157287598, 2.6402320861816406, 2.7527592182159424, 2.8652865886688232, 2.977813720703125, 3.0903408527374268, 3.2028679847717285, 3.3153953552246094, 3.427922487258911, 3.540449619293213]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 4.0, 7.0, 9.0, 10.0, 23.0, 16.0, 41.0, 41.0, 50.0, 85.0, 169.0, 231.0, 398.0, 789.0, 1463.0, 3252.0, 7298.0, 18680.0, 51518.0, 144463.0, 318638.0, 299438.0, 127300.0, 45374.0, 16734.0, 6650.0, 2794.0, 1344.0, 667.0, 400.0, 209.0, 120.0, 99.0, 73.0, 40.0, 36.0, 23.0, 12.0, 11.0, 8.0, 6.0, 9.0, 2.0, 5.0, 3.0, 2.0, 1.0, 5.0, 1.0, 3.0], "bins": [-4.30859375, -4.185272216796875, -4.06195068359375, -3.938629150390625, -3.8153076171875, -3.691986083984375, -3.56866455078125, -3.445343017578125, -3.322021484375, -3.198699951171875, -3.07537841796875, -2.952056884765625, -2.8287353515625, -2.705413818359375, -2.58209228515625, -2.458770751953125, -2.33544921875, -2.212127685546875, -2.08880615234375, -1.965484619140625, -1.8421630859375, -1.718841552734375, -1.59552001953125, -1.472198486328125, -1.348876953125, -1.225555419921875, -1.10223388671875, -0.978912353515625, -0.8555908203125, -0.732269287109375, -0.60894775390625, -0.485626220703125, -0.3623046875, -0.238983154296875, -0.11566162109375, 0.007659912109375, 0.1309814453125, 0.254302978515625, 0.37762451171875, 0.500946044921875, 0.624267578125, 0.747589111328125, 0.87091064453125, 0.994232177734375, 1.1175537109375, 1.240875244140625, 1.36419677734375, 1.487518310546875, 1.61083984375, 1.734161376953125, 1.85748291015625, 1.980804443359375, 2.1041259765625, 2.227447509765625, 2.35076904296875, 2.474090576171875, 2.597412109375, 2.720733642578125, 2.84405517578125, 2.967376708984375, 3.0906982421875, 3.214019775390625, 3.33734130859375, 3.460662841796875, 3.583984375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 7.0, 5.0, 5.0, 7.0, 13.0, 13.0, 16.0, 20.0, 29.0, 32.0, 31.0, 29.0, 36.0, 42.0, 42.0, 56.0, 56.0, 46.0, 46.0, 54.0, 47.0, 47.0, 48.0, 43.0, 24.0, 28.0, 33.0, 27.0, 30.0, 19.0, 13.0, 9.0, 9.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6259765625, -1.5720672607421875, -1.518157958984375, -1.4642486572265625, -1.41033935546875, -1.3564300537109375, -1.302520751953125, -1.2486114501953125, -1.1947021484375, -1.1407928466796875, -1.086883544921875, -1.0329742431640625, -0.97906494140625, -0.9251556396484375, -0.871246337890625, -0.8173370361328125, -0.763427734375, -0.7095184326171875, -0.655609130859375, -0.6016998291015625, -0.54779052734375, -0.4938812255859375, -0.439971923828125, -0.3860626220703125, -0.3321533203125, -0.2782440185546875, -0.224334716796875, -0.1704254150390625, -0.11651611328125, -0.0626068115234375, -0.008697509765625, 0.0452117919921875, 0.09912109375, 0.1530303955078125, 0.206939697265625, 0.2608489990234375, 0.31475830078125, 0.3686676025390625, 0.422576904296875, 0.4764862060546875, 0.5303955078125, 0.5843048095703125, 0.638214111328125, 0.6921234130859375, 0.74603271484375, 0.7999420166015625, 0.853851318359375, 0.9077606201171875, 0.961669921875, 1.0155792236328125, 1.069488525390625, 1.1233978271484375, 1.17730712890625, 1.2312164306640625, 1.285125732421875, 1.3390350341796875, 1.3929443359375, 1.4468536376953125, 1.500762939453125, 1.5546722412109375, 1.60858154296875, 1.6624908447265625, 1.716400146484375, 1.7703094482421875, 1.82421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 5.0, 0.0, 2.0, 10.0, 12.0, 16.0, 18.0, 26.0, 36.0, 60.0, 82.0, 140.0, 271.0, 444.0, 829.0, 1748.0, 3814.0, 9522.0, 26879.0, 87248.0, 304243.0, 419360.0, 131937.0, 38815.0, 13218.0, 5147.0, 2268.0, 1090.0, 568.0, 282.0, 143.0, 96.0, 76.0, 47.0, 23.0, 22.0, 11.0, 14.0, 6.0, 6.0, 4.0, 3.0, 4.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.95703125, -4.80291748046875, -4.6488037109375, -4.49468994140625, -4.340576171875, -4.18646240234375, -4.0323486328125, -3.87823486328125, -3.72412109375, -3.57000732421875, -3.4158935546875, -3.26177978515625, -3.107666015625, -2.95355224609375, -2.7994384765625, -2.64532470703125, -2.4912109375, -2.33709716796875, -2.1829833984375, -2.02886962890625, -1.874755859375, -1.72064208984375, -1.5665283203125, -1.41241455078125, -1.25830078125, -1.10418701171875, -0.9500732421875, -0.79595947265625, -0.641845703125, -0.48773193359375, -0.3336181640625, -0.17950439453125, -0.025390625, 0.12872314453125, 0.2828369140625, 0.43695068359375, 0.591064453125, 0.74517822265625, 0.8992919921875, 1.05340576171875, 1.20751953125, 1.36163330078125, 1.5157470703125, 1.66986083984375, 1.823974609375, 1.97808837890625, 2.1322021484375, 2.28631591796875, 2.4404296875, 2.59454345703125, 2.7486572265625, 2.90277099609375, 3.056884765625, 3.21099853515625, 3.3651123046875, 3.51922607421875, 3.67333984375, 3.82745361328125, 3.9815673828125, 4.13568115234375, 4.289794921875, 4.44390869140625, 4.5980224609375, 4.75213623046875, 4.90625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 3.0, 16.0, 17.0, 9.0, 20.0, 25.0, 21.0, 27.0, 33.0, 41.0, 38.0, 39.0, 53.0, 40.0, 39.0, 45.0, 42.0, 52.0, 47.0, 53.0, 36.0, 42.0, 38.0, 24.0, 27.0, 29.0, 24.0, 18.0, 23.0, 10.0, 13.0, 15.0, 9.0, 6.0, 6.0, 1.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.109375, -8.7899169921875, -8.470458984375, -8.1510009765625, -7.83154296875, -7.5120849609375, -7.192626953125, -6.8731689453125, -6.5537109375, -6.2342529296875, -5.914794921875, -5.5953369140625, -5.27587890625, -4.9564208984375, -4.636962890625, -4.3175048828125, -3.998046875, -3.6785888671875, -3.359130859375, -3.0396728515625, -2.72021484375, -2.4007568359375, -2.081298828125, -1.7618408203125, -1.4423828125, -1.1229248046875, -0.803466796875, -0.4840087890625, -0.16455078125, 0.1549072265625, 0.474365234375, 0.7938232421875, 1.11328125, 1.4327392578125, 1.752197265625, 2.0716552734375, 2.39111328125, 2.7105712890625, 3.030029296875, 3.3494873046875, 3.6689453125, 3.9884033203125, 4.307861328125, 4.6273193359375, 4.94677734375, 5.2662353515625, 5.585693359375, 5.9051513671875, 6.224609375, 6.5440673828125, 6.863525390625, 7.1829833984375, 7.50244140625, 7.8218994140625, 8.141357421875, 8.4608154296875, 8.7802734375, 9.0997314453125, 9.419189453125, 9.7386474609375, 10.05810546875, 10.3775634765625, 10.697021484375, 11.0164794921875, 11.3359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 13.0, 12.0, 20.0, 21.0, 42.0, 63.0, 122.0, 247.0, 577.0, 1571.0, 6040.0, 41354.0, 774498.0, 204895.0, 14233.0, 3083.0, 938.0, 401.0, 169.0, 77.0, 50.0, 33.0, 21.0, 12.0, 15.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.60546875, -5.4232177734375, -5.240966796875, -5.0587158203125, -4.87646484375, -4.6942138671875, -4.511962890625, -4.3297119140625, -4.1474609375, -3.9652099609375, -3.782958984375, -3.6007080078125, -3.41845703125, -3.2362060546875, -3.053955078125, -2.8717041015625, -2.689453125, -2.5072021484375, -2.324951171875, -2.1427001953125, -1.96044921875, -1.7781982421875, -1.595947265625, -1.4136962890625, -1.2314453125, -1.0491943359375, -0.866943359375, -0.6846923828125, -0.50244140625, -0.3201904296875, -0.137939453125, 0.0443115234375, 0.2265625, 0.4088134765625, 0.591064453125, 0.7733154296875, 0.95556640625, 1.1378173828125, 1.320068359375, 1.5023193359375, 1.6845703125, 1.8668212890625, 2.049072265625, 2.2313232421875, 2.41357421875, 2.5958251953125, 2.778076171875, 2.9603271484375, 3.142578125, 3.3248291015625, 3.507080078125, 3.6893310546875, 3.87158203125, 4.0538330078125, 4.236083984375, 4.4183349609375, 4.6005859375, 4.7828369140625, 4.965087890625, 5.1473388671875, 5.32958984375, 5.5118408203125, 5.694091796875, 5.8763427734375, 6.05859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 4.0, 13.0, 14.0, 21.0, 28.0, 35.0, 44.0, 52.0, 76.0, 78.0, 105.0, 100.0, 84.0, 88.0, 69.0, 47.0, 25.0, 33.0, 18.0, 15.0, 16.0, 9.0, 3.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021469593048095703, -0.00020546279847621918, -0.00019622966647148132, -0.00018699653446674347, -0.00017776340246200562, -0.00016853027045726776, -0.0001592971384525299, -0.00015006400644779205, -0.0001408308744430542, -0.00013159774243831635, -0.0001223646104335785, -0.00011313147842884064, -0.00010389834642410278, -9.466521441936493e-05, -8.543208241462708e-05, -7.619895040988922e-05, -6.696581840515137e-05, -5.773268640041351e-05, -4.849955439567566e-05, -3.9266422390937805e-05, -3.003329038619995e-05, -2.0800158381462097e-05, -1.1567026376724243e-05, -2.333894371986389e-06, 6.899237632751465e-06, 1.613236963748932e-05, 2.5365501642227173e-05, 3.459863364696503e-05, 4.383176565170288e-05, 5.3064897656440735e-05, 6.229802966117859e-05, 7.153116166591644e-05, 8.07642936706543e-05, 8.999742567539215e-05, 9.923055768013e-05, 0.00010846368968486786, 0.00011769682168960571, 0.00012692995369434357, 0.00013616308569908142, 0.00014539621770381927, 0.00015462934970855713, 0.00016386248171329498, 0.00017309561371803284, 0.0001823287457227707, 0.00019156187772750854, 0.0002007950097322464, 0.00021002814173698425, 0.0002192612737417221, 0.00022849440574645996, 0.00023772753775119781, 0.00024696066975593567, 0.0002561938017606735, 0.0002654269337654114, 0.00027466006577014923, 0.0002838931977748871, 0.00029312632977962494, 0.0003023594617843628, 0.00031159259378910065, 0.0003208257257938385, 0.00033005885779857635, 0.0003392919898033142, 0.00034852512180805206, 0.0003577582538127899, 0.00036699138581752777, 0.0003762245178222656]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 8.0, 6.0, 14.0, 8.0, 13.0, 22.0, 26.0, 43.0, 64.0, 106.0, 224.0, 401.0, 851.0, 2021.0, 5392.0, 19395.0, 144778.0, 733782.0, 115627.0, 17192.0, 5067.0, 1790.0, 789.0, 381.0, 220.0, 116.0, 73.0, 53.0, 28.0, 11.0, 14.0, 3.0, 11.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.1953125, -4.069915771484375, -3.94451904296875, -3.819122314453125, -3.6937255859375, -3.568328857421875, -3.44293212890625, -3.317535400390625, -3.192138671875, -3.066741943359375, -2.94134521484375, -2.815948486328125, -2.6905517578125, -2.565155029296875, -2.43975830078125, -2.314361572265625, -2.18896484375, -2.063568115234375, -1.93817138671875, -1.812774658203125, -1.6873779296875, -1.561981201171875, -1.43658447265625, -1.311187744140625, -1.185791015625, -1.060394287109375, -0.93499755859375, -0.809600830078125, -0.6842041015625, -0.558807373046875, -0.43341064453125, -0.308013916015625, -0.1826171875, -0.057220458984375, 0.06817626953125, 0.193572998046875, 0.3189697265625, 0.444366455078125, 0.56976318359375, 0.695159912109375, 0.820556640625, 0.945953369140625, 1.07135009765625, 1.196746826171875, 1.3221435546875, 1.447540283203125, 1.57293701171875, 1.698333740234375, 1.82373046875, 1.949127197265625, 2.07452392578125, 2.199920654296875, 2.3253173828125, 2.450714111328125, 2.57611083984375, 2.701507568359375, 2.826904296875, 2.952301025390625, 3.07769775390625, 3.203094482421875, 3.3284912109375, 3.453887939453125, 3.57928466796875, 3.704681396484375, 3.830078125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 4.0, 9.0, 12.0, 16.0, 16.0, 20.0, 46.0, 84.0, 115.0, 155.0, 155.0, 133.0, 79.0, 52.0, 26.0, 18.0, 10.0, 9.0, 6.0, 5.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.6505126953125, -4.449462890625, -4.2484130859375, -4.04736328125, -3.8463134765625, -3.645263671875, -3.4442138671875, -3.2431640625, -3.0421142578125, -2.841064453125, -2.6400146484375, -2.43896484375, -2.2379150390625, -2.036865234375, -1.8358154296875, -1.634765625, -1.4337158203125, -1.232666015625, -1.0316162109375, -0.83056640625, -0.6295166015625, -0.428466796875, -0.2274169921875, -0.0263671875, 0.1746826171875, 0.375732421875, 0.5767822265625, 0.77783203125, 0.9788818359375, 1.179931640625, 1.3809814453125, 1.58203125, 1.7830810546875, 1.984130859375, 2.1851806640625, 2.38623046875, 2.5872802734375, 2.788330078125, 2.9893798828125, 3.1904296875, 3.3914794921875, 3.592529296875, 3.7935791015625, 3.99462890625, 4.1956787109375, 4.396728515625, 4.5977783203125, 4.798828125, 4.9998779296875, 5.200927734375, 5.4019775390625, 5.60302734375, 5.8040771484375, 6.005126953125, 6.2061767578125, 6.4072265625, 6.6082763671875, 6.809326171875, 7.0103759765625, 7.21142578125, 7.4124755859375, 7.613525390625, 7.8145751953125, 8.015625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 33.0, 134.0, 358.0, 286.0, 136.0, 36.0, 10.0, 8.0, 8.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-226.37408447265625, -221.8329620361328, -217.29185485839844, -212.750732421875, -208.20962524414062, -203.6685028076172, -199.1273956298828, -194.58627319335938, -190.045166015625, -185.50404357910156, -180.9629364013672, -176.42181396484375, -171.88070678710938, -167.33958435058594, -162.79847717285156, -158.25735473632812, -153.7162322998047, -149.17510986328125, -144.63400268554688, -140.09288024902344, -135.55177307128906, -131.01065063476562, -126.46953582763672, -121.92842102050781, -117.3873062133789, -112.84619140625, -108.3050765991211, -103.76396179199219, -99.22283935546875, -94.68173217773438, -90.14060974121094, -85.59949493408203, -81.05838012695312, -76.51726531982422, -71.97615051269531, -67.4350357055664, -62.893917083740234, -58.35280227661133, -53.811683654785156, -49.27056884765625, -44.729454040527344, -40.18833923339844, -35.64722442626953, -31.10610580444336, -26.564990997314453, -22.023876190185547, -17.482759475708008, -12.941642761230469, -8.400527954101562, -3.85941219329834, 0.6817035675048828, 5.2228193283081055, 9.763935089111328, 14.305049896240234, 18.846166610717773, 23.387283325195312, 27.92839813232422, 32.469512939453125, 37.01062774658203, 41.5517463684082, 46.09286117553711, 50.633975982666016, 55.17509460449219, 59.716209411621094, 64.25732421875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 3.0, 6.0, 5.0, 6.0, 10.0, 12.0, 19.0, 20.0, 14.0, 26.0, 36.0, 30.0, 27.0, 47.0, 45.0, 52.0, 41.0, 43.0, 53.0, 54.0, 48.0, 52.0, 45.0, 49.0, 36.0, 30.0, 27.0, 18.0, 16.0, 23.0, 19.0, 22.0, 9.0, 8.0, 10.0, 6.0, 7.0, 5.0, 6.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-52.898746490478516, -51.378990173339844, -49.85923767089844, -48.339481353759766, -46.81972885131836, -45.29997253417969, -43.78022003173828, -42.26046371459961, -40.7407112121582, -39.22095489501953, -37.701202392578125, -36.18144607543945, -34.66169357299805, -33.141937255859375, -31.62218475341797, -30.102428436279297, -28.582674026489258, -27.06291961669922, -25.54316520690918, -24.02341079711914, -22.5036563873291, -20.983901977539062, -19.46414566040039, -17.944393157958984, -16.424636840820312, -14.904882431030273, -13.385128021240234, -11.865373611450195, -10.345619201660156, -8.825864791870117, -7.306109428405762, -5.786355018615723, -4.2666015625, -2.746847152709961, -1.2270925045013428, 0.2926621437072754, 1.8124165534973145, 3.3321709632873535, 4.851925849914551, 6.37168025970459, 7.891434669494629, 9.411189079284668, 10.930943489074707, 12.450698852539062, 13.970453262329102, 15.49020767211914, 17.00996208190918, 18.52971649169922, 20.049470901489258, 21.569225311279297, 23.088979721069336, 24.608734130859375, 26.128488540649414, 27.648242950439453, 29.167999267578125, 30.68775177001953, 32.2075080871582, 33.727264404296875, 35.24701690673828, 36.76677322387695, 38.28652572631836, 39.80628204345703, 41.32603454589844, 42.84579086303711, 44.365543365478516]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 12.0, 11.0, 22.0, 30.0, 46.0, 88.0, 141.0, 235.0, 403.0, 891.0, 2157.0, 6943.0, 51736.0, 4066063.0, 54345.0, 7154.0, 2157.0, 838.0, 416.0, 235.0, 134.0, 75.0, 49.0, 33.0, 13.0, 13.0, 9.0, 8.0, 1.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.67578125, -6.40338134765625, -6.1309814453125, -5.85858154296875, -5.586181640625, -5.31378173828125, -5.0413818359375, -4.76898193359375, -4.49658203125, -4.22418212890625, -3.9517822265625, -3.67938232421875, -3.406982421875, -3.13458251953125, -2.8621826171875, -2.58978271484375, -2.3173828125, -2.04498291015625, -1.7725830078125, -1.50018310546875, -1.227783203125, -0.95538330078125, -0.6829833984375, -0.41058349609375, -0.13818359375, 0.13421630859375, 0.4066162109375, 0.67901611328125, 0.951416015625, 1.22381591796875, 1.4962158203125, 1.76861572265625, 2.041015625, 2.31341552734375, 2.5858154296875, 2.85821533203125, 3.130615234375, 3.40301513671875, 3.6754150390625, 3.94781494140625, 4.22021484375, 4.49261474609375, 4.7650146484375, 5.03741455078125, 5.309814453125, 5.58221435546875, 5.8546142578125, 6.12701416015625, 6.3994140625, 6.67181396484375, 6.9442138671875, 7.21661376953125, 7.489013671875, 7.76141357421875, 8.0338134765625, 8.30621337890625, 8.57861328125, 8.85101318359375, 9.1234130859375, 9.39581298828125, 9.668212890625, 9.94061279296875, 10.2130126953125, 10.48541259765625, 10.7578125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 13.0, 14.0, 21.0, 31.0, 28.0, 43.0, 48.0, 74.0, 81.0, 78.0, 75.0, 81.0, 62.0, 84.0, 60.0, 55.0, 40.0, 39.0, 15.0, 12.0, 20.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.3984375, -3.30328369140625, -3.2081298828125, -3.11297607421875, -3.017822265625, -2.92266845703125, -2.8275146484375, -2.73236083984375, -2.63720703125, -2.54205322265625, -2.4468994140625, -2.35174560546875, -2.256591796875, -2.16143798828125, -2.0662841796875, -1.97113037109375, -1.8759765625, -1.78082275390625, -1.6856689453125, -1.59051513671875, -1.495361328125, -1.40020751953125, -1.3050537109375, -1.20989990234375, -1.11474609375, -1.01959228515625, -0.9244384765625, -0.82928466796875, -0.734130859375, -0.63897705078125, -0.5438232421875, -0.44866943359375, -0.353515625, -0.25836181640625, -0.1632080078125, -0.06805419921875, 0.027099609375, 0.12225341796875, 0.2174072265625, 0.31256103515625, 0.40771484375, 0.50286865234375, 0.5980224609375, 0.69317626953125, 0.788330078125, 0.88348388671875, 0.9786376953125, 1.07379150390625, 1.1689453125, 1.26409912109375, 1.3592529296875, 1.45440673828125, 1.549560546875, 1.64471435546875, 1.7398681640625, 1.83502197265625, 1.93017578125, 2.02532958984375, 2.1204833984375, 2.21563720703125, 2.310791015625, 2.40594482421875, 2.5010986328125, 2.59625244140625, 2.69140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 7.0, 10.0, 10.0, 15.0, 18.0, 40.0, 42.0, 47.0, 75.0, 99.0, 157.0, 213.0, 345.0, 497.0, 746.0, 1056.0, 1789.0, 2900.0, 5813.0, 12725.0, 38579.0, 258623.0, 3694376.0, 127397.0, 26957.0, 10108.0, 4710.0, 2437.0, 1483.0, 936.0, 672.0, 428.0, 299.0, 212.0, 159.0, 110.0, 62.0, 45.0, 26.0, 18.0, 25.0, 8.0, 9.0, 1.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.97265625, -2.85540771484375, -2.7381591796875, -2.62091064453125, -2.503662109375, -2.38641357421875, -2.2691650390625, -2.15191650390625, -2.03466796875, -1.91741943359375, -1.8001708984375, -1.68292236328125, -1.565673828125, -1.44842529296875, -1.3311767578125, -1.21392822265625, -1.0966796875, -0.97943115234375, -0.8621826171875, -0.74493408203125, -0.627685546875, -0.51043701171875, -0.3931884765625, -0.27593994140625, -0.15869140625, -0.04144287109375, 0.0758056640625, 0.19305419921875, 0.310302734375, 0.42755126953125, 0.5447998046875, 0.66204833984375, 0.779296875, 0.89654541015625, 1.0137939453125, 1.13104248046875, 1.248291015625, 1.36553955078125, 1.4827880859375, 1.60003662109375, 1.71728515625, 1.83453369140625, 1.9517822265625, 2.06903076171875, 2.186279296875, 2.30352783203125, 2.4207763671875, 2.53802490234375, 2.6552734375, 2.77252197265625, 2.8897705078125, 3.00701904296875, 3.124267578125, 3.24151611328125, 3.3587646484375, 3.47601318359375, 3.59326171875, 3.71051025390625, 3.8277587890625, 3.94500732421875, 4.062255859375, 4.17950439453125, 4.2967529296875, 4.41400146484375, 4.53125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 3.0, 14.0, 23.0, 25.0, 64.0, 157.0, 443.0, 2780.0, 282.0, 119.0, 48.0, 27.0, 12.0, 16.0, 10.0, 4.0, 7.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5947265625, -1.5508575439453125, -1.506988525390625, -1.4631195068359375, -1.41925048828125, -1.3753814697265625, -1.331512451171875, -1.2876434326171875, -1.2437744140625, -1.1999053955078125, -1.156036376953125, -1.1121673583984375, -1.06829833984375, -1.0244293212890625, -0.980560302734375, -0.9366912841796875, -0.892822265625, -0.8489532470703125, -0.805084228515625, -0.7612152099609375, -0.71734619140625, -0.6734771728515625, -0.629608154296875, -0.5857391357421875, -0.5418701171875, -0.4980010986328125, -0.454132080078125, -0.4102630615234375, -0.36639404296875, -0.3225250244140625, -0.278656005859375, -0.2347869873046875, -0.19091796875, -0.1470489501953125, -0.103179931640625, -0.0593109130859375, -0.01544189453125, 0.0284271240234375, 0.072296142578125, 0.1161651611328125, 0.1600341796875, 0.2039031982421875, 0.247772216796875, 0.2916412353515625, 0.33551025390625, 0.3793792724609375, 0.423248291015625, 0.4671173095703125, 0.510986328125, 0.5548553466796875, 0.598724365234375, 0.6425933837890625, 0.68646240234375, 0.7303314208984375, 0.774200439453125, 0.8180694580078125, 0.8619384765625, 0.9058074951171875, 0.949676513671875, 0.9935455322265625, 1.03741455078125, 1.0812835693359375, 1.125152587890625, 1.1690216064453125, 1.212890625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 17.0, 37.0, 40.0, 110.0, 151.0, 200.0, 177.0, 113.0, 69.0, 44.0, 11.0, 14.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.874142646789551, -5.622077465057373, -5.370012283325195, -5.117947578430176, -4.865882396697998, -4.61381721496582, -4.361752510070801, -4.109687328338623, -3.8576221466064453, -3.6055569648742676, -3.353492021560669, -3.1014270782470703, -2.8493618965148926, -2.597296714782715, -2.345231771469116, -2.0931668281555176, -1.8411016464233398, -1.5890365839004517, -1.3369715213775635, -1.0849064588546753, -0.8328413963317871, -0.5807763338088989, -0.32871127128601074, -0.07664620876312256, 0.17541885375976562, 0.4274839162826538, 0.679548978805542, 0.9316140413284302, 1.1836791038513184, 1.4357441663742065, 1.6878092288970947, 1.939874291419983, 2.1919403076171875, 2.4440054893493652, 2.696070432662964, 2.9481353759765625, 3.2002005577087402, 3.452265739440918, 3.7043306827545166, 3.9563956260681152, 4.208460807800293, 4.460525989532471, 4.712591171264648, 4.964655876159668, 5.216721057891846, 5.468786239624023, 5.720850944519043, 5.972916126251221, 6.224981307983398, 6.477046489715576, 6.729111671447754, 6.981176376342773, 7.233241558074951, 7.485306739807129, 7.737371444702148, 7.989436626434326, 8.241501808166504, 8.493566513061523, 8.74563217163086, 8.997696876525879, 9.249761581420898, 9.501827239990234, 9.753891944885254, 10.00595760345459, 10.25802230834961]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 9.0, 8.0, 9.0, 10.0, 8.0, 13.0, 23.0, 18.0, 24.0, 24.0, 26.0, 28.0, 41.0, 38.0, 34.0, 49.0, 54.0, 46.0, 47.0, 44.0, 46.0, 48.0, 27.0, 35.0, 40.0, 39.0, 35.0, 23.0, 26.0, 22.0, 21.0, 15.0, 16.0, 9.0, 9.0, 7.0, 10.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.3077476024627686, -3.2072198390960693, -3.106692314147949, -3.00616455078125, -2.905636787414551, -2.8051090240478516, -2.7045812606811523, -2.6040537357330322, -2.503525972366333, -2.402998208999634, -2.3024706840515137, -2.2019429206848145, -2.1014151573181152, -2.000887393951416, -1.9003597497940063, -1.7998321056365967, -1.6993043422698975, -1.5987765789031982, -1.4982489347457886, -1.397721290588379, -1.2971935272216797, -1.1966657638549805, -1.0961381196975708, -0.9956104159355164, -0.8950827121734619, -0.7945550084114075, -0.694027304649353, -0.5934996008872986, -0.49297189712524414, -0.3924441933631897, -0.29191648960113525, -0.1913887858390808, -0.09086084365844727, 0.009666860103607178, 0.11019456386566162, 0.21072226762771606, 0.3112499713897705, 0.41177767515182495, 0.5123053789138794, 0.6128330826759338, 0.7133607864379883, 0.8138884902000427, 0.9144161939620972, 1.0149438381195068, 1.115471601486206, 1.2159993648529053, 1.316527009010315, 1.4170546531677246, 1.5175824165344238, 1.618110179901123, 1.7186378240585327, 1.8191654682159424, 1.9196932315826416, 2.020220994949341, 2.120748519897461, 2.22127628326416, 2.3218040466308594, 2.4223318099975586, 2.522859573364258, 2.623387098312378, 2.723914861679077, 2.8244426250457764, 2.9249701499938965, 3.0254979133605957, 3.126025676727295]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 6.0, 7.0, 14.0, 19.0, 24.0, 33.0, 72.0, 102.0, 173.0, 289.0, 571.0, 1080.0, 2327.0, 5643.0, 16412.0, 56860.0, 223638.0, 465565.0, 200274.0, 51050.0, 14835.0, 5123.0, 2119.0, 1027.0, 515.0, 294.0, 164.0, 120.0, 60.0, 43.0, 22.0, 17.0, 15.0, 7.0, 8.0, 4.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.16796875, -4.0311279296875, -3.894287109375, -3.7574462890625, -3.62060546875, -3.4837646484375, -3.346923828125, -3.2100830078125, -3.0732421875, -2.9364013671875, -2.799560546875, -2.6627197265625, -2.52587890625, -2.3890380859375, -2.252197265625, -2.1153564453125, -1.978515625, -1.8416748046875, -1.704833984375, -1.5679931640625, -1.43115234375, -1.2943115234375, -1.157470703125, -1.0206298828125, -0.8837890625, -0.7469482421875, -0.610107421875, -0.4732666015625, -0.33642578125, -0.1995849609375, -0.062744140625, 0.0740966796875, 0.2109375, 0.3477783203125, 0.484619140625, 0.6214599609375, 0.75830078125, 0.8951416015625, 1.031982421875, 1.1688232421875, 1.3056640625, 1.4425048828125, 1.579345703125, 1.7161865234375, 1.85302734375, 1.9898681640625, 2.126708984375, 2.2635498046875, 2.400390625, 2.5372314453125, 2.674072265625, 2.8109130859375, 2.94775390625, 3.0845947265625, 3.221435546875, 3.3582763671875, 3.4951171875, 3.6319580078125, 3.768798828125, 3.9056396484375, 4.04248046875, 4.1793212890625, 4.316162109375, 4.4530029296875, 4.58984375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 7.0, 6.0, 11.0, 14.0, 18.0, 22.0, 29.0, 37.0, 38.0, 47.0, 82.0, 70.0, 73.0, 79.0, 64.0, 75.0, 59.0, 68.0, 47.0, 47.0, 28.0, 26.0, 19.0, 12.0, 12.0, 4.0, 3.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0703125, -2.981353759765625, -2.89239501953125, -2.803436279296875, -2.7144775390625, -2.625518798828125, -2.53656005859375, -2.447601318359375, -2.358642578125, -2.269683837890625, -2.18072509765625, -2.091766357421875, -2.0028076171875, -1.913848876953125, -1.82489013671875, -1.735931396484375, -1.64697265625, -1.558013916015625, -1.46905517578125, -1.380096435546875, -1.2911376953125, -1.202178955078125, -1.11322021484375, -1.024261474609375, -0.935302734375, -0.846343994140625, -0.75738525390625, -0.668426513671875, -0.5794677734375, -0.490509033203125, -0.40155029296875, -0.312591552734375, -0.2236328125, -0.134674072265625, -0.04571533203125, 0.043243408203125, 0.1322021484375, 0.221160888671875, 0.31011962890625, 0.399078369140625, 0.488037109375, 0.576995849609375, 0.66595458984375, 0.754913330078125, 0.8438720703125, 0.932830810546875, 1.02178955078125, 1.110748291015625, 1.19970703125, 1.288665771484375, 1.37762451171875, 1.466583251953125, 1.5555419921875, 1.644500732421875, 1.73345947265625, 1.822418212890625, 1.911376953125, 2.000335693359375, 2.08929443359375, 2.178253173828125, 2.2672119140625, 2.356170654296875, 2.44512939453125, 2.534088134765625, 2.623046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 5.0, 1.0, 10.0, 22.0, 23.0, 33.0, 46.0, 85.0, 126.0, 199.0, 370.0, 622.0, 1183.0, 3302.0, 11621.0, 58330.0, 399641.0, 480843.0, 71510.0, 13706.0, 3759.0, 1464.0, 662.0, 369.0, 215.0, 139.0, 95.0, 51.0, 31.0, 24.0, 19.0, 17.0, 6.0, 5.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.06640625, -6.87042236328125, -6.6744384765625, -6.47845458984375, -6.282470703125, -6.08648681640625, -5.8905029296875, -5.69451904296875, -5.49853515625, -5.30255126953125, -5.1065673828125, -4.91058349609375, -4.714599609375, -4.51861572265625, -4.3226318359375, -4.12664794921875, -3.9306640625, -3.73468017578125, -3.5386962890625, -3.34271240234375, -3.146728515625, -2.95074462890625, -2.7547607421875, -2.55877685546875, -2.36279296875, -2.16680908203125, -1.9708251953125, -1.77484130859375, -1.578857421875, -1.38287353515625, -1.1868896484375, -0.99090576171875, -0.794921875, -0.59893798828125, -0.4029541015625, -0.20697021484375, -0.010986328125, 0.18499755859375, 0.3809814453125, 0.57696533203125, 0.77294921875, 0.96893310546875, 1.1649169921875, 1.36090087890625, 1.556884765625, 1.75286865234375, 1.9488525390625, 2.14483642578125, 2.3408203125, 2.53680419921875, 2.7327880859375, 2.92877197265625, 3.124755859375, 3.32073974609375, 3.5167236328125, 3.71270751953125, 3.90869140625, 4.10467529296875, 4.3006591796875, 4.49664306640625, 4.692626953125, 4.88861083984375, 5.0845947265625, 5.28057861328125, 5.4765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 9.0, 8.0, 10.0, 10.0, 15.0, 21.0, 30.0, 38.0, 23.0, 43.0, 41.0, 43.0, 56.0, 70.0, 46.0, 62.0, 69.0, 52.0, 54.0, 51.0, 45.0, 36.0, 36.0, 24.0, 17.0, 18.0, 11.0, 10.0, 15.0, 7.0, 7.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6875, -11.33447265625, -10.9814453125, -10.62841796875, -10.275390625, -9.92236328125, -9.5693359375, -9.21630859375, -8.86328125, -8.51025390625, -8.1572265625, -7.80419921875, -7.451171875, -7.09814453125, -6.7451171875, -6.39208984375, -6.0390625, -5.68603515625, -5.3330078125, -4.97998046875, -4.626953125, -4.27392578125, -3.9208984375, -3.56787109375, -3.21484375, -2.86181640625, -2.5087890625, -2.15576171875, -1.802734375, -1.44970703125, -1.0966796875, -0.74365234375, -0.390625, -0.03759765625, 0.3154296875, 0.66845703125, 1.021484375, 1.37451171875, 1.7275390625, 2.08056640625, 2.43359375, 2.78662109375, 3.1396484375, 3.49267578125, 3.845703125, 4.19873046875, 4.5517578125, 4.90478515625, 5.2578125, 5.61083984375, 5.9638671875, 6.31689453125, 6.669921875, 7.02294921875, 7.3759765625, 7.72900390625, 8.08203125, 8.43505859375, 8.7880859375, 9.14111328125, 9.494140625, 9.84716796875, 10.2001953125, 10.55322265625, 10.90625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 4.0, 12.0, 10.0, 14.0, 27.0, 38.0, 61.0, 103.0, 189.0, 441.0, 1338.0, 5703.0, 76162.0, 883987.0, 72918.0, 5403.0, 1227.0, 472.0, 191.0, 109.0, 51.0, 31.0, 24.0, 15.0, 12.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.265625, -6.0985107421875, -5.931396484375, -5.7642822265625, -5.59716796875, -5.4300537109375, -5.262939453125, -5.0958251953125, -4.9287109375, -4.7615966796875, -4.594482421875, -4.4273681640625, -4.26025390625, -4.0931396484375, -3.926025390625, -3.7589111328125, -3.591796875, -3.4246826171875, -3.257568359375, -3.0904541015625, -2.92333984375, -2.7562255859375, -2.589111328125, -2.4219970703125, -2.2548828125, -2.0877685546875, -1.920654296875, -1.7535400390625, -1.58642578125, -1.4193115234375, -1.252197265625, -1.0850830078125, -0.91796875, -0.7508544921875, -0.583740234375, -0.4166259765625, -0.24951171875, -0.0823974609375, 0.084716796875, 0.2518310546875, 0.4189453125, 0.5860595703125, 0.753173828125, 0.9202880859375, 1.08740234375, 1.2545166015625, 1.421630859375, 1.5887451171875, 1.755859375, 1.9229736328125, 2.090087890625, 2.2572021484375, 2.42431640625, 2.5914306640625, 2.758544921875, 2.9256591796875, 3.0927734375, 3.2598876953125, 3.427001953125, 3.5941162109375, 3.76123046875, 3.9283447265625, 4.095458984375, 4.2625732421875, 4.4296875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 4.0, 3.0, 5.0, 14.0, 12.0, 14.0, 16.0, 22.0, 22.0, 48.0, 55.0, 71.0, 73.0, 95.0, 88.0, 81.0, 77.0, 68.0, 59.0, 41.0, 34.0, 18.0, 19.0, 13.0, 20.0, 2.0, 6.0, 3.0, 3.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002999305725097656, -0.00029190070927143097, -0.0002838708460330963, -0.00027584098279476166, -0.000267811119556427, -0.00025978125631809235, -0.0002517513930797577, -0.00024372152984142303, -0.00023569166660308838, -0.00022766180336475372, -0.00021963194012641907, -0.0002116020768880844, -0.00020357221364974976, -0.0001955423504114151, -0.00018751248717308044, -0.0001794826239347458, -0.00017145276069641113, -0.00016342289745807648, -0.00015539303421974182, -0.00014736317098140717, -0.0001393333077430725, -0.00013130344450473785, -0.0001232735812664032, -0.00011524371802806854, -0.00010721385478973389, -9.918399155139923e-05, -9.115412831306458e-05, -8.312426507472992e-05, -7.509440183639526e-05, -6.706453859806061e-05, -5.903467535972595e-05, -5.1004812121391296e-05, -4.297494888305664e-05, -3.4945085644721985e-05, -2.691522240638733e-05, -1.8885359168052673e-05, -1.0855495929718018e-05, -2.825632691383362e-06, 5.204230546951294e-06, 1.323409378528595e-05, 2.1263957023620605e-05, 2.929382026195526e-05, 3.732368350028992e-05, 4.535354673862457e-05, 5.338340997695923e-05, 6.141327321529388e-05, 6.944313645362854e-05, 7.74729996919632e-05, 8.550286293029785e-05, 9.353272616863251e-05, 0.00010156258940696716, 0.00010959245264530182, 0.00011762231588363647, 0.00012565217912197113, 0.00013368204236030579, 0.00014171190559864044, 0.0001497417688369751, 0.00015777163207530975, 0.0001658014953136444, 0.00017383135855197906, 0.00018186122179031372, 0.00018989108502864838, 0.00019792094826698303, 0.0002059508115053177, 0.00021398067474365234]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 6.0, 12.0, 10.0, 25.0, 34.0, 70.0, 93.0, 189.0, 371.0, 972.0, 3485.0, 24701.0, 563039.0, 430911.0, 19947.0, 3048.0, 848.0, 350.0, 202.0, 90.0, 43.0, 41.0, 19.0, 13.0, 9.0, 7.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.578125, -5.43115234375, -5.2841796875, -5.13720703125, -4.990234375, -4.84326171875, -4.6962890625, -4.54931640625, -4.40234375, -4.25537109375, -4.1083984375, -3.96142578125, -3.814453125, -3.66748046875, -3.5205078125, -3.37353515625, -3.2265625, -3.07958984375, -2.9326171875, -2.78564453125, -2.638671875, -2.49169921875, -2.3447265625, -2.19775390625, -2.05078125, -1.90380859375, -1.7568359375, -1.60986328125, -1.462890625, -1.31591796875, -1.1689453125, -1.02197265625, -0.875, -0.72802734375, -0.5810546875, -0.43408203125, -0.287109375, -0.14013671875, 0.0068359375, 0.15380859375, 0.30078125, 0.44775390625, 0.5947265625, 0.74169921875, 0.888671875, 1.03564453125, 1.1826171875, 1.32958984375, 1.4765625, 1.62353515625, 1.7705078125, 1.91748046875, 2.064453125, 2.21142578125, 2.3583984375, 2.50537109375, 2.65234375, 2.79931640625, 2.9462890625, 3.09326171875, 3.240234375, 3.38720703125, 3.5341796875, 3.68115234375, 3.828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 1.0, 5.0, 5.0, 3.0, 8.0, 14.0, 19.0, 41.0, 38.0, 62.0, 56.0, 70.0, 74.0, 90.0, 93.0, 86.0, 67.0, 54.0, 47.0, 44.0, 22.0, 28.0, 11.0, 11.0, 11.0, 8.0, 4.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.263671875, -2.165313720703125, -2.06695556640625, -1.968597412109375, -1.8702392578125, -1.771881103515625, -1.67352294921875, -1.575164794921875, -1.476806640625, -1.378448486328125, -1.28009033203125, -1.181732177734375, -1.0833740234375, -0.985015869140625, -0.88665771484375, -0.788299560546875, -0.68994140625, -0.591583251953125, -0.49322509765625, -0.394866943359375, -0.2965087890625, -0.198150634765625, -0.09979248046875, -0.001434326171875, 0.096923828125, 0.195281982421875, 0.29364013671875, 0.391998291015625, 0.4903564453125, 0.588714599609375, 0.68707275390625, 0.785430908203125, 0.8837890625, 0.982147216796875, 1.08050537109375, 1.178863525390625, 1.2772216796875, 1.375579833984375, 1.47393798828125, 1.572296142578125, 1.670654296875, 1.769012451171875, 1.86737060546875, 1.965728759765625, 2.0640869140625, 2.162445068359375, 2.26080322265625, 2.359161376953125, 2.45751953125, 2.555877685546875, 2.65423583984375, 2.752593994140625, 2.8509521484375, 2.949310302734375, 3.04766845703125, 3.146026611328125, 3.244384765625, 3.342742919921875, 3.44110107421875, 3.539459228515625, 3.6378173828125, 3.736175537109375, 3.83453369140625, 3.932891845703125, 4.03125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 19.0, 80.0, 233.0, 345.0, 218.0, 81.0, 17.0, 7.0, 7.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.898380279541016, -39.17774200439453, -35.45710754394531, -31.73647117614746, -28.01583480834961, -24.295198440551758, -20.574562072753906, -16.853925704956055, -13.133289337158203, -9.412652969360352, -5.6920166015625, -1.9713802337646484, 1.7492561340332031, 5.469892501831055, 9.190528869628906, 12.911165237426758, 16.63180160522461, 20.35243797302246, 24.073074340820312, 27.793710708618164, 31.514347076416016, 35.2349853515625, 38.95561981201172, 42.67625427246094, 46.39689254760742, 50.117530822753906, 53.838165283203125, 57.558799743652344, 61.27943801879883, 65.00007629394531, 68.72071075439453, 72.44134521484375, 76.1619873046875, 79.88262176513672, 83.60325622558594, 87.32389831542969, 91.0445327758789, 94.76516723632812, 98.48580932617188, 102.2064437866211, 105.92707824707031, 109.64771270751953, 113.36834716796875, 117.0889892578125, 120.80962371826172, 124.53025817871094, 128.2509002685547, 131.97152709960938, 135.69216918945312, 139.41281127929688, 143.13343811035156, 146.8540802001953, 150.57470703125, 154.29534912109375, 158.0159912109375, 161.7366180419922, 165.45726013183594, 169.1779022216797, 172.89852905273438, 176.61917114257812, 180.33981323242188, 184.06044006347656, 187.7810821533203, 191.501708984375, 195.22235107421875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 12.0, 9.0, 20.0, 24.0, 19.0, 33.0, 25.0, 29.0, 37.0, 46.0, 49.0, 55.0, 52.0, 53.0, 44.0, 63.0, 45.0, 48.0, 40.0, 43.0, 42.0, 32.0, 35.0, 25.0, 17.0, 15.0, 10.0, 15.0, 7.0, 7.0, 7.0, 8.0, 2.0, 4.0, 5.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.49346923828125, -40.08780288696289, -38.68213653564453, -37.27647018432617, -35.87080383300781, -34.46514129638672, -33.05947494506836, -31.65380859375, -30.24814224243164, -28.84247589111328, -27.436809539794922, -26.031145095825195, -24.625478744506836, -23.219812393188477, -21.81414794921875, -20.40848159790039, -19.00281524658203, -17.597148895263672, -16.191482543945312, -14.785818099975586, -13.380151748657227, -11.974485397338867, -10.568819999694824, -9.163154602050781, -7.757488250732422, -6.351822376251221, -4.9461565017700195, -3.5404906272888184, -2.134824752807617, -0.729158878326416, 0.6765069961547852, 2.082172393798828, 3.487834930419922, 4.893500804901123, 6.299166679382324, 7.704832553863525, 9.110498428344727, 10.516164779663086, 11.921830177307129, 13.327495574951172, 14.733161926269531, 16.13882827758789, 17.54449462890625, 18.950159072875977, 20.355825424194336, 21.761491775512695, 23.167156219482422, 24.57282257080078, 25.97848892211914, 27.3841552734375, 28.78982162475586, 30.195486068725586, 31.601152420043945, 33.00681686401367, 34.41248321533203, 35.81814956665039, 37.22381591796875, 38.62948226928711, 40.03514862060547, 41.44081497192383, 42.84648132324219, 44.25214385986328, 45.65781021118164, 47.0634765625, 48.46914291381836]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 8.0, 14.0, 13.0, 34.0, 33.0, 69.0, 83.0, 138.0, 269.0, 424.0, 946.0, 2228.0, 5833.0, 22570.0, 248599.0, 3865696.0, 34547.0, 7730.0, 2686.0, 1163.0, 524.0, 281.0, 150.0, 84.0, 52.0, 37.0, 21.0, 14.0, 8.0, 6.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.1796875, -6.017578125, -5.85546875, -5.693359375, -5.53125, -5.369140625, -5.20703125, -5.044921875, -4.8828125, -4.720703125, -4.55859375, -4.396484375, -4.234375, -4.072265625, -3.91015625, -3.748046875, -3.5859375, -3.423828125, -3.26171875, -3.099609375, -2.9375, -2.775390625, -2.61328125, -2.451171875, -2.2890625, -2.126953125, -1.96484375, -1.802734375, -1.640625, -1.478515625, -1.31640625, -1.154296875, -0.9921875, -0.830078125, -0.66796875, -0.505859375, -0.34375, -0.181640625, -0.01953125, 0.142578125, 0.3046875, 0.466796875, 0.62890625, 0.791015625, 0.953125, 1.115234375, 1.27734375, 1.439453125, 1.6015625, 1.763671875, 1.92578125, 2.087890625, 2.25, 2.412109375, 2.57421875, 2.736328125, 2.8984375, 3.060546875, 3.22265625, 3.384765625, 3.546875, 3.708984375, 3.87109375, 4.033203125, 4.1953125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 8.0, 6.0, 15.0, 9.0, 20.0, 28.0, 39.0, 46.0, 37.0, 56.0, 66.0, 67.0, 89.0, 60.0, 68.0, 83.0, 53.0, 53.0, 52.0, 22.0, 30.0, 17.0, 25.0, 12.0, 14.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.783203125, -2.69952392578125, -2.6158447265625, -2.53216552734375, -2.448486328125, -2.36480712890625, -2.2811279296875, -2.19744873046875, -2.11376953125, -2.03009033203125, -1.9464111328125, -1.86273193359375, -1.779052734375, -1.69537353515625, -1.6116943359375, -1.52801513671875, -1.4443359375, -1.36065673828125, -1.2769775390625, -1.19329833984375, -1.109619140625, -1.02593994140625, -0.9422607421875, -0.85858154296875, -0.77490234375, -0.69122314453125, -0.6075439453125, -0.52386474609375, -0.440185546875, -0.35650634765625, -0.2728271484375, -0.18914794921875, -0.10546875, -0.02178955078125, 0.0618896484375, 0.14556884765625, 0.229248046875, 0.31292724609375, 0.3966064453125, 0.48028564453125, 0.56396484375, 0.64764404296875, 0.7313232421875, 0.81500244140625, 0.898681640625, 0.98236083984375, 1.0660400390625, 1.14971923828125, 1.2333984375, 1.31707763671875, 1.4007568359375, 1.48443603515625, 1.568115234375, 1.65179443359375, 1.7354736328125, 1.81915283203125, 1.90283203125, 1.98651123046875, 2.0701904296875, 2.15386962890625, 2.237548828125, 2.32122802734375, 2.4049072265625, 2.48858642578125, 2.572265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 8.0, 19.0, 18.0, 32.0, 44.0, 63.0, 88.0, 145.0, 200.0, 260.0, 445.0, 735.0, 1288.0, 2183.0, 4433.0, 9860.0, 26330.0, 101420.0, 3712562.0, 260587.0, 45779.0, 14723.0, 6025.0, 2899.0, 1527.0, 923.0, 538.0, 348.0, 213.0, 194.0, 102.0, 85.0, 63.0, 38.0, 25.0, 20.0, 13.0, 12.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.470703125, -2.378265380859375, -2.28582763671875, -2.193389892578125, -2.1009521484375, -2.008514404296875, -1.91607666015625, -1.823638916015625, -1.731201171875, -1.638763427734375, -1.54632568359375, -1.453887939453125, -1.3614501953125, -1.269012451171875, -1.17657470703125, -1.084136962890625, -0.99169921875, -0.899261474609375, -0.80682373046875, -0.714385986328125, -0.6219482421875, -0.529510498046875, -0.43707275390625, -0.344635009765625, -0.252197265625, -0.159759521484375, -0.06732177734375, 0.025115966796875, 0.1175537109375, 0.209991455078125, 0.30242919921875, 0.394866943359375, 0.4873046875, 0.579742431640625, 0.67218017578125, 0.764617919921875, 0.8570556640625, 0.949493408203125, 1.04193115234375, 1.134368896484375, 1.226806640625, 1.319244384765625, 1.41168212890625, 1.504119873046875, 1.5965576171875, 1.688995361328125, 1.78143310546875, 1.873870849609375, 1.96630859375, 2.058746337890625, 2.15118408203125, 2.243621826171875, 2.3360595703125, 2.428497314453125, 2.52093505859375, 2.613372802734375, 2.705810546875, 2.798248291015625, 2.89068603515625, 2.983123779296875, 3.0755615234375, 3.167999267578125, 3.26043701171875, 3.352874755859375, 3.4453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 11.0, 10.0, 10.0, 14.0, 20.0, 31.0, 50.0, 89.0, 210.0, 2997.0, 353.0, 99.0, 73.0, 39.0, 26.0, 10.0, 11.0, 5.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.837890625, -0.8065643310546875, -0.775238037109375, -0.7439117431640625, -0.71258544921875, -0.6812591552734375, -0.649932861328125, -0.6186065673828125, -0.5872802734375, -0.5559539794921875, -0.524627685546875, -0.4933013916015625, -0.46197509765625, -0.4306488037109375, -0.399322509765625, -0.3679962158203125, -0.336669921875, -0.3053436279296875, -0.274017333984375, -0.2426910400390625, -0.21136474609375, -0.1800384521484375, -0.148712158203125, -0.1173858642578125, -0.0860595703125, -0.0547332763671875, -0.023406982421875, 0.0079193115234375, 0.03924560546875, 0.0705718994140625, 0.101898193359375, 0.1332244873046875, 0.16455078125, 0.1958770751953125, 0.227203369140625, 0.2585296630859375, 0.28985595703125, 0.3211822509765625, 0.352508544921875, 0.3838348388671875, 0.4151611328125, 0.4464874267578125, 0.477813720703125, 0.5091400146484375, 0.54046630859375, 0.5717926025390625, 0.603118896484375, 0.6344451904296875, 0.665771484375, 0.6970977783203125, 0.728424072265625, 0.7597503662109375, 0.79107666015625, 0.8224029541015625, 0.853729248046875, 0.8850555419921875, 0.9163818359375, 0.9477081298828125, 0.979034423828125, 1.0103607177734375, 1.04168701171875, 1.0730133056640625, 1.104339599609375, 1.1356658935546875, 1.1669921875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 4.0, 20.0, 20.0, 45.0, 64.0, 104.0, 107.0, 143.0, 150.0, 127.0, 91.0, 53.0, 33.0, 15.0, 12.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.966259956359863, -6.81903076171875, -6.671801567077637, -6.524571895599365, -6.377342700958252, -6.230113506317139, -6.082884311676025, -5.935655117034912, -5.788425445556641, -5.641196250915527, -5.493967056274414, -5.346737384796143, -5.199508190155029, -5.052278995513916, -4.905049800872803, -4.7578206062316895, -4.610591411590576, -4.463362216949463, -4.31613302230835, -4.168903350830078, -4.021674156188965, -3.8744449615478516, -3.7272157669067383, -3.579986572265625, -3.4327571392059326, -3.2855279445648193, -3.138298511505127, -2.9910693168640137, -2.8438401222229004, -2.696610689163208, -2.5493814945220947, -2.4021520614624023, -2.254922389984131, -2.1076931953430176, -1.9604637622833252, -1.813234567642212, -1.666005253791809, -1.5187759399414062, -1.371546745300293, -1.2243174314498901, -1.0770881175994873, -0.9298588037490845, -0.7826295495033264, -0.6354002952575684, -0.4881709814071655, -0.3409416675567627, -0.19371241331100464, -0.04648315906524658, 0.10074615478515625, 0.2479754388332367, 0.39520472288131714, 0.5424339771270752, 0.689663290977478, 0.8368926048278809, 0.9841218590736389, 1.131351113319397, 1.2785804271697998, 1.4258097410202026, 1.5730390548706055, 1.7202682495117188, 1.8674975633621216, 2.0147268772125244, 2.1619560718536377, 2.30918550491333, 2.4564146995544434]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 6.0, 8.0, 5.0, 5.0, 10.0, 10.0, 10.0, 12.0, 13.0, 19.0, 30.0, 16.0, 30.0, 32.0, 25.0, 42.0, 27.0, 28.0, 44.0, 52.0, 36.0, 40.0, 46.0, 48.0, 50.0, 44.0, 33.0, 38.0, 32.0, 33.0, 29.0, 29.0, 25.0, 22.0, 17.0, 12.0, 11.0, 6.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8987207412719727, -1.8339781761169434, -1.769235610961914, -1.7044931650161743, -1.639750599861145, -1.5750080347061157, -1.510265588760376, -1.4455230236053467, -1.3807804584503174, -1.316037893295288, -1.2512953281402588, -1.186552882194519, -1.1218103170394897, -1.0570677518844604, -0.9923252463340759, -0.9275827407836914, -0.8628401756286621, -0.7980976104736328, -0.7333551049232483, -0.6686125993728638, -0.6038700342178345, -0.5391274690628052, -0.47438496351242065, -0.40964242815971375, -0.34489989280700684, -0.2801573574542999, -0.21541482210159302, -0.1506722867488861, -0.0859297513961792, -0.02118721604347229, 0.04355531930923462, 0.10829785466194153, 0.17304039001464844, 0.23778292536735535, 0.30252546072006226, 0.36726799607276917, 0.4320105314254761, 0.496753066778183, 0.5614956021308899, 0.6262381076812744, 0.6909806728363037, 0.755723237991333, 0.8204657435417175, 0.885208249092102, 0.9499508142471313, 1.0146933794021606, 1.0794358253479004, 1.1441783905029297, 1.208920955657959, 1.2736635208129883, 1.3384060859680176, 1.4031485319137573, 1.4678910970687866, 1.532633662223816, 1.5973761081695557, 1.662118673324585, 1.7268612384796143, 1.7916038036346436, 1.8563463687896729, 1.9210888147354126, 1.985831379890442, 2.0505738258361816, 2.115316390991211, 2.1800589561462402, 2.2448015213012695]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 12.0, 17.0, 30.0, 46.0, 49.0, 82.0, 119.0, 167.0, 305.0, 441.0, 660.0, 1156.0, 2053.0, 3976.0, 7838.0, 17553.0, 40572.0, 105662.0, 256040.0, 329053.0, 167509.0, 65048.0, 26196.0, 11720.0, 5330.0, 2890.0, 1488.0, 904.0, 532.0, 358.0, 237.0, 130.0, 99.0, 67.0, 58.0, 24.0, 27.0, 25.0, 17.0, 11.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.560546875, -2.48114013671875, -2.4017333984375, -2.32232666015625, -2.242919921875, -2.16351318359375, -2.0841064453125, -2.00469970703125, -1.92529296875, -1.84588623046875, -1.7664794921875, -1.68707275390625, -1.607666015625, -1.52825927734375, -1.4488525390625, -1.36944580078125, -1.2900390625, -1.21063232421875, -1.1312255859375, -1.05181884765625, -0.972412109375, -0.89300537109375, -0.8135986328125, -0.73419189453125, -0.65478515625, -0.57537841796875, -0.4959716796875, -0.41656494140625, -0.337158203125, -0.25775146484375, -0.1783447265625, -0.09893798828125, -0.01953125, 0.05987548828125, 0.1392822265625, 0.21868896484375, 0.298095703125, 0.37750244140625, 0.4569091796875, 0.53631591796875, 0.61572265625, 0.69512939453125, 0.7745361328125, 0.85394287109375, 0.933349609375, 1.01275634765625, 1.0921630859375, 1.17156982421875, 1.2509765625, 1.33038330078125, 1.4097900390625, 1.48919677734375, 1.568603515625, 1.64801025390625, 1.7274169921875, 1.80682373046875, 1.88623046875, 1.96563720703125, 2.0450439453125, 2.12445068359375, 2.203857421875, 2.28326416015625, 2.3626708984375, 2.44207763671875, 2.521484375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 9.0, 13.0, 17.0, 26.0, 19.0, 41.0, 41.0, 34.0, 49.0, 69.0, 76.0, 58.0, 80.0, 73.0, 77.0, 70.0, 56.0, 42.0, 38.0, 28.0, 21.0, 17.0, 12.0, 10.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.998046875, -2.910797119140625, -2.82354736328125, -2.736297607421875, -2.6490478515625, -2.561798095703125, -2.47454833984375, -2.387298583984375, -2.300048828125, -2.212799072265625, -2.12554931640625, -2.038299560546875, -1.9510498046875, -1.863800048828125, -1.77655029296875, -1.689300537109375, -1.60205078125, -1.514801025390625, -1.42755126953125, -1.340301513671875, -1.2530517578125, -1.165802001953125, -1.07855224609375, -0.991302490234375, -0.904052734375, -0.816802978515625, -0.72955322265625, -0.642303466796875, -0.5550537109375, -0.467803955078125, -0.38055419921875, -0.293304443359375, -0.2060546875, -0.118804931640625, -0.03155517578125, 0.055694580078125, 0.1429443359375, 0.230194091796875, 0.31744384765625, 0.404693603515625, 0.491943359375, 0.579193115234375, 0.66644287109375, 0.753692626953125, 0.8409423828125, 0.928192138671875, 1.01544189453125, 1.102691650390625, 1.18994140625, 1.277191162109375, 1.36444091796875, 1.451690673828125, 1.5389404296875, 1.626190185546875, 1.71343994140625, 1.800689697265625, 1.887939453125, 1.975189208984375, 2.06243896484375, 2.149688720703125, 2.2369384765625, 2.324188232421875, 2.41143798828125, 2.498687744140625, 2.5859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 7.0, 3.0, 6.0, 8.0, 2.0, 14.0, 14.0, 22.0, 40.0, 52.0, 80.0, 138.0, 172.0, 267.0, 421.0, 722.0, 1708.0, 5186.0, 22386.0, 144453.0, 649234.0, 186272.0, 27480.0, 5894.0, 1883.0, 779.0, 449.0, 285.0, 171.0, 104.0, 84.0, 63.0, 36.0, 27.0, 24.0, 18.0, 10.0, 7.0, 11.0, 7.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.62109375, -5.4429931640625, -5.264892578125, -5.0867919921875, -4.90869140625, -4.7305908203125, -4.552490234375, -4.3743896484375, -4.1962890625, -4.0181884765625, -3.840087890625, -3.6619873046875, -3.48388671875, -3.3057861328125, -3.127685546875, -2.9495849609375, -2.771484375, -2.5933837890625, -2.415283203125, -2.2371826171875, -2.05908203125, -1.8809814453125, -1.702880859375, -1.5247802734375, -1.3466796875, -1.1685791015625, -0.990478515625, -0.8123779296875, -0.63427734375, -0.4561767578125, -0.278076171875, -0.0999755859375, 0.078125, 0.2562255859375, 0.434326171875, 0.6124267578125, 0.79052734375, 0.9686279296875, 1.146728515625, 1.3248291015625, 1.5029296875, 1.6810302734375, 1.859130859375, 2.0372314453125, 2.21533203125, 2.3934326171875, 2.571533203125, 2.7496337890625, 2.927734375, 3.1058349609375, 3.283935546875, 3.4620361328125, 3.64013671875, 3.8182373046875, 3.996337890625, 4.1744384765625, 4.3525390625, 4.5306396484375, 4.708740234375, 4.8868408203125, 5.06494140625, 5.2430419921875, 5.421142578125, 5.5992431640625, 5.77734375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 7.0, 4.0, 8.0, 10.0, 13.0, 17.0, 26.0, 15.0, 32.0, 32.0, 32.0, 33.0, 31.0, 34.0, 33.0, 27.0, 40.0, 37.0, 41.0, 38.0, 56.0, 40.0, 40.0, 41.0, 45.0, 40.0, 37.0, 30.0, 22.0, 21.0, 13.0, 15.0, 21.0, 11.0, 9.0, 12.0, 8.0, 9.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.276123046875, -8.99755859375, -8.718994140625, -8.4404296875, -8.161865234375, -7.88330078125, -7.604736328125, -7.326171875, -7.047607421875, -6.76904296875, -6.490478515625, -6.2119140625, -5.933349609375, -5.65478515625, -5.376220703125, -5.09765625, -4.819091796875, -4.54052734375, -4.261962890625, -3.9833984375, -3.704833984375, -3.42626953125, -3.147705078125, -2.869140625, -2.590576171875, -2.31201171875, -2.033447265625, -1.7548828125, -1.476318359375, -1.19775390625, -0.919189453125, -0.640625, -0.362060546875, -0.08349609375, 0.195068359375, 0.4736328125, 0.752197265625, 1.03076171875, 1.309326171875, 1.587890625, 1.866455078125, 2.14501953125, 2.423583984375, 2.7021484375, 2.980712890625, 3.25927734375, 3.537841796875, 3.81640625, 4.094970703125, 4.37353515625, 4.652099609375, 4.9306640625, 5.209228515625, 5.48779296875, 5.766357421875, 6.044921875, 6.323486328125, 6.60205078125, 6.880615234375, 7.1591796875, 7.437744140625, 7.71630859375, 7.994873046875, 8.2734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 14.0, 17.0, 80.0, 257.0, 2030.0, 767504.0, 276637.0, 1626.0, 235.0, 79.0, 26.0, 11.0, 10.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.796875, -15.302490234375, -14.80810546875, -14.313720703125, -13.8193359375, -13.324951171875, -12.83056640625, -12.336181640625, -11.841796875, -11.347412109375, -10.85302734375, -10.358642578125, -9.8642578125, -9.369873046875, -8.87548828125, -8.381103515625, -7.88671875, -7.392333984375, -6.89794921875, -6.403564453125, -5.9091796875, -5.414794921875, -4.92041015625, -4.426025390625, -3.931640625, -3.437255859375, -2.94287109375, -2.448486328125, -1.9541015625, -1.459716796875, -0.96533203125, -0.470947265625, 0.0234375, 0.517822265625, 1.01220703125, 1.506591796875, 2.0009765625, 2.495361328125, 2.98974609375, 3.484130859375, 3.978515625, 4.472900390625, 4.96728515625, 5.461669921875, 5.9560546875, 6.450439453125, 6.94482421875, 7.439208984375, 7.93359375, 8.427978515625, 8.92236328125, 9.416748046875, 9.9111328125, 10.405517578125, 10.89990234375, 11.394287109375, 11.888671875, 12.383056640625, 12.87744140625, 13.371826171875, 13.8662109375, 14.360595703125, 14.85498046875, 15.349365234375, 15.84375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 11.0, 15.0, 11.0, 17.0, 25.0, 35.0, 44.0, 65.0, 79.0, 105.0, 97.0, 114.0, 78.0, 74.0, 69.0, 39.0, 35.0, 21.0, 23.0, 9.0, 5.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00029850006103515625, -0.0002905651926994324, -0.0002826303243637085, -0.0002746954560279846, -0.00026676058769226074, -0.00025882571935653687, -0.000250890851020813, -0.0002429559826850891, -0.00023502111434936523, -0.00022708624601364136, -0.00021915137767791748, -0.0002112165093421936, -0.00020328164100646973, -0.00019534677267074585, -0.00018741190433502197, -0.0001794770359992981, -0.00017154216766357422, -0.00016360729932785034, -0.00015567243099212646, -0.0001477375626564026, -0.0001398026943206787, -0.00013186782598495483, -0.00012393295764923096, -0.00011599808931350708, -0.0001080632209777832, -0.00010012835264205933, -9.219348430633545e-05, -8.425861597061157e-05, -7.63237476348877e-05, -6.838887929916382e-05, -6.045401096343994e-05, -5.2519142627716064e-05, -4.458427429199219e-05, -3.664940595626831e-05, -2.8714537620544434e-05, -2.0779669284820557e-05, -1.284480094909668e-05, -4.909932613372803e-06, 3.0249357223510742e-06, 1.0959804058074951e-05, 1.8894672393798828e-05, 2.6829540729522705e-05, 3.476440906524658e-05, 4.269927740097046e-05, 5.0634145736694336e-05, 5.856901407241821e-05, 6.650388240814209e-05, 7.443875074386597e-05, 8.237361907958984e-05, 9.030848741531372e-05, 9.82433557510376e-05, 0.00010617822408676147, 0.00011411309242248535, 0.00012204796075820923, 0.0001299828290939331, 0.00013791769742965698, 0.00014585256576538086, 0.00015378743410110474, 0.0001617223024368286, 0.0001696571707725525, 0.00017759203910827637, 0.00018552690744400024, 0.00019346177577972412, 0.000201396644115448, 0.00020933151245117188]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 9.0, 19.0, 26.0, 49.0, 116.0, 222.0, 668.0, 2464.0, 22208.0, 891903.0, 123600.0, 5478.0, 1092.0, 349.0, 141.0, 72.0, 41.0, 27.0, 15.0, 11.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.171875, -4.98529052734375, -4.7987060546875, -4.61212158203125, -4.425537109375, -4.23895263671875, -4.0523681640625, -3.86578369140625, -3.67919921875, -3.49261474609375, -3.3060302734375, -3.11944580078125, -2.932861328125, -2.74627685546875, -2.5596923828125, -2.37310791015625, -2.1865234375, -1.99993896484375, -1.8133544921875, -1.62677001953125, -1.440185546875, -1.25360107421875, -1.0670166015625, -0.88043212890625, -0.69384765625, -0.50726318359375, -0.3206787109375, -0.13409423828125, 0.052490234375, 0.23907470703125, 0.4256591796875, 0.61224365234375, 0.798828125, 0.98541259765625, 1.1719970703125, 1.35858154296875, 1.545166015625, 1.73175048828125, 1.9183349609375, 2.10491943359375, 2.29150390625, 2.47808837890625, 2.6646728515625, 2.85125732421875, 3.037841796875, 3.22442626953125, 3.4110107421875, 3.59759521484375, 3.7841796875, 3.97076416015625, 4.1573486328125, 4.34393310546875, 4.530517578125, 4.71710205078125, 4.9036865234375, 5.09027099609375, 5.27685546875, 5.46343994140625, 5.6500244140625, 5.83660888671875, 6.023193359375, 6.20977783203125, 6.3963623046875, 6.58294677734375, 6.76953125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 8.0, 8.0, 10.0, 24.0, 45.0, 56.0, 104.0, 135.0, 168.0, 161.0, 118.0, 65.0, 40.0, 18.0, 19.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.49609375, -4.3128662109375, -4.129638671875, -3.9464111328125, -3.76318359375, -3.5799560546875, -3.396728515625, -3.2135009765625, -3.0302734375, -2.8470458984375, -2.663818359375, -2.4805908203125, -2.29736328125, -2.1141357421875, -1.930908203125, -1.7476806640625, -1.564453125, -1.3812255859375, -1.197998046875, -1.0147705078125, -0.83154296875, -0.6483154296875, -0.465087890625, -0.2818603515625, -0.0986328125, 0.0845947265625, 0.267822265625, 0.4510498046875, 0.63427734375, 0.8175048828125, 1.000732421875, 1.1839599609375, 1.3671875, 1.5504150390625, 1.733642578125, 1.9168701171875, 2.10009765625, 2.2833251953125, 2.466552734375, 2.6497802734375, 2.8330078125, 3.0162353515625, 3.199462890625, 3.3826904296875, 3.56591796875, 3.7491455078125, 3.932373046875, 4.1156005859375, 4.298828125, 4.4820556640625, 4.665283203125, 4.8485107421875, 5.03173828125, 5.2149658203125, 5.398193359375, 5.5814208984375, 5.7646484375, 5.9478759765625, 6.131103515625, 6.3143310546875, 6.49755859375, 6.6807861328125, 6.864013671875, 7.0472412109375, 7.23046875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 19.0, 69.0, 318.0, 452.0, 132.0, 16.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.0213623046875, -130.04624938964844, -125.07113647460938, -120.09602355957031, -115.12091064453125, -110.14579772949219, -105.17068481445312, -100.19557189941406, -95.220458984375, -90.24534606933594, -85.27023315429688, -80.29512023925781, -75.32000732421875, -70.34489440917969, -65.36978149414062, -60.39467239379883, -55.41956329345703, -50.44445037841797, -45.469337463378906, -40.494224548339844, -35.51911163330078, -30.54400062561035, -25.568889617919922, -20.59377670288086, -15.618663787841797, -10.643550872802734, -5.668438911437988, -0.6933269500732422, 4.28178596496582, 9.256898880004883, 14.232009887695312, 19.207122802734375, 24.182235717773438, 29.1573486328125, 34.13246154785156, 39.107574462890625, 44.08268737792969, 49.05780029296875, 54.03290939331055, 59.00802230834961, 63.98313522338867, 68.95824432373047, 73.93335723876953, 78.9084701538086, 83.88358306884766, 88.85869598388672, 93.83380889892578, 98.80892181396484, 103.7840347290039, 108.75914764404297, 113.73426055908203, 118.7093734741211, 123.68448638916016, 128.6595916748047, 133.63470458984375, 138.6098175048828, 143.58493041992188, 148.56004333496094, 153.53515625, 158.51026916503906, 163.48538208007812, 168.4604949951172, 173.43560791015625, 178.4107208251953, 183.38583374023438]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 9.0, 9.0, 6.0, 5.0, 6.0, 11.0, 13.0, 8.0, 19.0, 26.0, 22.0, 39.0, 22.0, 53.0, 42.0, 53.0, 50.0, 48.0, 59.0, 50.0, 54.0, 57.0, 45.0, 48.0, 47.0, 32.0, 31.0, 27.0, 26.0, 18.0, 8.0, 21.0, 11.0, 7.0, 5.0, 3.0, 2.0, 6.0, 6.0, 3.0, 0.0, 2.0, 3.0], "bins": [-60.720924377441406, -59.19747543334961, -57.67402267456055, -56.15057373046875, -54.62712478637695, -53.10367202758789, -51.580223083496094, -50.05677032470703, -48.533321380615234, -47.00987243652344, -45.486419677734375, -43.96297073364258, -42.43952178955078, -40.91606903076172, -39.39262008666992, -37.869171142578125, -36.34571838378906, -34.822269439697266, -33.2988166809082, -31.775367736816406, -30.251916885375977, -28.728466033935547, -27.20501708984375, -25.68156623840332, -24.158119201660156, -22.634668350219727, -21.11121940612793, -19.5877685546875, -18.06431770324707, -16.54086685180664, -15.017417907714844, -13.493967056274414, -11.970516204833984, -10.447066307067871, -8.923615455627441, -7.400165557861328, -5.876715183258057, -4.353264808654785, -2.829814910888672, -1.3063640594482422, 0.2170858383178711, 1.740536093711853, 3.263986349105835, 4.787436485290527, 6.310886859893799, 7.83433723449707, 9.357787132263184, 10.881237983703613, 12.404687881469727, 13.92813777923584, 15.45158863067627, 16.975038528442383, 18.498489379882812, 20.02193832397461, 21.54538917541504, 23.06884002685547, 24.592288970947266, 26.115739822387695, 27.639188766479492, 29.162639617919922, 30.68609046936035, 32.20954132080078, 33.73299026489258, 35.256439208984375, 36.77989196777344]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 6.0, 4.0, 11.0, 13.0, 30.0, 35.0, 36.0, 95.0, 155.0, 340.0, 749.0, 2193.0, 8290.0, 69649.0, 4038182.0, 63560.0, 7621.0, 2013.0, 715.0, 296.0, 125.0, 67.0, 29.0, 20.0, 16.0, 13.0, 7.0, 2.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.58203125, -6.37939453125, -6.1767578125, -5.97412109375, -5.771484375, -5.56884765625, -5.3662109375, -5.16357421875, -4.9609375, -4.75830078125, -4.5556640625, -4.35302734375, -4.150390625, -3.94775390625, -3.7451171875, -3.54248046875, -3.33984375, -3.13720703125, -2.9345703125, -2.73193359375, -2.529296875, -2.32666015625, -2.1240234375, -1.92138671875, -1.71875, -1.51611328125, -1.3134765625, -1.11083984375, -0.908203125, -0.70556640625, -0.5029296875, -0.30029296875, -0.09765625, 0.10498046875, 0.3076171875, 0.51025390625, 0.712890625, 0.91552734375, 1.1181640625, 1.32080078125, 1.5234375, 1.72607421875, 1.9287109375, 2.13134765625, 2.333984375, 2.53662109375, 2.7392578125, 2.94189453125, 3.14453125, 3.34716796875, 3.5498046875, 3.75244140625, 3.955078125, 4.15771484375, 4.3603515625, 4.56298828125, 4.765625, 4.96826171875, 5.1708984375, 5.37353515625, 5.576171875, 5.77880859375, 5.9814453125, 6.18408203125, 6.38671875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 11.0, 14.0, 20.0, 34.0, 51.0, 94.0, 89.0, 141.0, 121.0, 109.0, 120.0, 72.0, 48.0, 25.0, 18.0, 14.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.17578125, -6.035858154296875, -5.89593505859375, -5.756011962890625, -5.6160888671875, -5.476165771484375, -5.33624267578125, -5.196319580078125, -5.056396484375, -4.916473388671875, -4.77655029296875, -4.636627197265625, -4.4967041015625, -4.356781005859375, -4.21685791015625, -4.076934814453125, -3.93701171875, -3.797088623046875, -3.65716552734375, -3.517242431640625, -3.3773193359375, -3.237396240234375, -3.09747314453125, -2.957550048828125, -2.817626953125, -2.677703857421875, -2.53778076171875, -2.397857666015625, -2.2579345703125, -2.118011474609375, -1.97808837890625, -1.838165283203125, -1.6982421875, -1.558319091796875, -1.41839599609375, -1.278472900390625, -1.1385498046875, -0.998626708984375, -0.85870361328125, -0.718780517578125, -0.578857421875, -0.438934326171875, -0.29901123046875, -0.159088134765625, -0.0191650390625, 0.120758056640625, 0.26068115234375, 0.400604248046875, 0.54052734375, 0.680450439453125, 0.82037353515625, 0.960296630859375, 1.1002197265625, 1.240142822265625, 1.38006591796875, 1.519989013671875, 1.659912109375, 1.799835205078125, 1.93975830078125, 2.079681396484375, 2.2196044921875, 2.359527587890625, 2.49945068359375, 2.639373779296875, 2.779296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 15.0, 15.0, 22.0, 21.0, 31.0, 31.0, 31.0, 46.0, 60.0, 111.0, 150.0, 376.0, 1299.0, 7069.0, 299632.0, 3869320.0, 13045.0, 1861.0, 493.0, 174.0, 124.0, 86.0, 39.0, 44.0, 34.0, 27.0, 26.0, 17.0, 19.0, 10.0, 12.0, 11.0, 3.0, 4.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.03125, -9.6982421875, -9.365234375, -9.0322265625, -8.69921875, -8.3662109375, -8.033203125, -7.7001953125, -7.3671875, -7.0341796875, -6.701171875, -6.3681640625, -6.03515625, -5.7021484375, -5.369140625, -5.0361328125, -4.703125, -4.3701171875, -4.037109375, -3.7041015625, -3.37109375, -3.0380859375, -2.705078125, -2.3720703125, -2.0390625, -1.7060546875, -1.373046875, -1.0400390625, -0.70703125, -0.3740234375, -0.041015625, 0.2919921875, 0.625, 0.9580078125, 1.291015625, 1.6240234375, 1.95703125, 2.2900390625, 2.623046875, 2.9560546875, 3.2890625, 3.6220703125, 3.955078125, 4.2880859375, 4.62109375, 4.9541015625, 5.287109375, 5.6201171875, 5.953125, 6.2861328125, 6.619140625, 6.9521484375, 7.28515625, 7.6181640625, 7.951171875, 8.2841796875, 8.6171875, 8.9501953125, 9.283203125, 9.6162109375, 9.94921875, 10.2822265625, 10.615234375, 10.9482421875, 11.28125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 5.0, 6.0, 14.0, 58.0, 299.0, 3342.0, 282.0, 52.0, 12.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.654296875, -1.480255126953125, -1.30621337890625, -1.132171630859375, -0.9581298828125, -0.784088134765625, -0.61004638671875, -0.436004638671875, -0.261962890625, -0.087921142578125, 0.08612060546875, 0.260162353515625, 0.4342041015625, 0.608245849609375, 0.78228759765625, 0.956329345703125, 1.13037109375, 1.304412841796875, 1.47845458984375, 1.652496337890625, 1.8265380859375, 2.000579833984375, 2.17462158203125, 2.348663330078125, 2.522705078125, 2.696746826171875, 2.87078857421875, 3.044830322265625, 3.2188720703125, 3.392913818359375, 3.56695556640625, 3.740997314453125, 3.9150390625, 4.089080810546875, 4.26312255859375, 4.437164306640625, 4.6112060546875, 4.785247802734375, 4.95928955078125, 5.133331298828125, 5.307373046875, 5.481414794921875, 5.65545654296875, 5.829498291015625, 6.0035400390625, 6.177581787109375, 6.35162353515625, 6.525665283203125, 6.69970703125, 6.873748779296875, 7.04779052734375, 7.221832275390625, 7.3958740234375, 7.569915771484375, 7.74395751953125, 7.917999267578125, 8.092041015625, 8.266082763671875, 8.44012451171875, 8.614166259765625, 8.7882080078125, 8.962249755859375, 9.13629150390625, 9.310333251953125, 9.484375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 6.0, 6.0, 22.0, 78.0, 223.0, 371.0, 205.0, 69.0, 19.0, 10.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.54205322265625, -12.776350021362305, -12.010647773742676, -11.24494457244873, -10.479242324829102, -9.713539123535156, -8.947835922241211, -8.182132720947266, -7.416430473327637, -6.65072774887085, -5.8850250244140625, -5.119321823120117, -4.35361909866333, -3.587916374206543, -2.8222131729125977, -2.0565104484558105, -1.2908077239990234, -0.5251048803329468, 0.24059796333312988, 1.006300926208496, 1.7720036506652832, 2.5377063751220703, 3.3034095764160156, 4.069112300872803, 4.83481502532959, 5.600517749786377, 6.366220474243164, 7.131923675537109, 7.8976263999938965, 8.663329124450684, 9.429032325744629, 10.194734573364258, 10.960437774658203, 11.726140975952148, 12.491843223571777, 13.257546424865723, 14.023248672485352, 14.788951873779297, 15.554655075073242, 16.320358276367188, 17.0860595703125, 17.851762771606445, 18.61746597290039, 19.383167266845703, 20.14887046813965, 20.914573669433594, 21.68027687072754, 22.445980072021484, 23.21168327331543, 23.977386474609375, 24.74308967590332, 25.508792877197266, 26.274494171142578, 27.040197372436523, 27.80590057373047, 28.571603775024414, 29.33730697631836, 30.103010177612305, 30.86871337890625, 31.634414672851562, 32.40011978149414, 33.16582107543945, 33.93152618408203, 34.697227478027344, 35.462928771972656]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 13.0, 7.0, 22.0, 26.0, 53.0, 61.0, 96.0, 114.0, 134.0, 110.0, 98.0, 95.0, 65.0, 33.0, 31.0, 16.0, 13.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.76545524597168, -18.240495681762695, -17.71553611755371, -17.190576553344727, -16.665616989135742, -16.140657424926758, -15.61569881439209, -15.090739250183105, -14.565779685974121, -14.040820121765137, -13.515860557556152, -12.990900993347168, -12.4659423828125, -11.940982818603516, -11.416023254394531, -10.891063690185547, -10.366104125976562, -9.841144561767578, -9.316184997558594, -8.79122543334961, -8.266265869140625, -7.741306781768799, -7.216347694396973, -6.691388130187988, -6.166428565979004, -5.6414690017700195, -5.116509437561035, -4.591550350189209, -4.066590785980225, -3.5416312217712402, -3.016671895980835, -2.4917125701904297, -1.9667530059814453, -1.4417935609817505, -0.9168341159820557, -0.39187467098236084, 0.13308477401733398, 0.6580443382263184, 1.1830036640167236, 1.707962989807129, 2.2329225540161133, 2.7578821182250977, 3.282841444015503, 3.807800769805908, 4.332760334014893, 4.857719898223877, 5.382678985595703, 5.9076385498046875, 6.432598114013672, 6.957557678222656, 7.482517242431641, 8.007476806640625, 8.53243637084961, 9.057395935058594, 9.582354545593262, 10.107314109802246, 10.63227367401123, 11.157233238220215, 11.6821928024292, 12.207152366638184, 12.732110977172852, 13.257070541381836, 13.78203010559082, 14.306989669799805, 14.831949234008789]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 14.0, 9.0, 14.0, 30.0, 22.0, 61.0, 96.0, 130.0, 254.0, 527.0, 1266.0, 3941.0, 16376.0, 127981.0, 699923.0, 170622.0, 20069.0, 4394.0, 1513.0, 595.0, 269.0, 141.0, 82.0, 66.0, 38.0, 33.0, 17.0, 16.0, 8.0, 9.0, 9.0, 1.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.0625, -5.8502197265625, -5.637939453125, -5.4256591796875, -5.21337890625, -5.0010986328125, -4.788818359375, -4.5765380859375, -4.3642578125, -4.1519775390625, -3.939697265625, -3.7274169921875, -3.51513671875, -3.3028564453125, -3.090576171875, -2.8782958984375, -2.666015625, -2.4537353515625, -2.241455078125, -2.0291748046875, -1.81689453125, -1.6046142578125, -1.392333984375, -1.1800537109375, -0.9677734375, -0.7554931640625, -0.543212890625, -0.3309326171875, -0.11865234375, 0.0936279296875, 0.305908203125, 0.5181884765625, 0.73046875, 0.9427490234375, 1.155029296875, 1.3673095703125, 1.57958984375, 1.7918701171875, 2.004150390625, 2.2164306640625, 2.4287109375, 2.6409912109375, 2.853271484375, 3.0655517578125, 3.27783203125, 3.4901123046875, 3.702392578125, 3.9146728515625, 4.126953125, 4.3392333984375, 4.551513671875, 4.7637939453125, 4.97607421875, 5.1883544921875, 5.400634765625, 5.6129150390625, 5.8251953125, 6.0374755859375, 6.249755859375, 6.4620361328125, 6.67431640625, 6.8865966796875, 7.098876953125, 7.3111572265625, 7.5234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 17.0, 21.0, 40.0, 47.0, 65.0, 108.0, 113.0, 141.0, 128.0, 117.0, 76.0, 52.0, 32.0, 7.0, 12.0, 8.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.5975341796875, -6.445068359375, -6.2926025390625, -6.14013671875, -5.9876708984375, -5.835205078125, -5.6827392578125, -5.5302734375, -5.3778076171875, -5.225341796875, -5.0728759765625, -4.92041015625, -4.7679443359375, -4.615478515625, -4.4630126953125, -4.310546875, -4.1580810546875, -4.005615234375, -3.8531494140625, -3.70068359375, -3.5482177734375, -3.395751953125, -3.2432861328125, -3.0908203125, -2.9383544921875, -2.785888671875, -2.6334228515625, -2.48095703125, -2.3284912109375, -2.176025390625, -2.0235595703125, -1.87109375, -1.7186279296875, -1.566162109375, -1.4136962890625, -1.26123046875, -1.1087646484375, -0.956298828125, -0.8038330078125, -0.6513671875, -0.4989013671875, -0.346435546875, -0.1939697265625, -0.04150390625, 0.1109619140625, 0.263427734375, 0.4158935546875, 0.568359375, 0.7208251953125, 0.873291015625, 1.0257568359375, 1.17822265625, 1.3306884765625, 1.483154296875, 1.6356201171875, 1.7880859375, 1.9405517578125, 2.093017578125, 2.2454833984375, 2.39794921875, 2.5504150390625, 2.702880859375, 2.8553466796875, 3.0078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 2.0, 9.0, 9.0, 11.0, 22.0, 26.0, 46.0, 61.0, 134.0, 268.0, 565.0, 1509.0, 5620.0, 59122.0, 874039.0, 97002.0, 7041.0, 1645.0, 720.0, 300.0, 152.0, 79.0, 68.0, 25.0, 29.0, 15.0, 8.0, 10.0, 6.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.84375, -11.490966796875, -11.13818359375, -10.785400390625, -10.4326171875, -10.079833984375, -9.72705078125, -9.374267578125, -9.021484375, -8.668701171875, -8.31591796875, -7.963134765625, -7.6103515625, -7.257568359375, -6.90478515625, -6.552001953125, -6.19921875, -5.846435546875, -5.49365234375, -5.140869140625, -4.7880859375, -4.435302734375, -4.08251953125, -3.729736328125, -3.376953125, -3.024169921875, -2.67138671875, -2.318603515625, -1.9658203125, -1.613037109375, -1.26025390625, -0.907470703125, -0.5546875, -0.201904296875, 0.15087890625, 0.503662109375, 0.8564453125, 1.209228515625, 1.56201171875, 1.914794921875, 2.267578125, 2.620361328125, 2.97314453125, 3.325927734375, 3.6787109375, 4.031494140625, 4.38427734375, 4.737060546875, 5.08984375, 5.442626953125, 5.79541015625, 6.148193359375, 6.5009765625, 6.853759765625, 7.20654296875, 7.559326171875, 7.912109375, 8.264892578125, 8.61767578125, 8.970458984375, 9.3232421875, 9.676025390625, 10.02880859375, 10.381591796875, 10.734375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 7.0, 4.0, 10.0, 10.0, 26.0, 23.0, 27.0, 36.0, 39.0, 57.0, 59.0, 80.0, 62.0, 69.0, 79.0, 65.0, 82.0, 47.0, 45.0, 52.0, 25.0, 17.0, 25.0, 15.0, 10.0, 4.0, 5.0, 4.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.1328125, -13.713623046875, -13.29443359375, -12.875244140625, -12.4560546875, -12.036865234375, -11.61767578125, -11.198486328125, -10.779296875, -10.360107421875, -9.94091796875, -9.521728515625, -9.1025390625, -8.683349609375, -8.26416015625, -7.844970703125, -7.42578125, -7.006591796875, -6.58740234375, -6.168212890625, -5.7490234375, -5.329833984375, -4.91064453125, -4.491455078125, -4.072265625, -3.653076171875, -3.23388671875, -2.814697265625, -2.3955078125, -1.976318359375, -1.55712890625, -1.137939453125, -0.71875, -0.299560546875, 0.11962890625, 0.538818359375, 0.9580078125, 1.377197265625, 1.79638671875, 2.215576171875, 2.634765625, 3.053955078125, 3.47314453125, 3.892333984375, 4.3115234375, 4.730712890625, 5.14990234375, 5.569091796875, 5.98828125, 6.407470703125, 6.82666015625, 7.245849609375, 7.6650390625, 8.084228515625, 8.50341796875, 8.922607421875, 9.341796875, 9.760986328125, 10.18017578125, 10.599365234375, 11.0185546875, 11.437744140625, 11.85693359375, 12.276123046875, 12.6953125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 0.0, 6.0, 9.0, 12.0, 10.0, 15.0, 17.0, 26.0, 42.0, 44.0, 64.0, 106.0, 137.0, 290.0, 597.0, 1528.0, 5381.0, 33858.0, 601969.0, 373980.0, 23559.0, 4331.0, 1252.0, 543.0, 288.0, 148.0, 87.0, 64.0, 40.0, 33.0, 21.0, 24.0, 12.0, 12.0, 7.0, 10.0, 9.0, 6.0, 4.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.075347900390625, -2.98468017578125, -2.894012451171875, -2.8033447265625, -2.712677001953125, -2.62200927734375, -2.531341552734375, -2.440673828125, -2.350006103515625, -2.25933837890625, -2.168670654296875, -2.0780029296875, -1.987335205078125, -1.89666748046875, -1.805999755859375, -1.71533203125, -1.624664306640625, -1.53399658203125, -1.443328857421875, -1.3526611328125, -1.261993408203125, -1.17132568359375, -1.080657958984375, -0.989990234375, -0.899322509765625, -0.80865478515625, -0.717987060546875, -0.6273193359375, -0.536651611328125, -0.44598388671875, -0.355316162109375, -0.2646484375, -0.173980712890625, -0.08331298828125, 0.007354736328125, 0.0980224609375, 0.188690185546875, 0.27935791015625, 0.370025634765625, 0.460693359375, 0.551361083984375, 0.64202880859375, 0.732696533203125, 0.8233642578125, 0.914031982421875, 1.00469970703125, 1.095367431640625, 1.18603515625, 1.276702880859375, 1.36737060546875, 1.458038330078125, 1.5487060546875, 1.639373779296875, 1.73004150390625, 1.820709228515625, 1.911376953125, 2.002044677734375, 2.09271240234375, 2.183380126953125, 2.2740478515625, 2.364715576171875, 2.45538330078125, 2.546051025390625, 2.63671875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 4.0, 6.0, 5.0, 6.0, 12.0, 13.0, 16.0, 43.0, 47.0, 63.0, 78.0, 124.0, 130.0, 115.0, 96.0, 57.0, 51.0, 34.0, 29.0, 18.0, 15.0, 8.0, 3.0, 7.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003662109375, -0.00035593658685684204, -0.0003456622362136841, -0.0003353878855705261, -0.00032511353492736816, -0.0003148391842842102, -0.00030456483364105225, -0.0002942904829978943, -0.00028401613235473633, -0.00027374178171157837, -0.0002634674310684204, -0.00025319308042526245, -0.0002429187297821045, -0.00023264437913894653, -0.00022237002849578857, -0.00021209567785263062, -0.00020182132720947266, -0.0001915469765663147, -0.00018127262592315674, -0.00017099827527999878, -0.00016072392463684082, -0.00015044957399368286, -0.0001401752233505249, -0.00012990087270736694, -0.00011962652206420898, -0.00010935217142105103, -9.907782077789307e-05, -8.880347013473511e-05, -7.852911949157715e-05, -6.825476884841919e-05, -5.798041820526123e-05, -4.770606756210327e-05, -3.743171691894531e-05, -2.7157366275787354e-05, -1.6883015632629395e-05, -6.6086649894714355e-06, 3.6656856536865234e-06, 1.3940036296844482e-05, 2.421438694000244e-05, 3.44887375831604e-05, 4.476308822631836e-05, 5.503743886947632e-05, 6.531178951263428e-05, 7.558614015579224e-05, 8.58604907989502e-05, 9.613484144210815e-05, 0.00010640919208526611, 0.00011668354272842407, 0.00012695789337158203, 0.00013723224401474, 0.00014750659465789795, 0.0001577809453010559, 0.00016805529594421387, 0.00017832964658737183, 0.00018860399723052979, 0.00019887834787368774, 0.0002091526985168457, 0.00021942704916000366, 0.00022970139980316162, 0.00023997575044631958, 0.00025025010108947754, 0.0002605244517326355, 0.00027079880237579346, 0.0002810731530189514, 0.0002913475036621094]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 6.0, 2.0, 3.0, 11.0, 8.0, 11.0, 19.0, 23.0, 36.0, 60.0, 90.0, 138.0, 302.0, 607.0, 1464.0, 4329.0, 20711.0, 395062.0, 590621.0, 26929.0, 5118.0, 1567.0, 702.0, 280.0, 160.0, 105.0, 57.0, 40.0, 25.0, 13.0, 16.0, 9.0, 8.0, 3.0, 9.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.1640625, -4.048583984375, -3.93310546875, -3.817626953125, -3.7021484375, -3.586669921875, -3.47119140625, -3.355712890625, -3.240234375, -3.124755859375, -3.00927734375, -2.893798828125, -2.7783203125, -2.662841796875, -2.54736328125, -2.431884765625, -2.31640625, -2.200927734375, -2.08544921875, -1.969970703125, -1.8544921875, -1.739013671875, -1.62353515625, -1.508056640625, -1.392578125, -1.277099609375, -1.16162109375, -1.046142578125, -0.9306640625, -0.815185546875, -0.69970703125, -0.584228515625, -0.46875, -0.353271484375, -0.23779296875, -0.122314453125, -0.0068359375, 0.108642578125, 0.22412109375, 0.339599609375, 0.455078125, 0.570556640625, 0.68603515625, 0.801513671875, 0.9169921875, 1.032470703125, 1.14794921875, 1.263427734375, 1.37890625, 1.494384765625, 1.60986328125, 1.725341796875, 1.8408203125, 1.956298828125, 2.07177734375, 2.187255859375, 2.302734375, 2.418212890625, 2.53369140625, 2.649169921875, 2.7646484375, 2.880126953125, 2.99560546875, 3.111083984375, 3.2265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 15.0, 19.0, 27.0, 45.0, 52.0, 61.0, 77.0, 96.0, 109.0, 108.0, 81.0, 67.0, 59.0, 37.0, 36.0, 24.0, 21.0, 12.0, 9.0, 8.0, 1.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.611328125, -3.518707275390625, -3.42608642578125, -3.333465576171875, -3.2408447265625, -3.148223876953125, -3.05560302734375, -2.962982177734375, -2.870361328125, -2.777740478515625, -2.68511962890625, -2.592498779296875, -2.4998779296875, -2.407257080078125, -2.31463623046875, -2.222015380859375, -2.12939453125, -2.036773681640625, -1.94415283203125, -1.851531982421875, -1.7589111328125, -1.666290283203125, -1.57366943359375, -1.481048583984375, -1.388427734375, -1.295806884765625, -1.20318603515625, -1.110565185546875, -1.0179443359375, -0.925323486328125, -0.83270263671875, -0.740081787109375, -0.6474609375, -0.554840087890625, -0.46221923828125, -0.369598388671875, -0.2769775390625, -0.184356689453125, -0.09173583984375, 0.000885009765625, 0.093505859375, 0.186126708984375, 0.27874755859375, 0.371368408203125, 0.4639892578125, 0.556610107421875, 0.64923095703125, 0.741851806640625, 0.83447265625, 0.927093505859375, 1.01971435546875, 1.112335205078125, 1.2049560546875, 1.297576904296875, 1.39019775390625, 1.482818603515625, 1.575439453125, 1.668060302734375, 1.76068115234375, 1.853302001953125, 1.9459228515625, 2.038543701171875, 2.13116455078125, 2.223785400390625, 2.31640625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 4.0, 7.0, 12.0, 49.0, 102.0, 144.0, 183.0, 185.0, 126.0, 86.0, 37.0, 28.0, 11.0, 10.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.12635040283203, -50.168212890625, -48.2100715637207, -46.25193405151367, -44.293792724609375, -42.335655212402344, -40.37751388549805, -38.419376373291016, -36.46123504638672, -34.50309753417969, -32.54495620727539, -30.586816787719727, -28.628677368164062, -26.67053985595703, -24.712398529052734, -22.754261016845703, -20.79612159729004, -18.837982177734375, -16.87984275817871, -14.921703338623047, -12.963563919067383, -11.005425453186035, -9.047286033630371, -7.089146614074707, -5.131007194519043, -3.172867774963379, -1.214728593826294, 0.743410587310791, 2.701550006866455, 4.659688949584961, 6.617828369140625, 8.575967788696289, 10.534107208251953, 12.492246627807617, 14.450386047363281, 16.408525466918945, 18.36666488647461, 20.32480239868164, 22.282943725585938, 24.24108123779297, 26.199222564697266, 28.15736198425293, 30.115501403808594, 32.073638916015625, 34.03178024291992, 35.98991775512695, 37.94805908203125, 39.90619659423828, 41.86433410644531, 43.822471618652344, 45.78061294555664, 47.73875045776367, 49.69689178466797, 51.655029296875, 53.6131706237793, 55.57130813598633, 57.529449462890625, 59.487586975097656, 61.44572830200195, 63.403865814208984, 65.36200714111328, 67.32014465332031, 69.27828216552734, 71.2364273071289, 73.19456481933594]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 10.0, 3.0, 6.0, 10.0, 10.0, 16.0, 18.0, 17.0, 33.0, 28.0, 28.0, 51.0, 41.0, 45.0, 60.0, 46.0, 71.0, 68.0, 55.0, 61.0, 51.0, 46.0, 43.0, 40.0, 26.0, 31.0, 21.0, 14.0, 21.0, 8.0, 4.0, 11.0, 6.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.08018493652344, -34.44758605957031, -32.81499099731445, -31.182392120361328, -29.549795150756836, -27.917198181152344, -26.28459930419922, -24.652002334594727, -23.019405364990234, -21.386808395385742, -19.75421142578125, -18.121612548828125, -16.489015579223633, -14.85641860961914, -13.223820686340332, -11.591222763061523, -9.958625793457031, -8.326028823852539, -6.6934309005737305, -5.06083345413208, -3.4282360076904297, -1.7956390380859375, -0.1630411148071289, 1.4695568084716797, 3.102153778076172, 4.734751224517822, 6.367348670959473, 7.999946117401123, 9.632543563842773, 11.265140533447266, 12.897738456726074, 14.530336380004883, 16.162933349609375, 17.795530319213867, 19.42812728881836, 21.060726165771484, 22.693323135375977, 24.32592010498047, 25.958518981933594, 27.591115951538086, 29.223712921142578, 30.85630989074707, 32.48890686035156, 34.12150573730469, 35.75410461425781, 37.38669967651367, 39.0192985534668, 40.651893615722656, 42.28449249267578, 43.917091369628906, 45.549686431884766, 47.18228530883789, 48.81488037109375, 50.447479248046875, 52.080078125, 53.712677001953125, 55.345272064208984, 56.97787094116211, 58.61046600341797, 60.243064880371094, 61.87566375732422, 63.50825881958008, 65.14085388183594, 66.77345275878906, 68.40605163574219]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 0.0, 5.0, 0.0, 3.0, 6.0, 6.0, 12.0, 16.0, 10.0, 18.0, 34.0, 51.0, 69.0, 94.0, 160.0, 240.0, 455.0, 1086.0, 3219.0, 14250.0, 185141.0, 3901221.0, 74473.0, 9295.0, 2478.0, 902.0, 417.0, 225.0, 122.0, 95.0, 55.0, 35.0, 23.0, 19.0, 10.0, 8.0, 12.0, 2.0, 12.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0546875, -6.829833984375, -6.60498046875, -6.380126953125, -6.1552734375, -5.930419921875, -5.70556640625, -5.480712890625, -5.255859375, -5.031005859375, -4.80615234375, -4.581298828125, -4.3564453125, -4.131591796875, -3.90673828125, -3.681884765625, -3.45703125, -3.232177734375, -3.00732421875, -2.782470703125, -2.5576171875, -2.332763671875, -2.10791015625, -1.883056640625, -1.658203125, -1.433349609375, -1.20849609375, -0.983642578125, -0.7587890625, -0.533935546875, -0.30908203125, -0.084228515625, 0.140625, 0.365478515625, 0.59033203125, 0.815185546875, 1.0400390625, 1.264892578125, 1.48974609375, 1.714599609375, 1.939453125, 2.164306640625, 2.38916015625, 2.614013671875, 2.8388671875, 3.063720703125, 3.28857421875, 3.513427734375, 3.73828125, 3.963134765625, 4.18798828125, 4.412841796875, 4.6376953125, 4.862548828125, 5.08740234375, 5.312255859375, 5.537109375, 5.761962890625, 5.98681640625, 6.211669921875, 6.4365234375, 6.661376953125, 6.88623046875, 7.111083984375, 7.3359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 18.0, 18.0, 40.0, 63.0, 45.0, 79.0, 109.0, 91.0, 122.0, 102.0, 94.0, 71.0, 43.0, 33.0, 27.0, 15.0, 14.0, 5.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.135589599609375, -4.02117919921875, -3.906768798828125, -3.7923583984375, -3.677947998046875, -3.56353759765625, -3.449127197265625, -3.334716796875, -3.220306396484375, -3.10589599609375, -2.991485595703125, -2.8770751953125, -2.762664794921875, -2.64825439453125, -2.533843994140625, -2.41943359375, -2.305023193359375, -2.19061279296875, -2.076202392578125, -1.9617919921875, -1.847381591796875, -1.73297119140625, -1.618560791015625, -1.504150390625, -1.389739990234375, -1.27532958984375, -1.160919189453125, -1.0465087890625, -0.932098388671875, -0.81768798828125, -0.703277587890625, -0.5888671875, -0.474456787109375, -0.36004638671875, -0.245635986328125, -0.1312255859375, -0.016815185546875, 0.09759521484375, 0.212005615234375, 0.326416015625, 0.440826416015625, 0.55523681640625, 0.669647216796875, 0.7840576171875, 0.898468017578125, 1.01287841796875, 1.127288818359375, 1.24169921875, 1.356109619140625, 1.47052001953125, 1.584930419921875, 1.6993408203125, 1.813751220703125, 1.92816162109375, 2.042572021484375, 2.156982421875, 2.271392822265625, 2.38580322265625, 2.500213623046875, 2.6146240234375, 2.729034423828125, 2.84344482421875, 2.957855224609375, 3.072265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 9.0, 12.0, 17.0, 34.0, 29.0, 79.0, 155.0, 438.0, 1512.0, 6627.0, 51605.0, 3718904.0, 391294.0, 19093.0, 3168.0, 763.0, 276.0, 88.0, 43.0, 28.0, 19.0, 16.0, 16.0, 9.0, 9.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.0703125, -7.8314208984375, -7.592529296875, -7.3536376953125, -7.11474609375, -6.8758544921875, -6.636962890625, -6.3980712890625, -6.1591796875, -5.9202880859375, -5.681396484375, -5.4425048828125, -5.20361328125, -4.9647216796875, -4.725830078125, -4.4869384765625, -4.248046875, -4.0091552734375, -3.770263671875, -3.5313720703125, -3.29248046875, -3.0535888671875, -2.814697265625, -2.5758056640625, -2.3369140625, -2.0980224609375, -1.859130859375, -1.6202392578125, -1.38134765625, -1.1424560546875, -0.903564453125, -0.6646728515625, -0.42578125, -0.1868896484375, 0.052001953125, 0.2908935546875, 0.52978515625, 0.7686767578125, 1.007568359375, 1.2464599609375, 1.4853515625, 1.7242431640625, 1.963134765625, 2.2020263671875, 2.44091796875, 2.6798095703125, 2.918701171875, 3.1575927734375, 3.396484375, 3.6353759765625, 3.874267578125, 4.1131591796875, 4.35205078125, 4.5909423828125, 4.829833984375, 5.0687255859375, 5.3076171875, 5.5465087890625, 5.785400390625, 6.0242919921875, 6.26318359375, 6.5020751953125, 6.740966796875, 6.9798583984375, 7.21875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 6.0, 7.0, 13.0, 12.0, 17.0, 15.0, 28.0, 43.0, 82.0, 169.0, 430.0, 1070.0, 1232.0, 457.0, 202.0, 91.0, 61.0, 38.0, 24.0, 19.0, 11.0, 11.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.77734375, -6.60400390625, -6.4306640625, -6.25732421875, -6.083984375, -5.91064453125, -5.7373046875, -5.56396484375, -5.390625, -5.21728515625, -5.0439453125, -4.87060546875, -4.697265625, -4.52392578125, -4.3505859375, -4.17724609375, -4.00390625, -3.83056640625, -3.6572265625, -3.48388671875, -3.310546875, -3.13720703125, -2.9638671875, -2.79052734375, -2.6171875, -2.44384765625, -2.2705078125, -2.09716796875, -1.923828125, -1.75048828125, -1.5771484375, -1.40380859375, -1.23046875, -1.05712890625, -0.8837890625, -0.71044921875, -0.537109375, -0.36376953125, -0.1904296875, -0.01708984375, 0.15625, 0.32958984375, 0.5029296875, 0.67626953125, 0.849609375, 1.02294921875, 1.1962890625, 1.36962890625, 1.54296875, 1.71630859375, 1.8896484375, 2.06298828125, 2.236328125, 2.40966796875, 2.5830078125, 2.75634765625, 2.9296875, 3.10302734375, 3.2763671875, 3.44970703125, 3.623046875, 3.79638671875, 3.9697265625, 4.14306640625, 4.31640625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 11.0, 13.0, 14.0, 41.0, 95.0, 166.0, 205.0, 160.0, 148.0, 60.0, 42.0, 19.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.96563720703125, -46.63637161254883, -45.307106018066406, -43.977840423583984, -42.64857482910156, -41.31930923461914, -39.99004364013672, -38.6607780456543, -37.331512451171875, -36.00224685668945, -34.67298126220703, -33.34371566772461, -32.01445007324219, -30.685184478759766, -29.355918884277344, -28.026653289794922, -26.697385787963867, -25.368120193481445, -24.038854598999023, -22.7095890045166, -21.38032341003418, -20.051057815551758, -18.721790313720703, -17.39252471923828, -16.06325912475586, -14.733993530273438, -13.404727935791016, -12.075462341308594, -10.746196746826172, -9.41693115234375, -8.087664604187012, -6.75839900970459, -5.429134368896484, -4.0998687744140625, -2.7706029415130615, -1.4413371086120605, -0.11207151412963867, 1.2171940803527832, 2.5464601516723633, 3.875725746154785, 5.204991340637207, 6.534256935119629, 7.863522529602051, 9.192789077758789, 10.522054672241211, 11.851320266723633, 13.180585861206055, 14.509851455688477, 15.839117050170898, 17.16838264465332, 18.497648239135742, 19.826913833618164, 21.156179428100586, 22.485445022583008, 23.814712524414062, 25.143978118896484, 26.473243713378906, 27.802509307861328, 29.13177490234375, 30.461040496826172, 31.790306091308594, 33.119571685791016, 34.44883728027344, 35.77810287475586, 37.10736846923828]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 5.0, 6.0, 6.0, 9.0, 11.0, 17.0, 26.0, 22.0, 33.0, 38.0, 51.0, 44.0, 62.0, 54.0, 54.0, 60.0, 73.0, 62.0, 56.0, 60.0, 48.0, 43.0, 31.0, 31.0, 22.0, 26.0, 10.0, 16.0, 7.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.02933692932129, -23.240867614746094, -22.4523983001709, -21.663928985595703, -20.875459671020508, -20.086990356445312, -19.29852294921875, -18.510051727294922, -17.72158432006836, -16.933115005493164, -16.14464569091797, -15.356176376342773, -14.567707061767578, -13.779237747192383, -12.990769386291504, -12.202300071716309, -11.413829803466797, -10.625360488891602, -9.836891174316406, -9.048421859741211, -8.259952545166016, -7.4714837074279785, -6.683014869689941, -5.894545555114746, -5.106076240539551, -4.3176069259643555, -3.5291378498077393, -2.740668773651123, -1.9521994590759277, -1.1637301445007324, -0.3752613067626953, 0.4132080078125, 1.2016754150390625, 1.9901446104049683, 2.778613805770874, 3.5670828819274902, 4.3555521965026855, 5.144021511077881, 5.932490348815918, 6.720959663391113, 7.509428977966309, 8.297898292541504, 9.0863676071167, 9.874835968017578, 10.663305282592773, 11.451774597167969, 12.240243911743164, 13.02871322631836, 13.817182540893555, 14.60565185546875, 15.394121170043945, 16.18259048461914, 16.971059799194336, 17.75952911376953, 18.547996520996094, 19.336467742919922, 20.124935150146484, 20.91340446472168, 21.701873779296875, 22.49034309387207, 23.278812408447266, 24.06728172302246, 24.855751037597656, 25.64421844482422, 26.432689666748047]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 21.0, 22.0, 29.0, 58.0, 126.0, 303.0, 771.0, 2124.0, 7700.0, 34289.0, 205251.0, 598459.0, 162123.0, 27972.0, 6212.0, 1827.0, 678.0, 280.0, 135.0, 77.0, 40.0, 16.0, 12.0, 5.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6328125, -5.46923828125, -5.3056640625, -5.14208984375, -4.978515625, -4.81494140625, -4.6513671875, -4.48779296875, -4.32421875, -4.16064453125, -3.9970703125, -3.83349609375, -3.669921875, -3.50634765625, -3.3427734375, -3.17919921875, -3.015625, -2.85205078125, -2.6884765625, -2.52490234375, -2.361328125, -2.19775390625, -2.0341796875, -1.87060546875, -1.70703125, -1.54345703125, -1.3798828125, -1.21630859375, -1.052734375, -0.88916015625, -0.7255859375, -0.56201171875, -0.3984375, -0.23486328125, -0.0712890625, 0.09228515625, 0.255859375, 0.41943359375, 0.5830078125, 0.74658203125, 0.91015625, 1.07373046875, 1.2373046875, 1.40087890625, 1.564453125, 1.72802734375, 1.8916015625, 2.05517578125, 2.21875, 2.38232421875, 2.5458984375, 2.70947265625, 2.873046875, 3.03662109375, 3.2001953125, 3.36376953125, 3.52734375, 3.69091796875, 3.8544921875, 4.01806640625, 4.181640625, 4.34521484375, 4.5087890625, 4.67236328125, 4.8359375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 10.0, 12.0, 8.0, 15.0, 17.0, 18.0, 31.0, 31.0, 36.0, 51.0, 39.0, 46.0, 58.0, 49.0, 53.0, 59.0, 45.0, 56.0, 40.0, 32.0, 41.0, 44.0, 34.0, 28.0, 24.0, 26.0, 20.0, 8.0, 15.0, 7.0, 8.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7763671875, -1.7228546142578125, -1.669342041015625, -1.6158294677734375, -1.56231689453125, -1.5088043212890625, -1.455291748046875, -1.4017791748046875, -1.3482666015625, -1.2947540283203125, -1.241241455078125, -1.1877288818359375, -1.13421630859375, -1.0807037353515625, -1.027191162109375, -0.9736785888671875, -0.920166015625, -0.8666534423828125, -0.813140869140625, -0.7596282958984375, -0.70611572265625, -0.6526031494140625, -0.599090576171875, -0.5455780029296875, -0.4920654296875, -0.4385528564453125, -0.385040283203125, -0.3315277099609375, -0.27801513671875, -0.2245025634765625, -0.170989990234375, -0.1174774169921875, -0.06396484375, -0.0104522705078125, 0.043060302734375, 0.0965728759765625, 0.15008544921875, 0.2035980224609375, 0.257110595703125, 0.3106231689453125, 0.3641357421875, 0.4176483154296875, 0.471160888671875, 0.5246734619140625, 0.57818603515625, 0.6316986083984375, 0.685211181640625, 0.7387237548828125, 0.792236328125, 0.8457489013671875, 0.899261474609375, 0.9527740478515625, 1.00628662109375, 1.0597991943359375, 1.113311767578125, 1.1668243408203125, 1.2203369140625, 1.2738494873046875, 1.327362060546875, 1.3808746337890625, 1.43438720703125, 1.4878997802734375, 1.541412353515625, 1.5949249267578125, 1.6484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 2.0, 6.0, 9.0, 22.0, 37.0, 59.0, 137.0, 235.0, 682.0, 2257.0, 22783.0, 972000.0, 45865.0, 3026.0, 789.0, 303.0, 143.0, 65.0, 32.0, 27.0, 19.0, 8.0, 6.0, 9.0, 5.0, 5.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.5, -15.99365234375, -15.4873046875, -14.98095703125, -14.474609375, -13.96826171875, -13.4619140625, -12.95556640625, -12.44921875, -11.94287109375, -11.4365234375, -10.93017578125, -10.423828125, -9.91748046875, -9.4111328125, -8.90478515625, -8.3984375, -7.89208984375, -7.3857421875, -6.87939453125, -6.373046875, -5.86669921875, -5.3603515625, -4.85400390625, -4.34765625, -3.84130859375, -3.3349609375, -2.82861328125, -2.322265625, -1.81591796875, -1.3095703125, -0.80322265625, -0.296875, 0.20947265625, 0.7158203125, 1.22216796875, 1.728515625, 2.23486328125, 2.7412109375, 3.24755859375, 3.75390625, 4.26025390625, 4.7666015625, 5.27294921875, 5.779296875, 6.28564453125, 6.7919921875, 7.29833984375, 7.8046875, 8.31103515625, 8.8173828125, 9.32373046875, 9.830078125, 10.33642578125, 10.8427734375, 11.34912109375, 11.85546875, 12.36181640625, 12.8681640625, 13.37451171875, 13.880859375, 14.38720703125, 14.8935546875, 15.39990234375, 15.90625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 9.0, 3.0, 5.0, 9.0, 5.0, 7.0, 10.0, 15.0, 25.0, 38.0, 28.0, 47.0, 40.0, 55.0, 68.0, 73.0, 63.0, 71.0, 70.0, 76.0, 52.0, 52.0, 36.0, 44.0, 20.0, 18.0, 21.0, 17.0, 12.0, 7.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3203125, -10.0228271484375, -9.725341796875, -9.4278564453125, -9.13037109375, -8.8328857421875, -8.535400390625, -8.2379150390625, -7.9404296875, -7.6429443359375, -7.345458984375, -7.0479736328125, -6.75048828125, -6.4530029296875, -6.155517578125, -5.8580322265625, -5.560546875, -5.2630615234375, -4.965576171875, -4.6680908203125, -4.37060546875, -4.0731201171875, -3.775634765625, -3.4781494140625, -3.1806640625, -2.8831787109375, -2.585693359375, -2.2882080078125, -1.99072265625, -1.6932373046875, -1.395751953125, -1.0982666015625, -0.80078125, -0.5032958984375, -0.205810546875, 0.0916748046875, 0.38916015625, 0.6866455078125, 0.984130859375, 1.2816162109375, 1.5791015625, 1.8765869140625, 2.174072265625, 2.4715576171875, 2.76904296875, 3.0665283203125, 3.364013671875, 3.6614990234375, 3.958984375, 4.2564697265625, 4.553955078125, 4.8514404296875, 5.14892578125, 5.4464111328125, 5.743896484375, 6.0413818359375, 6.3388671875, 6.6363525390625, 6.933837890625, 7.2313232421875, 7.52880859375, 7.8262939453125, 8.123779296875, 8.4212646484375, 8.71875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 8.0, 7.0, 8.0, 13.0, 19.0, 39.0, 54.0, 99.0, 203.0, 489.0, 1490.0, 8025.0, 251186.0, 770712.0, 13040.0, 1952.0, 588.0, 275.0, 135.0, 74.0, 43.0, 25.0, 16.0, 10.0, 6.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.578125, -5.392822265625, -5.20751953125, -5.022216796875, -4.8369140625, -4.651611328125, -4.46630859375, -4.281005859375, -4.095703125, -3.910400390625, -3.72509765625, -3.539794921875, -3.3544921875, -3.169189453125, -2.98388671875, -2.798583984375, -2.61328125, -2.427978515625, -2.24267578125, -2.057373046875, -1.8720703125, -1.686767578125, -1.50146484375, -1.316162109375, -1.130859375, -0.945556640625, -0.76025390625, -0.574951171875, -0.3896484375, -0.204345703125, -0.01904296875, 0.166259765625, 0.3515625, 0.536865234375, 0.72216796875, 0.907470703125, 1.0927734375, 1.278076171875, 1.46337890625, 1.648681640625, 1.833984375, 2.019287109375, 2.20458984375, 2.389892578125, 2.5751953125, 2.760498046875, 2.94580078125, 3.131103515625, 3.31640625, 3.501708984375, 3.68701171875, 3.872314453125, 4.0576171875, 4.242919921875, 4.42822265625, 4.613525390625, 4.798828125, 4.984130859375, 5.16943359375, 5.354736328125, 5.5400390625, 5.725341796875, 5.91064453125, 6.095947265625, 6.28125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 7.0, 10.0, 20.0, 19.0, 25.0, 33.0, 44.0, 69.0, 88.0, 152.0, 140.0, 116.0, 60.0, 57.0, 29.0, 24.0, 15.0, 15.0, 12.0, 10.0, 14.0, 5.0, 7.0, 4.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00033664703369140625, -0.0003250502049922943, -0.0003134533762931824, -0.00030185654759407043, -0.0002902597188949585, -0.00027866289019584656, -0.0002670660614967346, -0.0002554692327976227, -0.00024387240409851074, -0.0002322755753993988, -0.00022067874670028687, -0.00020908191800117493, -0.000197485089302063, -0.00018588826060295105, -0.0001742914319038391, -0.00016269460320472717, -0.00015109777450561523, -0.0001395009458065033, -0.00012790411710739136, -0.00011630728840827942, -0.00010471045970916748, -9.311363101005554e-05, -8.15168023109436e-05, -6.991997361183167e-05, -5.8323144912719727e-05, -4.672631621360779e-05, -3.512948751449585e-05, -2.353265881538391e-05, -1.1935830116271973e-05, -3.390014171600342e-07, 1.1257827281951904e-05, 2.2854655981063843e-05, 3.445148468017578e-05, 4.604831337928772e-05, 5.764514207839966e-05, 6.92419707775116e-05, 8.083879947662354e-05, 9.243562817573547e-05, 0.00010403245687484741, 0.00011562928557395935, 0.0001272261142730713, 0.00013882294297218323, 0.00015041977167129517, 0.0001620166003704071, 0.00017361342906951904, 0.00018521025776863098, 0.00019680708646774292, 0.00020840391516685486, 0.0002200007438659668, 0.00023159757256507874, 0.00024319440126419067, 0.0002547912299633026, 0.00026638805866241455, 0.0002779848873615265, 0.00028958171606063843, 0.00030117854475975037, 0.0003127753734588623, 0.00032437220215797424, 0.0003359690308570862, 0.0003475658595561981, 0.00035916268825531006, 0.000370759516954422, 0.00038235634565353394, 0.0003939531743526459, 0.0004055500030517578]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 3.0, 6.0, 9.0, 8.0, 13.0, 17.0, 34.0, 45.0, 61.0, 105.0, 210.0, 449.0, 1052.0, 3463.0, 19843.0, 727253.0, 279176.0, 12465.0, 2592.0, 903.0, 391.0, 168.0, 108.0, 57.0, 35.0, 24.0, 20.0, 14.0, 5.0, 4.0, 7.0, 5.0, 0.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.30078125, -5.1396484375, -4.978515625, -4.8173828125, -4.65625, -4.4951171875, -4.333984375, -4.1728515625, -4.01171875, -3.8505859375, -3.689453125, -3.5283203125, -3.3671875, -3.2060546875, -3.044921875, -2.8837890625, -2.72265625, -2.5615234375, -2.400390625, -2.2392578125, -2.078125, -1.9169921875, -1.755859375, -1.5947265625, -1.43359375, -1.2724609375, -1.111328125, -0.9501953125, -0.7890625, -0.6279296875, -0.466796875, -0.3056640625, -0.14453125, 0.0166015625, 0.177734375, 0.3388671875, 0.5, 0.6611328125, 0.822265625, 0.9833984375, 1.14453125, 1.3056640625, 1.466796875, 1.6279296875, 1.7890625, 1.9501953125, 2.111328125, 2.2724609375, 2.43359375, 2.5947265625, 2.755859375, 2.9169921875, 3.078125, 3.2392578125, 3.400390625, 3.5615234375, 3.72265625, 3.8837890625, 4.044921875, 4.2060546875, 4.3671875, 4.5283203125, 4.689453125, 4.8505859375, 5.01171875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 6.0, 6.0, 16.0, 14.0, 29.0, 24.0, 40.0, 49.0, 79.0, 116.0, 134.0, 156.0, 89.0, 60.0, 43.0, 29.0, 29.0, 12.0, 12.0, 11.0, 9.0, 8.0, 1.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.525390625, -3.410003662109375, -3.29461669921875, -3.179229736328125, -3.0638427734375, -2.948455810546875, -2.83306884765625, -2.717681884765625, -2.602294921875, -2.486907958984375, -2.37152099609375, -2.256134033203125, -2.1407470703125, -2.025360107421875, -1.90997314453125, -1.794586181640625, -1.67919921875, -1.563812255859375, -1.44842529296875, -1.333038330078125, -1.2176513671875, -1.102264404296875, -0.98687744140625, -0.871490478515625, -0.756103515625, -0.640716552734375, -0.52532958984375, -0.409942626953125, -0.2945556640625, -0.179168701171875, -0.06378173828125, 0.051605224609375, 0.1669921875, 0.282379150390625, 0.39776611328125, 0.513153076171875, 0.6285400390625, 0.743927001953125, 0.85931396484375, 0.974700927734375, 1.090087890625, 1.205474853515625, 1.32086181640625, 1.436248779296875, 1.5516357421875, 1.667022705078125, 1.78240966796875, 1.897796630859375, 2.01318359375, 2.128570556640625, 2.24395751953125, 2.359344482421875, 2.4747314453125, 2.590118408203125, 2.70550537109375, 2.820892333984375, 2.936279296875, 3.051666259765625, 3.16705322265625, 3.282440185546875, 3.3978271484375, 3.513214111328125, 3.62860107421875, 3.743988037109375, 3.859375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 10.0, 26.0, 72.0, 141.0, 245.0, 261.0, 132.0, 61.0, 22.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-77.70861053466797, -75.66587829589844, -73.6231460571289, -71.58041381835938, -69.53768920898438, -67.49495697021484, -65.45222473144531, -63.40949249267578, -61.36676025390625, -59.32402801513672, -57.28129959106445, -55.23856735229492, -53.19583511352539, -51.153106689453125, -49.110374450683594, -47.06764221191406, -45.0249137878418, -42.982181549072266, -40.939453125, -38.89672088623047, -36.85398864746094, -34.811256408691406, -32.76852798461914, -30.72579574584961, -28.68306541442871, -26.640335083007812, -24.59760284423828, -22.554872512817383, -20.512142181396484, -18.469409942626953, -16.426679611206055, -14.38394832611084, -12.34122085571289, -10.298489570617676, -8.255758285522461, -6.2130279541015625, -4.170296669006348, -2.127565383911133, -0.08483505249023438, 1.9578962326049805, 4.000627517700195, 6.04335880279541, 8.086090087890625, 10.128820419311523, 12.171551704406738, 14.214282989501953, 16.25701332092285, 18.29974365234375, 20.34247589111328, 22.38520622253418, 24.42793846130371, 26.47066879272461, 28.51340103149414, 30.55613136291504, 32.59886169433594, 34.64159393310547, 36.684326171875, 38.72705841064453, 40.7697868347168, 42.81251907348633, 44.85525131225586, 46.897979736328125, 48.940711975097656, 50.98344421386719, 53.02617263793945]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 6.0, 5.0, 5.0, 12.0, 20.0, 27.0, 23.0, 23.0, 19.0, 37.0, 47.0, 53.0, 37.0, 55.0, 64.0, 75.0, 67.0, 68.0, 52.0, 50.0, 35.0, 36.0, 44.0, 24.0, 25.0, 22.0, 19.0, 13.0, 8.0, 7.0, 5.0, 6.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.19202423095703, -34.11357879638672, -33.035133361816406, -31.956687927246094, -30.87824249267578, -29.79979705810547, -28.721351623535156, -27.642906188964844, -26.56446075439453, -25.48601531982422, -24.407569885253906, -23.329124450683594, -22.25067901611328, -21.17223358154297, -20.093788146972656, -19.015342712402344, -17.93689727783203, -16.85845184326172, -15.780006408691406, -14.701560974121094, -13.623115539550781, -12.544670104980469, -11.466224670410156, -10.387779235839844, -9.309333801269531, -8.230888366699219, -7.152442932128906, -6.073997497558594, -4.995552062988281, -3.9171066284179688, -2.8386611938476562, -1.7602157592773438, -0.6817703247070312, 0.39667510986328125, 1.4751205444335938, 2.5535659790039062, 3.6320114135742188, 4.710456848144531, 5.788902282714844, 6.867347717285156, 7.945793151855469, 9.024238586425781, 10.102684020996094, 11.181129455566406, 12.259574890136719, 13.338020324707031, 14.416465759277344, 15.494911193847656, 16.57335662841797, 17.65180206298828, 18.730247497558594, 19.808692932128906, 20.88713836669922, 21.96558380126953, 23.044029235839844, 24.122474670410156, 25.20092010498047, 26.27936553955078, 27.357810974121094, 28.436256408691406, 29.51470184326172, 30.59314727783203, 31.671592712402344, 32.750038146972656, 33.82848358154297]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 3.0, 7.0, 7.0, 9.0, 3.0, 11.0, 27.0, 28.0, 30.0, 57.0, 122.0, 176.0, 326.0, 626.0, 1329.0, 3360.0, 9884.0, 44249.0, 686602.0, 3282091.0, 134402.0, 20643.0, 6138.0, 2214.0, 869.0, 461.0, 227.0, 145.0, 66.0, 50.0, 39.0, 26.0, 13.0, 8.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.375, -4.257568359375, -4.14013671875, -4.022705078125, -3.9052734375, -3.787841796875, -3.67041015625, -3.552978515625, -3.435546875, -3.318115234375, -3.20068359375, -3.083251953125, -2.9658203125, -2.848388671875, -2.73095703125, -2.613525390625, -2.49609375, -2.378662109375, -2.26123046875, -2.143798828125, -2.0263671875, -1.908935546875, -1.79150390625, -1.674072265625, -1.556640625, -1.439208984375, -1.32177734375, -1.204345703125, -1.0869140625, -0.969482421875, -0.85205078125, -0.734619140625, -0.6171875, -0.499755859375, -0.38232421875, -0.264892578125, -0.1474609375, -0.030029296875, 0.08740234375, 0.204833984375, 0.322265625, 0.439697265625, 0.55712890625, 0.674560546875, 0.7919921875, 0.909423828125, 1.02685546875, 1.144287109375, 1.26171875, 1.379150390625, 1.49658203125, 1.614013671875, 1.7314453125, 1.848876953125, 1.96630859375, 2.083740234375, 2.201171875, 2.318603515625, 2.43603515625, 2.553466796875, 2.6708984375, 2.788330078125, 2.90576171875, 3.023193359375, 3.140625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 15.0, 18.0, 39.0, 42.0, 60.0, 93.0, 133.0, 119.0, 129.0, 119.0, 91.0, 44.0, 47.0, 28.0, 16.0, 10.0, 6.0, 4.0, 0.0, 0.0, 3.0], "bins": [-6.19140625, -6.0696563720703125, -5.947906494140625, -5.8261566162109375, -5.70440673828125, -5.5826568603515625, -5.460906982421875, -5.3391571044921875, -5.2174072265625, -5.0956573486328125, -4.973907470703125, -4.8521575927734375, -4.73040771484375, -4.6086578369140625, -4.486907958984375, -4.3651580810546875, -4.243408203125, -4.1216583251953125, -3.999908447265625, -3.8781585693359375, -3.75640869140625, -3.6346588134765625, -3.512908935546875, -3.3911590576171875, -3.2694091796875, -3.1476593017578125, -3.025909423828125, -2.9041595458984375, -2.78240966796875, -2.6606597900390625, -2.538909912109375, -2.4171600341796875, -2.29541015625, -2.1736602783203125, -2.051910400390625, -1.9301605224609375, -1.80841064453125, -1.6866607666015625, -1.564910888671875, -1.4431610107421875, -1.3214111328125, -1.1996612548828125, -1.077911376953125, -0.9561614990234375, -0.83441162109375, -0.7126617431640625, -0.590911865234375, -0.4691619873046875, -0.347412109375, -0.2256622314453125, -0.103912353515625, 0.0178375244140625, 0.13958740234375, 0.2613372802734375, 0.383087158203125, 0.5048370361328125, 0.6265869140625, 0.7483367919921875, 0.870086669921875, 0.9918365478515625, 1.11358642578125, 1.2353363037109375, 1.357086181640625, 1.4788360595703125, 1.6005859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 2.0, 8.0, 6.0, 10.0, 19.0, 66.0, 128.0, 296.0, 697.0, 1839.0, 5666.0, 23095.0, 265956.0, 3706395.0, 162732.0, 19526.0, 5138.0, 1630.0, 633.0, 212.0, 105.0, 60.0, 17.0, 14.0, 5.0, 6.0, 4.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.58984375, -5.44049072265625, -5.2911376953125, -5.14178466796875, -4.992431640625, -4.84307861328125, -4.6937255859375, -4.54437255859375, -4.39501953125, -4.24566650390625, -4.0963134765625, -3.94696044921875, -3.797607421875, -3.64825439453125, -3.4989013671875, -3.34954833984375, -3.2001953125, -3.05084228515625, -2.9014892578125, -2.75213623046875, -2.602783203125, -2.45343017578125, -2.3040771484375, -2.15472412109375, -2.00537109375, -1.85601806640625, -1.7066650390625, -1.55731201171875, -1.407958984375, -1.25860595703125, -1.1092529296875, -0.95989990234375, -0.810546875, -0.66119384765625, -0.5118408203125, -0.36248779296875, -0.213134765625, -0.06378173828125, 0.0855712890625, 0.23492431640625, 0.38427734375, 0.53363037109375, 0.6829833984375, 0.83233642578125, 0.981689453125, 1.13104248046875, 1.2803955078125, 1.42974853515625, 1.5791015625, 1.72845458984375, 1.8778076171875, 2.02716064453125, 2.176513671875, 2.32586669921875, 2.4752197265625, 2.62457275390625, 2.77392578125, 2.92327880859375, 3.0726318359375, 3.22198486328125, 3.371337890625, 3.52069091796875, 3.6700439453125, 3.81939697265625, 3.96875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 8.0, 17.0, 9.0, 30.0, 33.0, 48.0, 98.0, 189.0, 347.0, 749.0, 1019.0, 692.0, 330.0, 182.0, 94.0, 58.0, 42.0, 26.0, 17.0, 19.0, 12.0, 9.0, 4.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-3.892578125, -3.782928466796875, -3.67327880859375, -3.563629150390625, -3.4539794921875, -3.344329833984375, -3.23468017578125, -3.125030517578125, -3.015380859375, -2.905731201171875, -2.79608154296875, -2.686431884765625, -2.5767822265625, -2.467132568359375, -2.35748291015625, -2.247833251953125, -2.13818359375, -2.028533935546875, -1.91888427734375, -1.809234619140625, -1.6995849609375, -1.589935302734375, -1.48028564453125, -1.370635986328125, -1.260986328125, -1.151336669921875, -1.04168701171875, -0.932037353515625, -0.8223876953125, -0.712738037109375, -0.60308837890625, -0.493438720703125, -0.3837890625, -0.274139404296875, -0.16448974609375, -0.054840087890625, 0.0548095703125, 0.164459228515625, 0.27410888671875, 0.383758544921875, 0.493408203125, 0.603057861328125, 0.71270751953125, 0.822357177734375, 0.9320068359375, 1.041656494140625, 1.15130615234375, 1.260955810546875, 1.37060546875, 1.480255126953125, 1.58990478515625, 1.699554443359375, 1.8092041015625, 1.918853759765625, 2.02850341796875, 2.138153076171875, 2.247802734375, 2.357452392578125, 2.46710205078125, 2.576751708984375, 2.6864013671875, 2.796051025390625, 2.90570068359375, 3.015350341796875, 3.125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 14.0, 23.0, 57.0, 133.0, 247.0, 261.0, 135.0, 72.0, 27.0, 10.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.351806640625, -31.060998916625977, -29.770191192626953, -28.47938346862793, -27.188575744628906, -25.897769927978516, -24.606962203979492, -23.31615447998047, -22.025346755981445, -20.734539031982422, -19.4437313079834, -18.152923583984375, -16.862117767333984, -15.571309089660645, -14.280502319335938, -12.989694595336914, -11.69888687133789, -10.408079147338867, -9.117271423339844, -7.826464653015137, -6.535656929016113, -5.24484920501709, -3.9540419578552246, -2.6632347106933594, -1.372426986694336, -0.0816195011138916, 1.2091879844665527, 2.499995470046997, 3.7908029556274414, 5.081610679626465, 6.37241792678833, 7.663225173950195, 8.954032897949219, 10.244840621948242, 11.535648345947266, 12.826455116271973, 14.117262840270996, 15.40807056427002, 16.698877334594727, 17.98968505859375, 19.280492782592773, 20.571300506591797, 21.86210823059082, 23.152915954589844, 24.443721771240234, 25.73453140258789, 27.02533721923828, 28.316144943237305, 29.606952667236328, 30.89776039123535, 32.188568115234375, 33.479373931884766, 34.77018356323242, 36.06098937988281, 37.35179901123047, 38.64260482788086, 39.93341064453125, 41.22421646118164, 42.5150260925293, 43.80583190917969, 45.096641540527344, 46.387447357177734, 47.67825698852539, 48.96906280517578, 50.25987243652344]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 7.0, 12.0, 20.0, 18.0, 17.0, 41.0, 29.0, 51.0, 65.0, 70.0, 65.0, 90.0, 68.0, 69.0, 60.0, 48.0, 53.0, 53.0, 42.0, 26.0, 26.0, 17.0, 13.0, 12.0, 14.0, 7.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.75351333618164, -14.104641914367676, -13.455771446228027, -12.806900024414062, -12.158029556274414, -11.50915813446045, -10.860286712646484, -10.211416244506836, -9.562544822692871, -8.913673400878906, -8.264802932739258, -7.615931510925293, -6.967060565948486, -6.31818962097168, -5.669318199157715, -5.020447254180908, -4.371576309204102, -3.722705364227295, -3.073834180831909, -2.4249629974365234, -1.7760920524597168, -1.1272211074829102, -0.4783499240875244, 0.17052125930786133, 0.819392204284668, 1.4682632684707642, 2.1171343326568604, 2.766005516052246, 3.4148764610290527, 4.063747406005859, 4.712618827819824, 5.361489772796631, 6.010358810424805, 6.659229755401611, 7.308100700378418, 7.956972122192383, 8.605842590332031, 9.254714012145996, 9.903585433959961, 10.55245590209961, 11.201327323913574, 11.850198745727539, 12.499069213867188, 13.147940635681152, 13.796812057495117, 14.445682525634766, 15.09455394744873, 15.743425369262695, 16.392295837402344, 17.041166305541992, 17.690038681030273, 18.338909149169922, 18.98777961730957, 19.63665008544922, 20.2855224609375, 20.93439292907715, 21.583263397216797, 22.232133865356445, 22.881006240844727, 23.529876708984375, 24.178747177124023, 24.827617645263672, 25.476490020751953, 26.1253604888916, 26.774232864379883]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 8.0, 5.0, 12.0, 27.0, 36.0, 48.0, 68.0, 96.0, 137.0, 242.0, 418.0, 752.0, 1424.0, 3050.0, 7073.0, 17776.0, 49334.0, 153183.0, 403817.0, 273452.0, 87198.0, 30075.0, 11222.0, 4471.0, 2106.0, 1101.0, 574.0, 299.0, 189.0, 123.0, 78.0, 47.0, 33.0, 23.0, 14.0, 19.0, 12.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0], "bins": [-3.826171875, -3.727447509765625, -3.62872314453125, -3.529998779296875, -3.4312744140625, -3.332550048828125, -3.23382568359375, -3.135101318359375, -3.036376953125, -2.937652587890625, -2.83892822265625, -2.740203857421875, -2.6414794921875, -2.542755126953125, -2.44403076171875, -2.345306396484375, -2.24658203125, -2.147857666015625, -2.04913330078125, -1.950408935546875, -1.8516845703125, -1.752960205078125, -1.65423583984375, -1.555511474609375, -1.456787109375, -1.358062744140625, -1.25933837890625, -1.160614013671875, -1.0618896484375, -0.963165283203125, -0.86444091796875, -0.765716552734375, -0.6669921875, -0.568267822265625, -0.46954345703125, -0.370819091796875, -0.2720947265625, -0.173370361328125, -0.07464599609375, 0.024078369140625, 0.122802734375, 0.221527099609375, 0.32025146484375, 0.418975830078125, 0.5177001953125, 0.616424560546875, 0.71514892578125, 0.813873291015625, 0.91259765625, 1.011322021484375, 1.11004638671875, 1.208770751953125, 1.3074951171875, 1.406219482421875, 1.50494384765625, 1.603668212890625, 1.702392578125, 1.801116943359375, 1.89984130859375, 1.998565673828125, 2.0972900390625, 2.196014404296875, 2.29473876953125, 2.393463134765625, 2.4921875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 6.0, 6.0, 10.0, 9.0, 23.0, 16.0, 27.0, 27.0, 40.0, 57.0, 47.0, 48.0, 74.0, 71.0, 67.0, 66.0, 57.0, 48.0, 64.0, 54.0, 38.0, 31.0, 23.0, 37.0, 11.0, 13.0, 12.0, 10.0, 9.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.2988128662109375, -2.236297607421875, -2.1737823486328125, -2.11126708984375, -2.0487518310546875, -1.986236572265625, -1.9237213134765625, -1.8612060546875, -1.7986907958984375, -1.736175537109375, -1.6736602783203125, -1.61114501953125, -1.5486297607421875, -1.486114501953125, -1.4235992431640625, -1.361083984375, -1.2985687255859375, -1.236053466796875, -1.1735382080078125, -1.11102294921875, -1.0485076904296875, -0.985992431640625, -0.9234771728515625, -0.8609619140625, -0.7984466552734375, -0.735931396484375, -0.6734161376953125, -0.61090087890625, -0.5483856201171875, -0.485870361328125, -0.4233551025390625, -0.36083984375, -0.2983245849609375, -0.235809326171875, -0.1732940673828125, -0.11077880859375, -0.0482635498046875, 0.014251708984375, 0.0767669677734375, 0.1392822265625, 0.2017974853515625, 0.264312744140625, 0.3268280029296875, 0.38934326171875, 0.4518585205078125, 0.514373779296875, 0.5768890380859375, 0.639404296875, 0.7019195556640625, 0.764434814453125, 0.8269500732421875, 0.88946533203125, 0.9519805908203125, 1.014495849609375, 1.0770111083984375, 1.1395263671875, 1.2020416259765625, 1.264556884765625, 1.3270721435546875, 1.38958740234375, 1.4521026611328125, 1.514617919921875, 1.5771331787109375, 1.6396484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 9.0, 9.0, 13.0, 24.0, 25.0, 33.0, 59.0, 77.0, 167.0, 263.0, 481.0, 1089.0, 3687.0, 22363.0, 310428.0, 660873.0, 40662.0, 5424.0, 1476.0, 596.0, 320.0, 161.0, 100.0, 65.0, 43.0, 33.0, 16.0, 15.0, 14.0, 13.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.03125, -7.788818359375, -7.54638671875, -7.303955078125, -7.0615234375, -6.819091796875, -6.57666015625, -6.334228515625, -6.091796875, -5.849365234375, -5.60693359375, -5.364501953125, -5.1220703125, -4.879638671875, -4.63720703125, -4.394775390625, -4.15234375, -3.909912109375, -3.66748046875, -3.425048828125, -3.1826171875, -2.940185546875, -2.69775390625, -2.455322265625, -2.212890625, -1.970458984375, -1.72802734375, -1.485595703125, -1.2431640625, -1.000732421875, -0.75830078125, -0.515869140625, -0.2734375, -0.031005859375, 0.21142578125, 0.453857421875, 0.6962890625, 0.938720703125, 1.18115234375, 1.423583984375, 1.666015625, 1.908447265625, 2.15087890625, 2.393310546875, 2.6357421875, 2.878173828125, 3.12060546875, 3.363037109375, 3.60546875, 3.847900390625, 4.09033203125, 4.332763671875, 4.5751953125, 4.817626953125, 5.06005859375, 5.302490234375, 5.544921875, 5.787353515625, 6.02978515625, 6.272216796875, 6.5146484375, 6.757080078125, 6.99951171875, 7.241943359375, 7.484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 9.0, 8.0, 6.0, 7.0, 12.0, 13.0, 19.0, 20.0, 27.0, 17.0, 31.0, 20.0, 31.0, 34.0, 41.0, 29.0, 36.0, 37.0, 54.0, 38.0, 59.0, 43.0, 45.0, 38.0, 36.0, 41.0, 28.0, 28.0, 33.0, 25.0, 20.0, 15.0, 19.0, 15.0, 14.0, 6.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.4844970703125, -4.324462890625, -4.1644287109375, -4.00439453125, -3.8443603515625, -3.684326171875, -3.5242919921875, -3.3642578125, -3.2042236328125, -3.044189453125, -2.8841552734375, -2.72412109375, -2.5640869140625, -2.404052734375, -2.2440185546875, -2.083984375, -1.9239501953125, -1.763916015625, -1.6038818359375, -1.44384765625, -1.2838134765625, -1.123779296875, -0.9637451171875, -0.8037109375, -0.6436767578125, -0.483642578125, -0.3236083984375, -0.16357421875, -0.0035400390625, 0.156494140625, 0.3165283203125, 0.4765625, 0.6365966796875, 0.796630859375, 0.9566650390625, 1.11669921875, 1.2767333984375, 1.436767578125, 1.5968017578125, 1.7568359375, 1.9168701171875, 2.076904296875, 2.2369384765625, 2.39697265625, 2.5570068359375, 2.717041015625, 2.8770751953125, 3.037109375, 3.1971435546875, 3.357177734375, 3.5172119140625, 3.67724609375, 3.8372802734375, 3.997314453125, 4.1573486328125, 4.3173828125, 4.4774169921875, 4.637451171875, 4.7974853515625, 4.95751953125, 5.1175537109375, 5.277587890625, 5.4376220703125, 5.59765625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 8.0, 14.0, 12.0, 30.0, 92.0, 330.0, 2507.0, 814417.0, 229010.0, 1748.0, 226.0, 75.0, 37.0, 11.0, 11.0, 6.0, 3.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.9375, -10.6243896484375, -10.311279296875, -9.9981689453125, -9.68505859375, -9.3719482421875, -9.058837890625, -8.7457275390625, -8.4326171875, -8.1195068359375, -7.806396484375, -7.4932861328125, -7.18017578125, -6.8670654296875, -6.553955078125, -6.2408447265625, -5.927734375, -5.6146240234375, -5.301513671875, -4.9884033203125, -4.67529296875, -4.3621826171875, -4.049072265625, -3.7359619140625, -3.4228515625, -3.1097412109375, -2.796630859375, -2.4835205078125, -2.17041015625, -1.8572998046875, -1.544189453125, -1.2310791015625, -0.91796875, -0.6048583984375, -0.291748046875, 0.0213623046875, 0.33447265625, 0.6475830078125, 0.960693359375, 1.2738037109375, 1.5869140625, 1.9000244140625, 2.213134765625, 2.5262451171875, 2.83935546875, 3.1524658203125, 3.465576171875, 3.7786865234375, 4.091796875, 4.4049072265625, 4.718017578125, 5.0311279296875, 5.34423828125, 5.6573486328125, 5.970458984375, 6.2835693359375, 6.5966796875, 6.9097900390625, 7.222900390625, 7.5360107421875, 7.84912109375, 8.1622314453125, 8.475341796875, 8.7884521484375, 9.1015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 4.0, 9.0, 8.0, 13.0, 12.0, 13.0, 24.0, 22.0, 36.0, 59.0, 74.0, 93.0, 114.0, 123.0, 107.0, 77.0, 47.0, 42.0, 18.0, 25.0, 20.0, 9.0, 18.0, 8.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.00036144256591796875, -0.0003513917326927185, -0.00034134089946746826, -0.000331290066242218, -0.0003212392330169678, -0.00031118839979171753, -0.0003011375665664673, -0.00029108673334121704, -0.0002810359001159668, -0.00027098506689071655, -0.0002609342336654663, -0.00025088340044021606, -0.00024083256721496582, -0.00023078173398971558, -0.00022073090076446533, -0.0002106800675392151, -0.00020062923431396484, -0.0001905784010887146, -0.00018052756786346436, -0.0001704767346382141, -0.00016042590141296387, -0.00015037506818771362, -0.00014032423496246338, -0.00013027340173721313, -0.00012022256851196289, -0.00011017173528671265, -0.0001001209020614624, -9.007006883621216e-05, -8.001923561096191e-05, -6.996840238571167e-05, -5.9917569160461426e-05, -4.986673593521118e-05, -3.981590270996094e-05, -2.9765069484710693e-05, -1.971423625946045e-05, -9.663403034210205e-06, 3.8743019104003906e-07, 1.0438263416290283e-05, 2.0489096641540527e-05, 3.053992986679077e-05, 4.0590763092041016e-05, 5.064159631729126e-05, 6.0692429542541504e-05, 7.074326276779175e-05, 8.079409599304199e-05, 9.084492921829224e-05, 0.00010089576244354248, 0.00011094659566879272, 0.00012099742889404297, 0.0001310482621192932, 0.00014109909534454346, 0.0001511499285697937, 0.00016120076179504395, 0.0001712515950202942, 0.00018130242824554443, 0.00019135326147079468, 0.00020140409469604492, 0.00021145492792129517, 0.0002215057611465454, 0.00023155659437179565, 0.0002416074275970459, 0.00025165826082229614, 0.0002617090940475464, 0.00027175992727279663, 0.0002818107604980469]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 8.0, 10.0, 11.0, 13.0, 43.0, 66.0, 115.0, 246.0, 513.0, 1439.0, 5780.0, 50139.0, 880355.0, 98575.0, 8181.0, 1841.0, 655.0, 269.0, 121.0, 63.0, 39.0, 22.0, 16.0, 7.0, 5.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.75390625, -2.6419677734375, -2.530029296875, -2.4180908203125, -2.30615234375, -2.1942138671875, -2.082275390625, -1.9703369140625, -1.8583984375, -1.7464599609375, -1.634521484375, -1.5225830078125, -1.41064453125, -1.2987060546875, -1.186767578125, -1.0748291015625, -0.962890625, -0.8509521484375, -0.739013671875, -0.6270751953125, -0.51513671875, -0.4031982421875, -0.291259765625, -0.1793212890625, -0.0673828125, 0.0445556640625, 0.156494140625, 0.2684326171875, 0.38037109375, 0.4923095703125, 0.604248046875, 0.7161865234375, 0.828125, 0.9400634765625, 1.052001953125, 1.1639404296875, 1.27587890625, 1.3878173828125, 1.499755859375, 1.6116943359375, 1.7236328125, 1.8355712890625, 1.947509765625, 2.0594482421875, 2.17138671875, 2.2833251953125, 2.395263671875, 2.5072021484375, 2.619140625, 2.7310791015625, 2.843017578125, 2.9549560546875, 3.06689453125, 3.1788330078125, 3.290771484375, 3.4027099609375, 3.5146484375, 3.6265869140625, 3.738525390625, 3.8504638671875, 3.96240234375, 4.0743408203125, 4.186279296875, 4.2982177734375, 4.41015625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 12.0, 16.0, 20.0, 19.0, 21.0, 46.0, 50.0, 71.0, 87.0, 97.0, 86.0, 78.0, 88.0, 64.0, 65.0, 41.0, 29.0, 25.0, 21.0, 15.0, 11.0, 2.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5166015625, -1.4600067138671875, -1.403411865234375, -1.3468170166015625, -1.29022216796875, -1.2336273193359375, -1.177032470703125, -1.1204376220703125, -1.0638427734375, -1.0072479248046875, -0.950653076171875, -0.8940582275390625, -0.83746337890625, -0.7808685302734375, -0.724273681640625, -0.6676788330078125, -0.611083984375, -0.5544891357421875, -0.497894287109375, -0.4412994384765625, -0.38470458984375, -0.3281097412109375, -0.271514892578125, -0.2149200439453125, -0.1583251953125, -0.1017303466796875, -0.045135498046875, 0.0114593505859375, 0.06805419921875, 0.1246490478515625, 0.181243896484375, 0.2378387451171875, 0.29443359375, 0.3510284423828125, 0.407623291015625, 0.4642181396484375, 0.52081298828125, 0.5774078369140625, 0.634002685546875, 0.6905975341796875, 0.7471923828125, 0.8037872314453125, 0.860382080078125, 0.9169769287109375, 0.97357177734375, 1.0301666259765625, 1.086761474609375, 1.1433563232421875, 1.199951171875, 1.2565460205078125, 1.313140869140625, 1.3697357177734375, 1.42633056640625, 1.4829254150390625, 1.539520263671875, 1.5961151123046875, 1.6527099609375, 1.7093048095703125, 1.765899658203125, 1.8224945068359375, 1.87908935546875, 1.9356842041015625, 1.992279052734375, 2.0488739013671875, 2.10546875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 15.0, 45.0, 123.0, 369.0, 290.0, 105.0, 39.0, 4.0, 7.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.2984390258789, -80.83534240722656, -78.37224578857422, -75.90914916992188, -73.44605255126953, -70.98295593261719, -68.51985931396484, -66.0567626953125, -63.59366989135742, -61.13057327270508, -58.667476654052734, -56.20438003540039, -53.74128723144531, -51.27819061279297, -48.815093994140625, -46.35199737548828, -43.88890075683594, -41.425804138183594, -38.96270751953125, -36.499610900878906, -34.03651428222656, -31.57341957092285, -29.11032485961914, -26.647228240966797, -24.184131622314453, -21.72103500366211, -19.257938385009766, -16.794843673706055, -14.331747055053711, -11.868650436401367, -9.40555477142334, -6.9424591064453125, -4.479362487792969, -2.016266345977783, 0.44682979583740234, 2.909925937652588, 5.373022079467773, 7.836118698120117, 10.299214363098145, 12.762310028076172, 15.225406646728516, 17.68850326538086, 20.151599884033203, 22.614694595336914, 25.077791213989258, 27.5408878326416, 30.003982543945312, 32.467079162597656, 34.93017578125, 37.393272399902344, 39.85636901855469, 42.31946563720703, 44.782562255859375, 47.24565887451172, 49.7087516784668, 52.17184829711914, 54.634944915771484, 57.09804153442383, 59.56113815307617, 62.024234771728516, 64.4873275756836, 66.95042419433594, 69.41352081298828, 71.87661743164062, 74.33971405029297]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 1.0, 8.0, 4.0, 8.0, 11.0, 15.0, 17.0, 12.0, 14.0, 14.0, 21.0, 27.0, 35.0, 27.0, 28.0, 32.0, 39.0, 48.0, 45.0, 50.0, 74.0, 28.0, 52.0, 39.0, 34.0, 33.0, 45.0, 36.0, 25.0, 23.0, 28.0, 20.0, 30.0, 16.0, 9.0, 13.0, 11.0, 7.0, 3.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.85574722290039, -20.12257194519043, -19.38939666748047, -18.656221389770508, -17.923046112060547, -17.189868927001953, -16.456695556640625, -15.723518371582031, -14.99034309387207, -14.25716781616211, -13.523992538452148, -12.790817260742188, -12.05764102935791, -11.32446575164795, -10.591290473937988, -9.858114242553711, -9.124939918518066, -8.391764640808105, -7.658588886260986, -6.925413608551025, -6.192237854003906, -5.459062576293945, -4.725887298583984, -3.9927115440368652, -3.2595362663269043, -2.5263607501983643, -1.7931853532791138, -1.0600099563598633, -0.32683444023132324, 0.4063410758972168, 1.1395163536071777, 1.8726921081542969, 2.605867385864258, 3.339042901992798, 4.072218418121338, 4.805393695831299, 5.538569450378418, 6.271744728088379, 7.00492000579834, 7.738095760345459, 8.471271514892578, 9.204446792602539, 9.9376220703125, 10.670797348022461, 11.403973579406738, 12.1371488571167, 12.87032413482666, 13.603500366210938, 14.336674690246582, 15.069849967956543, 15.803025245666504, 16.53620147705078, 17.269376754760742, 18.002552032470703, 18.735727310180664, 19.468902587890625, 20.202077865600586, 20.935253143310547, 21.668428421020508, 22.40160369873047, 23.13477897644043, 23.86795425415039, 24.601131439208984, 25.334306716918945, 26.067481994628906]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 9.0, 17.0, 20.0, 36.0, 63.0, 126.0, 241.0, 538.0, 1290.0, 4065.0, 15713.0, 114993.0, 2860189.0, 1126398.0, 56294.0, 9833.0, 2600.0, 976.0, 413.0, 197.0, 101.0, 50.0, 44.0, 23.0, 13.0, 8.0, 7.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51171875, -4.39556884765625, -4.2794189453125, -4.16326904296875, -4.047119140625, -3.93096923828125, -3.8148193359375, -3.69866943359375, -3.58251953125, -3.46636962890625, -3.3502197265625, -3.23406982421875, -3.117919921875, -3.00177001953125, -2.8856201171875, -2.76947021484375, -2.6533203125, -2.53717041015625, -2.4210205078125, -2.30487060546875, -2.188720703125, -2.07257080078125, -1.9564208984375, -1.84027099609375, -1.72412109375, -1.60797119140625, -1.4918212890625, -1.37567138671875, -1.259521484375, -1.14337158203125, -1.0272216796875, -0.91107177734375, -0.794921875, -0.67877197265625, -0.5626220703125, -0.44647216796875, -0.330322265625, -0.21417236328125, -0.0980224609375, 0.01812744140625, 0.13427734375, 0.25042724609375, 0.3665771484375, 0.48272705078125, 0.598876953125, 0.71502685546875, 0.8311767578125, 0.94732666015625, 1.0634765625, 1.17962646484375, 1.2957763671875, 1.41192626953125, 1.528076171875, 1.64422607421875, 1.7603759765625, 1.87652587890625, 1.99267578125, 2.10882568359375, 2.2249755859375, 2.34112548828125, 2.457275390625, 2.57342529296875, 2.6895751953125, 2.80572509765625, 2.921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 8.0, 11.0, 10.0, 21.0, 22.0, 18.0, 20.0, 24.0, 42.0, 35.0, 31.0, 38.0, 51.0, 52.0, 51.0, 67.0, 48.0, 45.0, 43.0, 35.0, 46.0, 46.0, 36.0, 32.0, 24.0, 28.0, 16.0, 26.0, 19.0, 22.0, 10.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5029296875, -1.4599761962890625, -1.417022705078125, -1.3740692138671875, -1.33111572265625, -1.2881622314453125, -1.245208740234375, -1.2022552490234375, -1.1593017578125, -1.1163482666015625, -1.073394775390625, -1.0304412841796875, -0.98748779296875, -0.9445343017578125, -0.901580810546875, -0.8586273193359375, -0.815673828125, -0.7727203369140625, -0.729766845703125, -0.6868133544921875, -0.64385986328125, -0.6009063720703125, -0.557952880859375, -0.5149993896484375, -0.4720458984375, -0.4290924072265625, -0.386138916015625, -0.3431854248046875, -0.30023193359375, -0.2572784423828125, -0.214324951171875, -0.1713714599609375, -0.12841796875, -0.0854644775390625, -0.042510986328125, 0.0004425048828125, 0.04339599609375, 0.0863494873046875, 0.129302978515625, 0.1722564697265625, 0.2152099609375, 0.2581634521484375, 0.301116943359375, 0.3440704345703125, 0.38702392578125, 0.4299774169921875, 0.472930908203125, 0.5158843994140625, 0.558837890625, 0.6017913818359375, 0.644744873046875, 0.6876983642578125, 0.73065185546875, 0.7736053466796875, 0.816558837890625, 0.8595123291015625, 0.9024658203125, 0.9454193115234375, 0.988372802734375, 1.0313262939453125, 1.07427978515625, 1.1172332763671875, 1.160186767578125, 1.2031402587890625, 1.24609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 8.0, 27.0, 41.0, 59.0, 119.0, 217.0, 436.0, 1184.0, 4319.0, 22164.0, 206626.0, 3552535.0, 364556.0, 33423.0, 5999.0, 1526.0, 516.0, 236.0, 106.0, 52.0, 28.0, 31.0, 18.0, 12.0, 12.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.21875, -5.0869140625, -4.955078125, -4.8232421875, -4.69140625, -4.5595703125, -4.427734375, -4.2958984375, -4.1640625, -4.0322265625, -3.900390625, -3.7685546875, -3.63671875, -3.5048828125, -3.373046875, -3.2412109375, -3.109375, -2.9775390625, -2.845703125, -2.7138671875, -2.58203125, -2.4501953125, -2.318359375, -2.1865234375, -2.0546875, -1.9228515625, -1.791015625, -1.6591796875, -1.52734375, -1.3955078125, -1.263671875, -1.1318359375, -1.0, -0.8681640625, -0.736328125, -0.6044921875, -0.47265625, -0.3408203125, -0.208984375, -0.0771484375, 0.0546875, 0.1865234375, 0.318359375, 0.4501953125, 0.58203125, 0.7138671875, 0.845703125, 0.9775390625, 1.109375, 1.2412109375, 1.373046875, 1.5048828125, 1.63671875, 1.7685546875, 1.900390625, 2.0322265625, 2.1640625, 2.2958984375, 2.427734375, 2.5595703125, 2.69140625, 2.8232421875, 2.955078125, 3.0869140625, 3.21875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 13.0, 16.0, 17.0, 30.0, 45.0, 66.0, 114.0, 204.0, 372.0, 651.0, 902.0, 677.0, 337.0, 194.0, 131.0, 71.0, 58.0, 43.0, 38.0, 20.0, 23.0, 10.0, 7.0, 4.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.21875, -4.103363037109375, -3.98797607421875, -3.872589111328125, -3.7572021484375, -3.641815185546875, -3.52642822265625, -3.411041259765625, -3.295654296875, -3.180267333984375, -3.06488037109375, -2.949493408203125, -2.8341064453125, -2.718719482421875, -2.60333251953125, -2.487945556640625, -2.37255859375, -2.257171630859375, -2.14178466796875, -2.026397705078125, -1.9110107421875, -1.795623779296875, -1.68023681640625, -1.564849853515625, -1.449462890625, -1.334075927734375, -1.21868896484375, -1.103302001953125, -0.9879150390625, -0.872528076171875, -0.75714111328125, -0.641754150390625, -0.5263671875, -0.410980224609375, -0.29559326171875, -0.180206298828125, -0.0648193359375, 0.050567626953125, 0.16595458984375, 0.281341552734375, 0.396728515625, 0.512115478515625, 0.62750244140625, 0.742889404296875, 0.8582763671875, 0.973663330078125, 1.08905029296875, 1.204437255859375, 1.31982421875, 1.435211181640625, 1.55059814453125, 1.665985107421875, 1.7813720703125, 1.896759033203125, 2.01214599609375, 2.127532958984375, 2.242919921875, 2.358306884765625, 2.47369384765625, 2.589080810546875, 2.7044677734375, 2.819854736328125, 2.93524169921875, 3.050628662109375, 3.166015625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 22.0, 35.0, 75.0, 111.0, 149.0, 201.0, 179.0, 92.0, 47.0, 40.0, 11.0, 6.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.58943557739258, -34.51499938964844, -33.44056701660156, -32.36613082885742, -31.291696548461914, -30.217262268066406, -29.142826080322266, -28.068391799926758, -26.99395751953125, -25.919523239135742, -24.8450870513916, -23.770652770996094, -22.696218490600586, -21.621784210205078, -20.547348022460938, -19.47291374206543, -18.39847755432129, -17.32404327392578, -16.24960708618164, -15.175172805786133, -14.100738525390625, -13.0263032913208, -11.951868057250977, -10.877433776855469, -9.802998542785645, -8.72856330871582, -7.6541290283203125, -6.579693794250488, -5.505259037017822, -4.430824279785156, -3.356389045715332, -2.281954288482666, -1.20751953125, -0.13308465480804443, 0.9413502216339111, 2.0157852172851562, 3.0902199745178223, 4.164654731750488, 5.2390899658203125, 6.3135247230529785, 7.3879594802856445, 8.462394714355469, 9.536828994750977, 10.6112642288208, 11.685699462890625, 12.760133743286133, 13.834568977355957, 14.909004211425781, 15.983438491821289, 17.057872772216797, 18.132308959960938, 19.206743240356445, 20.281177520751953, 21.355613708496094, 22.4300479888916, 23.50448226928711, 24.57891845703125, 25.653352737426758, 26.7277889251709, 27.802223205566406, 28.876657485961914, 29.951091766357422, 31.025527954101562, 32.0999641418457, 33.17439651489258]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 10.0, 14.0, 19.0, 18.0, 22.0, 29.0, 39.0, 52.0, 56.0, 66.0, 75.0, 71.0, 63.0, 60.0, 63.0, 67.0, 57.0, 48.0, 38.0, 30.0, 39.0, 17.0, 19.0, 12.0, 9.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.276994705200195, -13.583927154541016, -12.890860557556152, -12.197793960571289, -11.50472640991211, -10.81165885925293, -10.118592262268066, -9.425525665283203, -8.732458114624023, -8.039390563964844, -7.3463239669799805, -6.653256893157959, -5.9601898193359375, -5.267122745513916, -4.5740556716918945, -3.880988597869873, -3.1879215240478516, -2.49485445022583, -1.8017873764038086, -1.108720302581787, -0.4156532287597656, 0.27741384506225586, 0.9704809188842773, 1.6635479927062988, 2.3566150665283203, 3.049682140350342, 3.7427492141723633, 4.435816287994385, 5.128883361816406, 5.821950435638428, 6.515017509460449, 7.208084583282471, 7.901151657104492, 8.594219207763672, 9.287285804748535, 9.980352401733398, 10.673419952392578, 11.366487503051758, 12.059554100036621, 12.752620697021484, 13.445688247680664, 14.138755798339844, 14.831822395324707, 15.52488899230957, 16.21795654296875, 16.91102409362793, 17.60409164428711, 18.297157287597656, 18.990224838256836, 19.683292388916016, 20.376358032226562, 21.069425582885742, 21.762493133544922, 22.4555606842041, 23.14862823486328, 23.841693878173828, 24.534761428833008, 25.227828979492188, 25.920894622802734, 26.613962173461914, 27.307029724121094, 28.000097274780273, 28.693164825439453, 29.38623046875, 30.07929801940918]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 8.0, 14.0, 14.0, 23.0, 36.0, 64.0, 103.0, 223.0, 431.0, 1030.0, 3026.0, 11955.0, 72044.0, 445813.0, 428575.0, 68704.0, 11605.0, 2916.0, 1041.0, 463.0, 194.0, 125.0, 54.0, 34.0, 21.0, 11.0, 7.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25390625, -4.0902099609375, -3.926513671875, -3.7628173828125, -3.59912109375, -3.4354248046875, -3.271728515625, -3.1080322265625, -2.9443359375, -2.7806396484375, -2.616943359375, -2.4532470703125, -2.28955078125, -2.1258544921875, -1.962158203125, -1.7984619140625, -1.634765625, -1.4710693359375, -1.307373046875, -1.1436767578125, -0.97998046875, -0.8162841796875, -0.652587890625, -0.4888916015625, -0.3251953125, -0.1614990234375, 0.002197265625, 0.1658935546875, 0.32958984375, 0.4932861328125, 0.656982421875, 0.8206787109375, 0.984375, 1.1480712890625, 1.311767578125, 1.4754638671875, 1.63916015625, 1.8028564453125, 1.966552734375, 2.1302490234375, 2.2939453125, 2.4576416015625, 2.621337890625, 2.7850341796875, 2.94873046875, 3.1124267578125, 3.276123046875, 3.4398193359375, 3.603515625, 3.7672119140625, 3.930908203125, 4.0946044921875, 4.25830078125, 4.4219970703125, 4.585693359375, 4.7493896484375, 4.9130859375, 5.0767822265625, 5.240478515625, 5.4041748046875, 5.56787109375, 5.7315673828125, 5.895263671875, 6.0589599609375, 6.22265625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 13.0, 18.0, 17.0, 24.0, 21.0, 37.0, 43.0, 42.0, 35.0, 39.0, 40.0, 52.0, 58.0, 54.0, 60.0, 46.0, 47.0, 52.0, 41.0, 42.0, 31.0, 34.0, 31.0, 26.0, 23.0, 18.0, 5.0, 12.0, 10.0, 7.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.258270263671875, -1.21282958984375, -1.167388916015625, -1.1219482421875, -1.076507568359375, -1.03106689453125, -0.985626220703125, -0.940185546875, -0.894744873046875, -0.84930419921875, -0.803863525390625, -0.7584228515625, -0.712982177734375, -0.66754150390625, -0.622100830078125, -0.57666015625, -0.531219482421875, -0.48577880859375, -0.440338134765625, -0.3948974609375, -0.349456787109375, -0.30401611328125, -0.258575439453125, -0.213134765625, -0.167694091796875, -0.12225341796875, -0.076812744140625, -0.0313720703125, 0.014068603515625, 0.05950927734375, 0.104949951171875, 0.150390625, 0.195831298828125, 0.24127197265625, 0.286712646484375, 0.3321533203125, 0.377593994140625, 0.42303466796875, 0.468475341796875, 0.513916015625, 0.559356689453125, 0.60479736328125, 0.650238037109375, 0.6956787109375, 0.741119384765625, 0.78656005859375, 0.832000732421875, 0.87744140625, 0.922882080078125, 0.96832275390625, 1.013763427734375, 1.0592041015625, 1.104644775390625, 1.15008544921875, 1.195526123046875, 1.240966796875, 1.286407470703125, 1.33184814453125, 1.377288818359375, 1.4227294921875, 1.468170166015625, 1.51361083984375, 1.559051513671875, 1.6044921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 5.0, 8.0, 11.0, 16.0, 24.0, 36.0, 84.0, 108.0, 260.0, 584.0, 1580.0, 6807.0, 230386.0, 793115.0, 12032.0, 2082.0, 749.0, 320.0, 131.0, 83.0, 40.0, 36.0, 18.0, 13.0, 10.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0234375, -12.5762939453125, -12.129150390625, -11.6820068359375, -11.23486328125, -10.7877197265625, -10.340576171875, -9.8934326171875, -9.4462890625, -8.9991455078125, -8.552001953125, -8.1048583984375, -7.65771484375, -7.2105712890625, -6.763427734375, -6.3162841796875, -5.869140625, -5.4219970703125, -4.974853515625, -4.5277099609375, -4.08056640625, -3.6334228515625, -3.186279296875, -2.7391357421875, -2.2919921875, -1.8448486328125, -1.397705078125, -0.9505615234375, -0.50341796875, -0.0562744140625, 0.390869140625, 0.8380126953125, 1.28515625, 1.7322998046875, 2.179443359375, 2.6265869140625, 3.07373046875, 3.5208740234375, 3.968017578125, 4.4151611328125, 4.8623046875, 5.3094482421875, 5.756591796875, 6.2037353515625, 6.65087890625, 7.0980224609375, 7.545166015625, 7.9923095703125, 8.439453125, 8.8865966796875, 9.333740234375, 9.7808837890625, 10.22802734375, 10.6751708984375, 11.122314453125, 11.5694580078125, 12.0166015625, 12.4637451171875, 12.910888671875, 13.3580322265625, 13.80517578125, 14.2523193359375, 14.699462890625, 15.1466064453125, 15.59375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 4.0, 7.0, 14.0, 15.0, 13.0, 31.0, 21.0, 25.0, 27.0, 42.0, 46.0, 61.0, 59.0, 55.0, 57.0, 54.0, 52.0, 56.0, 64.0, 50.0, 51.0, 40.0, 29.0, 30.0, 23.0, 23.0, 10.0, 10.0, 9.0, 8.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03515625, -4.81719970703125, -4.5992431640625, -4.38128662109375, -4.163330078125, -3.94537353515625, -3.7274169921875, -3.50946044921875, -3.29150390625, -3.07354736328125, -2.8555908203125, -2.63763427734375, -2.419677734375, -2.20172119140625, -1.9837646484375, -1.76580810546875, -1.5478515625, -1.32989501953125, -1.1119384765625, -0.89398193359375, -0.676025390625, -0.45806884765625, -0.2401123046875, -0.02215576171875, 0.19580078125, 0.41375732421875, 0.6317138671875, 0.84967041015625, 1.067626953125, 1.28558349609375, 1.5035400390625, 1.72149658203125, 1.939453125, 2.15740966796875, 2.3753662109375, 2.59332275390625, 2.811279296875, 3.02923583984375, 3.2471923828125, 3.46514892578125, 3.68310546875, 3.90106201171875, 4.1190185546875, 4.33697509765625, 4.554931640625, 4.77288818359375, 4.9908447265625, 5.20880126953125, 5.4267578125, 5.64471435546875, 5.8626708984375, 6.08062744140625, 6.298583984375, 6.51654052734375, 6.7344970703125, 6.95245361328125, 7.17041015625, 7.38836669921875, 7.6063232421875, 7.82427978515625, 8.042236328125, 8.26019287109375, 8.4781494140625, 8.69610595703125, 8.9140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 5.0, 5.0, 17.0, 10.0, 17.0, 26.0, 40.0, 40.0, 74.0, 108.0, 168.0, 332.0, 787.0, 2029.0, 7450.0, 62290.0, 884904.0, 77876.0, 8520.0, 2131.0, 777.0, 360.0, 198.0, 127.0, 68.0, 53.0, 39.0, 26.0, 13.0, 11.0, 9.0, 9.0, 6.0, 6.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.7799072265625, -2.678955078125, -2.5780029296875, -2.47705078125, -2.3760986328125, -2.275146484375, -2.1741943359375, -2.0732421875, -1.9722900390625, -1.871337890625, -1.7703857421875, -1.66943359375, -1.5684814453125, -1.467529296875, -1.3665771484375, -1.265625, -1.1646728515625, -1.063720703125, -0.9627685546875, -0.86181640625, -0.7608642578125, -0.659912109375, -0.5589599609375, -0.4580078125, -0.3570556640625, -0.256103515625, -0.1551513671875, -0.05419921875, 0.0467529296875, 0.147705078125, 0.2486572265625, 0.349609375, 0.4505615234375, 0.551513671875, 0.6524658203125, 0.75341796875, 0.8543701171875, 0.955322265625, 1.0562744140625, 1.1572265625, 1.2581787109375, 1.359130859375, 1.4600830078125, 1.56103515625, 1.6619873046875, 1.762939453125, 1.8638916015625, 1.96484375, 2.0657958984375, 2.166748046875, 2.2677001953125, 2.36865234375, 2.4696044921875, 2.570556640625, 2.6715087890625, 2.7724609375, 2.8734130859375, 2.974365234375, 3.0753173828125, 3.17626953125, 3.2772216796875, 3.378173828125, 3.4791259765625, 3.580078125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 8.0, 9.0, 2.0, 11.0, 16.0, 26.0, 37.0, 41.0, 59.0, 84.0, 133.0, 173.0, 107.0, 81.0, 57.0, 42.0, 38.0, 16.0, 20.0, 11.0, 8.0, 8.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003414154052734375, -0.0003260970115661621, -0.0003107786178588867, -0.00029546022415161133, -0.00028014183044433594, -0.00026482343673706055, -0.00024950504302978516, -0.00023418664932250977, -0.00021886825561523438, -0.00020354986190795898, -0.0001882314682006836, -0.0001729130744934082, -0.0001575946807861328, -0.00014227628707885742, -0.00012695789337158203, -0.00011163949966430664, -9.632110595703125e-05, -8.100271224975586e-05, -6.568431854248047e-05, -5.036592483520508e-05, -3.504753112792969e-05, -1.9729137420654297e-05, -4.410743713378906e-06, 1.0907649993896484e-05, 2.6226043701171875e-05, 4.1544437408447266e-05, 5.6862831115722656e-05, 7.218122482299805e-05, 8.749961853027344e-05, 0.00010281801223754883, 0.00011813640594482422, 0.0001334547996520996, 0.000148773193359375, 0.0001640915870666504, 0.00017940998077392578, 0.00019472837448120117, 0.00021004676818847656, 0.00022536516189575195, 0.00024068355560302734, 0.00025600194931030273, 0.0002713203430175781, 0.0002866387367248535, 0.0003019571304321289, 0.0003172755241394043, 0.0003325939178466797, 0.0003479123115539551, 0.00036323070526123047, 0.00037854909896850586, 0.00039386749267578125, 0.00040918588638305664, 0.00042450428009033203, 0.0004398226737976074, 0.0004551410675048828, 0.0004704594612121582, 0.0004857778549194336, 0.000501096248626709, 0.0005164146423339844, 0.0005317330360412598, 0.0005470514297485352, 0.0005623698234558105, 0.0005776882171630859, 0.0005930066108703613, 0.0006083250045776367, 0.0006236433982849121, 0.0006389617919921875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 11.0, 9.0, 14.0, 22.0, 27.0, 37.0, 52.0, 77.0, 95.0, 166.0, 241.0, 428.0, 840.0, 1799.0, 4738.0, 17008.0, 156208.0, 807145.0, 44796.0, 9070.0, 2935.0, 1226.0, 607.0, 350.0, 218.0, 125.0, 87.0, 52.0, 41.0, 33.0, 25.0, 11.0, 13.0, 12.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.072265625, -2.98516845703125, -2.8980712890625, -2.81097412109375, -2.723876953125, -2.63677978515625, -2.5496826171875, -2.46258544921875, -2.37548828125, -2.28839111328125, -2.2012939453125, -2.11419677734375, -2.027099609375, -1.94000244140625, -1.8529052734375, -1.76580810546875, -1.6787109375, -1.59161376953125, -1.5045166015625, -1.41741943359375, -1.330322265625, -1.24322509765625, -1.1561279296875, -1.06903076171875, -0.98193359375, -0.89483642578125, -0.8077392578125, -0.72064208984375, -0.633544921875, -0.54644775390625, -0.4593505859375, -0.37225341796875, -0.28515625, -0.19805908203125, -0.1109619140625, -0.02386474609375, 0.063232421875, 0.15032958984375, 0.2374267578125, 0.32452392578125, 0.41162109375, 0.49871826171875, 0.5858154296875, 0.67291259765625, 0.760009765625, 0.84710693359375, 0.9342041015625, 1.02130126953125, 1.1083984375, 1.19549560546875, 1.2825927734375, 1.36968994140625, 1.456787109375, 1.54388427734375, 1.6309814453125, 1.71807861328125, 1.80517578125, 1.89227294921875, 1.9793701171875, 2.06646728515625, 2.153564453125, 2.24066162109375, 2.3277587890625, 2.41485595703125, 2.501953125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 2.0, 6.0, 11.0, 11.0, 14.0, 17.0, 25.0, 36.0, 50.0, 73.0, 95.0, 142.0, 146.0, 114.0, 75.0, 55.0, 34.0, 24.0, 20.0, 13.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.884765625, -2.804931640625, -2.72509765625, -2.645263671875, -2.5654296875, -2.485595703125, -2.40576171875, -2.325927734375, -2.24609375, -2.166259765625, -2.08642578125, -2.006591796875, -1.9267578125, -1.846923828125, -1.76708984375, -1.687255859375, -1.607421875, -1.527587890625, -1.44775390625, -1.367919921875, -1.2880859375, -1.208251953125, -1.12841796875, -1.048583984375, -0.96875, -0.888916015625, -0.80908203125, -0.729248046875, -0.6494140625, -0.569580078125, -0.48974609375, -0.409912109375, -0.330078125, -0.250244140625, -0.17041015625, -0.090576171875, -0.0107421875, 0.069091796875, 0.14892578125, 0.228759765625, 0.30859375, 0.388427734375, 0.46826171875, 0.548095703125, 0.6279296875, 0.707763671875, 0.78759765625, 0.867431640625, 0.947265625, 1.027099609375, 1.10693359375, 1.186767578125, 1.2666015625, 1.346435546875, 1.42626953125, 1.506103515625, 1.5859375, 1.665771484375, 1.74560546875, 1.825439453125, 1.9052734375, 1.985107421875, 2.06494140625, 2.144775390625, 2.224609375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 18.0, 58.0, 176.0, 439.0, 203.0, 78.0, 17.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.66737365722656, -99.03453063964844, -96.40168762207031, -93.76885223388672, -91.1360092163086, -88.50316619873047, -85.87033081054688, -83.23748779296875, -80.60464477539062, -77.9718017578125, -75.33895874023438, -72.70612335205078, -70.07328033447266, -67.44043731689453, -64.80760192871094, -62.17475891113281, -59.54191589355469, -56.90907287597656, -54.2762336730957, -51.643394470214844, -49.01055145263672, -46.377708435058594, -43.744869232177734, -41.112030029296875, -38.47918701171875, -35.846343994140625, -33.213504791259766, -30.580663681030273, -27.94782257080078, -25.31498146057129, -22.682140350341797, -20.049299240112305, -17.416458129882812, -14.78361701965332, -12.150775909423828, -9.517934799194336, -6.885093688964844, -4.252252578735352, -1.6194114685058594, 1.0134296417236328, 3.646270751953125, 6.279111862182617, 8.91195297241211, 11.544794082641602, 14.177635192871094, 16.810476303100586, 19.443317413330078, 22.07615852355957, 24.708999633789062, 27.341840744018555, 29.974681854248047, 32.607521057128906, 35.24036407470703, 37.873207092285156, 40.506046295166016, 43.138885498046875, 45.771728515625, 48.404571533203125, 51.037410736083984, 53.670249938964844, 56.30309295654297, 58.935935974121094, 61.56877517700195, 64.20161437988281, 66.83445739746094]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 9.0, 15.0, 15.0, 15.0, 33.0, 22.0, 34.0, 27.0, 36.0, 46.0, 55.0, 83.0, 85.0, 77.0, 67.0, 61.0, 45.0, 38.0, 31.0, 44.0, 23.0, 26.0, 16.0, 20.0, 13.0, 14.0, 6.0, 8.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.534469604492188, -29.731578826904297, -28.928686141967773, -28.125795364379883, -27.32290267944336, -26.52001190185547, -25.717119216918945, -24.914228439331055, -24.11133575439453, -23.30844497680664, -22.505552291870117, -21.702661514282227, -20.899768829345703, -20.096878051757812, -19.29398536682129, -18.4910945892334, -17.688201904296875, -16.885311126708984, -16.08241844177246, -15.279526710510254, -14.476634979248047, -13.673744201660156, -12.870851516723633, -12.067960739135742, -11.265069961547852, -10.462178230285645, -9.659286499023438, -8.85639476776123, -8.053503036499023, -7.250611782073975, -6.447720050811768, -5.6448283195495605, -4.841936111450195, -4.039044380187988, -3.2361526489257812, -2.4332611560821533, -1.6303694248199463, -0.8274779319763184, -0.024586200714111328, 0.7783055305480957, 1.5811972618103027, 2.3840889930725098, 3.186980724334717, 3.9898722171783447, 4.792763710021973, 5.59565544128418, 6.398547172546387, 7.201438903808594, 8.0043306350708, 8.807222366333008, 9.610114097595215, 10.413005828857422, 11.215897560119629, 12.018789291381836, 12.821680068969727, 13.62457275390625, 14.42746353149414, 15.230355262756348, 16.033246994018555, 16.836137771606445, 17.63903045654297, 18.44192123413086, 19.244813919067383, 20.047704696655273, 20.850597381591797]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 2.0, 7.0, 7.0, 10.0, 22.0, 34.0, 57.0, 70.0, 75.0, 137.0, 188.0, 304.0, 464.0, 817.0, 1613.0, 3315.0, 8019.0, 23531.0, 95089.0, 788036.0, 2773349.0, 410188.0, 60978.0, 16559.0, 5841.0, 2482.0, 1205.0, 609.0, 368.0, 246.0, 155.0, 127.0, 95.0, 58.0, 32.0, 29.0, 36.0, 23.0, 22.0, 13.0, 16.0, 12.0, 5.0, 7.0, 5.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-2.013671875, -1.947357177734375, -1.88104248046875, -1.814727783203125, -1.7484130859375, -1.682098388671875, -1.61578369140625, -1.549468994140625, -1.483154296875, -1.416839599609375, -1.35052490234375, -1.284210205078125, -1.2178955078125, -1.151580810546875, -1.08526611328125, -1.018951416015625, -0.95263671875, -0.886322021484375, -0.82000732421875, -0.753692626953125, -0.6873779296875, -0.621063232421875, -0.55474853515625, -0.488433837890625, -0.422119140625, -0.355804443359375, -0.28948974609375, -0.223175048828125, -0.1568603515625, -0.090545654296875, -0.02423095703125, 0.042083740234375, 0.1083984375, 0.174713134765625, 0.24102783203125, 0.307342529296875, 0.3736572265625, 0.439971923828125, 0.50628662109375, 0.572601318359375, 0.638916015625, 0.705230712890625, 0.77154541015625, 0.837860107421875, 0.9041748046875, 0.970489501953125, 1.03680419921875, 1.103118896484375, 1.16943359375, 1.235748291015625, 1.30206298828125, 1.368377685546875, 1.4346923828125, 1.501007080078125, 1.56732177734375, 1.633636474609375, 1.699951171875, 1.766265869140625, 1.83258056640625, 1.898895263671875, 1.9652099609375, 2.031524658203125, 2.09783935546875, 2.164154052734375, 2.23046875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 6.0, 5.0, 4.0, 9.0, 9.0, 18.0, 22.0, 25.0, 24.0, 35.0, 39.0, 38.0, 43.0, 49.0, 39.0, 66.0, 58.0, 54.0, 49.0, 64.0, 53.0, 47.0, 45.0, 41.0, 25.0, 26.0, 25.0, 15.0, 25.0, 11.0, 10.0, 8.0, 7.0, 2.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2060546875, -1.1601409912109375, -1.114227294921875, -1.0683135986328125, -1.02239990234375, -0.9764862060546875, -0.930572509765625, -0.8846588134765625, -0.8387451171875, -0.7928314208984375, -0.746917724609375, -0.7010040283203125, -0.65509033203125, -0.6091766357421875, -0.563262939453125, -0.5173492431640625, -0.471435546875, -0.4255218505859375, -0.379608154296875, -0.3336944580078125, -0.28778076171875, -0.2418670654296875, -0.195953369140625, -0.1500396728515625, -0.1041259765625, -0.0582122802734375, -0.012298583984375, 0.0336151123046875, 0.07952880859375, 0.1254425048828125, 0.171356201171875, 0.2172698974609375, 0.26318359375, 0.3090972900390625, 0.355010986328125, 0.4009246826171875, 0.44683837890625, 0.4927520751953125, 0.538665771484375, 0.5845794677734375, 0.6304931640625, 0.6764068603515625, 0.722320556640625, 0.7682342529296875, 0.81414794921875, 0.8600616455078125, 0.905975341796875, 0.9518890380859375, 0.997802734375, 1.0437164306640625, 1.089630126953125, 1.1355438232421875, 1.18145751953125, 1.2273712158203125, 1.273284912109375, 1.3191986083984375, 1.3651123046875, 1.4110260009765625, 1.456939697265625, 1.5028533935546875, 1.54876708984375, 1.5946807861328125, 1.640594482421875, 1.6865081787109375, 1.732421875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0, 7.0, 9.0, 10.0, 20.0, 32.0, 48.0, 66.0, 120.0, 234.0, 324.0, 623.0, 1345.0, 3931.0, 17443.0, 144452.0, 3395848.0, 576157.0, 41739.0, 7658.0, 2063.0, 891.0, 490.0, 248.0, 188.0, 93.0, 75.0, 54.0, 31.0, 28.0, 23.0, 12.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.16015625, -4.0367431640625, -3.913330078125, -3.7899169921875, -3.66650390625, -3.5430908203125, -3.419677734375, -3.2962646484375, -3.1728515625, -3.0494384765625, -2.926025390625, -2.8026123046875, -2.67919921875, -2.5557861328125, -2.432373046875, -2.3089599609375, -2.185546875, -2.0621337890625, -1.938720703125, -1.8153076171875, -1.69189453125, -1.5684814453125, -1.445068359375, -1.3216552734375, -1.1982421875, -1.0748291015625, -0.951416015625, -0.8280029296875, -0.70458984375, -0.5811767578125, -0.457763671875, -0.3343505859375, -0.2109375, -0.0875244140625, 0.035888671875, 0.1593017578125, 0.28271484375, 0.4061279296875, 0.529541015625, 0.6529541015625, 0.7763671875, 0.8997802734375, 1.023193359375, 1.1466064453125, 1.27001953125, 1.3934326171875, 1.516845703125, 1.6402587890625, 1.763671875, 1.8870849609375, 2.010498046875, 2.1339111328125, 2.25732421875, 2.3807373046875, 2.504150390625, 2.6275634765625, 2.7509765625, 2.8743896484375, 2.997802734375, 3.1212158203125, 3.24462890625, 3.3680419921875, 3.491455078125, 3.6148681640625, 3.73828125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 7.0, 14.0, 14.0, 25.0, 65.0, 127.0, 319.0, 866.0, 1323.0, 758.0, 270.0, 130.0, 69.0, 35.0, 17.0, 14.0, 12.0, 7.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41796875, -5.239990234375, -5.06201171875, -4.884033203125, -4.7060546875, -4.528076171875, -4.35009765625, -4.172119140625, -3.994140625, -3.816162109375, -3.63818359375, -3.460205078125, -3.2822265625, -3.104248046875, -2.92626953125, -2.748291015625, -2.5703125, -2.392333984375, -2.21435546875, -2.036376953125, -1.8583984375, -1.680419921875, -1.50244140625, -1.324462890625, -1.146484375, -0.968505859375, -0.79052734375, -0.612548828125, -0.4345703125, -0.256591796875, -0.07861328125, 0.099365234375, 0.27734375, 0.455322265625, 0.63330078125, 0.811279296875, 0.9892578125, 1.167236328125, 1.34521484375, 1.523193359375, 1.701171875, 1.879150390625, 2.05712890625, 2.235107421875, 2.4130859375, 2.591064453125, 2.76904296875, 2.947021484375, 3.125, 3.302978515625, 3.48095703125, 3.658935546875, 3.8369140625, 4.014892578125, 4.19287109375, 4.370849609375, 4.548828125, 4.726806640625, 4.90478515625, 5.082763671875, 5.2607421875, 5.438720703125, 5.61669921875, 5.794677734375, 5.97265625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 8.0, 11.0, 28.0, 123.0, 321.0, 329.0, 131.0, 25.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.04322814941406, -44.03514099121094, -42.02705001831055, -40.018959045410156, -38.01087188720703, -36.002784729003906, -33.994693756103516, -31.986604690551758, -29.978515625, -27.970426559448242, -25.962337493896484, -23.954248428344727, -21.94615936279297, -19.93807029724121, -17.929981231689453, -15.921892166137695, -13.913803100585938, -11.90571403503418, -9.897624969482422, -7.889535903930664, -5.881446838378906, -3.8733577728271484, -1.8652687072753906, 0.1428203582763672, 2.150909423828125, 4.158998489379883, 6.167087554931641, 8.175176620483398, 10.183265686035156, 12.191354751586914, 14.199443817138672, 16.20753288269043, 18.21562957763672, 20.223718643188477, 22.231807708740234, 24.239896774291992, 26.24798583984375, 28.256074905395508, 30.264163970947266, 32.272254943847656, 34.28034210205078, 36.288429260253906, 38.2965202331543, 40.30461120605469, 42.31269836425781, 44.32078552246094, 46.32887649536133, 48.33696746826172, 50.345054626464844, 52.35314178466797, 54.36123275756836, 56.36932373046875, 58.377410888671875, 60.385498046875, 62.39358901977539, 64.40167999267578, 66.4097671508789, 68.41785430908203, 70.42594909667969, 72.43403625488281, 74.44212341308594, 76.45021057128906, 78.45829772949219, 80.46639251708984, 82.47447967529297]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 9.0, 16.0, 15.0, 23.0, 45.0, 49.0, 56.0, 68.0, 91.0, 101.0, 84.0, 73.0, 96.0, 81.0, 45.0, 42.0, 34.0, 32.0, 21.0, 14.0, 8.0, 1.0, 1.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.83367919921875, -35.0432243347168, -34.25277328491211, -33.462318420410156, -32.67186737060547, -31.881412506103516, -31.090959548950195, -30.300506591796875, -29.510053634643555, -28.719600677490234, -27.929147720336914, -27.138694763183594, -26.34823989868164, -25.55778694152832, -24.767333984375, -23.97688102722168, -23.18642807006836, -22.39597511291504, -21.60552215576172, -20.8150691986084, -20.024616241455078, -19.234161376953125, -18.443708419799805, -17.653255462646484, -16.862802505493164, -16.072349548339844, -15.281896591186523, -14.491442680358887, -13.700989723205566, -12.910536766052246, -12.12008285522461, -11.329629898071289, -10.539176940917969, -9.748723983764648, -8.958271026611328, -8.167817115783691, -7.377364158630371, -6.586911201477051, -5.796457767486572, -5.006004333496094, -4.215551376342773, -3.425098180770874, -2.6346449851989746, -1.8441917896270752, -1.0537385940551758, -0.26328539848327637, 0.527167797088623, 1.3176212310791016, 2.108074188232422, 2.8985273838043213, 3.6889805793762207, 4.479434013366699, 5.2698869705200195, 6.06033992767334, 6.850793361663818, 7.641246795654297, 8.431699752807617, 9.222152709960938, 10.012605667114258, 10.803059577941895, 11.593512535095215, 12.383965492248535, 13.174419403076172, 13.964872360229492, 14.755325317382812]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 0.0, 7.0, 4.0, 11.0, 17.0, 23.0, 37.0, 52.0, 70.0, 96.0, 140.0, 214.0, 365.0, 734.0, 1463.0, 3851.0, 11454.0, 42524.0, 186050.0, 517575.0, 214276.0, 49051.0, 12810.0, 4237.0, 1663.0, 735.0, 409.0, 253.0, 145.0, 75.0, 42.0, 54.0, 33.0, 21.0, 16.0, 9.0, 9.0, 12.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.87890625, -3.755950927734375, -3.63299560546875, -3.510040283203125, -3.3870849609375, -3.264129638671875, -3.14117431640625, -3.018218994140625, -2.895263671875, -2.772308349609375, -2.64935302734375, -2.526397705078125, -2.4034423828125, -2.280487060546875, -2.15753173828125, -2.034576416015625, -1.91162109375, -1.788665771484375, -1.66571044921875, -1.542755126953125, -1.4197998046875, -1.296844482421875, -1.17388916015625, -1.050933837890625, -0.927978515625, -0.805023193359375, -0.68206787109375, -0.559112548828125, -0.4361572265625, -0.313201904296875, -0.19024658203125, -0.067291259765625, 0.0556640625, 0.178619384765625, 0.30157470703125, 0.424530029296875, 0.5474853515625, 0.670440673828125, 0.79339599609375, 0.916351318359375, 1.039306640625, 1.162261962890625, 1.28521728515625, 1.408172607421875, 1.5311279296875, 1.654083251953125, 1.77703857421875, 1.899993896484375, 2.02294921875, 2.145904541015625, 2.26885986328125, 2.391815185546875, 2.5147705078125, 2.637725830078125, 2.76068115234375, 2.883636474609375, 3.006591796875, 3.129547119140625, 3.25250244140625, 3.375457763671875, 3.4984130859375, 3.621368408203125, 3.74432373046875, 3.867279052734375, 3.990234375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 9.0, 10.0, 15.0, 16.0, 19.0, 30.0, 31.0, 36.0, 39.0, 32.0, 35.0, 39.0, 52.0, 46.0, 45.0, 45.0, 59.0, 40.0, 41.0, 51.0, 36.0, 45.0, 22.0, 41.0, 20.0, 29.0, 21.0, 13.0, 10.0, 15.0, 10.0, 6.0, 4.0, 8.0, 2.0, 5.0, 5.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.126953125, -1.087371826171875, -1.04779052734375, -1.008209228515625, -0.9686279296875, -0.929046630859375, -0.88946533203125, -0.849884033203125, -0.810302734375, -0.770721435546875, -0.73114013671875, -0.691558837890625, -0.6519775390625, -0.612396240234375, -0.57281494140625, -0.533233642578125, -0.49365234375, -0.454071044921875, -0.41448974609375, -0.374908447265625, -0.3353271484375, -0.295745849609375, -0.25616455078125, -0.216583251953125, -0.177001953125, -0.137420654296875, -0.09783935546875, -0.058258056640625, -0.0186767578125, 0.020904541015625, 0.06048583984375, 0.100067138671875, 0.1396484375, 0.179229736328125, 0.21881103515625, 0.258392333984375, 0.2979736328125, 0.337554931640625, 0.37713623046875, 0.416717529296875, 0.456298828125, 0.495880126953125, 0.53546142578125, 0.575042724609375, 0.6146240234375, 0.654205322265625, 0.69378662109375, 0.733367919921875, 0.77294921875, 0.812530517578125, 0.85211181640625, 0.891693115234375, 0.9312744140625, 0.970855712890625, 1.01043701171875, 1.050018310546875, 1.089599609375, 1.129180908203125, 1.16876220703125, 1.208343505859375, 1.2479248046875, 1.287506103515625, 1.32708740234375, 1.366668701171875, 1.40625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 3.0, 4.0, 7.0, 7.0, 12.0, 22.0, 21.0, 37.0, 47.0, 87.0, 129.0, 200.0, 336.0, 638.0, 1288.0, 3499.0, 12272.0, 119293.0, 828305.0, 68116.0, 8881.0, 2737.0, 1178.0, 585.0, 319.0, 180.0, 97.0, 89.0, 54.0, 33.0, 16.0, 18.0, 12.0, 5.0, 2.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8671875, -7.6083984375, -7.349609375, -7.0908203125, -6.83203125, -6.5732421875, -6.314453125, -6.0556640625, -5.796875, -5.5380859375, -5.279296875, -5.0205078125, -4.76171875, -4.5029296875, -4.244140625, -3.9853515625, -3.7265625, -3.4677734375, -3.208984375, -2.9501953125, -2.69140625, -2.4326171875, -2.173828125, -1.9150390625, -1.65625, -1.3974609375, -1.138671875, -0.8798828125, -0.62109375, -0.3623046875, -0.103515625, 0.1552734375, 0.4140625, 0.6728515625, 0.931640625, 1.1904296875, 1.44921875, 1.7080078125, 1.966796875, 2.2255859375, 2.484375, 2.7431640625, 3.001953125, 3.2607421875, 3.51953125, 3.7783203125, 4.037109375, 4.2958984375, 4.5546875, 4.8134765625, 5.072265625, 5.3310546875, 5.58984375, 5.8486328125, 6.107421875, 6.3662109375, 6.625, 6.8837890625, 7.142578125, 7.4013671875, 7.66015625, 7.9189453125, 8.177734375, 8.4365234375, 8.6953125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 14.0, 12.0, 25.0, 27.0, 31.0, 35.0, 28.0, 41.0, 49.0, 57.0, 58.0, 63.0, 61.0, 58.0, 56.0, 63.0, 50.0, 36.0, 48.0, 43.0, 26.0, 32.0, 16.0, 17.0, 14.0, 13.0, 5.0, 2.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.1346435546875, -5.941162109375, -5.7476806640625, -5.55419921875, -5.3607177734375, -5.167236328125, -4.9737548828125, -4.7802734375, -4.5867919921875, -4.393310546875, -4.1998291015625, -4.00634765625, -3.8128662109375, -3.619384765625, -3.4259033203125, -3.232421875, -3.0389404296875, -2.845458984375, -2.6519775390625, -2.45849609375, -2.2650146484375, -2.071533203125, -1.8780517578125, -1.6845703125, -1.4910888671875, -1.297607421875, -1.1041259765625, -0.91064453125, -0.7171630859375, -0.523681640625, -0.3302001953125, -0.13671875, 0.0567626953125, 0.250244140625, 0.4437255859375, 0.63720703125, 0.8306884765625, 1.024169921875, 1.2176513671875, 1.4111328125, 1.6046142578125, 1.798095703125, 1.9915771484375, 2.18505859375, 2.3785400390625, 2.572021484375, 2.7655029296875, 2.958984375, 3.1524658203125, 3.345947265625, 3.5394287109375, 3.73291015625, 3.9263916015625, 4.119873046875, 4.3133544921875, 4.5068359375, 4.7003173828125, 4.893798828125, 5.0872802734375, 5.28076171875, 5.4742431640625, 5.667724609375, 5.8612060546875, 6.0546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 3.0, 9.0, 13.0, 7.0, 12.0, 16.0, 17.0, 28.0, 32.0, 67.0, 102.0, 152.0, 314.0, 784.0, 3133.0, 23496.0, 891274.0, 119110.0, 7446.0, 1508.0, 465.0, 210.0, 104.0, 66.0, 50.0, 33.0, 21.0, 21.0, 12.0, 8.0, 12.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.2265625, -4.09747314453125, -3.9683837890625, -3.83929443359375, -3.710205078125, -3.58111572265625, -3.4520263671875, -3.32293701171875, -3.19384765625, -3.06475830078125, -2.9356689453125, -2.80657958984375, -2.677490234375, -2.54840087890625, -2.4193115234375, -2.29022216796875, -2.1611328125, -2.03204345703125, -1.9029541015625, -1.77386474609375, -1.644775390625, -1.51568603515625, -1.3865966796875, -1.25750732421875, -1.12841796875, -0.99932861328125, -0.8702392578125, -0.74114990234375, -0.612060546875, -0.48297119140625, -0.3538818359375, -0.22479248046875, -0.095703125, 0.03338623046875, 0.1624755859375, 0.29156494140625, 0.420654296875, 0.54974365234375, 0.6788330078125, 0.80792236328125, 0.93701171875, 1.06610107421875, 1.1951904296875, 1.32427978515625, 1.453369140625, 1.58245849609375, 1.7115478515625, 1.84063720703125, 1.9697265625, 2.09881591796875, 2.2279052734375, 2.35699462890625, 2.486083984375, 2.61517333984375, 2.7442626953125, 2.87335205078125, 3.00244140625, 3.13153076171875, 3.2606201171875, 3.38970947265625, 3.518798828125, 3.64788818359375, 3.7769775390625, 3.90606689453125, 4.03515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 4.0, 8.0, 22.0, 14.0, 27.0, 28.0, 30.0, 40.0, 80.0, 150.0, 147.0, 122.0, 86.0, 61.0, 45.0, 29.0, 22.0, 24.0, 14.0, 9.0, 3.0, 7.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005240440368652344, -0.0005097389221191406, -0.0004954338073730469, -0.0004811286926269531, -0.0004668235778808594, -0.0004525184631347656, -0.0004382133483886719, -0.0004239082336425781, -0.0004096031188964844, -0.0003952980041503906, -0.0003809928894042969, -0.0003666877746582031, -0.0003523826599121094, -0.0003380775451660156, -0.0003237724304199219, -0.0003094673156738281, -0.0002951622009277344, -0.0002808570861816406, -0.0002665519714355469, -0.0002522468566894531, -0.00023794174194335938, -0.00022363662719726562, -0.00020933151245117188, -0.00019502639770507812, -0.00018072128295898438, -0.00016641616821289062, -0.00015211105346679688, -0.00013780593872070312, -0.00012350082397460938, -0.00010919570922851562, -9.489059448242188e-05, -8.058547973632812e-05, -6.628036499023438e-05, -5.1975250244140625e-05, -3.7670135498046875e-05, -2.3365020751953125e-05, -9.059906005859375e-06, 5.245208740234375e-06, 1.9550323486328125e-05, 3.3855438232421875e-05, 4.8160552978515625e-05, 6.246566772460938e-05, 7.677078247070312e-05, 9.107589721679688e-05, 0.00010538101196289062, 0.00011968612670898438, 0.00013399124145507812, 0.00014829635620117188, 0.00016260147094726562, 0.00017690658569335938, 0.00019121170043945312, 0.00020551681518554688, 0.00021982192993164062, 0.00023412704467773438, 0.0002484321594238281, 0.0002627372741699219, 0.0002770423889160156, 0.0002913475036621094, 0.0003056526184082031, 0.0003199577331542969, 0.0003342628479003906, 0.0003485679626464844, 0.0003628730773925781, 0.0003771781921386719, 0.0003914833068847656]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 3.0, 5.0, 10.0, 11.0, 25.0, 36.0, 44.0, 64.0, 86.0, 124.0, 204.0, 367.0, 768.0, 1959.0, 5982.0, 24507.0, 355085.0, 619707.0, 28871.0, 6701.0, 2169.0, 859.0, 373.0, 199.0, 118.0, 80.0, 60.0, 38.0, 37.0, 23.0, 19.0, 10.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.98828125, -1.908905029296875, -1.82952880859375, -1.750152587890625, -1.6707763671875, -1.591400146484375, -1.51202392578125, -1.432647705078125, -1.353271484375, -1.273895263671875, -1.19451904296875, -1.115142822265625, -1.0357666015625, -0.956390380859375, -0.87701416015625, -0.797637939453125, -0.71826171875, -0.638885498046875, -0.55950927734375, -0.480133056640625, -0.4007568359375, -0.321380615234375, -0.24200439453125, -0.162628173828125, -0.083251953125, -0.003875732421875, 0.07550048828125, 0.154876708984375, 0.2342529296875, 0.313629150390625, 0.39300537109375, 0.472381591796875, 0.5517578125, 0.631134033203125, 0.71051025390625, 0.789886474609375, 0.8692626953125, 0.948638916015625, 1.02801513671875, 1.107391357421875, 1.186767578125, 1.266143798828125, 1.34552001953125, 1.424896240234375, 1.5042724609375, 1.583648681640625, 1.66302490234375, 1.742401123046875, 1.82177734375, 1.901153564453125, 1.98052978515625, 2.059906005859375, 2.1392822265625, 2.218658447265625, 2.29803466796875, 2.377410888671875, 2.456787109375, 2.536163330078125, 2.61553955078125, 2.694915771484375, 2.7742919921875, 2.853668212890625, 2.93304443359375, 3.012420654296875, 3.091796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 11.0, 8.0, 12.0, 13.0, 14.0, 15.0, 32.0, 49.0, 65.0, 105.0, 122.0, 155.0, 114.0, 81.0, 68.0, 41.0, 20.0, 13.0, 14.0, 12.0, 9.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.26171875, -2.1959075927734375, -2.130096435546875, -2.0642852783203125, -1.99847412109375, -1.9326629638671875, -1.866851806640625, -1.8010406494140625, -1.7352294921875, -1.6694183349609375, -1.603607177734375, -1.5377960205078125, -1.47198486328125, -1.4061737060546875, -1.340362548828125, -1.2745513916015625, -1.208740234375, -1.1429290771484375, -1.077117919921875, -1.0113067626953125, -0.94549560546875, -0.8796844482421875, -0.813873291015625, -0.7480621337890625, -0.6822509765625, -0.6164398193359375, -0.550628662109375, -0.4848175048828125, -0.41900634765625, -0.3531951904296875, -0.287384033203125, -0.2215728759765625, -0.15576171875, -0.0899505615234375, -0.024139404296875, 0.0416717529296875, 0.10748291015625, 0.1732940673828125, 0.239105224609375, 0.3049163818359375, 0.3707275390625, 0.4365386962890625, 0.502349853515625, 0.5681610107421875, 0.63397216796875, 0.6997833251953125, 0.765594482421875, 0.8314056396484375, 0.897216796875, 0.9630279541015625, 1.028839111328125, 1.0946502685546875, 1.16046142578125, 1.2262725830078125, 1.292083740234375, 1.3578948974609375, 1.4237060546875, 1.4895172119140625, 1.555328369140625, 1.6211395263671875, 1.68695068359375, 1.7527618408203125, 1.818572998046875, 1.8843841552734375, 1.9501953125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 12.0, 25.0, 83.0, 224.0, 389.0, 170.0, 42.0, 21.0, 11.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.4411392211914, -85.22296905517578, -83.00479125976562, -80.78662109375, -78.56845092773438, -76.35027313232422, -74.1321029663086, -71.91393280029297, -69.69575500488281, -67.47758483886719, -65.25940704345703, -63.041236877441406, -60.823062896728516, -58.604888916015625, -56.38671875, -54.16854476928711, -51.950374603271484, -49.732200622558594, -47.51403045654297, -45.29585647583008, -43.07768249511719, -40.85951232910156, -38.64133834838867, -36.42316436767578, -34.204994201660156, -31.9868221282959, -29.768648147583008, -27.55047607421875, -25.33230209350586, -23.1141300201416, -20.895957946777344, -18.677783966064453, -16.459609985351562, -14.241436958312988, -12.023263931274414, -9.805091857910156, -7.586918830871582, -5.368745803833008, -3.15057373046875, -0.9324007034301758, 1.2857723236083984, 3.5039451122283936, 5.722117900848389, 7.940290451049805, 10.158463478088379, 12.376636505126953, 14.594808578491211, 16.81298065185547, 19.03115463256836, 21.249326705932617, 23.467500686645508, 25.685672760009766, 27.903846740722656, 30.122018814086914, 32.34019088745117, 34.55836486816406, 36.77653503417969, 38.99470901489258, 41.2128791809082, 43.431053161621094, 45.649227142333984, 47.867401123046875, 50.0855712890625, 52.30374526977539, 54.52191925048828]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 4.0, 10.0, 10.0, 11.0, 18.0, 16.0, 26.0, 27.0, 35.0, 49.0, 30.0, 41.0, 42.0, 69.0, 96.0, 91.0, 77.0, 57.0, 46.0, 45.0, 20.0, 38.0, 26.0, 23.0, 25.0, 11.0, 11.0, 11.0, 4.0, 8.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.34560203552246, -22.511781692504883, -21.677963256835938, -20.84414291381836, -20.010324478149414, -19.176504135131836, -18.34268569946289, -17.508865356445312, -16.675045013427734, -15.841225624084473, -15.007406234741211, -14.173585891723633, -13.339767456054688, -12.50594711303711, -11.672127723693848, -10.838308334350586, -10.00448989868164, -9.170670509338379, -8.336851119995117, -7.503031253814697, -6.6692118644714355, -5.835392475128174, -5.001572608947754, -4.167753219604492, -3.3339338302612305, -2.5001144409179688, -1.666294813156128, -0.8324751853942871, 0.0013442039489746094, 0.8351635932922363, 1.6689834594726562, 2.502802848815918, 3.336620330810547, 4.170439720153809, 5.00425910949707, 5.83807897567749, 6.671898365020752, 7.505717754364014, 8.339537620544434, 9.173357009887695, 10.007176399230957, 10.840995788574219, 11.67481517791748, 12.508634567260742, 13.34245491027832, 14.176273345947266, 15.010093688964844, 15.843913078308105, 16.677732467651367, 17.511552810668945, 18.34537124633789, 19.17919158935547, 20.013010025024414, 20.846830368041992, 21.680648803710938, 22.514469146728516, 23.348289489746094, 24.182109832763672, 25.015928268432617, 25.849748611450195, 26.68356704711914, 27.51738739013672, 28.351207733154297, 29.185026168823242, 30.018844604492188]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 4.0, 6.0, 5.0, 12.0, 14.0, 28.0, 40.0, 65.0, 90.0, 219.0, 454.0, 925.0, 2547.0, 9202.0, 73466.0, 3529342.0, 550632.0, 20478.0, 4077.0, 1274.0, 541.0, 329.0, 164.0, 118.0, 76.0, 50.0, 29.0, 17.0, 17.0, 12.0, 11.0, 12.0, 3.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1171875, -2.98016357421875, -2.8431396484375, -2.70611572265625, -2.569091796875, -2.43206787109375, -2.2950439453125, -2.15802001953125, -2.02099609375, -1.88397216796875, -1.7469482421875, -1.60992431640625, -1.472900390625, -1.33587646484375, -1.1988525390625, -1.06182861328125, -0.9248046875, -0.78778076171875, -0.6507568359375, -0.51373291015625, -0.376708984375, -0.23968505859375, -0.1026611328125, 0.03436279296875, 0.17138671875, 0.30841064453125, 0.4454345703125, 0.58245849609375, 0.719482421875, 0.85650634765625, 0.9935302734375, 1.13055419921875, 1.267578125, 1.40460205078125, 1.5416259765625, 1.67864990234375, 1.815673828125, 1.95269775390625, 2.0897216796875, 2.22674560546875, 2.36376953125, 2.50079345703125, 2.6378173828125, 2.77484130859375, 2.911865234375, 3.04888916015625, 3.1859130859375, 3.32293701171875, 3.4599609375, 3.59698486328125, 3.7340087890625, 3.87103271484375, 4.008056640625, 4.14508056640625, 4.2821044921875, 4.41912841796875, 4.55615234375, 4.69317626953125, 4.8302001953125, 4.96722412109375, 5.104248046875, 5.24127197265625, 5.3782958984375, 5.51531982421875, 5.65234375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 7.0, 11.0, 17.0, 18.0, 21.0, 43.0, 45.0, 75.0, 72.0, 74.0, 92.0, 82.0, 73.0, 82.0, 75.0, 39.0, 51.0, 35.0, 30.0, 19.0, 15.0, 10.0, 6.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.017578125, -1.953338623046875, -1.88909912109375, -1.824859619140625, -1.7606201171875, -1.696380615234375, -1.63214111328125, -1.567901611328125, -1.503662109375, -1.439422607421875, -1.37518310546875, -1.310943603515625, -1.2467041015625, -1.182464599609375, -1.11822509765625, -1.053985595703125, -0.98974609375, -0.925506591796875, -0.86126708984375, -0.797027587890625, -0.7327880859375, -0.668548583984375, -0.60430908203125, -0.540069580078125, -0.475830078125, -0.411590576171875, -0.34735107421875, -0.283111572265625, -0.2188720703125, -0.154632568359375, -0.09039306640625, -0.026153564453125, 0.0380859375, 0.102325439453125, 0.16656494140625, 0.230804443359375, 0.2950439453125, 0.359283447265625, 0.42352294921875, 0.487762451171875, 0.552001953125, 0.616241455078125, 0.68048095703125, 0.744720458984375, 0.8089599609375, 0.873199462890625, 0.93743896484375, 1.001678466796875, 1.06591796875, 1.130157470703125, 1.19439697265625, 1.258636474609375, 1.3228759765625, 1.387115478515625, 1.45135498046875, 1.515594482421875, 1.579833984375, 1.644073486328125, 1.70831298828125, 1.772552490234375, 1.8367919921875, 1.901031494140625, 1.96527099609375, 2.029510498046875, 2.09375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 12.0, 13.0, 12.0, 34.0, 53.0, 124.0, 231.0, 405.0, 780.0, 1539.0, 3441.0, 13092.0, 160743.0, 3871201.0, 124811.0, 11366.0, 3328.0, 1452.0, 747.0, 359.0, 207.0, 119.0, 62.0, 44.0, 30.0, 18.0, 12.0, 7.0, 3.0, 8.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90625, -4.73974609375, -4.5732421875, -4.40673828125, -4.240234375, -4.07373046875, -3.9072265625, -3.74072265625, -3.57421875, -3.40771484375, -3.2412109375, -3.07470703125, -2.908203125, -2.74169921875, -2.5751953125, -2.40869140625, -2.2421875, -2.07568359375, -1.9091796875, -1.74267578125, -1.576171875, -1.40966796875, -1.2431640625, -1.07666015625, -0.91015625, -0.74365234375, -0.5771484375, -0.41064453125, -0.244140625, -0.07763671875, 0.0888671875, 0.25537109375, 0.421875, 0.58837890625, 0.7548828125, 0.92138671875, 1.087890625, 1.25439453125, 1.4208984375, 1.58740234375, 1.75390625, 1.92041015625, 2.0869140625, 2.25341796875, 2.419921875, 2.58642578125, 2.7529296875, 2.91943359375, 3.0859375, 3.25244140625, 3.4189453125, 3.58544921875, 3.751953125, 3.91845703125, 4.0849609375, 4.25146484375, 4.41796875, 4.58447265625, 4.7509765625, 4.91748046875, 5.083984375, 5.25048828125, 5.4169921875, 5.58349609375, 5.75]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 9.0, 12.0, 26.0, 42.0, 83.0, 139.0, 375.0, 919.0, 1324.0, 633.0, 249.0, 105.0, 59.0, 28.0, 18.0, 13.0, 10.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.96484375, -4.81103515625, -4.6572265625, -4.50341796875, -4.349609375, -4.19580078125, -4.0419921875, -3.88818359375, -3.734375, -3.58056640625, -3.4267578125, -3.27294921875, -3.119140625, -2.96533203125, -2.8115234375, -2.65771484375, -2.50390625, -2.35009765625, -2.1962890625, -2.04248046875, -1.888671875, -1.73486328125, -1.5810546875, -1.42724609375, -1.2734375, -1.11962890625, -0.9658203125, -0.81201171875, -0.658203125, -0.50439453125, -0.3505859375, -0.19677734375, -0.04296875, 0.11083984375, 0.2646484375, 0.41845703125, 0.572265625, 0.72607421875, 0.8798828125, 1.03369140625, 1.1875, 1.34130859375, 1.4951171875, 1.64892578125, 1.802734375, 1.95654296875, 2.1103515625, 2.26416015625, 2.41796875, 2.57177734375, 2.7255859375, 2.87939453125, 3.033203125, 3.18701171875, 3.3408203125, 3.49462890625, 3.6484375, 3.80224609375, 3.9560546875, 4.10986328125, 4.263671875, 4.41748046875, 4.5712890625, 4.72509765625, 4.87890625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 5.0, 19.0, 109.0, 362.0, 324.0, 129.0, 24.0, 12.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-92.21549987792969, -90.16929626464844, -88.12309265136719, -86.07688903808594, -84.03068542480469, -81.98448181152344, -79.93827819824219, -77.89208221435547, -75.84587860107422, -73.79967498779297, -71.75347137451172, -69.70726776123047, -67.66106414794922, -65.6148681640625, -63.568660736083984, -61.522457122802734, -59.476253509521484, -57.430049896240234, -55.383846282958984, -53.337646484375, -51.29144287109375, -49.2452392578125, -47.19903564453125, -45.15283203125, -43.10662841796875, -41.0604248046875, -39.01422119140625, -36.968017578125, -34.921817779541016, -32.875614166259766, -30.829410552978516, -28.783206939697266, -26.73700714111328, -24.69080352783203, -22.644601821899414, -20.598398208618164, -18.552196502685547, -16.505992889404297, -14.459789276123047, -12.413586616516113, -10.36738395690918, -8.321181297302246, -6.274978160858154, -4.2287750244140625, -2.182572364807129, -0.1363697052001953, 1.9098339080810547, 3.9560365676879883, 6.002239227294922, 8.048441886901855, 10.094644546508789, 12.140848159790039, 14.187050819396973, 16.233253479003906, 18.279457092285156, 20.325660705566406, 22.371862411499023, 24.418066024780273, 26.46426773071289, 28.51047134399414, 30.55667495727539, 32.602874755859375, 34.649078369140625, 36.695281982421875, 38.741485595703125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 10.0, 11.0, 8.0, 18.0, 28.0, 30.0, 33.0, 50.0, 60.0, 67.0, 90.0, 86.0, 97.0, 80.0, 59.0, 65.0, 53.0, 43.0, 30.0, 19.0, 24.0, 14.0, 13.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-27.23350715637207, -26.613506317138672, -25.993505477905273, -25.373504638671875, -24.753503799438477, -24.133502960205078, -23.51350212097168, -22.89350128173828, -22.273500442504883, -21.653499603271484, -21.033498764038086, -20.413497924804688, -19.79349708557129, -19.17349624633789, -18.553495407104492, -17.933494567871094, -17.313493728637695, -16.693492889404297, -16.0734920501709, -15.4534912109375, -14.833490371704102, -14.213489532470703, -13.593488693237305, -12.973487854003906, -12.353487014770508, -11.73348617553711, -11.113485336303711, -10.493484497070312, -9.873483657836914, -9.253482818603516, -8.633481979370117, -8.013481140136719, -7.393481254577637, -6.773480415344238, -6.15347957611084, -5.533478736877441, -4.913477897644043, -4.2934770584106445, -3.673476219177246, -3.0534753799438477, -2.433474540710449, -1.8134737014770508, -1.1934728622436523, -0.5734720230102539, 0.04652881622314453, 0.666529655456543, 1.2865304946899414, 1.9065313339233398, 2.5265321731567383, 3.1465330123901367, 3.766533851623535, 4.386534690856934, 5.006535530090332, 5.6265363693237305, 6.246537208557129, 6.866538047790527, 7.486538887023926, 8.106539726257324, 8.726540565490723, 9.346541404724121, 9.96654224395752, 10.586543083190918, 11.206543922424316, 11.826544761657715, 12.446545600891113]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 16.0, 23.0, 17.0, 29.0, 49.0, 79.0, 109.0, 195.0, 341.0, 723.0, 1983.0, 8619.0, 61820.0, 507388.0, 411142.0, 46150.0, 6724.0, 1731.0, 615.0, 299.0, 182.0, 103.0, 59.0, 41.0, 32.0, 18.0, 12.0, 12.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.39630126953125, -5.2418212890625, -5.08734130859375, -4.932861328125, -4.77838134765625, -4.6239013671875, -4.46942138671875, -4.31494140625, -4.16046142578125, -4.0059814453125, -3.85150146484375, -3.697021484375, -3.54254150390625, -3.3880615234375, -3.23358154296875, -3.0791015625, -2.92462158203125, -2.7701416015625, -2.61566162109375, -2.461181640625, -2.30670166015625, -2.1522216796875, -1.99774169921875, -1.84326171875, -1.68878173828125, -1.5343017578125, -1.37982177734375, -1.225341796875, -1.07086181640625, -0.9163818359375, -0.76190185546875, -0.607421875, -0.45294189453125, -0.2984619140625, -0.14398193359375, 0.010498046875, 0.16497802734375, 0.3194580078125, 0.47393798828125, 0.62841796875, 0.78289794921875, 0.9373779296875, 1.09185791015625, 1.246337890625, 1.40081787109375, 1.5552978515625, 1.70977783203125, 1.8642578125, 2.01873779296875, 2.1732177734375, 2.32769775390625, 2.482177734375, 2.63665771484375, 2.7911376953125, 2.94561767578125, 3.10009765625, 3.25457763671875, 3.4090576171875, 3.56353759765625, 3.718017578125, 3.87249755859375, 4.0269775390625, 4.18145751953125, 4.3359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 11.0, 13.0, 16.0, 23.0, 37.0, 46.0, 51.0, 71.0, 84.0, 97.0, 77.0, 80.0, 74.0, 60.0, 65.0, 51.0, 44.0, 28.0, 21.0, 21.0, 15.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.224609375, -2.1566162109375, -2.088623046875, -2.0206298828125, -1.95263671875, -1.8846435546875, -1.816650390625, -1.7486572265625, -1.6806640625, -1.6126708984375, -1.544677734375, -1.4766845703125, -1.40869140625, -1.3406982421875, -1.272705078125, -1.2047119140625, -1.13671875, -1.0687255859375, -1.000732421875, -0.9327392578125, -0.86474609375, -0.7967529296875, -0.728759765625, -0.6607666015625, -0.5927734375, -0.5247802734375, -0.456787109375, -0.3887939453125, -0.32080078125, -0.2528076171875, -0.184814453125, -0.1168212890625, -0.048828125, 0.0191650390625, 0.087158203125, 0.1551513671875, 0.22314453125, 0.2911376953125, 0.359130859375, 0.4271240234375, 0.4951171875, 0.5631103515625, 0.631103515625, 0.6990966796875, 0.76708984375, 0.8350830078125, 0.903076171875, 0.9710693359375, 1.0390625, 1.1070556640625, 1.175048828125, 1.2430419921875, 1.31103515625, 1.3790283203125, 1.447021484375, 1.5150146484375, 1.5830078125, 1.6510009765625, 1.718994140625, 1.7869873046875, 1.85498046875, 1.9229736328125, 1.990966796875, 2.0589599609375, 2.126953125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 9.0, 13.0, 12.0, 10.0, 21.0, 35.0, 27.0, 61.0, 79.0, 122.0, 235.0, 373.0, 841.0, 2165.0, 6679.0, 26440.0, 152477.0, 670691.0, 151395.0, 26357.0, 6503.0, 2177.0, 845.0, 393.0, 197.0, 124.0, 90.0, 54.0, 41.0, 19.0, 17.0, 11.0, 10.0, 8.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.22265625, -4.100250244140625, -3.97784423828125, -3.855438232421875, -3.7330322265625, -3.610626220703125, -3.48822021484375, -3.365814208984375, -3.243408203125, -3.121002197265625, -2.99859619140625, -2.876190185546875, -2.7537841796875, -2.631378173828125, -2.50897216796875, -2.386566162109375, -2.26416015625, -2.141754150390625, -2.01934814453125, -1.896942138671875, -1.7745361328125, -1.652130126953125, -1.52972412109375, -1.407318115234375, -1.284912109375, -1.162506103515625, -1.04010009765625, -0.917694091796875, -0.7952880859375, -0.672882080078125, -0.55047607421875, -0.428070068359375, -0.3056640625, -0.183258056640625, -0.06085205078125, 0.061553955078125, 0.1839599609375, 0.306365966796875, 0.42877197265625, 0.551177978515625, 0.673583984375, 0.795989990234375, 0.91839599609375, 1.040802001953125, 1.1632080078125, 1.285614013671875, 1.40802001953125, 1.530426025390625, 1.65283203125, 1.775238037109375, 1.89764404296875, 2.020050048828125, 2.1424560546875, 2.264862060546875, 2.38726806640625, 2.509674072265625, 2.632080078125, 2.754486083984375, 2.87689208984375, 2.999298095703125, 3.1217041015625, 3.244110107421875, 3.36651611328125, 3.488922119140625, 3.611328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 2.0, 6.0, 8.0, 14.0, 18.0, 16.0, 21.0, 23.0, 30.0, 35.0, 37.0, 57.0, 68.0, 51.0, 61.0, 62.0, 56.0, 51.0, 61.0, 43.0, 50.0, 38.0, 41.0, 18.0, 19.0, 32.0, 14.0, 11.0, 9.0, 11.0, 8.0, 9.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.658935546875, -5.48583984375, -5.312744140625, -5.1396484375, -4.966552734375, -4.79345703125, -4.620361328125, -4.447265625, -4.274169921875, -4.10107421875, -3.927978515625, -3.7548828125, -3.581787109375, -3.40869140625, -3.235595703125, -3.0625, -2.889404296875, -2.71630859375, -2.543212890625, -2.3701171875, -2.197021484375, -2.02392578125, -1.850830078125, -1.677734375, -1.504638671875, -1.33154296875, -1.158447265625, -0.9853515625, -0.812255859375, -0.63916015625, -0.466064453125, -0.29296875, -0.119873046875, 0.05322265625, 0.226318359375, 0.3994140625, 0.572509765625, 0.74560546875, 0.918701171875, 1.091796875, 1.264892578125, 1.43798828125, 1.611083984375, 1.7841796875, 1.957275390625, 2.13037109375, 2.303466796875, 2.4765625, 2.649658203125, 2.82275390625, 2.995849609375, 3.1689453125, 3.342041015625, 3.51513671875, 3.688232421875, 3.861328125, 4.034423828125, 4.20751953125, 4.380615234375, 4.5537109375, 4.726806640625, 4.89990234375, 5.072998046875, 5.24609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 13.0, 22.0, 27.0, 38.0, 95.0, 228.0, 672.0, 2478.0, 12680.0, 105485.0, 770615.0, 136558.0, 15569.0, 2825.0, 779.0, 231.0, 110.0, 49.0, 29.0, 23.0, 13.0, 6.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.025390625, -1.9754486083984375, -1.925506591796875, -1.8755645751953125, -1.82562255859375, -1.7756805419921875, -1.725738525390625, -1.6757965087890625, -1.6258544921875, -1.5759124755859375, -1.525970458984375, -1.4760284423828125, -1.42608642578125, -1.3761444091796875, -1.326202392578125, -1.2762603759765625, -1.226318359375, -1.1763763427734375, -1.126434326171875, -1.0764923095703125, -1.02655029296875, -0.9766082763671875, -0.926666259765625, -0.8767242431640625, -0.8267822265625, -0.7768402099609375, -0.726898193359375, -0.6769561767578125, -0.62701416015625, -0.5770721435546875, -0.527130126953125, -0.4771881103515625, -0.42724609375, -0.3773040771484375, -0.327362060546875, -0.2774200439453125, -0.22747802734375, -0.1775360107421875, -0.127593994140625, -0.0776519775390625, -0.0277099609375, 0.0222320556640625, 0.072174072265625, 0.1221160888671875, 0.17205810546875, 0.2220001220703125, 0.271942138671875, 0.3218841552734375, 0.371826171875, 0.4217681884765625, 0.471710205078125, 0.5216522216796875, 0.57159423828125, 0.6215362548828125, 0.671478271484375, 0.7214202880859375, 0.7713623046875, 0.8213043212890625, 0.871246337890625, 0.9211883544921875, 0.97113037109375, 1.0210723876953125, 1.071014404296875, 1.1209564208984375, 1.1708984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 10.0, 11.0, 10.0, 9.0, 7.0, 21.0, 37.0, 43.0, 47.0, 62.0, 79.0, 95.0, 94.0, 108.0, 71.0, 61.0, 50.0, 37.0, 31.0, 33.0, 24.0, 11.0, 13.0, 7.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.00027251243591308594, -0.000265609472990036, -0.0002587065100669861, -0.00025180354714393616, -0.00024490058422088623, -0.0002379976212978363, -0.00023109465837478638, -0.00022419169545173645, -0.00021728873252868652, -0.0002103857696056366, -0.00020348280668258667, -0.00019657984375953674, -0.00018967688083648682, -0.0001827739179134369, -0.00017587095499038696, -0.00016896799206733704, -0.0001620650291442871, -0.00015516206622123718, -0.00014825910329818726, -0.00014135614037513733, -0.0001344531774520874, -0.00012755021452903748, -0.00012064725160598755, -0.00011374428868293762, -0.0001068413257598877, -9.993836283683777e-05, -9.303539991378784e-05, -8.613243699073792e-05, -7.922947406768799e-05, -7.232651114463806e-05, -6.542354822158813e-05, -5.852058529853821e-05, -5.161762237548828e-05, -4.4714659452438354e-05, -3.781169652938843e-05, -3.09087336063385e-05, -2.4005770683288574e-05, -1.7102807760238647e-05, -1.019984483718872e-05, -3.296881914138794e-06, 3.606081008911133e-06, 1.050904393196106e-05, 1.7412006855010986e-05, 2.4314969778060913e-05, 3.121793270111084e-05, 3.8120895624160767e-05, 4.502385854721069e-05, 5.192682147026062e-05, 5.882978439331055e-05, 6.573274731636047e-05, 7.26357102394104e-05, 7.953867316246033e-05, 8.644163608551025e-05, 9.334459900856018e-05, 0.00010024756193161011, 0.00010715052485466003, 0.00011405348777770996, 0.00012095645070075989, 0.00012785941362380981, 0.00013476237654685974, 0.00014166533946990967, 0.0001485683023929596, 0.00015547126531600952, 0.00016237422823905945, 0.00016927719116210938]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 24.0, 23.0, 33.0, 47.0, 84.0, 110.0, 218.0, 388.0, 843.0, 1915.0, 4698.0, 14528.0, 59261.0, 297939.0, 556255.0, 83002.0, 18910.0, 5902.0, 2221.0, 1036.0, 476.0, 230.0, 131.0, 83.0, 62.0, 34.0, 19.0, 18.0, 10.0, 10.0, 7.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9462890625, -0.911376953125, -0.87646484375, -0.841552734375, -0.806640625, -0.771728515625, -0.73681640625, -0.701904296875, -0.6669921875, -0.632080078125, -0.59716796875, -0.562255859375, -0.52734375, -0.492431640625, -0.45751953125, -0.422607421875, -0.3876953125, -0.352783203125, -0.31787109375, -0.282958984375, -0.248046875, -0.213134765625, -0.17822265625, -0.143310546875, -0.1083984375, -0.073486328125, -0.03857421875, -0.003662109375, 0.03125, 0.066162109375, 0.10107421875, 0.135986328125, 0.1708984375, 0.205810546875, 0.24072265625, 0.275634765625, 0.310546875, 0.345458984375, 0.38037109375, 0.415283203125, 0.4501953125, 0.485107421875, 0.52001953125, 0.554931640625, 0.58984375, 0.624755859375, 0.65966796875, 0.694580078125, 0.7294921875, 0.764404296875, 0.79931640625, 0.834228515625, 0.869140625, 0.904052734375, 0.93896484375, 0.973876953125, 1.0087890625, 1.043701171875, 1.07861328125, 1.113525390625, 1.1484375, 1.183349609375, 1.21826171875, 1.253173828125, 1.2880859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 10.0, 7.0, 11.0, 16.0, 23.0, 29.0, 43.0, 62.0, 78.0, 69.0, 109.0, 108.0, 94.0, 80.0, 67.0, 52.0, 40.0, 22.0, 20.0, 13.0, 10.0, 5.0, 6.0, 8.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1181640625, -1.07879638671875, -1.0394287109375, -1.00006103515625, -0.960693359375, -0.92132568359375, -0.8819580078125, -0.84259033203125, -0.80322265625, -0.76385498046875, -0.7244873046875, -0.68511962890625, -0.645751953125, -0.60638427734375, -0.5670166015625, -0.52764892578125, -0.48828125, -0.44891357421875, -0.4095458984375, -0.37017822265625, -0.330810546875, -0.29144287109375, -0.2520751953125, -0.21270751953125, -0.17333984375, -0.13397216796875, -0.0946044921875, -0.05523681640625, -0.015869140625, 0.02349853515625, 0.0628662109375, 0.10223388671875, 0.1416015625, 0.18096923828125, 0.2203369140625, 0.25970458984375, 0.299072265625, 0.33843994140625, 0.3778076171875, 0.41717529296875, 0.45654296875, 0.49591064453125, 0.5352783203125, 0.57464599609375, 0.614013671875, 0.65338134765625, 0.6927490234375, 0.73211669921875, 0.771484375, 0.81085205078125, 0.8502197265625, 0.88958740234375, 0.928955078125, 0.96832275390625, 1.0076904296875, 1.04705810546875, 1.08642578125, 1.12579345703125, 1.1651611328125, 1.20452880859375, 1.243896484375, 1.28326416015625, 1.3226318359375, 1.36199951171875, 1.4013671875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 13.0, 17.0, 39.0, 82.0, 182.0, 291.0, 153.0, 88.0, 45.0, 31.0, 23.0, 9.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.356670379638672, -30.38308334350586, -29.40949821472168, -28.435911178588867, -27.462326049804688, -26.488739013671875, -25.515151977539062, -24.541566848754883, -23.567981719970703, -22.59439468383789, -21.62080955505371, -20.6472225189209, -19.67363739013672, -18.700050354003906, -17.726463317871094, -16.752878189086914, -15.779291152954102, -14.805705070495605, -13.83211898803711, -12.858531951904297, -11.884946823120117, -10.911359786987305, -9.937773704528809, -8.964187622070312, -7.990601539611816, -7.01701545715332, -6.043429374694824, -5.06984281539917, -4.096256732940674, -3.1226706504821777, -2.1490840911865234, -1.1754980087280273, -0.20191001892089844, 0.7716761827468872, 1.7452623844146729, 2.718848705291748, 3.692434787750244, 4.66602087020874, 5.6396074295043945, 6.613193511962891, 7.586779594421387, 8.560365676879883, 9.533951759338379, 10.507537841796875, 11.481124877929688, 12.454710006713867, 13.42829704284668, 14.401883125305176, 15.375469207763672, 16.349056243896484, 17.322641372680664, 18.296228408813477, 19.269813537597656, 20.24340057373047, 21.21698760986328, 22.19057273864746, 23.16415786743164, 24.137744903564453, 25.111330032348633, 26.084917068481445, 27.058502197265625, 28.032089233398438, 29.00567626953125, 29.97926139831543, 30.952848434448242]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 10.0, 5.0, 7.0, 9.0, 14.0, 21.0, 15.0, 30.0, 16.0, 18.0, 19.0, 19.0, 27.0, 38.0, 45.0, 40.0, 81.0, 70.0, 79.0, 65.0, 63.0, 34.0, 36.0, 44.0, 24.0, 29.0, 28.0, 14.0, 18.0, 14.0, 9.0, 11.0, 9.0, 16.0, 4.0, 7.0, 5.0, 2.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.64261245727539, -16.072528839111328, -15.502445220947266, -14.932361602783203, -14.36227798461914, -13.792194366455078, -13.2221097946167, -12.652026176452637, -12.081942558288574, -11.511858940124512, -10.94177532196045, -10.371691703796387, -9.801607131958008, -9.231523513793945, -8.661439895629883, -8.09135627746582, -7.521272659301758, -6.951189041137695, -6.381105422973633, -5.811021327972412, -5.24093770980835, -4.670854091644287, -4.100769996643066, -3.530686378479004, -2.9606027603149414, -2.390519142150879, -1.8204352855682373, -1.2503515481948853, -0.6802678108215332, -0.1101841926574707, 0.4598996639251709, 1.0299835205078125, 1.600067138671875, 2.1701507568359375, 2.740234613418579, 3.3103184700012207, 3.880402088165283, 4.450485706329346, 5.020569801330566, 5.590653419494629, 6.160737037658691, 6.730820655822754, 7.300904273986816, 7.870988368988037, 8.441072463989258, 9.01115608215332, 9.581239700317383, 10.151323318481445, 10.721406936645508, 11.29149055480957, 11.861574172973633, 12.431657791137695, 13.001741409301758, 13.57182502746582, 14.1419095993042, 14.711993217468262, 15.282076835632324, 15.852160453796387, 16.422245025634766, 16.992328643798828, 17.56241226196289, 18.132495880126953, 18.702579498291016, 19.272663116455078, 19.84274673461914]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 9.0, 6.0, 6.0, 9.0, 15.0, 24.0, 39.0, 58.0, 104.0, 190.0, 325.0, 655.0, 1918.0, 6768.0, 42140.0, 1300025.0, 2748030.0, 80708.0, 9264.0, 2355.0, 810.0, 349.0, 175.0, 100.0, 62.0, 40.0, 28.0, 21.0, 16.0, 8.0, 12.0, 7.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.138671875, -3.037811279296875, -2.93695068359375, -2.836090087890625, -2.7352294921875, -2.634368896484375, -2.53350830078125, -2.432647705078125, -2.331787109375, -2.230926513671875, -2.13006591796875, -2.029205322265625, -1.9283447265625, -1.827484130859375, -1.72662353515625, -1.625762939453125, -1.52490234375, -1.424041748046875, -1.32318115234375, -1.222320556640625, -1.1214599609375, -1.020599365234375, -0.91973876953125, -0.818878173828125, -0.718017578125, -0.617156982421875, -0.51629638671875, -0.415435791015625, -0.3145751953125, -0.213714599609375, -0.11285400390625, -0.011993408203125, 0.0888671875, 0.189727783203125, 0.29058837890625, 0.391448974609375, 0.4923095703125, 0.593170166015625, 0.69403076171875, 0.794891357421875, 0.895751953125, 0.996612548828125, 1.09747314453125, 1.198333740234375, 1.2991943359375, 1.400054931640625, 1.50091552734375, 1.601776123046875, 1.70263671875, 1.803497314453125, 1.90435791015625, 2.005218505859375, 2.1060791015625, 2.206939697265625, 2.30780029296875, 2.408660888671875, 2.509521484375, 2.610382080078125, 2.71124267578125, 2.812103271484375, 2.9129638671875, 3.013824462890625, 3.11468505859375, 3.215545654296875, 3.31640625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 3.0, 17.0, 16.0, 22.0, 26.0, 38.0, 44.0, 52.0, 54.0, 81.0, 93.0, 76.0, 68.0, 69.0, 65.0, 66.0, 47.0, 44.0, 30.0, 27.0, 22.0, 13.0, 12.0, 7.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6787109375, -1.6183929443359375, -1.558074951171875, -1.4977569580078125, -1.43743896484375, -1.3771209716796875, -1.316802978515625, -1.2564849853515625, -1.1961669921875, -1.1358489990234375, -1.075531005859375, -1.0152130126953125, -0.95489501953125, -0.8945770263671875, -0.834259033203125, -0.7739410400390625, -0.713623046875, -0.6533050537109375, -0.592987060546875, -0.5326690673828125, -0.47235107421875, -0.4120330810546875, -0.351715087890625, -0.2913970947265625, -0.2310791015625, -0.1707611083984375, -0.110443115234375, -0.0501251220703125, 0.01019287109375, 0.0705108642578125, 0.130828857421875, 0.1911468505859375, 0.25146484375, 0.3117828369140625, 0.372100830078125, 0.4324188232421875, 0.49273681640625, 0.5530548095703125, 0.613372802734375, 0.6736907958984375, 0.7340087890625, 0.7943267822265625, 0.854644775390625, 0.9149627685546875, 0.97528076171875, 1.0355987548828125, 1.095916748046875, 1.1562347412109375, 1.216552734375, 1.2768707275390625, 1.337188720703125, 1.3975067138671875, 1.45782470703125, 1.5181427001953125, 1.578460693359375, 1.6387786865234375, 1.6990966796875, 1.7594146728515625, 1.819732666015625, 1.8800506591796875, 1.94036865234375, 2.0006866455078125, 2.061004638671875, 2.1213226318359375, 2.181640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 8.0, 6.0, 8.0, 11.0, 20.0, 17.0, 39.0, 46.0, 79.0, 141.0, 288.0, 757.0, 2509.0, 10103.0, 65612.0, 1763364.0, 2258490.0, 77509.0, 11092.0, 2638.0, 782.0, 344.0, 151.0, 76.0, 62.0, 28.0, 20.0, 12.0, 8.0, 18.0, 8.0, 13.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.359375, -3.26348876953125, -3.1676025390625, -3.07171630859375, -2.975830078125, -2.87994384765625, -2.7840576171875, -2.68817138671875, -2.59228515625, -2.49639892578125, -2.4005126953125, -2.30462646484375, -2.208740234375, -2.11285400390625, -2.0169677734375, -1.92108154296875, -1.8251953125, -1.72930908203125, -1.6334228515625, -1.53753662109375, -1.441650390625, -1.34576416015625, -1.2498779296875, -1.15399169921875, -1.05810546875, -0.96221923828125, -0.8663330078125, -0.77044677734375, -0.674560546875, -0.57867431640625, -0.4827880859375, -0.38690185546875, -0.291015625, -0.19512939453125, -0.0992431640625, -0.00335693359375, 0.092529296875, 0.18841552734375, 0.2843017578125, 0.38018798828125, 0.47607421875, 0.57196044921875, 0.6678466796875, 0.76373291015625, 0.859619140625, 0.95550537109375, 1.0513916015625, 1.14727783203125, 1.2431640625, 1.33905029296875, 1.4349365234375, 1.53082275390625, 1.626708984375, 1.72259521484375, 1.8184814453125, 1.91436767578125, 2.01025390625, 2.10614013671875, 2.2020263671875, 2.29791259765625, 2.393798828125, 2.48968505859375, 2.5855712890625, 2.68145751953125, 2.77734375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 11.0, 6.0, 5.0, 14.0, 19.0, 12.0, 31.0, 34.0, 53.0, 84.0, 122.0, 173.0, 275.0, 423.0, 630.0, 624.0, 526.0, 363.0, 226.0, 120.0, 83.0, 74.0, 51.0, 26.0, 18.0, 11.0, 11.0, 13.0, 11.0, 1.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0234375, -1.95416259765625, -1.8848876953125, -1.81561279296875, -1.746337890625, -1.67706298828125, -1.6077880859375, -1.53851318359375, -1.46923828125, -1.39996337890625, -1.3306884765625, -1.26141357421875, -1.192138671875, -1.12286376953125, -1.0535888671875, -0.98431396484375, -0.9150390625, -0.84576416015625, -0.7764892578125, -0.70721435546875, -0.637939453125, -0.56866455078125, -0.4993896484375, -0.43011474609375, -0.36083984375, -0.29156494140625, -0.2222900390625, -0.15301513671875, -0.083740234375, -0.01446533203125, 0.0548095703125, 0.12408447265625, 0.193359375, 0.26263427734375, 0.3319091796875, 0.40118408203125, 0.470458984375, 0.53973388671875, 0.6090087890625, 0.67828369140625, 0.74755859375, 0.81683349609375, 0.8861083984375, 0.95538330078125, 1.024658203125, 1.09393310546875, 1.1632080078125, 1.23248291015625, 1.3017578125, 1.37103271484375, 1.4403076171875, 1.50958251953125, 1.578857421875, 1.64813232421875, 1.7174072265625, 1.78668212890625, 1.85595703125, 1.92523193359375, 1.9945068359375, 2.06378173828125, 2.133056640625, 2.20233154296875, 2.2716064453125, 2.34088134765625, 2.41015625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 24.0, 59.0, 147.0, 231.0, 229.0, 177.0, 73.0, 19.0, 17.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.10642623901367, -38.13414001464844, -37.16185760498047, -36.189571380615234, -35.21728515625, -34.244998931884766, -33.2727165222168, -32.30043029785156, -31.328144073486328, -30.355859756469727, -29.383573532104492, -28.41128921508789, -27.439002990722656, -26.466718673706055, -25.49443244934082, -24.52214813232422, -23.549861907958984, -22.577577590942383, -21.60529136657715, -20.633007049560547, -19.660720825195312, -18.68843650817871, -17.716150283813477, -16.743865966796875, -15.771581649780273, -14.799296379089355, -13.827011108398438, -12.85472583770752, -11.882440567016602, -10.91015625, -9.937870025634766, -8.965585708618164, -7.99329948425293, -7.021014213562012, -6.048728942871094, -5.076443672180176, -4.104158401489258, -3.131873607635498, -2.15958833694458, -1.187303066253662, -0.21501779556274414, 0.757267415523529, 1.7295526266098022, 2.7018377780914307, 3.6741230487823486, 4.6464080810546875, 5.6186933517456055, 6.590978622436523, 7.563263893127441, 8.53554916381836, 9.507834434509277, 10.480119705200195, 11.452404975891113, 12.424690246582031, 13.396974563598633, 14.369260787963867, 15.341545104980469, 16.31382942199707, 17.286115646362305, 18.258399963378906, 19.23068618774414, 20.202970504760742, 21.175256729125977, 22.147541046142578, 23.119827270507812]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 5.0, 11.0, 12.0, 20.0, 19.0, 14.0, 21.0, 23.0, 36.0, 26.0, 51.0, 35.0, 61.0, 59.0, 68.0, 74.0, 60.0, 65.0, 48.0, 49.0, 34.0, 35.0, 35.0, 20.0, 27.0, 12.0, 12.0, 9.0, 17.0, 3.0, 11.0, 9.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.409591674804688, -12.008337020874023, -11.607081413269043, -11.205826759338379, -10.804571151733398, -10.403316497802734, -10.00206184387207, -9.60080623626709, -9.19955062866211, -8.798295974731445, -8.397040367126465, -7.995785713195801, -7.59453010559082, -7.193275451660156, -6.792020320892334, -6.390765190124512, -5.989510536193848, -5.588255405426025, -5.187000274658203, -4.785745620727539, -4.384490013122559, -3.9832351207733154, -3.5819802284240723, -3.18072509765625, -2.7794699668884277, -2.3782148361206055, -1.9769598245620728, -1.57570481300354, -1.1744496822357178, -0.7731945514678955, -0.37193965911865234, 0.029315471649169922, 0.4305706024169922, 0.8318256735801697, 1.2330807447433472, 1.6343357563018799, 2.035590887069702, 2.4368460178375244, 2.8381009101867676, 3.23935604095459, 3.640611171722412, 4.041866302490234, 4.443121433258057, 4.844376564025879, 5.245631217956543, 5.646886825561523, 6.0481414794921875, 6.44939661026001, 6.850651741027832, 7.251906871795654, 7.653162002563477, 8.05441665649414, 8.455672264099121, 8.856926918029785, 9.258182525634766, 9.65943717956543, 10.060691833496094, 10.461946487426758, 10.863202095031738, 11.264456748962402, 11.665712356567383, 12.066967010498047, 12.468221664428711, 12.869477272033691, 13.270732879638672]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 11.0, 20.0, 10.0, 20.0, 32.0, 49.0, 71.0, 102.0, 169.0, 317.0, 554.0, 1198.0, 2859.0, 9242.0, 36362.0, 176512.0, 552859.0, 209282.0, 42347.0, 10459.0, 3402.0, 1220.0, 587.0, 321.0, 165.0, 125.0, 65.0, 47.0, 32.0, 23.0, 20.0, 18.0, 13.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.345703125, -3.248870849609375, -3.15203857421875, -3.055206298828125, -2.9583740234375, -2.861541748046875, -2.76470947265625, -2.667877197265625, -2.571044921875, -2.474212646484375, -2.37738037109375, -2.280548095703125, -2.1837158203125, -2.086883544921875, -1.99005126953125, -1.893218994140625, -1.79638671875, -1.699554443359375, -1.60272216796875, -1.505889892578125, -1.4090576171875, -1.312225341796875, -1.21539306640625, -1.118560791015625, -1.021728515625, -0.924896240234375, -0.82806396484375, -0.731231689453125, -0.6343994140625, -0.537567138671875, -0.44073486328125, -0.343902587890625, -0.2470703125, -0.150238037109375, -0.05340576171875, 0.043426513671875, 0.1402587890625, 0.237091064453125, 0.33392333984375, 0.430755615234375, 0.527587890625, 0.624420166015625, 0.72125244140625, 0.818084716796875, 0.9149169921875, 1.011749267578125, 1.10858154296875, 1.205413818359375, 1.30224609375, 1.399078369140625, 1.49591064453125, 1.592742919921875, 1.6895751953125, 1.786407470703125, 1.88323974609375, 1.980072021484375, 2.076904296875, 2.173736572265625, 2.27056884765625, 2.367401123046875, 2.4642333984375, 2.561065673828125, 2.65789794921875, 2.754730224609375, 2.8515625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 3.0, 11.0, 16.0, 26.0, 23.0, 33.0, 46.0, 55.0, 48.0, 63.0, 81.0, 90.0, 69.0, 68.0, 86.0, 56.0, 39.0, 55.0, 38.0, 30.0, 17.0, 9.0, 14.0, 9.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7041015625, -1.6433563232421875, -1.582611083984375, -1.5218658447265625, -1.46112060546875, -1.4003753662109375, -1.339630126953125, -1.2788848876953125, -1.2181396484375, -1.1573944091796875, -1.096649169921875, -1.0359039306640625, -0.97515869140625, -0.9144134521484375, -0.853668212890625, -0.7929229736328125, -0.732177734375, -0.6714324951171875, -0.610687255859375, -0.5499420166015625, -0.48919677734375, -0.4284515380859375, -0.367706298828125, -0.3069610595703125, -0.2462158203125, -0.1854705810546875, -0.124725341796875, -0.0639801025390625, -0.00323486328125, 0.0575103759765625, 0.118255615234375, 0.1790008544921875, 0.23974609375, 0.3004913330078125, 0.361236572265625, 0.4219818115234375, 0.48272705078125, 0.5434722900390625, 0.604217529296875, 0.6649627685546875, 0.7257080078125, 0.7864532470703125, 0.847198486328125, 0.9079437255859375, 0.96868896484375, 1.0294342041015625, 1.090179443359375, 1.1509246826171875, 1.211669921875, 1.2724151611328125, 1.333160400390625, 1.3939056396484375, 1.45465087890625, 1.5153961181640625, 1.576141357421875, 1.6368865966796875, 1.6976318359375, 1.7583770751953125, 1.819122314453125, 1.8798675537109375, 1.94061279296875, 2.0013580322265625, 2.062103271484375, 2.1228485107421875, 2.18359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 9.0, 11.0, 11.0, 10.0, 13.0, 24.0, 39.0, 60.0, 88.0, 135.0, 177.0, 289.0, 500.0, 902.0, 2159.0, 7325.0, 38500.0, 347956.0, 592291.0, 45043.0, 8048.0, 2421.0, 980.0, 534.0, 372.0, 187.0, 141.0, 101.0, 61.0, 35.0, 35.0, 23.0, 15.0, 15.0, 8.0, 4.0, 3.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-4.6796875, -4.5533447265625, -4.427001953125, -4.3006591796875, -4.17431640625, -4.0479736328125, -3.921630859375, -3.7952880859375, -3.6689453125, -3.5426025390625, -3.416259765625, -3.2899169921875, -3.16357421875, -3.0372314453125, -2.910888671875, -2.7845458984375, -2.658203125, -2.5318603515625, -2.405517578125, -2.2791748046875, -2.15283203125, -2.0264892578125, -1.900146484375, -1.7738037109375, -1.6474609375, -1.5211181640625, -1.394775390625, -1.2684326171875, -1.14208984375, -1.0157470703125, -0.889404296875, -0.7630615234375, -0.63671875, -0.5103759765625, -0.384033203125, -0.2576904296875, -0.13134765625, -0.0050048828125, 0.121337890625, 0.2476806640625, 0.3740234375, 0.5003662109375, 0.626708984375, 0.7530517578125, 0.87939453125, 1.0057373046875, 1.132080078125, 1.2584228515625, 1.384765625, 1.5111083984375, 1.637451171875, 1.7637939453125, 1.89013671875, 2.0164794921875, 2.142822265625, 2.2691650390625, 2.3955078125, 2.5218505859375, 2.648193359375, 2.7745361328125, 2.90087890625, 3.0272216796875, 3.153564453125, 3.2799072265625, 3.40625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 10.0, 6.0, 15.0, 5.0, 13.0, 14.0, 13.0, 20.0, 24.0, 22.0, 35.0, 28.0, 45.0, 44.0, 54.0, 41.0, 55.0, 52.0, 54.0, 51.0, 49.0, 59.0, 46.0, 40.0, 27.0, 34.0, 29.0, 25.0, 19.0, 12.0, 8.0, 8.0, 11.0, 6.0, 5.0, 2.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.71875, -4.569580078125, -4.42041015625, -4.271240234375, -4.1220703125, -3.972900390625, -3.82373046875, -3.674560546875, -3.525390625, -3.376220703125, -3.22705078125, -3.077880859375, -2.9287109375, -2.779541015625, -2.63037109375, -2.481201171875, -2.33203125, -2.182861328125, -2.03369140625, -1.884521484375, -1.7353515625, -1.586181640625, -1.43701171875, -1.287841796875, -1.138671875, -0.989501953125, -0.84033203125, -0.691162109375, -0.5419921875, -0.392822265625, -0.24365234375, -0.094482421875, 0.0546875, 0.203857421875, 0.35302734375, 0.502197265625, 0.6513671875, 0.800537109375, 0.94970703125, 1.098876953125, 1.248046875, 1.397216796875, 1.54638671875, 1.695556640625, 1.8447265625, 1.993896484375, 2.14306640625, 2.292236328125, 2.44140625, 2.590576171875, 2.73974609375, 2.888916015625, 3.0380859375, 3.187255859375, 3.33642578125, 3.485595703125, 3.634765625, 3.783935546875, 3.93310546875, 4.082275390625, 4.2314453125, 4.380615234375, 4.52978515625, 4.678955078125, 4.828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 16.0, 25.0, 29.0, 31.0, 69.0, 116.0, 167.0, 357.0, 735.0, 1697.0, 4631.0, 15244.0, 81430.0, 798509.0, 116796.0, 19641.0, 5409.0, 1929.0, 798.0, 358.0, 205.0, 118.0, 65.0, 44.0, 24.0, 21.0, 15.0, 16.0, 9.0, 2.0, 4.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.40625, -1.361724853515625, -1.31719970703125, -1.272674560546875, -1.2281494140625, -1.183624267578125, -1.13909912109375, -1.094573974609375, -1.050048828125, -1.005523681640625, -0.96099853515625, -0.916473388671875, -0.8719482421875, -0.827423095703125, -0.78289794921875, -0.738372802734375, -0.69384765625, -0.649322509765625, -0.60479736328125, -0.560272216796875, -0.5157470703125, -0.471221923828125, -0.42669677734375, -0.382171630859375, -0.337646484375, -0.293121337890625, -0.24859619140625, -0.204071044921875, -0.1595458984375, -0.115020751953125, -0.07049560546875, -0.025970458984375, 0.0185546875, 0.063079833984375, 0.10760498046875, 0.152130126953125, 0.1966552734375, 0.241180419921875, 0.28570556640625, 0.330230712890625, 0.374755859375, 0.419281005859375, 0.46380615234375, 0.508331298828125, 0.5528564453125, 0.597381591796875, 0.64190673828125, 0.686431884765625, 0.73095703125, 0.775482177734375, 0.82000732421875, 0.864532470703125, 0.9090576171875, 0.953582763671875, 0.99810791015625, 1.042633056640625, 1.087158203125, 1.131683349609375, 1.17620849609375, 1.220733642578125, 1.2652587890625, 1.309783935546875, 1.35430908203125, 1.398834228515625, 1.443359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 2.0, 1.0, 5.0, 4.0, 6.0, 8.0, 14.0, 12.0, 20.0, 28.0, 25.0, 32.0, 55.0, 60.0, 100.0, 118.0, 140.0, 83.0, 72.0, 60.0, 32.0, 32.0, 22.0, 14.0, 13.0, 5.0, 13.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.000278472900390625, -0.0002713017165660858, -0.00026413053274154663, -0.00025695934891700745, -0.00024978816509246826, -0.00024261698126792908, -0.0002354457974433899, -0.0002282746136188507, -0.00022110342979431152, -0.00021393224596977234, -0.00020676106214523315, -0.00019958987832069397, -0.00019241869449615479, -0.0001852475106716156, -0.00017807632684707642, -0.00017090514302253723, -0.00016373395919799805, -0.00015656277537345886, -0.00014939159154891968, -0.0001422204077243805, -0.0001350492238998413, -0.00012787804007530212, -0.00012070685625076294, -0.00011353567242622375, -0.00010636448860168457, -9.919330477714539e-05, -9.20221209526062e-05, -8.485093712806702e-05, -7.767975330352783e-05, -7.050856947898865e-05, -6.333738565444946e-05, -5.616620182991028e-05, -4.8995018005371094e-05, -4.182383418083191e-05, -3.4652650356292725e-05, -2.748146653175354e-05, -2.0310282707214355e-05, -1.3139098882675171e-05, -5.967915058135986e-06, 1.2032687664031982e-06, 8.374452590942383e-06, 1.5545636415481567e-05, 2.2716820240020752e-05, 2.9888004064559937e-05, 3.705918788909912e-05, 4.4230371713638306e-05, 5.140155553817749e-05, 5.8572739362716675e-05, 6.574392318725586e-05, 7.291510701179504e-05, 8.008629083633423e-05, 8.725747466087341e-05, 9.44286584854126e-05, 0.00010159984230995178, 0.00010877102613449097, 0.00011594220995903015, 0.00012311339378356934, 0.00013028457760810852, 0.0001374557614326477, 0.0001446269452571869, 0.00015179812908172607, 0.00015896931290626526, 0.00016614049673080444, 0.00017331168055534363, 0.0001804828643798828]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 13.0, 12.0, 16.0, 17.0, 28.0, 39.0, 62.0, 82.0, 153.0, 237.0, 446.0, 746.0, 1485.0, 3372.0, 7946.0, 24404.0, 109729.0, 718381.0, 136716.0, 28251.0, 9158.0, 3542.0, 1658.0, 825.0, 441.0, 262.0, 183.0, 111.0, 74.0, 36.0, 30.0, 24.0, 14.0, 14.0, 10.0, 7.0, 4.0, 4.0, 2.0, 1.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.20703125, -1.1721038818359375, -1.137176513671875, -1.1022491455078125, -1.06732177734375, -1.0323944091796875, -0.997467041015625, -0.9625396728515625, -0.9276123046875, -0.8926849365234375, -0.857757568359375, -0.8228302001953125, -0.78790283203125, -0.7529754638671875, -0.718048095703125, -0.6831207275390625, -0.648193359375, -0.6132659912109375, -0.578338623046875, -0.5434112548828125, -0.50848388671875, -0.4735565185546875, -0.438629150390625, -0.4037017822265625, -0.3687744140625, -0.3338470458984375, -0.298919677734375, -0.2639923095703125, -0.22906494140625, -0.1941375732421875, -0.159210205078125, -0.1242828369140625, -0.08935546875, -0.0544281005859375, -0.019500732421875, 0.0154266357421875, 0.05035400390625, 0.0852813720703125, 0.120208740234375, 0.1551361083984375, 0.1900634765625, 0.2249908447265625, 0.259918212890625, 0.2948455810546875, 0.32977294921875, 0.3647003173828125, 0.399627685546875, 0.4345550537109375, 0.469482421875, 0.5044097900390625, 0.539337158203125, 0.5742645263671875, 0.60919189453125, 0.6441192626953125, 0.679046630859375, 0.7139739990234375, 0.7489013671875, 0.7838287353515625, 0.818756103515625, 0.8536834716796875, 0.88861083984375, 0.9235382080078125, 0.958465576171875, 0.9933929443359375, 1.0283203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 9.0, 11.0, 12.0, 16.0, 18.0, 29.0, 60.0, 91.0, 110.0, 118.0, 163.0, 113.0, 87.0, 56.0, 35.0, 19.0, 11.0, 11.0, 13.0, 3.0, 3.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3671875, -1.3186187744140625, -1.270050048828125, -1.2214813232421875, -1.17291259765625, -1.1243438720703125, -1.075775146484375, -1.0272064208984375, -0.9786376953125, -0.9300689697265625, -0.881500244140625, -0.8329315185546875, -0.78436279296875, -0.7357940673828125, -0.687225341796875, -0.6386566162109375, -0.590087890625, -0.5415191650390625, -0.492950439453125, -0.4443817138671875, -0.39581298828125, -0.3472442626953125, -0.298675537109375, -0.2501068115234375, -0.2015380859375, -0.1529693603515625, -0.104400634765625, -0.0558319091796875, -0.00726318359375, 0.0413055419921875, 0.089874267578125, 0.1384429931640625, 0.18701171875, 0.2355804443359375, 0.284149169921875, 0.3327178955078125, 0.38128662109375, 0.4298553466796875, 0.478424072265625, 0.5269927978515625, 0.5755615234375, 0.6241302490234375, 0.672698974609375, 0.7212677001953125, 0.76983642578125, 0.8184051513671875, 0.866973876953125, 0.9155426025390625, 0.964111328125, 1.0126800537109375, 1.061248779296875, 1.1098175048828125, 1.15838623046875, 1.2069549560546875, 1.255523681640625, 1.3040924072265625, 1.3526611328125, 1.4012298583984375, 1.449798583984375, 1.4983673095703125, 1.54693603515625, 1.5955047607421875, 1.644073486328125, 1.6926422119140625, 1.7412109375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 8.0, 16.0, 50.0, 174.0, 476.0, 176.0, 65.0, 24.0, 4.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.036376953125, -63.43166732788086, -61.826961517333984, -60.222251892089844, -58.6175422668457, -57.01283264160156, -55.40812683105469, -53.80341720581055, -52.198707580566406, -50.593997955322266, -48.98929214477539, -47.38458251953125, -45.77987289428711, -44.17516326904297, -42.570457458496094, -40.96574783325195, -39.36103820800781, -37.75632858276367, -36.1516227722168, -34.546913146972656, -32.942203521728516, -31.337495803833008, -29.7327880859375, -28.12807846069336, -26.523372650146484, -24.918664932250977, -23.313955307006836, -21.709247589111328, -20.104537963867188, -18.49983024597168, -16.895122528076172, -15.290412902832031, -13.68570327758789, -12.080994606018066, -10.476285934448242, -8.871578216552734, -7.266869068145752, -5.662160873413086, -4.057452201843262, -2.4527435302734375, -0.8480348587036133, 0.7566736936569214, 2.361382246017456, 3.966090679168701, 5.570799350738525, 7.175507545471191, 8.780216217041016, 10.38492488861084, 11.989633560180664, 13.594342231750488, 15.199050903320312, 16.80375862121582, 18.40846824645996, 20.01317596435547, 21.61788558959961, 23.222593307495117, 24.827301025390625, 26.432008743286133, 28.036718368530273, 29.64142608642578, 31.246135711669922, 32.85084533691406, 34.45555114746094, 36.06026077270508, 37.66497039794922]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 6.0, 10.0, 6.0, 6.0, 8.0, 6.0, 8.0, 11.0, 17.0, 19.0, 19.0, 15.0, 38.0, 22.0, 35.0, 32.0, 53.0, 57.0, 84.0, 95.0, 86.0, 63.0, 44.0, 31.0, 33.0, 33.0, 24.0, 18.0, 19.0, 18.0, 13.0, 18.0, 14.0, 11.0, 6.0, 5.0, 3.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.469680786132812, -14.959761619567871, -14.449843406677246, -13.939924240112305, -13.430005073547363, -12.920085906982422, -12.410167694091797, -11.900248527526855, -11.390329360961914, -10.880410194396973, -10.370491981506348, -9.860572814941406, -9.350653648376465, -8.840734481811523, -8.330816268920898, -7.820897102355957, -7.310978889465332, -6.801060199737549, -6.291141033172607, -5.781222343444824, -5.271303176879883, -4.7613844871521, -4.251465797424316, -3.741546869277954, -3.231627941131592, -2.7217090129852295, -2.211790084838867, -1.701871395111084, -1.1919524669647217, -0.6820335388183594, -0.17211484909057617, 0.33780407905578613, 0.8477230072021484, 1.3576419353485107, 1.8675607442855835, 2.3774795532226562, 2.8873984813690186, 3.397317409515381, 3.907236099243164, 4.4171552658081055, 4.927073955535889, 5.436992645263672, 5.946911811828613, 6.4568305015563965, 6.96674919128418, 7.476668357849121, 7.986587047576904, 8.496505737304688, 9.006424903869629, 9.51634407043457, 10.026262283325195, 10.536181449890137, 11.046100616455078, 11.556018829345703, 12.065937995910645, 12.575857162475586, 13.085775375366211, 13.595694541931152, 14.105612754821777, 14.615531921386719, 15.12545108795166, 15.635370254516602, 16.145288467407227, 16.65520668029785, 17.16512680053711]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 10.0, 23.0, 49.0, 78.0, 190.0, 355.0, 964.0, 3011.0, 15095.0, 227364.0, 3640143.0, 285446.0, 16174.0, 3227.0, 1076.0, 483.0, 215.0, 133.0, 76.0, 56.0, 26.0, 14.0, 11.0, 10.0, 11.0, 11.0, 4.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.36334228515625, -2.2423095703125, -2.12127685546875, -2.000244140625, -1.87921142578125, -1.7581787109375, -1.63714599609375, -1.51611328125, -1.39508056640625, -1.2740478515625, -1.15301513671875, -1.031982421875, -0.91094970703125, -0.7899169921875, -0.66888427734375, -0.5478515625, -0.42681884765625, -0.3057861328125, -0.18475341796875, -0.063720703125, 0.05731201171875, 0.1783447265625, 0.29937744140625, 0.42041015625, 0.54144287109375, 0.6624755859375, 0.78350830078125, 0.904541015625, 1.02557373046875, 1.1466064453125, 1.26763916015625, 1.388671875, 1.50970458984375, 1.6307373046875, 1.75177001953125, 1.872802734375, 1.99383544921875, 2.1148681640625, 2.23590087890625, 2.35693359375, 2.47796630859375, 2.5989990234375, 2.72003173828125, 2.841064453125, 2.96209716796875, 3.0831298828125, 3.20416259765625, 3.3251953125, 3.44622802734375, 3.5672607421875, 3.68829345703125, 3.809326171875, 3.93035888671875, 4.0513916015625, 4.17242431640625, 4.29345703125, 4.41448974609375, 4.5355224609375, 4.65655517578125, 4.777587890625, 4.89862060546875, 5.0196533203125, 5.14068603515625, 5.26171875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 3.0, 6.0, 5.0, 10.0, 10.0, 16.0, 16.0, 14.0, 19.0, 35.0, 34.0, 39.0, 47.0, 46.0, 65.0, 60.0, 56.0, 66.0, 68.0, 57.0, 49.0, 63.0, 38.0, 33.0, 28.0, 28.0, 23.0, 16.0, 17.0, 7.0, 5.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4521484375, -1.406890869140625, -1.36163330078125, -1.316375732421875, -1.2711181640625, -1.225860595703125, -1.18060302734375, -1.135345458984375, -1.090087890625, -1.044830322265625, -0.99957275390625, -0.954315185546875, -0.9090576171875, -0.863800048828125, -0.81854248046875, -0.773284912109375, -0.72802734375, -0.682769775390625, -0.63751220703125, -0.592254638671875, -0.5469970703125, -0.501739501953125, -0.45648193359375, -0.411224365234375, -0.365966796875, -0.320709228515625, -0.27545166015625, -0.230194091796875, -0.1849365234375, -0.139678955078125, -0.09442138671875, -0.049163818359375, -0.00390625, 0.041351318359375, 0.08660888671875, 0.131866455078125, 0.1771240234375, 0.222381591796875, 0.26763916015625, 0.312896728515625, 0.358154296875, 0.403411865234375, 0.44866943359375, 0.493927001953125, 0.5391845703125, 0.584442138671875, 0.62969970703125, 0.674957275390625, 0.72021484375, 0.765472412109375, 0.81072998046875, 0.855987548828125, 0.9012451171875, 0.946502685546875, 0.99176025390625, 1.037017822265625, 1.082275390625, 1.127532958984375, 1.17279052734375, 1.218048095703125, 1.2633056640625, 1.308563232421875, 1.35382080078125, 1.399078369140625, 1.4443359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 9.0, 15.0, 20.0, 21.0, 35.0, 51.0, 98.0, 152.0, 406.0, 1211.0, 6648.0, 78208.0, 3542919.0, 541820.0, 18656.0, 2716.0, 722.0, 254.0, 133.0, 64.0, 44.0, 12.0, 21.0, 10.0, 7.0, 8.0, 8.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.11328125, -3.98370361328125, -3.8541259765625, -3.72454833984375, -3.594970703125, -3.46539306640625, -3.3358154296875, -3.20623779296875, -3.07666015625, -2.94708251953125, -2.8175048828125, -2.68792724609375, -2.558349609375, -2.42877197265625, -2.2991943359375, -2.16961669921875, -2.0400390625, -1.91046142578125, -1.7808837890625, -1.65130615234375, -1.521728515625, -1.39215087890625, -1.2625732421875, -1.13299560546875, -1.00341796875, -0.87384033203125, -0.7442626953125, -0.61468505859375, -0.485107421875, -0.35552978515625, -0.2259521484375, -0.09637451171875, 0.033203125, 0.16278076171875, 0.2923583984375, 0.42193603515625, 0.551513671875, 0.68109130859375, 0.8106689453125, 0.94024658203125, 1.06982421875, 1.19940185546875, 1.3289794921875, 1.45855712890625, 1.588134765625, 1.71771240234375, 1.8472900390625, 1.97686767578125, 2.1064453125, 2.23602294921875, 2.3656005859375, 2.49517822265625, 2.624755859375, 2.75433349609375, 2.8839111328125, 3.01348876953125, 3.14306640625, 3.27264404296875, 3.4022216796875, 3.53179931640625, 3.661376953125, 3.79095458984375, 3.9205322265625, 4.05010986328125, 4.1796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 11.0, 13.0, 23.0, 39.0, 39.0, 61.0, 77.0, 118.0, 156.0, 301.0, 440.0, 567.0, 620.0, 524.0, 348.0, 237.0, 148.0, 93.0, 67.0, 46.0, 31.0, 29.0, 30.0, 11.0, 7.0, 3.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.076171875, -2.00006103515625, -1.9239501953125, -1.84783935546875, -1.771728515625, -1.69561767578125, -1.6195068359375, -1.54339599609375, -1.46728515625, -1.39117431640625, -1.3150634765625, -1.23895263671875, -1.162841796875, -1.08673095703125, -1.0106201171875, -0.93450927734375, -0.8583984375, -0.78228759765625, -0.7061767578125, -0.63006591796875, -0.553955078125, -0.47784423828125, -0.4017333984375, -0.32562255859375, -0.24951171875, -0.17340087890625, -0.0972900390625, -0.02117919921875, 0.054931640625, 0.13104248046875, 0.2071533203125, 0.28326416015625, 0.359375, 0.43548583984375, 0.5115966796875, 0.58770751953125, 0.663818359375, 0.73992919921875, 0.8160400390625, 0.89215087890625, 0.96826171875, 1.04437255859375, 1.1204833984375, 1.19659423828125, 1.272705078125, 1.34881591796875, 1.4249267578125, 1.50103759765625, 1.5771484375, 1.65325927734375, 1.7293701171875, 1.80548095703125, 1.881591796875, 1.95770263671875, 2.0338134765625, 2.10992431640625, 2.18603515625, 2.26214599609375, 2.3382568359375, 2.41436767578125, 2.490478515625, 2.56658935546875, 2.6427001953125, 2.71881103515625, 2.794921875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 8.0, 19.0, 60.0, 170.0, 306.0, 280.0, 104.0, 36.0, 11.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-53.57251739501953, -52.19485092163086, -50.81718444824219, -49.43951416015625, -48.06184768676758, -46.684181213378906, -45.306514739990234, -43.92884826660156, -42.551177978515625, -41.17351150512695, -39.79584503173828, -38.418174743652344, -37.04050827026367, -35.662841796875, -34.28517532348633, -32.907508850097656, -31.52984046936035, -30.15217399597168, -28.774505615234375, -27.396839141845703, -26.0191707611084, -24.641504287719727, -23.263835906982422, -21.88616943359375, -20.508502960205078, -19.130836486816406, -17.7531681060791, -16.37550163269043, -14.997833251953125, -13.620166778564453, -12.242499351501465, -10.864831924438477, -9.487163543701172, -8.109496116638184, -6.731828689575195, -5.354161739349365, -3.976494312286377, -2.5988268852233887, -1.2211599349975586, 0.1565074920654297, 1.534174919128418, 2.9118423461914062, 4.2895097732543945, 5.667176723480225, 7.044844150543213, 8.42251205444336, 9.800178527832031, 11.17784595489502, 12.555513381958008, 13.933180809020996, 15.310848236083984, 16.688514709472656, 18.06618309020996, 19.443849563598633, 20.821517944335938, 22.19918441772461, 23.57685089111328, 24.954517364501953, 26.332185745239258, 27.70985221862793, 29.087520599365234, 30.465187072753906, 31.842853546142578, 33.22052001953125, 34.59819030761719]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 2.0, 7.0, 8.0, 10.0, 11.0, 14.0, 18.0, 13.0, 17.0, 27.0, 23.0, 20.0, 28.0, 32.0, 39.0, 41.0, 36.0, 55.0, 55.0, 65.0, 58.0, 46.0, 50.0, 49.0, 34.0, 31.0, 35.0, 30.0, 30.0, 21.0, 18.0, 11.0, 14.0, 9.0, 12.0, 6.0, 4.0, 7.0, 7.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.042563438415527, -11.701725959777832, -11.360889434814453, -11.020051956176758, -10.679214477539062, -10.338376998901367, -9.997539520263672, -9.656702995300293, -9.315865516662598, -8.975028038024902, -8.634191513061523, -8.293354034423828, -7.952516555786133, -7.6116790771484375, -7.2708420753479, -6.930005073547363, -6.589167594909668, -6.248330116271973, -5.9074931144714355, -5.566656112670898, -5.225818634033203, -4.884981155395508, -4.544144153594971, -4.203307151794434, -3.8624696731567383, -3.521632432937622, -3.180795192718506, -2.8399579524993896, -2.4991207122802734, -2.1582834720611572, -1.817446231842041, -1.4766089916229248, -1.135772705078125, -0.7949354648590088, -0.4540982246398926, -0.11326098442077637, 0.22757625579833984, 0.568413496017456, 0.9092507362365723, 1.2500879764556885, 1.5909252166748047, 1.931762456893921, 2.272599697113037, 2.6134369373321533, 2.9542741775512695, 3.2951114177703857, 3.635948657989502, 3.976785898208618, 4.317623138427734, 4.65846061706543, 4.999297618865967, 5.340134620666504, 5.680972099304199, 6.0218095779418945, 6.362646579742432, 6.703483581542969, 7.044321060180664, 7.385158538818359, 7.7259955406188965, 8.066832542419434, 8.407670021057129, 8.748507499694824, 9.089344024658203, 9.430181503295898, 9.771018981933594]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 5.0, 5.0, 3.0, 8.0, 4.0, 13.0, 16.0, 23.0, 28.0, 37.0, 64.0, 83.0, 149.0, 257.0, 437.0, 845.0, 1621.0, 3280.0, 7783.0, 19730.0, 56786.0, 190512.0, 456463.0, 211362.0, 62243.0, 21198.0, 8061.0, 3670.0, 1733.0, 897.0, 499.0, 274.0, 142.0, 103.0, 70.0, 48.0, 28.0, 24.0, 18.0, 8.0, 6.0, 3.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 5.0], "bins": [-2.62109375, -2.5493621826171875, -2.477630615234375, -2.4058990478515625, -2.33416748046875, -2.2624359130859375, -2.190704345703125, -2.1189727783203125, -2.0472412109375, -1.9755096435546875, -1.903778076171875, -1.8320465087890625, -1.76031494140625, -1.6885833740234375, -1.616851806640625, -1.5451202392578125, -1.473388671875, -1.4016571044921875, -1.329925537109375, -1.2581939697265625, -1.18646240234375, -1.1147308349609375, -1.042999267578125, -0.9712677001953125, -0.8995361328125, -0.8278045654296875, -0.756072998046875, -0.6843414306640625, -0.61260986328125, -0.5408782958984375, -0.469146728515625, -0.3974151611328125, -0.32568359375, -0.2539520263671875, -0.182220458984375, -0.1104888916015625, -0.03875732421875, 0.0329742431640625, 0.104705810546875, 0.1764373779296875, 0.2481689453125, 0.3199005126953125, 0.391632080078125, 0.4633636474609375, 0.53509521484375, 0.6068267822265625, 0.678558349609375, 0.7502899169921875, 0.822021484375, 0.8937530517578125, 0.965484619140625, 1.0372161865234375, 1.10894775390625, 1.1806793212890625, 1.252410888671875, 1.3241424560546875, 1.3958740234375, 1.4676055908203125, 1.539337158203125, 1.6110687255859375, 1.68280029296875, 1.7545318603515625, 1.826263427734375, 1.8979949951171875, 1.9697265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 7.0, 2.0, 18.0, 21.0, 14.0, 12.0, 18.0, 28.0, 26.0, 34.0, 41.0, 46.0, 44.0, 66.0, 56.0, 51.0, 48.0, 66.0, 73.0, 61.0, 34.0, 38.0, 33.0, 33.0, 28.0, 30.0, 16.0, 17.0, 11.0, 7.0, 5.0, 5.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4716796875, -1.4258575439453125, -1.380035400390625, -1.3342132568359375, -1.28839111328125, -1.2425689697265625, -1.196746826171875, -1.1509246826171875, -1.1051025390625, -1.0592803955078125, -1.013458251953125, -0.9676361083984375, -0.92181396484375, -0.8759918212890625, -0.830169677734375, -0.7843475341796875, -0.738525390625, -0.6927032470703125, -0.646881103515625, -0.6010589599609375, -0.55523681640625, -0.5094146728515625, -0.463592529296875, -0.4177703857421875, -0.3719482421875, -0.3261260986328125, -0.280303955078125, -0.2344818115234375, -0.18865966796875, -0.1428375244140625, -0.097015380859375, -0.0511932373046875, -0.00537109375, 0.0404510498046875, 0.086273193359375, 0.1320953369140625, 0.17791748046875, 0.2237396240234375, 0.269561767578125, 0.3153839111328125, 0.3612060546875, 0.4070281982421875, 0.452850341796875, 0.4986724853515625, 0.54449462890625, 0.5903167724609375, 0.636138916015625, 0.6819610595703125, 0.727783203125, 0.7736053466796875, 0.819427490234375, 0.8652496337890625, 0.91107177734375, 0.9568939208984375, 1.002716064453125, 1.0485382080078125, 1.0943603515625, 1.1401824951171875, 1.186004638671875, 1.2318267822265625, 1.27764892578125, 1.3234710693359375, 1.369293212890625, 1.4151153564453125, 1.4609375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 11.0, 13.0, 19.0, 35.0, 46.0, 69.0, 90.0, 208.0, 347.0, 648.0, 1243.0, 3400.0, 18600.0, 709519.0, 294828.0, 13907.0, 2964.0, 1170.0, 579.0, 323.0, 194.0, 116.0, 76.0, 44.0, 36.0, 15.0, 15.0, 10.0, 3.0, 6.0, 1.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.984375, -5.80267333984375, -5.6209716796875, -5.43927001953125, -5.257568359375, -5.07586669921875, -4.8941650390625, -4.71246337890625, -4.53076171875, -4.34906005859375, -4.1673583984375, -3.98565673828125, -3.803955078125, -3.62225341796875, -3.4405517578125, -3.25885009765625, -3.0771484375, -2.89544677734375, -2.7137451171875, -2.53204345703125, -2.350341796875, -2.16864013671875, -1.9869384765625, -1.80523681640625, -1.62353515625, -1.44183349609375, -1.2601318359375, -1.07843017578125, -0.896728515625, -0.71502685546875, -0.5333251953125, -0.35162353515625, -0.169921875, 0.01177978515625, 0.1934814453125, 0.37518310546875, 0.556884765625, 0.73858642578125, 0.9202880859375, 1.10198974609375, 1.28369140625, 1.46539306640625, 1.6470947265625, 1.82879638671875, 2.010498046875, 2.19219970703125, 2.3739013671875, 2.55560302734375, 2.7373046875, 2.91900634765625, 3.1007080078125, 3.28240966796875, 3.464111328125, 3.64581298828125, 3.8275146484375, 4.00921630859375, 4.19091796875, 4.37261962890625, 4.5543212890625, 4.73602294921875, 4.917724609375, 5.09942626953125, 5.2811279296875, 5.46282958984375, 5.64453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 9.0, 8.0, 14.0, 11.0, 26.0, 24.0, 27.0, 29.0, 33.0, 42.0, 57.0, 55.0, 59.0, 56.0, 60.0, 68.0, 54.0, 58.0, 50.0, 51.0, 34.0, 30.0, 26.0, 20.0, 26.0, 9.0, 19.0, 7.0, 7.0, 7.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.61505126953125, -4.4527587890625, -4.29046630859375, -4.128173828125, -3.96588134765625, -3.8035888671875, -3.64129638671875, -3.47900390625, -3.31671142578125, -3.1544189453125, -2.99212646484375, -2.829833984375, -2.66754150390625, -2.5052490234375, -2.34295654296875, -2.1806640625, -2.01837158203125, -1.8560791015625, -1.69378662109375, -1.531494140625, -1.36920166015625, -1.2069091796875, -1.04461669921875, -0.88232421875, -0.72003173828125, -0.5577392578125, -0.39544677734375, -0.233154296875, -0.07086181640625, 0.0914306640625, 0.25372314453125, 0.416015625, 0.57830810546875, 0.7406005859375, 0.90289306640625, 1.065185546875, 1.22747802734375, 1.3897705078125, 1.55206298828125, 1.71435546875, 1.87664794921875, 2.0389404296875, 2.20123291015625, 2.363525390625, 2.52581787109375, 2.6881103515625, 2.85040283203125, 3.0126953125, 3.17498779296875, 3.3372802734375, 3.49957275390625, 3.661865234375, 3.82415771484375, 3.9864501953125, 4.14874267578125, 4.31103515625, 4.47332763671875, 4.6356201171875, 4.79791259765625, 4.960205078125, 5.12249755859375, 5.2847900390625, 5.44708251953125, 5.609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 8.0, 16.0, 19.0, 24.0, 42.0, 62.0, 109.0, 211.0, 399.0, 1074.0, 3300.0, 16520.0, 761578.0, 248806.0, 11928.0, 2644.0, 921.0, 357.0, 186.0, 116.0, 67.0, 29.0, 29.0, 15.0, 24.0, 17.0, 6.0, 3.0, 5.0, 7.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.923828125, -1.865386962890625, -1.80694580078125, -1.748504638671875, -1.6900634765625, -1.631622314453125, -1.57318115234375, -1.514739990234375, -1.456298828125, -1.397857666015625, -1.33941650390625, -1.280975341796875, -1.2225341796875, -1.164093017578125, -1.10565185546875, -1.047210693359375, -0.98876953125, -0.930328369140625, -0.87188720703125, -0.813446044921875, -0.7550048828125, -0.696563720703125, -0.63812255859375, -0.579681396484375, -0.521240234375, -0.462799072265625, -0.40435791015625, -0.345916748046875, -0.2874755859375, -0.229034423828125, -0.17059326171875, -0.112152099609375, -0.0537109375, 0.004730224609375, 0.06317138671875, 0.121612548828125, 0.1800537109375, 0.238494873046875, 0.29693603515625, 0.355377197265625, 0.413818359375, 0.472259521484375, 0.53070068359375, 0.589141845703125, 0.6475830078125, 0.706024169921875, 0.76446533203125, 0.822906494140625, 0.88134765625, 0.939788818359375, 0.99822998046875, 1.056671142578125, 1.1151123046875, 1.173553466796875, 1.23199462890625, 1.290435791015625, 1.348876953125, 1.407318115234375, 1.46575927734375, 1.524200439453125, 1.5826416015625, 1.641082763671875, 1.69952392578125, 1.757965087890625, 1.81640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 5.0, 8.0, 13.0, 16.0, 28.0, 55.0, 101.0, 247.0, 256.0, 118.0, 50.0, 28.0, 17.0, 12.0, 10.0, 8.0, 5.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005054473876953125, -0.0004921481013298035, -0.00047884881496429443, -0.0004655495285987854, -0.00045225024223327637, -0.00043895095586776733, -0.0004256516695022583, -0.00041235238313674927, -0.00039905309677124023, -0.0003857538104057312, -0.00037245452404022217, -0.00035915523767471313, -0.0003458559513092041, -0.00033255666494369507, -0.00031925737857818604, -0.000305958092212677, -0.00029265880584716797, -0.00027935951948165894, -0.0002660602331161499, -0.00025276094675064087, -0.00023946166038513184, -0.0002261623740196228, -0.00021286308765411377, -0.00019956380128860474, -0.0001862645149230957, -0.00017296522855758667, -0.00015966594219207764, -0.0001463666558265686, -0.00013306736946105957, -0.00011976808309555054, -0.0001064687967300415, -9.316951036453247e-05, -7.987022399902344e-05, -6.65709376335144e-05, -5.327165126800537e-05, -3.997236490249634e-05, -2.6673078536987305e-05, -1.3373792171478271e-05, -7.450580596923828e-08, 1.3224780559539795e-05, 2.6524066925048828e-05, 3.982335329055786e-05, 5.3122639656066895e-05, 6.642192602157593e-05, 7.972121238708496e-05, 9.3020498752594e-05, 0.00010631978511810303, 0.00011961907148361206, 0.0001329183578491211, 0.00014621764421463013, 0.00015951693058013916, 0.0001728162169456482, 0.00018611550331115723, 0.00019941478967666626, 0.0002127140760421753, 0.00022601336240768433, 0.00023931264877319336, 0.0002526119351387024, 0.0002659112215042114, 0.00027921050786972046, 0.0002925097942352295, 0.0003058090806007385, 0.00031910836696624756, 0.0003324076533317566, 0.0003457069396972656]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 9.0, 9.0, 15.0, 18.0, 11.0, 24.0, 43.0, 57.0, 67.0, 107.0, 168.0, 297.0, 428.0, 722.0, 1306.0, 2679.0, 6010.0, 17749.0, 81625.0, 706758.0, 181657.0, 31667.0, 9177.0, 3670.0, 1849.0, 932.0, 520.0, 324.0, 196.0, 135.0, 88.0, 69.0, 41.0, 27.0, 29.0, 12.0, 11.0, 12.0, 6.0, 6.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.880859375, -0.8554840087890625, -0.830108642578125, -0.8047332763671875, -0.77935791015625, -0.7539825439453125, -0.728607177734375, -0.7032318115234375, -0.6778564453125, -0.6524810791015625, -0.627105712890625, -0.6017303466796875, -0.57635498046875, -0.5509796142578125, -0.525604248046875, -0.5002288818359375, -0.474853515625, -0.4494781494140625, -0.424102783203125, -0.3987274169921875, -0.37335205078125, -0.3479766845703125, -0.322601318359375, -0.2972259521484375, -0.2718505859375, -0.2464752197265625, -0.221099853515625, -0.1957244873046875, -0.17034912109375, -0.1449737548828125, -0.119598388671875, -0.0942230224609375, -0.06884765625, -0.0434722900390625, -0.018096923828125, 0.0072784423828125, 0.03265380859375, 0.0580291748046875, 0.083404541015625, 0.1087799072265625, 0.1341552734375, 0.1595306396484375, 0.184906005859375, 0.2102813720703125, 0.23565673828125, 0.2610321044921875, 0.286407470703125, 0.3117828369140625, 0.337158203125, 0.3625335693359375, 0.387908935546875, 0.4132843017578125, 0.43865966796875, 0.4640350341796875, 0.489410400390625, 0.5147857666015625, 0.5401611328125, 0.5655364990234375, 0.590911865234375, 0.6162872314453125, 0.64166259765625, 0.6670379638671875, 0.692413330078125, 0.7177886962890625, 0.7431640625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 7.0, 13.0, 13.0, 7.0, 14.0, 12.0, 18.0, 22.0, 29.0, 23.0, 52.0, 70.0, 58.0, 81.0, 73.0, 85.0, 70.0, 62.0, 43.0, 45.0, 36.0, 35.0, 34.0, 13.0, 10.0, 11.0, 16.0, 7.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.70654296875, -0.6836929321289062, -0.6608428955078125, -0.6379928588867188, -0.615142822265625, -0.5922927856445312, -0.5694427490234375, -0.5465927124023438, -0.52374267578125, -0.5008926391601562, -0.4780426025390625, -0.45519256591796875, -0.432342529296875, -0.40949249267578125, -0.3866424560546875, -0.36379241943359375, -0.3409423828125, -0.31809234619140625, -0.2952423095703125, -0.27239227294921875, -0.249542236328125, -0.22669219970703125, -0.2038421630859375, -0.18099212646484375, -0.15814208984375, -0.13529205322265625, -0.1124420166015625, -0.08959197998046875, -0.066741943359375, -0.04389190673828125, -0.0210418701171875, 0.00180816650390625, 0.024658203125, 0.04750823974609375, 0.0703582763671875, 0.09320831298828125, 0.116058349609375, 0.13890838623046875, 0.1617584228515625, 0.18460845947265625, 0.20745849609375, 0.23030853271484375, 0.2531585693359375, 0.27600860595703125, 0.298858642578125, 0.32170867919921875, 0.3445587158203125, 0.36740875244140625, 0.3902587890625, 0.41310882568359375, 0.4359588623046875, 0.45880889892578125, 0.481658935546875, 0.5045089721679688, 0.5273590087890625, 0.5502090454101562, 0.57305908203125, 0.5959091186523438, 0.6187591552734375, 0.6416091918945312, 0.664459228515625, 0.6873092651367188, 0.7101593017578125, 0.7330093383789062, 0.755859375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 23.0, 40.0, 82.0, 363.0, 300.0, 99.0, 47.0, 19.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.59895324707031, -41.30607604980469, -40.01319885253906, -38.72032165527344, -37.42744064331055, -36.13456344604492, -34.8416862487793, -33.54880905151367, -32.25593185424805, -30.963054656982422, -29.670175552368164, -28.37729835510254, -27.084421157836914, -25.791542053222656, -24.49866485595703, -23.205787658691406, -21.91290855407715, -20.620031356811523, -19.327152252197266, -18.03427505493164, -16.741397857666016, -15.448519706726074, -14.155641555786133, -12.862764358520508, -11.569886207580566, -10.277008056640625, -8.984130859375, -7.691252708435059, -6.398375034332275, -5.105497360229492, -3.812619209289551, -2.519742012023926, -1.2268638610839844, 0.06601393222808838, 1.3588917255401611, 2.6517696380615234, 3.9446473121643066, 5.23752498626709, 6.530403137207031, 7.823280334472656, 9.116158485412598, 10.409036636352539, 11.701913833618164, 12.994791984558105, 14.287670135498047, 15.580547332763672, 16.873424530029297, 18.166301727294922, 19.45918083190918, 20.752058029174805, 22.044937133789062, 23.337814331054688, 24.630691528320312, 25.923568725585938, 27.216447830200195, 28.50932502746582, 29.802204132080078, 31.095081329345703, 32.38795852661133, 33.68083953857422, 34.973716735839844, 36.26659393310547, 37.559471130371094, 38.85234832763672, 40.145225524902344]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 6.0, 12.0, 18.0, 21.0, 24.0, 24.0, 22.0, 17.0, 40.0, 36.0, 41.0, 46.0, 97.0, 169.0, 91.0, 42.0, 40.0, 24.0, 31.0, 30.0, 26.0, 25.0, 23.0, 15.0, 17.0, 8.0, 12.0, 7.0, 10.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.061260223388672, -17.449214935302734, -16.83717155456543, -16.225128173828125, -15.613082885742188, -15.001038551330566, -14.388994216918945, -13.776949882507324, -13.164905548095703, -12.552861213684082, -11.940816879272461, -11.32877254486084, -10.716728210449219, -10.104683876037598, -9.492639541625977, -8.880595207214355, -8.268550872802734, -7.656506538391113, -7.044462203979492, -6.432417869567871, -5.82037353515625, -5.208329200744629, -4.596284866333008, -3.9842405319213867, -3.3721961975097656, -2.7601518630981445, -2.1481075286865234, -1.5360631942749023, -0.9240188598632812, -0.31197452545166016, 0.30006980895996094, 0.912114143371582, 1.5241584777832031, 2.136202812194824, 2.7482471466064453, 3.3602914810180664, 3.9723358154296875, 4.584380149841309, 5.19642448425293, 5.808468818664551, 6.420513153076172, 7.032557487487793, 7.644601821899414, 8.256646156311035, 8.868690490722656, 9.480734825134277, 10.092779159545898, 10.70482349395752, 11.31686782836914, 11.928912162780762, 12.540956497192383, 13.153000831604004, 13.765045166015625, 14.377089500427246, 14.989133834838867, 15.601178169250488, 16.21322250366211, 16.825267791748047, 17.43731117248535, 18.049354553222656, 18.661399841308594, 19.27344512939453, 19.885488510131836, 20.49753189086914, 21.109577178955078]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 3.0, 6.0, 10.0, 18.0, 20.0, 30.0, 45.0, 100.0, 178.0, 434.0, 982.0, 2533.0, 7857.0, 38020.0, 591365.0, 3014207.0, 494369.0, 33421.0, 6629.0, 2222.0, 893.0, 437.0, 178.0, 122.0, 74.0, 42.0, 23.0, 18.0, 14.0, 8.0, 8.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.373046875, -2.267425537109375, -2.16180419921875, -2.056182861328125, -1.9505615234375, -1.844940185546875, -1.73931884765625, -1.633697509765625, -1.528076171875, -1.422454833984375, -1.31683349609375, -1.211212158203125, -1.1055908203125, -0.999969482421875, -0.89434814453125, -0.788726806640625, -0.68310546875, -0.577484130859375, -0.47186279296875, -0.366241455078125, -0.2606201171875, -0.154998779296875, -0.04937744140625, 0.056243896484375, 0.161865234375, 0.267486572265625, 0.37310791015625, 0.478729248046875, 0.5843505859375, 0.689971923828125, 0.79559326171875, 0.901214599609375, 1.0068359375, 1.112457275390625, 1.21807861328125, 1.323699951171875, 1.4293212890625, 1.534942626953125, 1.64056396484375, 1.746185302734375, 1.851806640625, 1.957427978515625, 2.06304931640625, 2.168670654296875, 2.2742919921875, 2.379913330078125, 2.48553466796875, 2.591156005859375, 2.69677734375, 2.802398681640625, 2.90802001953125, 3.013641357421875, 3.1192626953125, 3.224884033203125, 3.33050537109375, 3.436126708984375, 3.541748046875, 3.647369384765625, 3.75299072265625, 3.858612060546875, 3.9642333984375, 4.069854736328125, 4.17547607421875, 4.281097412109375, 4.38671875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 4.0, 9.0, 12.0, 13.0, 13.0, 14.0, 13.0, 22.0, 18.0, 26.0, 21.0, 37.0, 38.0, 43.0, 48.0, 42.0, 31.0, 52.0, 38.0, 56.0, 55.0, 47.0, 44.0, 50.0, 50.0, 20.0, 31.0, 25.0, 15.0, 26.0, 13.0, 18.0, 12.0, 5.0, 6.0, 12.0, 4.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0869140625, -1.0500335693359375, -1.013153076171875, -0.9762725830078125, -0.93939208984375, -0.9025115966796875, -0.865631103515625, -0.8287506103515625, -0.7918701171875, -0.7549896240234375, -0.718109130859375, -0.6812286376953125, -0.64434814453125, -0.6074676513671875, -0.570587158203125, -0.5337066650390625, -0.496826171875, -0.4599456787109375, -0.423065185546875, -0.3861846923828125, -0.34930419921875, -0.3124237060546875, -0.275543212890625, -0.2386627197265625, -0.2017822265625, -0.1649017333984375, -0.128021240234375, -0.0911407470703125, -0.05426025390625, -0.0173797607421875, 0.019500732421875, 0.0563812255859375, 0.09326171875, 0.1301422119140625, 0.167022705078125, 0.2039031982421875, 0.24078369140625, 0.2776641845703125, 0.314544677734375, 0.3514251708984375, 0.3883056640625, 0.4251861572265625, 0.462066650390625, 0.4989471435546875, 0.53582763671875, 0.5727081298828125, 0.609588623046875, 0.6464691162109375, 0.683349609375, 0.7202301025390625, 0.757110595703125, 0.7939910888671875, 0.83087158203125, 0.8677520751953125, 0.904632568359375, 0.9415130615234375, 0.9783935546875, 1.0152740478515625, 1.052154541015625, 1.0890350341796875, 1.12591552734375, 1.1627960205078125, 1.199676513671875, 1.2365570068359375, 1.2734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 10.0, 9.0, 6.0, 17.0, 27.0, 37.0, 93.0, 177.0, 287.0, 637.0, 1329.0, 4083.0, 31617.0, 3982947.0, 162869.0, 6607.0, 1943.0, 738.0, 410.0, 164.0, 106.0, 65.0, 38.0, 20.0, 8.0, 11.0, 3.0, 5.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.9453125, -6.703125, -6.4609375, -6.21875, -5.9765625, -5.734375, -5.4921875, -5.25, -5.0078125, -4.765625, -4.5234375, -4.28125, -4.0390625, -3.796875, -3.5546875, -3.3125, -3.0703125, -2.828125, -2.5859375, -2.34375, -2.1015625, -1.859375, -1.6171875, -1.375, -1.1328125, -0.890625, -0.6484375, -0.40625, -0.1640625, 0.078125, 0.3203125, 0.5625, 0.8046875, 1.046875, 1.2890625, 1.53125, 1.7734375, 2.015625, 2.2578125, 2.5, 2.7421875, 2.984375, 3.2265625, 3.46875, 3.7109375, 3.953125, 4.1953125, 4.4375, 4.6796875, 4.921875, 5.1640625, 5.40625, 5.6484375, 5.890625, 6.1328125, 6.375, 6.6171875, 6.859375, 7.1015625, 7.34375, 7.5859375, 7.828125, 8.0703125, 8.3125, 8.5546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 9.0, 15.0, 22.0, 37.0, 65.0, 83.0, 151.0, 276.0, 419.0, 623.0, 808.0, 640.0, 393.0, 213.0, 127.0, 75.0, 50.0, 29.0, 9.0, 12.0, 9.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.01953125, -6.8575439453125, -6.695556640625, -6.5335693359375, -6.37158203125, -6.2095947265625, -6.047607421875, -5.8856201171875, -5.7236328125, -5.5616455078125, -5.399658203125, -5.2376708984375, -5.07568359375, -4.9136962890625, -4.751708984375, -4.5897216796875, -4.427734375, -4.2657470703125, -4.103759765625, -3.9417724609375, -3.77978515625, -3.6177978515625, -3.455810546875, -3.2938232421875, -3.1318359375, -2.9698486328125, -2.807861328125, -2.6458740234375, -2.48388671875, -2.3218994140625, -2.159912109375, -1.9979248046875, -1.8359375, -1.6739501953125, -1.511962890625, -1.3499755859375, -1.18798828125, -1.0260009765625, -0.864013671875, -0.7020263671875, -0.5400390625, -0.3780517578125, -0.216064453125, -0.0540771484375, 0.10791015625, 0.2698974609375, 0.431884765625, 0.5938720703125, 0.755859375, 0.9178466796875, 1.079833984375, 1.2418212890625, 1.40380859375, 1.5657958984375, 1.727783203125, 1.8897705078125, 2.0517578125, 2.2137451171875, 2.375732421875, 2.5377197265625, 2.69970703125, 2.8616943359375, 3.023681640625, 3.1856689453125, 3.34765625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 4.0, 7.0, 17.0, 26.0, 64.0, 139.0, 201.0, 228.0, 141.0, 72.0, 37.0, 20.0, 9.0, 11.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.42120361328125, -53.84810256958008, -52.275001525878906, -50.70189666748047, -49.1287956237793, -47.555694580078125, -45.98258972167969, -44.409488677978516, -42.836387634277344, -41.26328659057617, -39.690185546875, -38.11708068847656, -36.54397964477539, -34.97087860107422, -33.39777374267578, -31.82467269897461, -30.251571655273438, -28.678470611572266, -27.10536766052246, -25.532264709472656, -23.959163665771484, -22.386062622070312, -20.812959671020508, -19.239856719970703, -17.66675567626953, -16.09365463256836, -14.520551681518555, -12.947449684143066, -11.374347686767578, -9.80124568939209, -8.228143692016602, -6.655041694641113, -5.081939697265625, -3.5088376998901367, -1.9357357025146484, -0.36263370513916016, 1.2104682922363281, 2.7835702896118164, 4.356672286987305, 5.929774284362793, 7.502876281738281, 9.07597827911377, 10.649080276489258, 12.222182273864746, 13.795284271240234, 15.368386268615723, 16.94148826599121, 18.514591217041016, 20.087692260742188, 21.66079330444336, 23.233896255493164, 24.80699920654297, 26.38010025024414, 27.953201293945312, 29.526304244995117, 31.099407196044922, 32.672508239746094, 34.245609283447266, 35.81871032714844, 37.391815185546875, 38.96491622924805, 40.53801727294922, 42.111122131347656, 43.68422317504883, 45.25732421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 4.0, 4.0, 9.0, 10.0, 17.0, 17.0, 19.0, 31.0, 22.0, 41.0, 45.0, 50.0, 50.0, 50.0, 66.0, 67.0, 78.0, 50.0, 59.0, 41.0, 50.0, 39.0, 35.0, 30.0, 14.0, 16.0, 9.0, 15.0, 15.0, 11.0, 12.0, 6.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.485164642333984, -23.771251678466797, -23.057340621948242, -22.343427658081055, -21.6295166015625, -20.915603637695312, -20.201690673828125, -19.48777961730957, -18.773866653442383, -18.059953689575195, -17.34604263305664, -16.632129669189453, -15.918217658996582, -15.204305648803711, -14.49039363861084, -13.776481628417969, -13.062569618225098, -12.348657608032227, -11.634745597839355, -10.920833587646484, -10.206920623779297, -9.493008613586426, -8.779096603393555, -8.065183639526367, -7.351272106170654, -6.637360095977783, -5.923447608947754, -5.209535598754883, -4.495623588562012, -3.7817111015319824, -3.0677990913391113, -2.353886604309082, -1.639974594116211, -0.9260624051094055, -0.2121502161026001, 0.5017619132995605, 1.2156741619110107, 1.929586410522461, 2.643498420715332, 3.3574109077453613, 4.071322917938232, 4.7852349281311035, 5.499147415161133, 6.213059425354004, 6.926971435546875, 7.640883922576904, 8.354795455932617, 9.068708419799805, 9.782620429992676, 10.496532440185547, 11.210444450378418, 11.924356460571289, 12.638269424438477, 13.352181434631348, 14.066093444824219, 14.780006408691406, 15.493917465209961, 16.20783042907715, 16.921741485595703, 17.63565444946289, 18.349565505981445, 19.063478469848633, 19.777389526367188, 20.491302490234375, 21.205215454101562]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 3.0, 6.0, 8.0, 15.0, 26.0, 38.0, 51.0, 68.0, 117.0, 189.0, 358.0, 659.0, 1228.0, 2631.0, 5579.0, 13876.0, 41348.0, 174992.0, 626497.0, 127297.0, 32560.0, 11362.0, 4927.0, 2231.0, 1153.0, 569.0, 306.0, 151.0, 120.0, 63.0, 36.0, 31.0, 22.0, 11.0, 7.0, 5.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8310546875, -1.7665863037109375, -1.702117919921875, -1.6376495361328125, -1.57318115234375, -1.5087127685546875, -1.444244384765625, -1.3797760009765625, -1.3153076171875, -1.2508392333984375, -1.186370849609375, -1.1219024658203125, -1.05743408203125, -0.9929656982421875, -0.928497314453125, -0.8640289306640625, -0.799560546875, -0.7350921630859375, -0.670623779296875, -0.6061553955078125, -0.54168701171875, -0.4772186279296875, -0.412750244140625, -0.3482818603515625, -0.2838134765625, -0.2193450927734375, -0.154876708984375, -0.0904083251953125, -0.02593994140625, 0.0385284423828125, 0.102996826171875, 0.1674652099609375, 0.23193359375, 0.2964019775390625, 0.360870361328125, 0.4253387451171875, 0.48980712890625, 0.5542755126953125, 0.618743896484375, 0.6832122802734375, 0.7476806640625, 0.8121490478515625, 0.876617431640625, 0.9410858154296875, 1.00555419921875, 1.0700225830078125, 1.134490966796875, 1.1989593505859375, 1.263427734375, 1.3278961181640625, 1.392364501953125, 1.4568328857421875, 1.52130126953125, 1.5857696533203125, 1.650238037109375, 1.7147064208984375, 1.7791748046875, 1.8436431884765625, 1.908111572265625, 1.9725799560546875, 2.03704833984375, 2.1015167236328125, 2.165985107421875, 2.2304534912109375, 2.294921875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 7.0, 7.0, 9.0, 8.0, 19.0, 12.0, 12.0, 25.0, 23.0, 22.0, 34.0, 40.0, 44.0, 41.0, 35.0, 45.0, 46.0, 41.0, 56.0, 58.0, 28.0, 47.0, 42.0, 47.0, 38.0, 25.0, 24.0, 26.0, 24.0, 27.0, 14.0, 9.0, 7.0, 7.0, 14.0, 7.0, 3.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2412109375, -1.2014617919921875, -1.161712646484375, -1.1219635009765625, -1.08221435546875, -1.0424652099609375, -1.002716064453125, -0.9629669189453125, -0.9232177734375, -0.8834686279296875, -0.843719482421875, -0.8039703369140625, -0.76422119140625, -0.7244720458984375, -0.684722900390625, -0.6449737548828125, -0.605224609375, -0.5654754638671875, -0.525726318359375, -0.4859771728515625, -0.44622802734375, -0.4064788818359375, -0.366729736328125, -0.3269805908203125, -0.2872314453125, -0.2474822998046875, -0.207733154296875, -0.1679840087890625, -0.12823486328125, -0.0884857177734375, -0.048736572265625, -0.0089874267578125, 0.03076171875, 0.0705108642578125, 0.110260009765625, 0.1500091552734375, 0.18975830078125, 0.2295074462890625, 0.269256591796875, 0.3090057373046875, 0.3487548828125, 0.3885040283203125, 0.428253173828125, 0.4680023193359375, 0.50775146484375, 0.5475006103515625, 0.587249755859375, 0.6269989013671875, 0.666748046875, 0.7064971923828125, 0.746246337890625, 0.7859954833984375, 0.82574462890625, 0.8654937744140625, 0.905242919921875, 0.9449920654296875, 0.9847412109375, 1.0244903564453125, 1.064239501953125, 1.1039886474609375, 1.14373779296875, 1.1834869384765625, 1.223236083984375, 1.2629852294921875, 1.302734375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 8.0, 6.0, 4.0, 8.0, 21.0, 28.0, 38.0, 46.0, 65.0, 90.0, 148.0, 214.0, 338.0, 574.0, 1245.0, 3533.0, 17864.0, 224574.0, 769113.0, 23304.0, 4256.0, 1345.0, 615.0, 351.0, 219.0, 153.0, 108.0, 58.0, 53.0, 44.0, 31.0, 25.0, 22.0, 12.0, 11.0, 8.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.478515625, -2.39019775390625, -2.3018798828125, -2.21356201171875, -2.125244140625, -2.03692626953125, -1.9486083984375, -1.86029052734375, -1.77197265625, -1.68365478515625, -1.5953369140625, -1.50701904296875, -1.418701171875, -1.33038330078125, -1.2420654296875, -1.15374755859375, -1.0654296875, -0.97711181640625, -0.8887939453125, -0.80047607421875, -0.712158203125, -0.62384033203125, -0.5355224609375, -0.44720458984375, -0.35888671875, -0.27056884765625, -0.1822509765625, -0.09393310546875, -0.005615234375, 0.08270263671875, 0.1710205078125, 0.25933837890625, 0.34765625, 0.43597412109375, 0.5242919921875, 0.61260986328125, 0.700927734375, 0.78924560546875, 0.8775634765625, 0.96588134765625, 1.05419921875, 1.14251708984375, 1.2308349609375, 1.31915283203125, 1.407470703125, 1.49578857421875, 1.5841064453125, 1.67242431640625, 1.7607421875, 1.84906005859375, 1.9373779296875, 2.02569580078125, 2.114013671875, 2.20233154296875, 2.2906494140625, 2.37896728515625, 2.46728515625, 2.55560302734375, 2.6439208984375, 2.73223876953125, 2.820556640625, 2.90887451171875, 2.9971923828125, 3.08551025390625, 3.173828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 6.0, 7.0, 16.0, 23.0, 21.0, 24.0, 26.0, 20.0, 27.0, 34.0, 57.0, 52.0, 67.0, 83.0, 86.0, 77.0, 50.0, 58.0, 31.0, 36.0, 28.0, 20.0, 19.0, 16.0, 15.0, 17.0, 13.0, 11.0, 5.0, 9.0, 2.0, 4.0, 3.0, 3.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.8099365234375, -4.655029296875, -4.5001220703125, -4.34521484375, -4.1903076171875, -4.035400390625, -3.8804931640625, -3.7255859375, -3.5706787109375, -3.415771484375, -3.2608642578125, -3.10595703125, -2.9510498046875, -2.796142578125, -2.6412353515625, -2.486328125, -2.3314208984375, -2.176513671875, -2.0216064453125, -1.86669921875, -1.7117919921875, -1.556884765625, -1.4019775390625, -1.2470703125, -1.0921630859375, -0.937255859375, -0.7823486328125, -0.62744140625, -0.4725341796875, -0.317626953125, -0.1627197265625, -0.0078125, 0.1470947265625, 0.302001953125, 0.4569091796875, 0.61181640625, 0.7667236328125, 0.921630859375, 1.0765380859375, 1.2314453125, 1.3863525390625, 1.541259765625, 1.6961669921875, 1.85107421875, 2.0059814453125, 2.160888671875, 2.3157958984375, 2.470703125, 2.6256103515625, 2.780517578125, 2.9354248046875, 3.09033203125, 3.2452392578125, 3.400146484375, 3.5550537109375, 3.7099609375, 3.8648681640625, 4.019775390625, 4.1746826171875, 4.32958984375, 4.4844970703125, 4.639404296875, 4.7943115234375, 4.94921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 1.0, 3.0, 6.0, 6.0, 24.0, 18.0, 36.0, 26.0, 41.0, 66.0, 97.0, 160.0, 288.0, 513.0, 1237.0, 3191.0, 11662.0, 69201.0, 881493.0, 63810.0, 11128.0, 3097.0, 1153.0, 532.0, 283.0, 148.0, 109.0, 67.0, 46.0, 31.0, 21.0, 22.0, 10.0, 8.0, 4.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.481689453125, -0.4663887023925781, -0.45108795166015625, -0.4357872009277344, -0.4204864501953125, -0.4051856994628906, -0.38988494873046875, -0.3745841979980469, -0.359283447265625, -0.3439826965332031, -0.32868194580078125, -0.3133811950683594, -0.2980804443359375, -0.2827796936035156, -0.26747894287109375, -0.2521781921386719, -0.23687744140625, -0.22157669067382812, -0.20627593994140625, -0.19097518920898438, -0.1756744384765625, -0.16037368774414062, -0.14507293701171875, -0.12977218627929688, -0.114471435546875, -0.09917068481445312, -0.08386993408203125, -0.06856918334960938, -0.0532684326171875, -0.037967681884765625, -0.02266693115234375, -0.007366180419921875, 0.0079345703125, 0.023235321044921875, 0.03853607177734375, 0.053836822509765625, 0.0691375732421875, 0.08443832397460938, 0.09973907470703125, 0.11503982543945312, 0.130340576171875, 0.14564132690429688, 0.16094207763671875, 0.17624282836914062, 0.1915435791015625, 0.20684432983398438, 0.22214508056640625, 0.23744583129882812, 0.25274658203125, 0.2680473327636719, 0.28334808349609375, 0.2986488342285156, 0.3139495849609375, 0.3292503356933594, 0.34455108642578125, 0.3598518371582031, 0.375152587890625, 0.3904533386230469, 0.40575408935546875, 0.4210548400878906, 0.4363555908203125, 0.4516563415527344, 0.46695709228515625, 0.4822578430175781, 0.49755859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 0.0, 5.0, 7.0, 7.0, 11.0, 6.0, 10.0, 11.0, 20.0, 27.0, 32.0, 41.0, 46.0, 74.0, 92.0, 129.0, 130.0, 98.0, 63.0, 59.0, 35.0, 23.0, 17.0, 11.0, 14.0, 9.0, 7.0, 13.0, 3.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011265277862548828, -0.00010940246284008026, -0.00010615214705467224, -0.00010290183126926422, -9.96515154838562e-05, -9.640119969844818e-05, -9.315088391304016e-05, -8.990056812763214e-05, -8.665025234222412e-05, -8.33999365568161e-05, -8.014962077140808e-05, -7.689930498600006e-05, -7.364898920059204e-05, -7.039867341518402e-05, -6.7148357629776e-05, -6.389804184436798e-05, -6.064772605895996e-05, -5.739741027355194e-05, -5.414709448814392e-05, -5.08967787027359e-05, -4.764646291732788e-05, -4.439614713191986e-05, -4.114583134651184e-05, -3.789551556110382e-05, -3.46451997756958e-05, -3.139488399028778e-05, -2.814456820487976e-05, -2.489425241947174e-05, -2.164393663406372e-05, -1.83936208486557e-05, -1.514330506324768e-05, -1.189298927783966e-05, -8.64267349243164e-06, -5.392357707023621e-06, -2.1420419216156006e-06, 1.1082738637924194e-06, 4.3585896492004395e-06, 7.6089054346084595e-06, 1.085922122001648e-05, 1.41095370054245e-05, 1.735985279083252e-05, 2.061016857624054e-05, 2.386048436164856e-05, 2.711080014705658e-05, 3.03611159324646e-05, 3.361143171787262e-05, 3.686174750328064e-05, 4.011206328868866e-05, 4.336237907409668e-05, 4.66126948595047e-05, 4.986301064491272e-05, 5.311332643032074e-05, 5.636364221572876e-05, 5.961395800113678e-05, 6.28642737865448e-05, 6.611458957195282e-05, 6.936490535736084e-05, 7.261522114276886e-05, 7.586553692817688e-05, 7.91158527135849e-05, 8.236616849899292e-05, 8.561648428440094e-05, 8.886680006980896e-05, 9.211711585521698e-05, 9.5367431640625e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 4.0, 7.0, 10.0, 18.0, 26.0, 20.0, 32.0, 48.0, 69.0, 94.0, 145.0, 204.0, 335.0, 546.0, 878.0, 1502.0, 2747.0, 5635.0, 12727.0, 32844.0, 121252.0, 743791.0, 80071.0, 25066.0, 10053.0, 4592.0, 2325.0, 1318.0, 765.0, 451.0, 313.0, 211.0, 136.0, 86.0, 55.0, 49.0, 46.0, 25.0, 14.0, 9.0, 9.0, 4.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.293212890625, -0.28492164611816406, -0.2766304016113281, -0.2683391571044922, -0.26004791259765625, -0.2517566680908203, -0.24346542358398438, -0.23517417907714844, -0.2268829345703125, -0.21859169006347656, -0.21030044555664062, -0.2020092010498047, -0.19371795654296875, -0.1854267120361328, -0.17713546752929688, -0.16884422302246094, -0.160552978515625, -0.15226173400878906, -0.14397048950195312, -0.1356792449951172, -0.12738800048828125, -0.11909675598144531, -0.11080551147460938, -0.10251426696777344, -0.0942230224609375, -0.08593177795410156, -0.07764053344726562, -0.06934928894042969, -0.06105804443359375, -0.05276679992675781, -0.044475555419921875, -0.03618431091308594, -0.02789306640625, -0.019601821899414062, -0.011310577392578125, -0.0030193328857421875, 0.00527191162109375, 0.013563156127929688, 0.021854400634765625, 0.030145645141601562, 0.0384368896484375, 0.04672813415527344, 0.055019378662109375, 0.06331062316894531, 0.07160186767578125, 0.07989311218261719, 0.08818435668945312, 0.09647560119628906, 0.104766845703125, 0.11305809020996094, 0.12134933471679688, 0.1296405792236328, 0.13793182373046875, 0.1462230682373047, 0.15451431274414062, 0.16280555725097656, 0.1710968017578125, 0.17938804626464844, 0.18767929077148438, 0.1959705352783203, 0.20426177978515625, 0.2125530242919922, 0.22084426879882812, 0.22913551330566406, 0.2374267578125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 4.0, 6.0, 11.0, 7.0, 10.0, 12.0, 13.0, 12.0, 21.0, 25.0, 30.0, 33.0, 61.0, 101.0, 101.0, 110.0, 106.0, 98.0, 57.0, 35.0, 30.0, 18.0, 17.0, 17.0, 13.0, 12.0, 5.0, 5.0, 3.0, 7.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.478271484375, -0.46384429931640625, -0.4494171142578125, -0.43498992919921875, -0.420562744140625, -0.40613555908203125, -0.3917083740234375, -0.37728118896484375, -0.36285400390625, -0.34842681884765625, -0.3339996337890625, -0.31957244873046875, -0.305145263671875, -0.29071807861328125, -0.2762908935546875, -0.26186370849609375, -0.2474365234375, -0.23300933837890625, -0.2185821533203125, -0.20415496826171875, -0.189727783203125, -0.17530059814453125, -0.1608734130859375, -0.14644622802734375, -0.13201904296875, -0.11759185791015625, -0.1031646728515625, -0.08873748779296875, -0.074310302734375, -0.05988311767578125, -0.0454559326171875, -0.03102874755859375, -0.0166015625, -0.00217437744140625, 0.0122528076171875, 0.02667999267578125, 0.041107177734375, 0.05553436279296875, 0.0699615478515625, 0.08438873291015625, 0.09881591796875, 0.11324310302734375, 0.1276702880859375, 0.14209747314453125, 0.156524658203125, 0.17095184326171875, 0.1853790283203125, 0.19980621337890625, 0.2142333984375, 0.22866058349609375, 0.2430877685546875, 0.25751495361328125, 0.271942138671875, 0.28636932373046875, 0.3007965087890625, 0.31522369384765625, 0.32965087890625, 0.34407806396484375, 0.3585052490234375, 0.37293243408203125, 0.387359619140625, 0.40178680419921875, 0.4162139892578125, 0.43064117431640625, 0.445068359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 10.0, 5.0, 17.0, 12.0, 33.0, 74.0, 170.0, 493.0, 101.0, 43.0, 30.0, 11.0, 5.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.719642639160156, -22.934696197509766, -22.149751663208008, -21.364805221557617, -20.579858779907227, -19.79491424560547, -19.009967803955078, -18.225021362304688, -17.440074920654297, -16.655128479003906, -15.870182991027832, -15.085237503051758, -14.300291061401367, -13.515345573425293, -12.730400085449219, -11.945453643798828, -11.16050910949707, -10.375563621520996, -9.590617179870605, -8.805671691894531, -8.02072525024414, -7.235779762268066, -6.450834274291992, -5.66588830947876, -4.880942344665527, -4.095996379852295, -3.3110506534576416, -2.5261049270629883, -1.7411589622497559, -0.9562129974365234, -0.17126750946044922, 0.6136784553527832, 1.3986244201660156, 2.183570384979248, 2.9685161113739014, 3.7534618377685547, 4.538407802581787, 5.3233537673950195, 6.108299255371094, 6.893245220184326, 7.678191184997559, 8.463136672973633, 9.248083114624023, 10.033028602600098, 10.817974090576172, 11.602920532226562, 12.387866020202637, 13.172811508178711, 13.957757949829102, 14.742703437805176, 15.527649879455566, 16.31259536743164, 17.09754180908203, 17.882488250732422, 18.66743278503418, 19.45237922668457, 20.237323760986328, 21.02227020263672, 21.807214736938477, 22.592161178588867, 23.377107620239258, 24.162052154541016, 24.946998596191406, 25.731945037841797, 26.516891479492188]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 7.0, 12.0, 9.0, 12.0, 14.0, 12.0, 10.0, 23.0, 21.0, 19.0, 18.0, 27.0, 36.0, 104.0, 216.0, 169.0, 42.0, 25.0, 23.0, 25.0, 27.0, 17.0, 22.0, 16.0, 7.0, 10.0, 13.0, 9.0, 5.0, 1.0, 5.0, 5.0, 6.0, 1.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.317230224609375, -12.882458686828613, -12.447688102722168, -12.012916564941406, -11.578145027160645, -11.143373489379883, -10.708602905273438, -10.273831367492676, -9.839059829711914, -9.404288291931152, -8.969517707824707, -8.534746170043945, -8.099974632263184, -7.66520357131958, -7.230432510375977, -6.795660972595215, -6.3608903884887695, -5.926119327545166, -5.491347789764404, -5.056576728820801, -4.621805191040039, -4.1870341300964355, -3.752263069152832, -3.3174917697906494, -2.882720470428467, -2.447949171066284, -2.0131778717041016, -1.578406810760498, -1.1436355113983154, -0.7088642120361328, -0.2740931510925293, 0.16067814826965332, 0.5954494476318359, 1.0302207469940186, 1.4649919271469116, 1.8997631072998047, 2.3345344066619873, 2.76930570602417, 3.2040767669677734, 3.638848066329956, 4.073619365692139, 4.508390426635742, 4.943161964416504, 5.377933025360107, 5.812704086303711, 6.247475624084473, 6.682246685028076, 7.11701774597168, 7.551789283752441, 7.986560344696045, 8.421331405639648, 8.85610294342041, 9.290874481201172, 9.725645065307617, 10.160416603088379, 10.59518814086914, 11.029958724975586, 11.464730262756348, 11.899500846862793, 12.334272384643555, 12.769043922424316, 13.203815460205078, 13.638586044311523, 14.073357582092285, 14.508129119873047]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 10.0, 14.0, 32.0, 37.0, 43.0, 53.0, 75.0, 348.0, 167.0, 69.0, 39.0, 32.0, 32.0, 19.0, 10.0, 8.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.04296875, -3.9526824951171875, -3.862396240234375, -3.7721099853515625, -3.68182373046875, -3.5915374755859375, -3.501251220703125, -3.4109649658203125, -3.3206787109375, -3.2303924560546875, -3.140106201171875, -3.0498199462890625, -2.95953369140625, -2.8692474365234375, -2.778961181640625, -2.6886749267578125, -2.598388671875, -2.5081024169921875, -2.417816162109375, -2.3275299072265625, -2.23724365234375, -2.1469573974609375, -2.056671142578125, -1.9663848876953125, -1.8760986328125, -1.7858123779296875, -1.695526123046875, -1.6052398681640625, -1.51495361328125, -1.4246673583984375, -1.334381103515625, -1.2440948486328125, -1.15380859375, -1.0635223388671875, -0.973236083984375, -0.8829498291015625, -0.79266357421875, -0.7023773193359375, -0.612091064453125, -0.5218048095703125, -0.4315185546875, -0.3412322998046875, -0.250946044921875, -0.1606597900390625, -0.07037353515625, 0.0199127197265625, 0.110198974609375, 0.2004852294921875, 0.290771484375, 0.3810577392578125, 0.471343994140625, 0.5616302490234375, 0.65191650390625, 0.7422027587890625, 0.832489013671875, 0.9227752685546875, 1.0130615234375, 1.1033477783203125, 1.193634033203125, 1.2839202880859375, 1.37420654296875, 1.4644927978515625, 1.554779052734375, 1.6450653076171875, 1.7353515625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 10.0, 21.0, 24.0, 36.0, 52.0, 112.0, 348.0, 1816.0, 8324823.0, 59453.0, 1356.0, 249.0, 121.0, 58.0, 27.0, 23.0, 10.0, 12.0, 6.0, 0.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.916542053222656, -28.882083892822266, -27.847623825073242, -26.81316566467285, -25.778705596923828, -24.744247436523438, -23.709789276123047, -22.675331115722656, -21.640871047973633, -20.606412887573242, -19.57195281982422, -18.537494659423828, -17.503036499023438, -16.468576431274414, -15.434118270874023, -14.399659156799316, -13.36520004272461, -12.330740928649902, -11.296281814575195, -10.261823654174805, -9.227364540100098, -8.19290542602539, -7.158446788787842, -6.123988151550293, -5.089529037475586, -4.055069923400879, -3.02061128616333, -1.9861524105072021, -0.9516935348510742, 0.08276557922363281, 1.1172242164611816, 2.1516828536987305, 3.186138153076172, 4.220597267150879, 5.255055904388428, 6.289514541625977, 7.323973655700684, 8.35843276977539, 9.392890930175781, 10.427350044250488, 11.461809158325195, 12.496268272399902, 13.53072738647461, 14.565185546875, 15.599644660949707, 16.634103775024414, 17.668561935424805, 18.703022003173828, 19.73748016357422, 20.77193832397461, 21.806398391723633, 22.840856552124023, 23.875316619873047, 24.909774780273438, 25.944232940673828, 26.97869110107422, 28.013151168823242, 29.047609329223633, 30.082069396972656, 31.116527557373047, 32.15098571777344, 33.185447692871094, 34.219905853271484, 35.254364013671875, 36.288822174072266]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 7.0, 4.0, 4.0, 4.0, 5.0, 5.0, 5.0, 4.0, 3.0, 8.0, 4.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 6.0, 1.0, 0.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.23875045776367, -33.82707595825195, -32.415401458740234, -31.003725051879883, -29.592050552368164, -28.180374145507812, -26.768699645996094, -25.357025146484375, -23.945350646972656, -22.533676147460938, -21.121999740600586, -19.710325241088867, -18.29865074157715, -16.886974334716797, -15.475299835205078, -14.06362533569336, -12.651948928833008, -11.240273475646973, -9.828598976135254, -8.416923522949219, -7.005248546600342, -5.593573570251465, -4.18189811706543, -2.770223617553711, -1.3585481643676758, 0.05312693119049072, 1.4648020267486572, 2.8764772415161133, 4.28815221786499, 5.699827194213867, 7.111502647399902, 8.523177146911621, 9.934852600097656, 11.346528053283691, 12.75820255279541, 14.169878005981445, 15.581552505493164, 16.993228912353516, 18.404903411865234, 19.816577911376953, 21.228252410888672, 22.63992691040039, 24.051603317260742, 25.46327781677246, 26.87495231628418, 28.28662872314453, 29.69830322265625, 31.10997772216797, 32.52165222167969, 33.933326721191406, 35.345001220703125, 36.756675720214844, 38.16835403442383, 39.58002853393555, 40.991703033447266, 42.403377532958984, 43.81505584716797, 45.22673034667969, 46.638404846191406, 48.050079345703125, 49.46175765991211, 50.87343215942383, 52.28510665893555, 53.696781158447266, 55.108455657958984]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 14.0, 14.0, 11.0, 11.0, 35.0, 49.0, 63.0, 98.0, 105.0, 174.0, 279.0, 459.0, 868.0, 1642.0, 3608.0, 8148.0, 20248.0, 55000.0, 148974.0, 173121.0, 69008.0, 24537.0, 9519.0, 4006.0, 1783.0, 913.0, 536.0, 317.0, 202.0, 161.0, 99.0, 80.0, 32.0, 37.0, 32.0, 31.0, 13.0, 8.0, 10.0, 7.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.328125, -10.01611328125, -9.7041015625, -9.39208984375, -9.080078125, -8.76806640625, -8.4560546875, -8.14404296875, -7.83203125, -7.52001953125, -7.2080078125, -6.89599609375, -6.583984375, -6.27197265625, -5.9599609375, -5.64794921875, -5.3359375, -5.02392578125, -4.7119140625, -4.39990234375, -4.087890625, -3.77587890625, -3.4638671875, -3.15185546875, -2.83984375, -2.52783203125, -2.2158203125, -1.90380859375, -1.591796875, -1.27978515625, -0.9677734375, -0.65576171875, -0.34375, -0.03173828125, 0.2802734375, 0.59228515625, 0.904296875, 1.21630859375, 1.5283203125, 1.84033203125, 2.15234375, 2.46435546875, 2.7763671875, 3.08837890625, 3.400390625, 3.71240234375, 4.0244140625, 4.33642578125, 4.6484375, 4.96044921875, 5.2724609375, 5.58447265625, 5.896484375, 6.20849609375, 6.5205078125, 6.83251953125, 7.14453125, 7.45654296875, 7.7685546875, 8.08056640625, 8.392578125, 8.70458984375, 9.0166015625, 9.32861328125, 9.640625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 4.0, 6.0, 8.0, 4.0, 10.0, 24.0, 30.0, 26.0, 31.0, 46.0, 54.0, 69.0, 77.0, 99.0, 91.0, 79.0, 65.0, 55.0, 46.0, 27.0, 41.0, 25.0, 26.0, 16.0, 9.0, 7.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4365234375, -1.3769378662109375, -1.317352294921875, -1.2577667236328125, -1.19818115234375, -1.1385955810546875, -1.079010009765625, -1.0194244384765625, -0.9598388671875, -0.9002532958984375, -0.840667724609375, -0.7810821533203125, -0.72149658203125, -0.6619110107421875, -0.602325439453125, -0.5427398681640625, -0.483154296875, -0.4235687255859375, -0.363983154296875, -0.3043975830078125, -0.24481201171875, -0.1852264404296875, -0.125640869140625, -0.0660552978515625, -0.0064697265625, 0.0531158447265625, 0.112701416015625, 0.1722869873046875, 0.23187255859375, 0.2914581298828125, 0.351043701171875, 0.4106292724609375, 0.47021484375, 0.5298004150390625, 0.589385986328125, 0.6489715576171875, 0.70855712890625, 0.7681427001953125, 0.827728271484375, 0.8873138427734375, 0.9468994140625, 1.0064849853515625, 1.066070556640625, 1.1256561279296875, 1.18524169921875, 1.2448272705078125, 1.304412841796875, 1.3639984130859375, 1.423583984375, 1.4831695556640625, 1.542755126953125, 1.6023406982421875, 1.66192626953125, 1.7215118408203125, 1.781097412109375, 1.8406829833984375, 1.9002685546875, 1.9598541259765625, 2.019439697265625, 2.0790252685546875, 2.13861083984375, 2.1981964111328125, 2.257781982421875, 2.3173675537109375, 2.376953125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 1.0, 8.0, 5.0, 4.0, 7.0, 15.0, 18.0, 19.0, 30.0, 34.0, 47.0, 47.0, 49.0, 36.0, 47.0, 31.0, 18.0, 17.0, 13.0, 9.0, 7.0, 4.0, 6.0, 4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.602139472961426, -9.308943748474121, -9.015748023986816, -8.722552299499512, -8.429356575012207, -8.136160850524902, -7.842965126037598, -7.549769401550293, -7.256573677062988, -6.963377952575684, -6.670182228088379, -6.376986503601074, -6.0837907791137695, -5.790595054626465, -5.49739933013916, -5.2042036056518555, -4.911007881164551, -4.617812156677246, -4.324616432189941, -4.031420707702637, -3.738224983215332, -3.4450292587280273, -3.1518335342407227, -2.858637809753418, -2.5654420852661133, -2.2722463607788086, -1.979050636291504, -1.6858549118041992, -1.3926591873168945, -1.0994634628295898, -0.8062677383422852, -0.5130720138549805, -0.2198772430419922, 0.0733184814453125, 0.3665142059326172, 0.6597099304199219, 0.9529056549072266, 1.2461013793945312, 1.539297103881836, 1.8324928283691406, 2.1256885528564453, 2.41888427734375, 2.7120800018310547, 3.0052757263183594, 3.298471450805664, 3.5916671752929688, 3.8848628997802734, 4.178058624267578, 4.471254348754883, 4.7644500732421875, 5.057645797729492, 5.350841522216797, 5.644037246704102, 5.937232971191406, 6.230428695678711, 6.523624420166016, 6.81682014465332, 7.110015869140625, 7.40321159362793, 7.696407318115234, 7.989603042602539, 8.282798767089844, 8.575994491577148, 8.869190216064453, 9.162385940551758]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 3.0, 6.0, 16.0, 13.0, 16.0, 18.0, 19.0, 41.0, 44.0, 51.0, 53.0, 54.0, 32.0, 25.0, 22.0, 17.0, 13.0, 8.0, 13.0, 4.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.531839370727539, -7.186500072479248, -6.841160297393799, -6.495820999145508, -6.150481700897217, -5.805142402648926, -5.459802627563477, -5.1144633293151855, -4.7691240310668945, -4.4237847328186035, -4.078444957733154, -3.7331056594848633, -3.3877663612365723, -3.042426824569702, -2.697087287902832, -2.351747989654541, -2.006408214569092, -1.6610687971115112, -1.3157293796539307, -0.9703898429870605, -0.62505042552948, -0.2797110080718994, 0.0656285285949707, 0.4109678268432617, 0.7563073635101318, 1.1016467809677124, 1.446986198425293, 1.792325735092163, 2.137665271759033, 2.483004570007324, 2.8283441066741943, 3.1736834049224854, 3.5190229415893555, 3.8643624782562256, 4.209702014923096, 4.555041313171387, 4.900380611419678, 5.245719909667969, 5.591059684753418, 5.936398983001709, 6.28173828125, 6.627077579498291, 6.97241735458374, 7.317756652832031, 7.663095951080322, 8.008435249328613, 8.353775024414062, 8.699113845825195, 9.044454574584961, 9.38979434967041, 9.735133171081543, 10.080472946166992, 10.425812721252441, 10.771151542663574, 11.116491317749023, 11.461830139160156, 11.807169914245605, 12.152509689331055, 12.497848510742188, 12.843188285827637, 13.188528060913086, 13.533866882324219, 13.879206657409668, 14.224546432495117, 14.56988525390625]}, "eval/loss": 7.756877899169922, "eval/wer": 1.9964482012818223, "eval/runtime": 950.641, "eval/samples_per_second": 2.779, "eval/steps_per_second": 0.348} \ No newline at end of file